system-linux: handle hotplug event socket ENOBUFS errors
[oweals/netifd.git] / system-linux.c
1 /*
2  * netifd - network interface daemon
3  * Copyright (C) 2012 Felix Fietkau <nbd@openwrt.org>
4  * Copyright (C) 2013 Jo-Philipp Wich <jow@openwrt.org>
5  * Copyright (C) 2013 Steven Barth <steven@midlink.org>
6  * Copyright (C) 2014 Gioacchino Mazzurco <gio@eigenlab.org>
7  * Copyright (C) 2017 Matthias Schiffer <mschiffer@universe-factory.net>
8  * Copyright (C) 2018 Hans Dedecker <dedeckeh@gmail.com>
9  *
10  * This program is free software; you can redistribute it and/or modify
11  * it under the terms of the GNU General Public License version 2
12  * as published by the Free Software Foundation
13  *
14  * This program is distributed in the hope that it will be useful,
15  * but WITHOUT ANY WARRANTY; without even the implied warranty of
16  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
17  * GNU General Public License for more details.
18  */
19 #define _GNU_SOURCE
20
21 #include <sys/socket.h>
22 #include <sys/ioctl.h>
23 #include <sys/stat.h>
24 #include <sys/syscall.h>
25
26 #include <net/if.h>
27 #include <net/if_arp.h>
28
29 #include <arpa/inet.h>
30 #include <netinet/ether.h>
31 #include <netinet/in.h>
32
33 #include <linux/rtnetlink.h>
34 #include <linux/sockios.h>
35 #include <linux/ip.h>
36 #include <linux/if_addr.h>
37 #include <linux/if_link.h>
38 #include <linux/if_vlan.h>
39 #include <linux/if_bridge.h>
40 #include <linux/if_tunnel.h>
41 #include <linux/ip6_tunnel.h>
42 #include <linux/ethtool.h>
43 #include <linux/fib_rules.h>
44 #include <linux/veth.h>
45 #include <linux/version.h>
46
47 #ifndef RTN_FAILED_POLICY
48 #define RTN_FAILED_POLICY 12
49 #endif
50
51 #ifndef IFA_F_NOPREFIXROUTE
52 #define IFA_F_NOPREFIXROUTE 0x200
53 #endif
54
55 #ifndef IFA_FLAGS
56 #define IFA_FLAGS (IFA_MULTICAST + 1)
57 #endif
58
59 #include <string.h>
60 #include <fcntl.h>
61 #include <glob.h>
62 #include <time.h>
63 #include <unistd.h>
64
65 #include <netlink/msg.h>
66 #include <netlink/attr.h>
67 #include <netlink/socket.h>
68 #include <libubox/uloop.h>
69
70 #include "netifd.h"
71 #include "device.h"
72 #include "system.h"
73
74 struct event_socket {
75         struct uloop_fd uloop;
76         struct nl_sock *sock;
77         int bufsize;
78 };
79
80 static int sock_ioctl = -1;
81 static struct nl_sock *sock_rtnl = NULL;
82
83 static int cb_rtnl_event(struct nl_msg *msg, void *arg);
84 static void handle_hotplug_event(struct uloop_fd *u, unsigned int events);
85 static int system_add_proto_tunnel(const char *name, const uint8_t proto,
86                                         const unsigned int link, struct blob_attr **tb);
87 static int __system_del_ip_tunnel(const char *name, struct blob_attr **tb);
88
89 static char dev_buf[256];
90
91 static void
92 handler_nl_event(struct uloop_fd *u, unsigned int events)
93 {
94         struct event_socket *ev = container_of(u, struct event_socket, uloop);
95         int err;
96         socklen_t errlen = sizeof(err);
97
98         if (!u->error) {
99                 nl_recvmsgs_default(ev->sock);
100                 return;
101         }
102
103         if (getsockopt(u->fd, SOL_SOCKET, SO_ERROR, (void *)&err, &errlen))
104                 goto abort;
105
106         switch(err) {
107         case ENOBUFS:
108                 /* Increase rx buffer size on netlink socket */
109                 ev->bufsize *= 2;
110                 if (nl_socket_set_buffer_size(ev->sock, ev->bufsize, 0))
111                         goto abort;
112
113                 /* Request full dump since some info got dropped */
114                 struct rtgenmsg msg = { .rtgen_family = AF_UNSPEC };
115                 nl_send_simple(ev->sock, RTM_GETLINK, NLM_F_DUMP, &msg, sizeof(msg));
116                 break;
117
118         default:
119                 goto abort;
120         }
121         u->error = false;
122         return;
123
124 abort:
125         uloop_fd_delete(&ev->uloop);
126         return;
127 }
128
129 static struct nl_sock *
130 create_socket(int protocol, int groups)
131 {
132         struct nl_sock *sock;
133
134         sock = nl_socket_alloc();
135         if (!sock)
136                 return NULL;
137
138         if (groups)
139                 nl_join_groups(sock, groups);
140
141         if (nl_connect(sock, protocol))
142                 return NULL;
143
144         return sock;
145 }
146
147 static bool
148 create_raw_event_socket(struct event_socket *ev, int protocol, int groups,
149                         uloop_fd_handler cb, int flags)
150 {
151         ev->sock = create_socket(protocol, groups);
152         if (!ev->sock)
153                 return false;
154
155         ev->uloop.fd = nl_socket_get_fd(ev->sock);
156         ev->uloop.cb = cb;
157         if (uloop_fd_add(&ev->uloop, ULOOP_READ|flags))
158                 return false;
159
160         return true;
161 }
162
163 static bool
164 create_event_socket(struct event_socket *ev, int protocol,
165                     int (*cb)(struct nl_msg *msg, void *arg))
166 {
167         if (!create_raw_event_socket(ev, protocol, 0, handler_nl_event, ULOOP_ERROR_CB))
168                 return false;
169
170         /* Install the valid custom callback handler */
171         nl_socket_modify_cb(ev->sock, NL_CB_VALID, NL_CB_CUSTOM, cb, NULL);
172
173         /* Disable sequence number checking on event sockets */
174         nl_socket_disable_seq_check(ev->sock);
175
176         /* Increase rx buffer size to 65K on event sockets */
177         ev->bufsize = 65535;
178         if (nl_socket_set_buffer_size(ev->sock, ev->bufsize, 0))
179                 return false;
180
181         return true;
182 }
183
184 static bool
185 create_hotplug_event_socket(struct event_socket *ev, int protocol,
186                             void (*cb)(struct uloop_fd *u, unsigned int events))
187 {
188         if (!create_raw_event_socket(ev, protocol, 1, cb, ULOOP_ERROR_CB))
189                 return false;
190
191         /* Increase rx buffer size to 65K on event sockets */
192         ev->bufsize = 65535;
193         if (nl_socket_set_buffer_size(ev->sock, ev->bufsize, 0))
194                 return false;
195
196         return true;
197 }
198
199 static bool
200 system_rtn_aton(const char *src, unsigned int *dst)
201 {
202         char *e;
203         unsigned int n;
204
205         if (!strcmp(src, "local"))
206                 n = RTN_LOCAL;
207         else if (!strcmp(src, "nat"))
208                 n = RTN_NAT;
209         else if (!strcmp(src, "broadcast"))
210                 n = RTN_BROADCAST;
211         else if (!strcmp(src, "anycast"))
212                 n = RTN_ANYCAST;
213         else if (!strcmp(src, "multicast"))
214                 n = RTN_MULTICAST;
215         else if (!strcmp(src, "prohibit"))
216                 n = RTN_PROHIBIT;
217         else if (!strcmp(src, "unreachable"))
218                 n = RTN_UNREACHABLE;
219         else if (!strcmp(src, "blackhole"))
220                 n = RTN_BLACKHOLE;
221         else if (!strcmp(src, "xresolve"))
222                 n = RTN_XRESOLVE;
223         else if (!strcmp(src, "unicast"))
224                 n = RTN_UNICAST;
225         else if (!strcmp(src, "throw"))
226                 n = RTN_THROW;
227         else if (!strcmp(src, "failed_policy"))
228                 n = RTN_FAILED_POLICY;
229         else {
230                 n = strtoul(src, &e, 0);
231                 if (!e || *e || e == src || n > 255)
232                         return false;
233         }
234
235         *dst = n;
236         return true;
237 }
238
239 static bool
240 system_tos_aton(const char *src, unsigned *dst)
241 {
242         char *e;
243
244         *dst = strtoul(src, &e, 16);
245         if (e == src || *e || *dst > 255)
246                 return false;
247
248         return true;
249 }
250
251 int system_init(void)
252 {
253         static struct event_socket rtnl_event;
254         static struct event_socket hotplug_event;
255
256         sock_ioctl = socket(AF_LOCAL, SOCK_DGRAM, 0);
257         system_fd_set_cloexec(sock_ioctl);
258
259         /* Prepare socket for routing / address control */
260         sock_rtnl = create_socket(NETLINK_ROUTE, 0);
261         if (!sock_rtnl)
262                 return -1;
263
264         if (!create_event_socket(&rtnl_event, NETLINK_ROUTE, cb_rtnl_event))
265                 return -1;
266
267         if (!create_hotplug_event_socket(&hotplug_event, NETLINK_KOBJECT_UEVENT,
268                                          handle_hotplug_event))
269                 return -1;
270
271         /* Receive network link events form kernel */
272         nl_socket_add_membership(rtnl_event.sock, RTNLGRP_LINK);
273
274         return 0;
275 }
276
277 static void system_set_sysctl(const char *path, const char *val)
278 {
279         int fd;
280
281         fd = open(path, O_WRONLY);
282         if (fd < 0)
283                 return;
284
285         if (write(fd, val, strlen(val))) {}
286         close(fd);
287 }
288
289 static void system_set_dev_sysctl(const char *path, const char *device, const char *val)
290 {
291         snprintf(dev_buf, sizeof(dev_buf), path, device);
292         system_set_sysctl(dev_buf, val);
293 }
294
295 static void system_set_disable_ipv6(struct device *dev, const char *val)
296 {
297         system_set_dev_sysctl("/proc/sys/net/ipv6/conf/%s/disable_ipv6", dev->ifname, val);
298 }
299
300 static void system_set_rpfilter(struct device *dev, const char *val)
301 {
302         system_set_dev_sysctl("/proc/sys/net/ipv4/conf/%s/rp_filter", dev->ifname, val);
303 }
304
305 static void system_set_acceptlocal(struct device *dev, const char *val)
306 {
307         system_set_dev_sysctl("/proc/sys/net/ipv4/conf/%s/accept_local", dev->ifname, val);
308 }
309
310 static void system_set_igmpversion(struct device *dev, const char *val)
311 {
312         system_set_dev_sysctl("/proc/sys/net/ipv4/conf/%s/force_igmp_version", dev->ifname, val);
313 }
314
315 static void system_set_mldversion(struct device *dev, const char *val)
316 {
317         system_set_dev_sysctl("/proc/sys/net/ipv6/conf/%s/force_mld_version", dev->ifname, val);
318 }
319
320 static void system_set_neigh4reachabletime(struct device *dev, const char *val)
321 {
322         system_set_dev_sysctl("/proc/sys/net/ipv4/neigh/%s/base_reachable_time_ms", dev->ifname, val);
323 }
324
325 static void system_set_neigh6reachabletime(struct device *dev, const char *val)
326 {
327         system_set_dev_sysctl("/proc/sys/net/ipv6/neigh/%s/base_reachable_time_ms", dev->ifname, val);
328 }
329
330 static void system_set_neigh4gcstaletime(struct device *dev, const char *val)
331 {
332         system_set_dev_sysctl("/proc/sys/net/ipv4/neigh/%s/gc_stale_time", dev->ifname, val);
333 }
334
335 static void system_set_neigh6gcstaletime(struct device *dev, const char *val)
336 {
337         system_set_dev_sysctl("/proc/sys/net/ipv6/neigh/%s/gc_stale_time", dev->ifname, val);
338 }
339
340 static void system_set_neigh4locktime(struct device *dev, const char *val)
341 {
342         system_set_dev_sysctl("/proc/sys/net/ipv4/neigh/%s/locktime", dev->ifname, val);
343 }
344
345 static void system_set_dadtransmits(struct device *dev, const char *val)
346 {
347         system_set_dev_sysctl("/proc/sys/net/ipv6/conf/%s/dad_transmits", dev->ifname, val);
348 }
349
350 static void system_bridge_set_multicast_to_unicast(struct device *dev, const char *val)
351 {
352         system_set_dev_sysctl("/sys/class/net/%s/brport/multicast_to_unicast", dev->ifname, val);
353 }
354
355 static void system_bridge_set_multicast_fast_leave(struct device *dev, const char *val)
356 {
357         system_set_dev_sysctl("/sys/class/net/%s/brport/multicast_fast_leave", dev->ifname, val);
358 }
359
360 static void system_bridge_set_hairpin_mode(struct device *dev, const char *val)
361 {
362         system_set_dev_sysctl("/sys/class/net/%s/brport/hairpin_mode", dev->ifname, val);
363 }
364
365 static void system_bridge_set_isolated(struct device *dev, const char *val)
366 {
367         system_set_dev_sysctl("/sys/class/net/%s/brport/isolated", dev->ifname, val);
368 }
369
370 static void system_bridge_set_multicast_router(struct device *dev, const char *val, bool bridge)
371 {
372         system_set_dev_sysctl(bridge ? "/sys/class/net/%s/bridge/multicast_router" :
373                                        "/sys/class/net/%s/brport/multicast_router",
374                               dev->ifname, val);
375 }
376
377 static void system_bridge_set_robustness(struct device *dev, const char *val)
378 {
379         system_set_dev_sysctl("/sys/devices/virtual/net/%s/bridge/multicast_startup_query_count",
380                               dev->ifname, val);
381         system_set_dev_sysctl("/sys/devices/virtual/net/%s/bridge/multicast_last_member_count",
382                               dev->ifname, val);
383 }
384
385 static void system_bridge_set_query_interval(struct device *dev, const char *val)
386 {
387         system_set_dev_sysctl("/sys/devices/virtual/net/%s/bridge/multicast_query_interval",
388                               dev->ifname, val);
389 }
390
391 static void system_bridge_set_query_response_interval(struct device *dev, const char *val)
392 {
393         system_set_dev_sysctl("/sys/devices/virtual/net/%s/bridge/multicast_query_response_interval",
394                               dev->ifname, val);
395 }
396
397 static void system_bridge_set_last_member_interval(struct device *dev, const char *val)
398 {
399         system_set_dev_sysctl("/sys/devices/virtual/net/%s/bridge/multicast_last_member_interval",
400                               dev->ifname, val);
401 }
402
403 static void system_bridge_set_membership_interval(struct device *dev, const char *val)
404 {
405         system_set_dev_sysctl("/sys/devices/virtual/net/%s/bridge/multicast_membership_interval",
406                               dev->ifname, val);
407 }
408
409 static void system_bridge_set_other_querier_timeout(struct device *dev, const char *val)
410 {
411         system_set_dev_sysctl("/sys/devices/virtual/net/%s/bridge/multicast_querier_interval",
412                               dev->ifname, val);
413 }
414
415 static void system_bridge_set_startup_query_interval(struct device *dev, const char *val)
416 {
417         system_set_dev_sysctl("/sys/devices/virtual/net/%s/bridge/multicast_startup_query_interval",
418                               dev->ifname, val);
419 }
420
421 static void system_bridge_set_stp_state(struct device *dev, const char *val)
422 {
423         system_set_dev_sysctl("/sys/devices/virtual/net/%s/bridge/stp_state", dev->ifname, val);
424 }
425
426 static void system_bridge_set_forward_delay(struct device *dev, const char *val)
427 {
428         system_set_dev_sysctl("/sys/devices/virtual/net/%s/bridge/forward_delay", dev->ifname, val);
429 }
430
431 static void system_bridge_set_priority(struct device *dev, const char *val)
432 {
433         system_set_dev_sysctl("/sys/devices/virtual/net/%s/bridge/priority", dev->ifname, val);
434 }
435
436 static void system_bridge_set_ageing_time(struct device *dev, const char *val)
437 {
438         system_set_dev_sysctl("/sys/devices/virtual/net/%s/bridge/ageing_time", dev->ifname, val);
439 }
440
441 static void system_bridge_set_hello_time(struct device *dev, const char *val)
442 {
443         system_set_dev_sysctl("/sys/devices/virtual/net/%s/bridge/hello_time", dev->ifname, val);
444 }
445
446 static void system_bridge_set_max_age(struct device *dev, const char *val)
447 {
448         system_set_dev_sysctl("/sys/devices/virtual/net/%s/bridge/max_age", dev->ifname, val);
449 }
450
451 static void system_bridge_set_learning(struct device *dev, const char *val)
452 {
453         system_set_dev_sysctl("/sys/class/net/%s/brport/learning", dev->ifname, val);
454 }
455
456 static void system_bridge_set_unicast_flood(struct device *dev, const char *val)
457 {
458         system_set_dev_sysctl("/sys/class/net/%s/brport/unicast_flood", dev->ifname, val);
459 }
460
461 static void system_set_sendredirects(struct device *dev, const char *val)
462 {
463         system_set_dev_sysctl("/proc/sys/net/ipv4/conf/%s/send_redirects", dev->ifname, val);
464 }
465
466 static int system_get_sysctl(const char *path, char *buf, const size_t buf_sz)
467 {
468         int fd = -1, ret = -1;
469
470         fd = open(path, O_RDONLY);
471         if (fd < 0)
472                 goto out;
473
474         ssize_t len = read(fd, buf, buf_sz - 1);
475         if (len < 0)
476                 goto out;
477
478         ret = buf[len] = 0;
479
480 out:
481         if (fd >= 0)
482                 close(fd);
483
484         return ret;
485 }
486
487 static int
488 system_get_dev_sysctl(const char *path, const char *device, char *buf, const size_t buf_sz)
489 {
490         snprintf(dev_buf, sizeof(dev_buf), path, device);
491         return system_get_sysctl(dev_buf, buf, buf_sz);
492 }
493
494 static int system_get_disable_ipv6(struct device *dev, char *buf, const size_t buf_sz)
495 {
496         return system_get_dev_sysctl("/proc/sys/net/ipv6/conf/%s/disable_ipv6",
497                         dev->ifname, buf, buf_sz);
498 }
499
500 static int system_get_rpfilter(struct device *dev, char *buf, const size_t buf_sz)
501 {
502         return system_get_dev_sysctl("/proc/sys/net/ipv4/conf/%s/rp_filter",
503                         dev->ifname, buf, buf_sz);
504 }
505
506 static int system_get_acceptlocal(struct device *dev, char *buf, const size_t buf_sz)
507 {
508         return system_get_dev_sysctl("/proc/sys/net/ipv4/conf/%s/accept_local",
509                         dev->ifname, buf, buf_sz);
510 }
511
512 static int system_get_igmpversion(struct device *dev, char *buf, const size_t buf_sz)
513 {
514         return system_get_dev_sysctl("/proc/sys/net/ipv4/conf/%s/force_igmp_version",
515                         dev->ifname, buf, buf_sz);
516 }
517
518 static int system_get_mldversion(struct device *dev, char *buf, const size_t buf_sz)
519 {
520         return system_get_dev_sysctl("/proc/sys/net/ipv6/conf/%s/force_mld_version",
521                         dev->ifname, buf, buf_sz);
522 }
523
524 static int system_get_neigh4reachabletime(struct device *dev, char *buf, const size_t buf_sz)
525 {
526         return system_get_dev_sysctl("/proc/sys/net/ipv4/neigh/%s/base_reachable_time_ms",
527                         dev->ifname, buf, buf_sz);
528 }
529
530 static int system_get_neigh6reachabletime(struct device *dev, char *buf, const size_t buf_sz)
531 {
532         return system_get_dev_sysctl("/proc/sys/net/ipv6/neigh/%s/base_reachable_time_ms",
533                         dev->ifname, buf, buf_sz);
534 }
535
536 static int system_get_neigh4gcstaletime(struct device *dev, char *buf, const size_t buf_sz)
537 {
538         return system_get_dev_sysctl("/proc/sys/net/ipv4/neigh/%s/gc_stale_time",
539                         dev->ifname, buf, buf_sz);
540 }
541
542 static int system_get_neigh6gcstaletime(struct device *dev, char *buf, const size_t buf_sz)
543 {
544         return system_get_dev_sysctl("/proc/sys/net/ipv6/neigh/%s/gc_stale_time",
545                         dev->ifname, buf, buf_sz);
546 }
547
548 static int system_get_neigh4locktime(struct device *dev, char *buf, const size_t buf_sz)
549 {
550         return system_get_dev_sysctl("/proc/sys/net/ipv4/neigh/%s/locktime",
551                         dev->ifname, buf, buf_sz);
552 }
553
554 static int system_get_dadtransmits(struct device *dev, char *buf, const size_t buf_sz)
555 {
556         return system_get_dev_sysctl("/proc/sys/net/ipv6/conf/%s/dad_transmits",
557                         dev->ifname, buf, buf_sz);
558 }
559
560 static int system_get_sendredirects(struct device *dev, char *buf, const size_t buf_sz)
561 {
562         return system_get_dev_sysctl("/proc/sys/net/ipv4/conf/%s/send_redirects",
563                         dev->ifname, buf, buf_sz);
564 }
565
566 /* Evaluate netlink messages */
567 static int cb_rtnl_event(struct nl_msg *msg, void *arg)
568 {
569         struct nlmsghdr *nh = nlmsg_hdr(msg);
570         struct nlattr *nla[__IFLA_MAX];
571         int link_state = 0;
572         char buf[10];
573
574         if (nh->nlmsg_type != RTM_NEWLINK)
575                 goto out;
576
577         nlmsg_parse(nh, sizeof(struct ifinfomsg), nla, __IFLA_MAX - 1, NULL);
578         if (!nla[IFLA_IFNAME])
579                 goto out;
580
581         struct device *dev = device_find(nla_data(nla[IFLA_IFNAME]));
582         if (!dev)
583                 goto out;
584
585         if (!system_get_dev_sysctl("/sys/class/net/%s/carrier", dev->ifname, buf, sizeof(buf)))
586                 link_state = strtoul(buf, NULL, 0);
587
588         device_set_link(dev, link_state ? true : false);
589
590 out:
591         return 0;
592 }
593
594 static void
595 handle_hotplug_msg(char *data, int size)
596 {
597         const char *subsystem = NULL, *interface = NULL, *interface_old = NULL;
598         char *cur, *end, *sep;
599         struct device *dev;
600         int skip;
601         bool add, move = false;
602
603         if (!strncmp(data, "add@", 4))
604                 add = true;
605         else if (!strncmp(data, "remove@", 7))
606                 add = false;
607         else if (!strncmp(data, "move@", 5)) {
608                 add = true;
609                 move = true;
610         }
611         else
612                 return;
613
614         skip = strlen(data) + 1;
615         end = data + size;
616
617         for (cur = data + skip; cur < end; cur += skip) {
618                 skip = strlen(cur) + 1;
619
620                 sep = strchr(cur, '=');
621                 if (!sep)
622                         continue;
623
624                 *sep = 0;
625                 if (!strcmp(cur, "INTERFACE"))
626                         interface = sep + 1;
627                 else if (!strcmp(cur, "SUBSYSTEM")) {
628                         subsystem = sep + 1;
629                         if (strcmp(subsystem, "net") != 0)
630                                 return;
631                 } else if (!strcmp(cur, "DEVPATH_OLD")) {
632                         interface_old = strrchr(sep + 1, '/');
633                         if (interface_old)
634                                 interface_old++;
635                 }
636         }
637
638         if (subsystem && interface) {
639                 if (move && interface_old)
640                         goto move;
641                 else
642                         goto found;
643         }
644
645         return;
646
647 move:
648         dev = device_find(interface_old);
649         if (!dev)
650                 goto found;
651
652         if (dev->type != &simple_device_type)
653                 goto found;
654
655         device_set_present(dev, false);
656
657 found:
658         dev = device_find(interface);
659         if (!dev)
660                 return;
661
662         if (dev->type != &simple_device_type)
663                 return;
664
665         if (add && system_if_force_external(dev->ifname))
666                 return;
667
668         device_set_present(dev, add);
669 }
670
671 static void
672 handle_hotplug_event(struct uloop_fd *u, unsigned int events)
673 {
674         struct event_socket *ev = container_of(u, struct event_socket, uloop);
675         struct sockaddr_nl nla;
676         unsigned char *buf = NULL;
677         int size;
678         int err;
679         socklen_t errlen = sizeof(err);
680
681         if (!u->error) {
682                 while ((size = nl_recv(ev->sock, &nla, &buf, NULL)) > 0) {
683                         if (nla.nl_pid == 0)
684                                 handle_hotplug_msg((char *) buf, size);
685
686                         free(buf);
687                 }
688                 return;
689         }
690
691         if (getsockopt(u->fd, SOL_SOCKET, SO_ERROR, (void *)&err, &errlen))
692                 goto abort;
693
694         switch(err) {
695         case ENOBUFS:
696                 /* Increase rx buffer size on netlink socket */
697                 ev->bufsize *= 2;
698                 if (nl_socket_set_buffer_size(ev->sock, ev->bufsize, 0))
699                         goto abort;
700                 break;
701
702         default:
703                 goto abort;
704         }
705         u->error = false;
706         return;
707
708 abort:
709         uloop_fd_delete(&ev->uloop);
710         return;
711 }
712
713 static int system_rtnl_call(struct nl_msg *msg)
714 {
715         int ret;
716
717         ret = nl_send_auto_complete(sock_rtnl, msg);
718         nlmsg_free(msg);
719
720         if (ret < 0)
721                 return ret;
722
723         return nl_wait_for_ack(sock_rtnl);
724 }
725
726 int system_bridge_delbr(struct device *bridge)
727 {
728         return ioctl(sock_ioctl, SIOCBRDELBR, bridge->ifname);
729 }
730
731 static int system_bridge_if(const char *bridge, struct device *dev, int cmd, void *data)
732 {
733         struct ifreq ifr;
734
735         memset(&ifr, 0, sizeof(ifr));
736         if (dev)
737                 ifr.ifr_ifindex = dev->ifindex;
738         else
739                 ifr.ifr_data = data;
740         strncpy(ifr.ifr_name, bridge, sizeof(ifr.ifr_name) - 1);
741         return ioctl(sock_ioctl, cmd, &ifr);
742 }
743
744 static bool system_is_bridge(const char *name, char *buf, int buflen)
745 {
746         struct stat st;
747
748         snprintf(buf, buflen, "/sys/devices/virtual/net/%s/bridge", name);
749         if (stat(buf, &st) < 0)
750                 return false;
751
752         return true;
753 }
754
755 static char *system_get_bridge(const char *name, char *buf, int buflen)
756 {
757         char *path;
758         ssize_t len = -1;
759         glob_t gl;
760
761         snprintf(buf, buflen, "/sys/devices/virtual/net/*/brif/%s/bridge", name);
762         if (glob(buf, GLOB_NOSORT, NULL, &gl) < 0)
763                 return NULL;
764
765         if (gl.gl_pathc > 0)
766                 len = readlink(gl.gl_pathv[0], buf, buflen);
767
768         globfree(&gl);
769
770         if (len < 0)
771                 return NULL;
772
773         buf[len] = 0;
774         path = strrchr(buf, '/');
775         if (!path)
776                 return NULL;
777
778         return path + 1;
779 }
780
781 static void
782 system_bridge_set_wireless(struct device *bridge, struct device *dev)
783 {
784         bool mcast_to_ucast = dev->wireless_ap;
785         bool hairpin = true;
786
787         if (bridge->settings.flags & DEV_OPT_MULTICAST_TO_UNICAST &&
788             !bridge->settings.multicast_to_unicast)
789                 mcast_to_ucast = false;
790
791         if (!mcast_to_ucast || dev->wireless_isolate)
792                 hairpin = false;
793
794         system_bridge_set_multicast_to_unicast(dev, mcast_to_ucast ? "1" : "0");
795         system_bridge_set_hairpin_mode(dev, hairpin ? "1" : "0");
796 }
797
798 int system_bridge_addif(struct device *bridge, struct device *dev)
799 {
800         char buf[64];
801         char *oldbr;
802         int ret = 0;
803
804         oldbr = system_get_bridge(dev->ifname, dev_buf, sizeof(dev_buf));
805         if (!oldbr || strcmp(oldbr, bridge->ifname) != 0)
806                 ret = system_bridge_if(bridge->ifname, dev, SIOCBRADDIF, NULL);
807
808         if (dev->wireless)
809                 system_bridge_set_wireless(bridge, dev);
810
811         if (dev->settings.flags & DEV_OPT_MULTICAST_ROUTER) {
812                 snprintf(buf, sizeof(buf), "%u", dev->settings.multicast_router);
813                 system_bridge_set_multicast_router(dev, buf, false);
814         }
815
816         if (dev->settings.flags & DEV_OPT_MULTICAST_FAST_LEAVE &&
817             dev->settings.multicast_fast_leave)
818                 system_bridge_set_multicast_fast_leave(dev, "1");
819
820         if (dev->settings.flags & DEV_OPT_LEARNING &&
821             !dev->settings.learning)
822                 system_bridge_set_learning(dev, "0");
823
824         if (dev->settings.flags & DEV_OPT_UNICAST_FLOOD &&
825             !dev->settings.unicast_flood)
826                 system_bridge_set_unicast_flood(dev, "0");
827
828         if (dev->settings.flags & DEV_OPT_ISOLATE &&
829             dev->settings.isolate)
830                 system_bridge_set_isolated(dev, "1");
831
832         return ret;
833 }
834
835 int system_bridge_delif(struct device *bridge, struct device *dev)
836 {
837         return system_bridge_if(bridge->ifname, dev, SIOCBRDELIF, NULL);
838 }
839
840 int system_if_resolve(struct device *dev)
841 {
842         struct ifreq ifr;
843         strncpy(ifr.ifr_name, dev->ifname, sizeof(ifr.ifr_name) - 1);
844         if (!ioctl(sock_ioctl, SIOCGIFINDEX, &ifr))
845                 return ifr.ifr_ifindex;
846         else
847                 return 0;
848 }
849
850 static int system_if_flags(const char *ifname, unsigned add, unsigned rem)
851 {
852         struct ifreq ifr;
853
854         memset(&ifr, 0, sizeof(ifr));
855         strncpy(ifr.ifr_name, ifname, sizeof(ifr.ifr_name) - 1);
856         if (ioctl(sock_ioctl, SIOCGIFFLAGS, &ifr) < 0)
857                 return -1;
858
859         ifr.ifr_flags |= add;
860         ifr.ifr_flags &= ~rem;
861         return ioctl(sock_ioctl, SIOCSIFFLAGS, &ifr);
862 }
863
864 struct clear_data {
865         struct nl_msg *msg;
866         struct device *dev;
867         int type;
868         int size;
869         int af;
870 };
871
872
873 static bool check_ifaddr(struct nlmsghdr *hdr, int ifindex)
874 {
875         struct ifaddrmsg *ifa = NLMSG_DATA(hdr);
876
877         return ifa->ifa_index == ifindex;
878 }
879
880 static bool check_route(struct nlmsghdr *hdr, int ifindex)
881 {
882         struct rtmsg *r = NLMSG_DATA(hdr);
883         struct nlattr *tb[__RTA_MAX];
884
885         if (r->rtm_protocol == RTPROT_KERNEL &&
886             r->rtm_family == AF_INET6)
887                 return false;
888
889         nlmsg_parse(hdr, sizeof(struct rtmsg), tb, __RTA_MAX - 1, NULL);
890         if (!tb[RTA_OIF])
891                 return false;
892
893         return *(int *)RTA_DATA(tb[RTA_OIF]) == ifindex;
894 }
895
896 static bool check_rule(struct nlmsghdr *hdr, int ifindex)
897 {
898         return true;
899 }
900
901 static int cb_clear_event(struct nl_msg *msg, void *arg)
902 {
903         struct clear_data *clr = arg;
904         struct nlmsghdr *hdr = nlmsg_hdr(msg);
905         bool (*cb)(struct nlmsghdr *, int ifindex);
906         int type;
907
908         switch(clr->type) {
909         case RTM_GETADDR:
910                 type = RTM_DELADDR;
911                 if (hdr->nlmsg_type != RTM_NEWADDR)
912                         return NL_SKIP;
913
914                 cb = check_ifaddr;
915                 break;
916         case RTM_GETROUTE:
917                 type = RTM_DELROUTE;
918                 if (hdr->nlmsg_type != RTM_NEWROUTE)
919                         return NL_SKIP;
920
921                 cb = check_route;
922                 break;
923         case RTM_GETRULE:
924                 type = RTM_DELRULE;
925                 if (hdr->nlmsg_type != RTM_NEWRULE)
926                         return NL_SKIP;
927
928                 cb = check_rule;
929                 break;
930         default:
931                 return NL_SKIP;
932         }
933
934         if (!cb(hdr, clr->dev ? clr->dev->ifindex : 0))
935                 return NL_SKIP;
936
937         if (type == RTM_DELRULE)
938                 D(SYSTEM, "Remove a rule\n");
939         else
940                 D(SYSTEM, "Remove %s from device %s\n",
941                   type == RTM_DELADDR ? "an address" : "a route",
942                   clr->dev->ifname);
943         memcpy(nlmsg_hdr(clr->msg), hdr, hdr->nlmsg_len);
944         hdr = nlmsg_hdr(clr->msg);
945         hdr->nlmsg_type = type;
946         hdr->nlmsg_flags = NLM_F_REQUEST;
947
948         nl_socket_disable_auto_ack(sock_rtnl);
949         nl_send_auto_complete(sock_rtnl, clr->msg);
950         nl_socket_enable_auto_ack(sock_rtnl);
951
952         return NL_SKIP;
953 }
954
955 static int
956 cb_finish_event(struct nl_msg *msg, void *arg)
957 {
958         int *pending = arg;
959         *pending = 0;
960         return NL_STOP;
961 }
962
963 static int
964 error_handler(struct sockaddr_nl *nla, struct nlmsgerr *err, void *arg)
965 {
966         int *pending = arg;
967         *pending = err->error;
968         return NL_STOP;
969 }
970
971 static void
972 system_if_clear_entries(struct device *dev, int type, int af)
973 {
974         struct clear_data clr;
975         struct nl_cb *cb = nl_cb_alloc(NL_CB_DEFAULT);
976         struct rtmsg rtm = {
977                 .rtm_family = af,
978                 .rtm_flags = RTM_F_CLONED,
979         };
980         int flags = NLM_F_DUMP;
981         int pending = 1;
982
983         clr.af = af;
984         clr.dev = dev;
985         clr.type = type;
986         switch (type) {
987         case RTM_GETADDR:
988         case RTM_GETRULE:
989                 clr.size = sizeof(struct rtgenmsg);
990                 break;
991         case RTM_GETROUTE:
992                 clr.size = sizeof(struct rtmsg);
993                 break;
994         default:
995                 return;
996         }
997
998         if (!cb)
999                 return;
1000
1001         clr.msg = nlmsg_alloc_simple(type, flags);
1002         if (!clr.msg)
1003                 goto out;
1004
1005         nlmsg_append(clr.msg, &rtm, clr.size, 0);
1006         nl_cb_set(cb, NL_CB_VALID, NL_CB_CUSTOM, cb_clear_event, &clr);
1007         nl_cb_set(cb, NL_CB_FINISH, NL_CB_CUSTOM, cb_finish_event, &pending);
1008         nl_cb_err(cb, NL_CB_CUSTOM, error_handler, &pending);
1009
1010         nl_send_auto_complete(sock_rtnl, clr.msg);
1011         while (pending > 0)
1012                 nl_recvmsgs(sock_rtnl, cb);
1013
1014         nlmsg_free(clr.msg);
1015 out:
1016         nl_cb_put(cb);
1017 }
1018
1019 /*
1020  * Clear bridge (membership) state and bring down device
1021  */
1022 void system_if_clear_state(struct device *dev)
1023 {
1024         static char buf[256];
1025         char *bridge;
1026
1027         device_set_ifindex(dev, system_if_resolve(dev));
1028         if (dev->external || !dev->ifindex)
1029                 return;
1030
1031         system_if_flags(dev->ifname, 0, IFF_UP);
1032
1033         if (system_is_bridge(dev->ifname, buf, sizeof(buf))) {
1034                 D(SYSTEM, "Delete existing bridge named '%s'\n", dev->ifname);
1035                 system_bridge_delbr(dev);
1036                 return;
1037         }
1038
1039         bridge = system_get_bridge(dev->ifname, buf, sizeof(buf));
1040         if (bridge) {
1041                 D(SYSTEM, "Remove device '%s' from bridge '%s'\n", dev->ifname, bridge);
1042                 system_bridge_if(bridge, dev, SIOCBRDELIF, NULL);
1043         }
1044
1045         system_if_clear_entries(dev, RTM_GETROUTE, AF_INET);
1046         system_if_clear_entries(dev, RTM_GETADDR, AF_INET);
1047         system_if_clear_entries(dev, RTM_GETROUTE, AF_INET6);
1048         system_if_clear_entries(dev, RTM_GETADDR, AF_INET6);
1049         system_set_disable_ipv6(dev, "0");
1050 }
1051
1052 static inline unsigned long
1053 sec_to_jiffies(int val)
1054 {
1055         return (unsigned long) val * 100;
1056 }
1057
1058 static void system_bridge_conf_multicast_deps(struct device *bridge,
1059                                               struct bridge_config *cfg,
1060                                               char *buf,
1061                                               int buf_len)
1062 {
1063         int val;
1064
1065         if (cfg->flags & BRIDGE_OPT_ROBUSTNESS ||
1066             cfg->flags & BRIDGE_OPT_QUERY_INTERVAL ||
1067             cfg->flags & BRIDGE_OPT_QUERY_RESPONSE_INTERVAL) {
1068                 val = cfg->robustness * cfg->query_interval +
1069                         cfg->query_response_interval;
1070
1071                 snprintf(buf, buf_len, "%i", val);
1072                 system_bridge_set_membership_interval(bridge, buf);
1073
1074                 val = cfg->robustness * cfg->query_interval +
1075                         cfg->query_response_interval / 2;
1076
1077                 snprintf(buf, buf_len, "%i", val);
1078                 system_bridge_set_other_querier_timeout(bridge, buf);
1079         }
1080
1081         if (cfg->flags & BRIDGE_OPT_QUERY_INTERVAL) {
1082                 val = cfg->query_interval / 4;
1083
1084                 snprintf(buf, buf_len, "%i", val);
1085                 system_bridge_set_startup_query_interval(bridge, buf);
1086         }
1087 }
1088
1089 static void system_bridge_conf_multicast(struct device *bridge,
1090                                          struct bridge_config *cfg,
1091                                          char *buf,
1092                                          int buf_len)
1093 {
1094         system_set_dev_sysctl("/sys/devices/virtual/net/%s/bridge/multicast_snooping",
1095                 bridge->ifname, cfg->igmp_snoop ? "1" : "0");
1096
1097         system_set_dev_sysctl("/sys/devices/virtual/net/%s/bridge/multicast_querier",
1098                 bridge->ifname, cfg->multicast_querier ? "1" : "0");
1099
1100         snprintf(buf, buf_len, "%i", cfg->hash_max);
1101         system_set_dev_sysctl("/sys/devices/virtual/net/%s/bridge/hash_max",
1102                 bridge->ifname, buf);
1103
1104         if (bridge->settings.flags & DEV_OPT_MULTICAST_ROUTER) {
1105                 snprintf(buf, buf_len, "%u", bridge->settings.multicast_router);
1106                 system_bridge_set_multicast_router(bridge, buf, true);
1107         }
1108
1109         if (cfg->flags & BRIDGE_OPT_ROBUSTNESS) {
1110                 snprintf(buf, buf_len, "%i", cfg->robustness);
1111                 system_bridge_set_robustness(bridge, buf);
1112         }
1113
1114         if (cfg->flags & BRIDGE_OPT_QUERY_INTERVAL) {
1115                 snprintf(buf, buf_len, "%i", cfg->query_interval);
1116                 system_bridge_set_query_interval(bridge, buf);
1117         }
1118
1119         if (cfg->flags & BRIDGE_OPT_QUERY_RESPONSE_INTERVAL) {
1120                 snprintf(buf, buf_len, "%i", cfg->query_response_interval);
1121                 system_bridge_set_query_response_interval(bridge, buf);
1122         }
1123
1124         if (cfg->flags & BRIDGE_OPT_LAST_MEMBER_INTERVAL) {
1125                 snprintf(buf, buf_len, "%i", cfg->last_member_interval);
1126                 system_bridge_set_last_member_interval(bridge, buf);
1127         }
1128
1129         system_bridge_conf_multicast_deps(bridge, cfg, buf, buf_len);
1130 }
1131
1132 int system_bridge_addbr(struct device *bridge, struct bridge_config *cfg)
1133 {
1134         char buf[64];
1135
1136         if (ioctl(sock_ioctl, SIOCBRADDBR, bridge->ifname) < 0)
1137                 return -1;
1138
1139         system_bridge_set_stp_state(bridge, cfg->stp ? "1" : "0");
1140
1141         snprintf(buf, sizeof(buf), "%lu", sec_to_jiffies(cfg->forward_delay));
1142         system_bridge_set_forward_delay(bridge, buf);
1143
1144         system_bridge_conf_multicast(bridge, cfg, buf, sizeof(buf));
1145
1146         snprintf(buf, sizeof(buf), "%d", cfg->priority);
1147         system_bridge_set_priority(bridge, buf);
1148
1149         if (cfg->flags & BRIDGE_OPT_AGEING_TIME) {
1150                 snprintf(buf, sizeof(buf), "%lu", sec_to_jiffies(cfg->ageing_time));
1151                 system_bridge_set_ageing_time(bridge, buf);
1152         }
1153
1154         if (cfg->flags & BRIDGE_OPT_HELLO_TIME) {
1155                 snprintf(buf, sizeof(buf), "%lu", sec_to_jiffies(cfg->hello_time));
1156                 system_bridge_set_hello_time(bridge, buf);
1157         }
1158
1159         if (cfg->flags & BRIDGE_OPT_MAX_AGE) {
1160                 snprintf(buf, sizeof(buf), "%lu", sec_to_jiffies(cfg->max_age));
1161                 system_bridge_set_max_age(bridge, buf);
1162         }
1163
1164         return 0;
1165 }
1166
1167 int system_macvlan_add(struct device *macvlan, struct device *dev, struct macvlan_config *cfg)
1168 {
1169         struct nl_msg *msg;
1170         struct nlattr *linkinfo, *data;
1171         struct ifinfomsg iim = { .ifi_family = AF_UNSPEC, };
1172         int i, rv;
1173         static const struct {
1174                 const char *name;
1175                 enum macvlan_mode val;
1176         } modes[] = {
1177                 { "private", MACVLAN_MODE_PRIVATE },
1178                 { "vepa", MACVLAN_MODE_VEPA },
1179                 { "bridge", MACVLAN_MODE_BRIDGE },
1180                 { "passthru", MACVLAN_MODE_PASSTHRU },
1181         };
1182
1183         msg = nlmsg_alloc_simple(RTM_NEWLINK, NLM_F_REQUEST | NLM_F_CREATE | NLM_F_EXCL);
1184
1185         if (!msg)
1186                 return -1;
1187
1188         nlmsg_append(msg, &iim, sizeof(iim), 0);
1189
1190         if (cfg->flags & MACVLAN_OPT_MACADDR)
1191                 nla_put(msg, IFLA_ADDRESS, sizeof(cfg->macaddr), cfg->macaddr);
1192         nla_put_string(msg, IFLA_IFNAME, macvlan->ifname);
1193         nla_put_u32(msg, IFLA_LINK, dev->ifindex);
1194
1195         if (!(linkinfo = nla_nest_start(msg, IFLA_LINKINFO)))
1196                 goto nla_put_failure;
1197
1198         nla_put_string(msg, IFLA_INFO_KIND, "macvlan");
1199
1200         if (!(data = nla_nest_start(msg, IFLA_INFO_DATA)))
1201                 goto nla_put_failure;
1202
1203         if (cfg->mode) {
1204                 for (i = 0; i < ARRAY_SIZE(modes); i++) {
1205                         if (strcmp(cfg->mode, modes[i].name) != 0)
1206                                 continue;
1207
1208                         nla_put_u32(msg, IFLA_MACVLAN_MODE, modes[i].val);
1209                         break;
1210                 }
1211         }
1212
1213         nla_nest_end(msg, data);
1214         nla_nest_end(msg, linkinfo);
1215
1216         rv = system_rtnl_call(msg);
1217         if (rv)
1218                 D(SYSTEM, "Error adding macvlan '%s' over '%s': %d\n", macvlan->ifname, dev->ifname, rv);
1219
1220         return rv;
1221
1222 nla_put_failure:
1223         nlmsg_free(msg);
1224         return -ENOMEM;
1225 }
1226
1227 static int system_link_del(const char *ifname)
1228 {
1229         struct nl_msg *msg;
1230         struct ifinfomsg iim = {
1231                 .ifi_family = AF_UNSPEC,
1232                 .ifi_index = 0,
1233         };
1234
1235         msg = nlmsg_alloc_simple(RTM_DELLINK, NLM_F_REQUEST);
1236
1237         if (!msg)
1238                 return -1;
1239
1240         nlmsg_append(msg, &iim, sizeof(iim), 0);
1241         nla_put_string(msg, IFLA_IFNAME, ifname);
1242         return system_rtnl_call(msg);
1243 }
1244
1245 int system_macvlan_del(struct device *macvlan)
1246 {
1247         return system_link_del(macvlan->ifname);
1248 }
1249
1250 int system_veth_add(struct device *veth, struct veth_config *cfg)
1251 {
1252         struct nl_msg *msg;
1253         struct ifinfomsg empty_iim = {};
1254         struct nlattr *linkinfo, *data, *veth_info;
1255         int rv;
1256
1257         msg = nlmsg_alloc_simple(RTM_NEWLINK, NLM_F_REQUEST | NLM_F_CREATE | NLM_F_EXCL);
1258
1259         if (!msg)
1260                 return -1;
1261
1262         nlmsg_append(msg, &empty_iim, sizeof(empty_iim), 0);
1263
1264         if (cfg->flags & VETH_OPT_MACADDR)
1265                 nla_put(msg, IFLA_ADDRESS, sizeof(cfg->macaddr), cfg->macaddr);
1266         nla_put_string(msg, IFLA_IFNAME, veth->ifname);
1267
1268         if (!(linkinfo = nla_nest_start(msg, IFLA_LINKINFO)))
1269                 goto nla_put_failure;
1270
1271         nla_put_string(msg, IFLA_INFO_KIND, "veth");
1272
1273         if (!(data = nla_nest_start(msg, IFLA_INFO_DATA)))
1274                 goto nla_put_failure;
1275
1276         if (!(veth_info = nla_nest_start(msg, VETH_INFO_PEER)))
1277                 goto nla_put_failure;
1278
1279         nlmsg_append(msg, &empty_iim, sizeof(empty_iim), 0);
1280
1281         if (cfg->flags & VETH_OPT_PEER_NAME)
1282                 nla_put_string(msg, IFLA_IFNAME, cfg->peer_name);
1283         if (cfg->flags & VETH_OPT_PEER_MACADDR)
1284                 nla_put(msg, IFLA_ADDRESS, sizeof(cfg->peer_macaddr), cfg->peer_macaddr);
1285
1286         nla_nest_end(msg, veth_info);
1287         nla_nest_end(msg, data);
1288         nla_nest_end(msg, linkinfo);
1289
1290         rv = system_rtnl_call(msg);
1291         if (rv) {
1292                 if (cfg->flags & VETH_OPT_PEER_NAME)
1293                         D(SYSTEM, "Error adding veth '%s' with peer '%s': %d\n", veth->ifname, cfg->peer_name, rv);
1294                 else
1295                         D(SYSTEM, "Error adding veth '%s': %d\n", veth->ifname, rv);
1296         }
1297
1298         return rv;
1299
1300 nla_put_failure:
1301         nlmsg_free(msg);
1302         return -ENOMEM;
1303 }
1304
1305 int system_veth_del(struct device *veth)
1306 {
1307         return system_link_del(veth->ifname);
1308 }
1309
1310 static int system_vlan(struct device *dev, int id)
1311 {
1312         struct vlan_ioctl_args ifr = {
1313                 .cmd = SET_VLAN_NAME_TYPE_CMD,
1314                 .u.name_type = VLAN_NAME_TYPE_RAW_PLUS_VID_NO_PAD,
1315         };
1316
1317         if (ioctl(sock_ioctl, SIOCSIFVLAN, &ifr) < 0)
1318                 return -1;
1319
1320         if (id < 0) {
1321                 ifr.cmd = DEL_VLAN_CMD;
1322                 ifr.u.VID = 0;
1323         } else {
1324                 ifr.cmd = ADD_VLAN_CMD;
1325                 ifr.u.VID = id;
1326         }
1327         strncpy(ifr.device1, dev->ifname, sizeof(ifr.device1));
1328         return ioctl(sock_ioctl, SIOCSIFVLAN, &ifr);
1329 }
1330
1331 int system_vlan_add(struct device *dev, int id)
1332 {
1333         return system_vlan(dev, id);
1334 }
1335
1336 int system_vlan_del(struct device *dev)
1337 {
1338         return system_vlan(dev, -1);
1339 }
1340
1341 int system_vlandev_add(struct device *vlandev, struct device *dev, struct vlandev_config *cfg)
1342 {
1343         struct nl_msg *msg;
1344         struct nlattr *linkinfo, *data;
1345         struct ifinfomsg iim = { .ifi_family = AF_UNSPEC };
1346         int rv;
1347
1348         msg = nlmsg_alloc_simple(RTM_NEWLINK, NLM_F_REQUEST | NLM_F_CREATE | NLM_F_EXCL);
1349
1350         if (!msg)
1351                 return -1;
1352
1353         nlmsg_append(msg, &iim, sizeof(iim), 0);
1354         nla_put_string(msg, IFLA_IFNAME, vlandev->ifname);
1355         nla_put_u32(msg, IFLA_LINK, dev->ifindex);
1356
1357         if (!(linkinfo = nla_nest_start(msg, IFLA_LINKINFO)))
1358                 goto nla_put_failure;
1359
1360         nla_put_string(msg, IFLA_INFO_KIND, "vlan");
1361
1362         if (!(data = nla_nest_start(msg, IFLA_INFO_DATA)))
1363                 goto nla_put_failure;
1364
1365         nla_put_u16(msg, IFLA_VLAN_ID, cfg->vid);
1366
1367 #if LINUX_VERSION_CODE >= KERNEL_VERSION(3,10,0)
1368         nla_put_u16(msg, IFLA_VLAN_PROTOCOL, htons(cfg->proto));
1369 #else
1370         if(cfg->proto == VLAN_PROTO_8021AD)
1371                 netifd_log_message(L_WARNING, "%s Your kernel is older than linux 3.10.0, 802.1ad is not supported defaulting to 802.1q", vlandev->type->name);
1372 #endif
1373
1374         nla_nest_end(msg, data);
1375         nla_nest_end(msg, linkinfo);
1376
1377         rv = system_rtnl_call(msg);
1378         if (rv)
1379                 D(SYSTEM, "Error adding vlandev '%s' over '%s': %d\n", vlandev->ifname, dev->ifname, rv);
1380
1381         return rv;
1382
1383 nla_put_failure:
1384         nlmsg_free(msg);
1385         return -ENOMEM;
1386 }
1387
1388 int system_vlandev_del(struct device *vlandev)
1389 {
1390         return system_link_del(vlandev->ifname);
1391 }
1392
1393 void
1394 system_if_get_settings(struct device *dev, struct device_settings *s)
1395 {
1396         struct ifreq ifr;
1397         char buf[10];
1398
1399         memset(&ifr, 0, sizeof(ifr));
1400         strncpy(ifr.ifr_name, dev->ifname, sizeof(ifr.ifr_name) - 1);
1401
1402         if (ioctl(sock_ioctl, SIOCGIFMTU, &ifr) == 0) {
1403                 s->mtu = ifr.ifr_mtu;
1404                 s->flags |= DEV_OPT_MTU;
1405         }
1406
1407         s->mtu6 = system_update_ipv6_mtu(dev, 0);
1408         if (s->mtu6 > 0)
1409                 s->flags |= DEV_OPT_MTU6;
1410
1411         if (ioctl(sock_ioctl, SIOCGIFTXQLEN, &ifr) == 0) {
1412                 s->txqueuelen = ifr.ifr_qlen;
1413                 s->flags |= DEV_OPT_TXQUEUELEN;
1414         }
1415
1416         if (ioctl(sock_ioctl, SIOCGIFHWADDR, &ifr) == 0) {
1417                 memcpy(s->macaddr, &ifr.ifr_hwaddr.sa_data, sizeof(s->macaddr));
1418                 s->flags |= DEV_OPT_MACADDR;
1419         }
1420
1421         if (!system_get_disable_ipv6(dev, buf, sizeof(buf))) {
1422                 s->ipv6 = !strtoul(buf, NULL, 0);
1423                 s->flags |= DEV_OPT_IPV6;
1424         }
1425
1426         if (ioctl(sock_ioctl, SIOCGIFFLAGS, &ifr) == 0) {
1427                 s->promisc = ifr.ifr_flags & IFF_PROMISC;
1428                 s->flags |= DEV_OPT_PROMISC;
1429
1430                 s->multicast = ifr.ifr_flags & IFF_MULTICAST;
1431                 s->flags |= DEV_OPT_MULTICAST;
1432         }
1433
1434         if (!system_get_rpfilter(dev, buf, sizeof(buf))) {
1435                 s->rpfilter = strtoul(buf, NULL, 0);
1436                 s->flags |= DEV_OPT_RPFILTER;
1437         }
1438
1439         if (!system_get_acceptlocal(dev, buf, sizeof(buf))) {
1440                 s->acceptlocal = strtoul(buf, NULL, 0);
1441                 s->flags |= DEV_OPT_ACCEPTLOCAL;
1442         }
1443
1444         if (!system_get_igmpversion(dev, buf, sizeof(buf))) {
1445                 s->igmpversion = strtoul(buf, NULL, 0);
1446                 s->flags |= DEV_OPT_IGMPVERSION;
1447         }
1448
1449         if (!system_get_mldversion(dev, buf, sizeof(buf))) {
1450                 s->mldversion = strtoul(buf, NULL, 0);
1451                 s->flags |= DEV_OPT_MLDVERSION;
1452         }
1453
1454         if (!system_get_neigh4reachabletime(dev, buf, sizeof(buf))) {
1455                 s->neigh4reachabletime = strtoul(buf, NULL, 0);
1456                 s->flags |= DEV_OPT_NEIGHREACHABLETIME;
1457         }
1458
1459         if (!system_get_neigh6reachabletime(dev, buf, sizeof(buf))) {
1460                 s->neigh6reachabletime = strtoul(buf, NULL, 0);
1461                 s->flags |= DEV_OPT_NEIGHREACHABLETIME;
1462         }
1463
1464         if (!system_get_neigh4locktime(dev, buf, sizeof(buf))) {
1465                 s->neigh4locktime = strtol(buf, NULL, 0);
1466                 s->flags |= DEV_OPT_NEIGHLOCKTIME;
1467         }
1468
1469         if (!system_get_neigh4gcstaletime(dev, buf, sizeof(buf))) {
1470                 s->neigh4gcstaletime = strtoul(buf, NULL, 0);
1471                 s->flags |= DEV_OPT_NEIGHGCSTALETIME;
1472         }
1473
1474         if (!system_get_neigh6gcstaletime(dev, buf, sizeof(buf))) {
1475                 s->neigh6gcstaletime = strtoul(buf, NULL, 0);
1476                 s->flags |= DEV_OPT_NEIGHGCSTALETIME;
1477         }
1478
1479         if (!system_get_dadtransmits(dev, buf, sizeof(buf))) {
1480                 s->dadtransmits = strtoul(buf, NULL, 0);
1481                 s->flags |= DEV_OPT_DADTRANSMITS;
1482         }
1483
1484         if (!system_get_sendredirects(dev, buf, sizeof(buf))) {
1485                 s->sendredirects = strtoul(buf, NULL, 0);
1486                 s->flags |= DEV_OPT_SENDREDIRECTS;
1487         }
1488 }
1489
1490 void
1491 system_if_apply_settings(struct device *dev, struct device_settings *s, unsigned int apply_mask)
1492 {
1493         struct ifreq ifr;
1494         char buf[12];
1495
1496         memset(&ifr, 0, sizeof(ifr));
1497         strncpy(ifr.ifr_name, dev->ifname, sizeof(ifr.ifr_name) - 1);
1498         if (s->flags & DEV_OPT_MTU & apply_mask) {
1499                 ifr.ifr_mtu = s->mtu;
1500                 if (ioctl(sock_ioctl, SIOCSIFMTU, &ifr) < 0)
1501                         s->flags &= ~DEV_OPT_MTU;
1502         }
1503         if (s->flags & DEV_OPT_MTU6 & apply_mask) {
1504                 system_update_ipv6_mtu(dev, s->mtu6);
1505         }
1506         if (s->flags & DEV_OPT_TXQUEUELEN & apply_mask) {
1507                 ifr.ifr_qlen = s->txqueuelen;
1508                 if (ioctl(sock_ioctl, SIOCSIFTXQLEN, &ifr) < 0)
1509                         s->flags &= ~DEV_OPT_TXQUEUELEN;
1510         }
1511         if ((s->flags & DEV_OPT_MACADDR & apply_mask) && !dev->external) {
1512                 ifr.ifr_hwaddr.sa_family = ARPHRD_ETHER;
1513                 memcpy(&ifr.ifr_hwaddr.sa_data, s->macaddr, sizeof(s->macaddr));
1514                 if (ioctl(sock_ioctl, SIOCSIFHWADDR, &ifr) < 0)
1515                         s->flags &= ~DEV_OPT_MACADDR;
1516         }
1517         if (s->flags & DEV_OPT_IPV6 & apply_mask)
1518                 system_set_disable_ipv6(dev, s->ipv6 ? "0" : "1");
1519         if (s->flags & DEV_OPT_PROMISC & apply_mask) {
1520                 if (system_if_flags(dev->ifname, s->promisc ? IFF_PROMISC : 0,
1521                                     !s->promisc ? IFF_PROMISC : 0) < 0)
1522                         s->flags &= ~DEV_OPT_PROMISC;
1523         }
1524         if (s->flags & DEV_OPT_RPFILTER & apply_mask) {
1525                 snprintf(buf, sizeof(buf), "%u", s->rpfilter);
1526                 system_set_rpfilter(dev, buf);
1527         }
1528         if (s->flags & DEV_OPT_ACCEPTLOCAL & apply_mask)
1529                 system_set_acceptlocal(dev, s->acceptlocal ? "1" : "0");
1530         if (s->flags & DEV_OPT_IGMPVERSION & apply_mask) {
1531                 snprintf(buf, sizeof(buf), "%u", s->igmpversion);
1532                 system_set_igmpversion(dev, buf);
1533         }
1534         if (s->flags & DEV_OPT_MLDVERSION & apply_mask) {
1535                 snprintf(buf, sizeof(buf), "%u", s->mldversion);
1536                 system_set_mldversion(dev, buf);
1537         }
1538         if (s->flags & DEV_OPT_NEIGHREACHABLETIME & apply_mask) {
1539                 snprintf(buf, sizeof(buf), "%u", s->neigh4reachabletime);
1540                 system_set_neigh4reachabletime(dev, buf);
1541                 snprintf(buf, sizeof(buf), "%u", s->neigh6reachabletime);
1542                 system_set_neigh6reachabletime(dev, buf);
1543         }
1544         if (s->flags & DEV_OPT_NEIGHLOCKTIME & apply_mask) {
1545                 snprintf(buf, sizeof(buf), "%d", s->neigh4locktime);
1546                 system_set_neigh4locktime(dev, buf);
1547         }
1548         if (s->flags & DEV_OPT_NEIGHGCSTALETIME & apply_mask) {
1549                 snprintf(buf, sizeof(buf), "%u", s->neigh4gcstaletime);
1550                 system_set_neigh4gcstaletime(dev, buf);
1551                 snprintf(buf, sizeof(buf), "%u", s->neigh6gcstaletime);
1552                 system_set_neigh6gcstaletime(dev, buf);
1553         }
1554         if (s->flags & DEV_OPT_DADTRANSMITS & apply_mask) {
1555                 snprintf(buf, sizeof(buf), "%u", s->dadtransmits);
1556                 system_set_dadtransmits(dev, buf);
1557         }
1558         if (s->flags & DEV_OPT_MULTICAST & apply_mask) {
1559                 if (system_if_flags(dev->ifname, s->multicast ? IFF_MULTICAST : 0,
1560                                     !s->multicast ? IFF_MULTICAST : 0) < 0)
1561                         s->flags &= ~DEV_OPT_MULTICAST;
1562         }
1563         if (s->flags & DEV_OPT_SENDREDIRECTS & apply_mask)
1564                 system_set_sendredirects(dev, s->sendredirects ? "1" : "0");
1565 }
1566
1567 int system_if_up(struct device *dev)
1568 {
1569         system_if_get_settings(dev, &dev->orig_settings);
1570         /* Only keep orig settings based on what needs to be set */
1571         dev->orig_settings.valid_flags = dev->orig_settings.flags;
1572         dev->orig_settings.flags &= dev->settings.flags;
1573         system_if_apply_settings(dev, &dev->settings, dev->settings.flags);
1574         return system_if_flags(dev->ifname, IFF_UP, 0);
1575 }
1576
1577 int system_if_down(struct device *dev)
1578 {
1579         int ret = system_if_flags(dev->ifname, 0, IFF_UP);
1580         system_if_apply_settings(dev, &dev->orig_settings, dev->orig_settings.flags);
1581         return ret;
1582 }
1583
1584 struct if_check_data {
1585         struct device *dev;
1586         int pending;
1587         int ret;
1588 };
1589
1590 #ifndef IFF_LOWER_UP
1591 #define IFF_LOWER_UP    0x10000
1592 #endif
1593
1594 static int cb_if_check_valid(struct nl_msg *msg, void *arg)
1595 {
1596         struct nlmsghdr *nh = nlmsg_hdr(msg);
1597         struct ifinfomsg *ifi = NLMSG_DATA(nh);
1598         struct if_check_data *chk = (struct if_check_data *)arg;
1599
1600         if (nh->nlmsg_type != RTM_NEWLINK)
1601                 return NL_SKIP;
1602
1603         device_set_present(chk->dev, ifi->ifi_index > 0 ? true : false);
1604         device_set_link(chk->dev, ifi->ifi_flags & IFF_LOWER_UP ? true : false);
1605
1606         return NL_OK;
1607 }
1608
1609 static int cb_if_check_ack(struct nl_msg *msg, void *arg)
1610 {
1611         struct if_check_data *chk = (struct if_check_data *)arg;
1612         chk->pending = 0;
1613         return NL_STOP;
1614 }
1615
1616 static int cb_if_check_error(struct sockaddr_nl *nla, struct nlmsgerr *err, void *arg)
1617 {
1618         struct if_check_data *chk = (struct if_check_data *)arg;
1619
1620         device_set_present(chk->dev, false);
1621         device_set_link(chk->dev, false);
1622         chk->pending = err->error;
1623
1624         return NL_STOP;
1625 }
1626
1627 int system_if_check(struct device *dev)
1628 {
1629         struct nl_cb *cb = nl_cb_alloc(NL_CB_DEFAULT);
1630         struct nl_msg *msg;
1631         struct ifinfomsg ifi = {
1632                 .ifi_family = AF_UNSPEC,
1633                 .ifi_index = 0,
1634         };
1635         struct if_check_data chk = {
1636                 .dev = dev,
1637                 .pending = 1,
1638         };
1639         int ret = 1;
1640
1641         if (!cb)
1642                 return ret;
1643
1644         msg = nlmsg_alloc_simple(RTM_GETLINK, 0);
1645         if (!msg)
1646                 goto out;
1647
1648         if (nlmsg_append(msg, &ifi, sizeof(ifi), 0) ||
1649             nla_put_string(msg, IFLA_IFNAME, dev->ifname))
1650                 goto free;
1651
1652         nl_cb_set(cb, NL_CB_VALID, NL_CB_CUSTOM, cb_if_check_valid, &chk);
1653         nl_cb_set(cb, NL_CB_ACK, NL_CB_CUSTOM, cb_if_check_ack, &chk);
1654         nl_cb_err(cb, NL_CB_CUSTOM, cb_if_check_error, &chk);
1655
1656         nl_send_auto_complete(sock_rtnl, msg);
1657         while (chk.pending > 0)
1658                 nl_recvmsgs(sock_rtnl, cb);
1659
1660         ret = chk.pending;
1661
1662 free:
1663         nlmsg_free(msg);
1664 out:
1665         nl_cb_put(cb);
1666         return ret;
1667 }
1668
1669 struct device *
1670 system_if_get_parent(struct device *dev)
1671 {
1672         char buf[64], *devname;
1673         int ifindex, iflink, len;
1674         FILE *f;
1675
1676         snprintf(buf, sizeof(buf), "/sys/class/net/%s/iflink", dev->ifname);
1677         f = fopen(buf, "r");
1678         if (!f)
1679                 return NULL;
1680
1681         len = fread(buf, 1, sizeof(buf) - 1, f);
1682         fclose(f);
1683
1684         if (len <= 0)
1685                 return NULL;
1686
1687         buf[len] = 0;
1688         iflink = strtoul(buf, NULL, 0);
1689         ifindex = system_if_resolve(dev);
1690         if (!iflink || iflink == ifindex)
1691                 return NULL;
1692
1693         devname = if_indextoname(iflink, buf);
1694         if (!devname)
1695                 return NULL;
1696
1697         return device_get(devname, true);
1698 }
1699
1700 static bool
1701 read_string_file(int dir_fd, const char *file, char *buf, int len)
1702 {
1703         bool ret = false;
1704         char *c;
1705         int fd;
1706
1707         fd = openat(dir_fd, file, O_RDONLY);
1708         if (fd < 0)
1709                 return false;
1710
1711 retry:
1712         len = read(fd, buf, len - 1);
1713         if (len < 0) {
1714                 if (errno == EINTR)
1715                         goto retry;
1716         } else if (len > 0) {
1717                         buf[len] = 0;
1718
1719                         c = strchr(buf, '\n');
1720                         if (c)
1721                                 *c = 0;
1722
1723                         ret = true;
1724         }
1725
1726         close(fd);
1727
1728         return ret;
1729 }
1730
1731 static bool
1732 read_uint64_file(int dir_fd, const char *file, uint64_t *val)
1733 {
1734         char buf[64];
1735         bool ret = false;
1736
1737         ret = read_string_file(dir_fd, file, buf, sizeof(buf));
1738         if (ret)
1739                 *val = strtoull(buf, NULL, 0);
1740
1741         return ret;
1742 }
1743
1744 /* Assume advertised flags == supported flags */
1745 static const struct {
1746         uint32_t mask;
1747         const char *name;
1748 } ethtool_link_modes[] = {
1749         { ADVERTISED_10baseT_Half, "10baseT-H" },
1750         { ADVERTISED_10baseT_Full, "10baseT-F" },
1751         { ADVERTISED_100baseT_Half, "100baseT-H" },
1752         { ADVERTISED_100baseT_Full, "100baseT-F" },
1753         { ADVERTISED_1000baseT_Half, "1000baseT-H" },
1754         { ADVERTISED_1000baseT_Full, "1000baseT-F" },
1755         { ADVERTISED_1000baseKX_Full, "1000baseKX-F" },
1756         { ADVERTISED_2500baseX_Full, "2500baseX-F" },
1757         { ADVERTISED_10000baseT_Full, "10000baseT-F" },
1758         { ADVERTISED_10000baseKX4_Full, "10000baseKX4-F" },
1759         { ADVERTISED_10000baseKR_Full, "10000baseKR-F" },
1760         { ADVERTISED_20000baseMLD2_Full, "20000baseMLD2-F" },
1761         { ADVERTISED_20000baseKR2_Full, "20000baseKR2-F" },
1762         { ADVERTISED_40000baseKR4_Full, "40000baseKR4-F" },
1763         { ADVERTISED_40000baseCR4_Full, "40000baseCR4-F" },
1764         { ADVERTISED_40000baseSR4_Full, "40000baseSR4-F" },
1765         { ADVERTISED_40000baseLR4_Full, "40000baseLR4-F" },
1766 #ifdef ADVERTISED_56000baseKR4_Full
1767         { ADVERTISED_56000baseKR4_Full, "56000baseKR4-F" },
1768         { ADVERTISED_56000baseCR4_Full, "56000baseCR4-F" },
1769         { ADVERTISED_56000baseSR4_Full, "56000baseSR4-F" },
1770         { ADVERTISED_56000baseLR4_Full, "56000baseLR4-F" },
1771 #endif
1772 };
1773
1774 static void system_add_link_modes(struct blob_buf *b, __u32 mask)
1775 {
1776         int i;
1777         for (i = 0; i < ARRAY_SIZE(ethtool_link_modes); i++) {
1778                 if (mask & ethtool_link_modes[i].mask)
1779                         blobmsg_add_string(b, NULL, ethtool_link_modes[i].name);
1780         }
1781 }
1782
1783 bool
1784 system_if_force_external(const char *ifname)
1785 {
1786         char buf[64];
1787         struct stat s;
1788
1789         snprintf(buf, sizeof(buf), "/sys/class/net/%s/phy80211", ifname);
1790         return stat(buf, &s) == 0;
1791 }
1792
1793 int
1794 system_if_dump_info(struct device *dev, struct blob_buf *b)
1795 {
1796         struct ethtool_cmd ecmd;
1797         struct ifreq ifr;
1798         char *s;
1799         void *c;
1800
1801         memset(&ecmd, 0, sizeof(ecmd));
1802         memset(&ifr, 0, sizeof(ifr));
1803         strncpy(ifr.ifr_name, dev->ifname, sizeof(ifr.ifr_name) - 1);
1804         ifr.ifr_data = (caddr_t) &ecmd;
1805         ecmd.cmd = ETHTOOL_GSET;
1806
1807         if (ioctl(sock_ioctl, SIOCETHTOOL, &ifr) == 0) {
1808                 c = blobmsg_open_array(b, "link-advertising");
1809                 system_add_link_modes(b, ecmd.advertising);
1810                 blobmsg_close_array(b, c);
1811
1812                 c = blobmsg_open_array(b, "link-partner-advertising");
1813                 system_add_link_modes(b, ecmd.lp_advertising);
1814                 blobmsg_close_array(b, c);
1815
1816                 c = blobmsg_open_array(b, "link-supported");
1817                 system_add_link_modes(b, ecmd.supported);
1818                 blobmsg_close_array(b, c);
1819
1820                 s = blobmsg_alloc_string_buffer(b, "speed", 8);
1821                 snprintf(s, 8, "%d%c", ethtool_cmd_speed(&ecmd),
1822                         ecmd.duplex == DUPLEX_HALF ? 'H' : 'F');
1823                 blobmsg_add_string_buffer(b);
1824
1825                 blobmsg_add_u8(b, "autoneg", !!ecmd.autoneg);
1826         }
1827
1828         return 0;
1829 }
1830
1831 int
1832 system_if_dump_stats(struct device *dev, struct blob_buf *b)
1833 {
1834         const char *const counters[] = {
1835                 "collisions",     "rx_frame_errors",   "tx_compressed",
1836                 "multicast",      "rx_length_errors",  "tx_dropped",
1837                 "rx_bytes",       "rx_missed_errors",  "tx_errors",
1838                 "rx_compressed",  "rx_over_errors",    "tx_fifo_errors",
1839                 "rx_crc_errors",  "rx_packets",        "tx_heartbeat_errors",
1840                 "rx_dropped",     "tx_aborted_errors", "tx_packets",
1841                 "rx_errors",      "tx_bytes",          "tx_window_errors",
1842                 "rx_fifo_errors", "tx_carrier_errors",
1843         };
1844         char buf[64];
1845         int stats_dir;
1846         int i;
1847         uint64_t val = 0;
1848
1849         snprintf(buf, sizeof(buf), "/sys/class/net/%s/statistics", dev->ifname);
1850         stats_dir = open(buf, O_DIRECTORY);
1851         if (stats_dir < 0)
1852                 return -1;
1853
1854         for (i = 0; i < ARRAY_SIZE(counters); i++)
1855                 if (read_uint64_file(stats_dir, counters[i], &val))
1856                         blobmsg_add_u64(b, counters[i], val);
1857
1858         close(stats_dir);
1859         return 0;
1860 }
1861
1862 static int system_addr(struct device *dev, struct device_addr *addr, int cmd)
1863 {
1864         bool v4 = ((addr->flags & DEVADDR_FAMILY) == DEVADDR_INET4);
1865         int alen = v4 ? 4 : 16;
1866         unsigned int flags = 0;
1867         struct ifaddrmsg ifa = {
1868                 .ifa_family = (alen == 4) ? AF_INET : AF_INET6,
1869                 .ifa_prefixlen = addr->mask,
1870                 .ifa_index = dev->ifindex,
1871         };
1872
1873         struct nl_msg *msg;
1874         if (cmd == RTM_NEWADDR)
1875                 flags |= NLM_F_CREATE | NLM_F_REPLACE;
1876
1877         msg = nlmsg_alloc_simple(cmd, flags);
1878         if (!msg)
1879                 return -1;
1880
1881         nlmsg_append(msg, &ifa, sizeof(ifa), 0);
1882         nla_put(msg, IFA_LOCAL, alen, &addr->addr);
1883         if (v4) {
1884                 if (addr->broadcast)
1885                         nla_put_u32(msg, IFA_BROADCAST, addr->broadcast);
1886                 if (addr->point_to_point)
1887                         nla_put_u32(msg, IFA_ADDRESS, addr->point_to_point);
1888         } else {
1889                 time_t now = system_get_rtime();
1890                 struct ifa_cacheinfo cinfo = {0xffffffffU, 0xffffffffU, 0, 0};
1891
1892                 if (addr->preferred_until) {
1893                         int64_t preferred = addr->preferred_until - now;
1894                         if (preferred < 0)
1895                                 preferred = 0;
1896                         else if (preferred > UINT32_MAX)
1897                                 preferred = UINT32_MAX;
1898
1899                         cinfo.ifa_prefered = preferred;
1900                 }
1901
1902                 if (addr->valid_until) {
1903                         int64_t valid = addr->valid_until - now;
1904                         if (valid <= 0) {
1905                                 nlmsg_free(msg);
1906                                 return -1;
1907                         }
1908                         else if (valid > UINT32_MAX)
1909                                 valid = UINT32_MAX;
1910
1911                         cinfo.ifa_valid = valid;
1912                 }
1913
1914                 nla_put(msg, IFA_CACHEINFO, sizeof(cinfo), &cinfo);
1915
1916                 if (cmd == RTM_NEWADDR && (addr->flags & DEVADDR_OFFLINK))
1917                         nla_put_u32(msg, IFA_FLAGS, IFA_F_NOPREFIXROUTE);
1918         }
1919
1920         return system_rtnl_call(msg);
1921 }
1922
1923 int system_add_address(struct device *dev, struct device_addr *addr)
1924 {
1925         return system_addr(dev, addr, RTM_NEWADDR);
1926 }
1927
1928 int system_del_address(struct device *dev, struct device_addr *addr)
1929 {
1930         return system_addr(dev, addr, RTM_DELADDR);
1931 }
1932
1933 static int system_rt(struct device *dev, struct device_route *route, int cmd)
1934 {
1935         int alen = ((route->flags & DEVADDR_FAMILY) == DEVADDR_INET4) ? 4 : 16;
1936         bool have_gw;
1937         unsigned int flags = 0;
1938
1939         if (alen == 4)
1940                 have_gw = !!route->nexthop.in.s_addr;
1941         else
1942                 have_gw = route->nexthop.in6.s6_addr32[0] ||
1943                         route->nexthop.in6.s6_addr32[1] ||
1944                         route->nexthop.in6.s6_addr32[2] ||
1945                         route->nexthop.in6.s6_addr32[3];
1946
1947         unsigned int table = (route->flags & (DEVROUTE_TABLE | DEVROUTE_SRCTABLE))
1948                         ? route->table : RT_TABLE_MAIN;
1949
1950         struct rtmsg rtm = {
1951                 .rtm_family = (alen == 4) ? AF_INET : AF_INET6,
1952                 .rtm_dst_len = route->mask,
1953                 .rtm_src_len = route->sourcemask,
1954                 .rtm_table = (table < 256) ? table : RT_TABLE_UNSPEC,
1955                 .rtm_protocol = (route->flags & DEVROUTE_PROTO) ? route->proto : RTPROT_STATIC,
1956                 .rtm_scope = RT_SCOPE_NOWHERE,
1957                 .rtm_type = (cmd == RTM_DELROUTE) ? 0: RTN_UNICAST,
1958                 .rtm_flags = (route->flags & DEVROUTE_ONLINK) ? RTNH_F_ONLINK : 0,
1959         };
1960         struct nl_msg *msg;
1961
1962         if (cmd == RTM_NEWROUTE) {
1963                 flags |= NLM_F_CREATE | NLM_F_REPLACE;
1964
1965                 if (!dev) { /* Add null-route */
1966                         rtm.rtm_scope = RT_SCOPE_UNIVERSE;
1967                         rtm.rtm_type = RTN_UNREACHABLE;
1968                 }
1969                 else
1970                         rtm.rtm_scope = (have_gw) ? RT_SCOPE_UNIVERSE : RT_SCOPE_LINK;
1971         }
1972
1973         if (route->flags & DEVROUTE_TYPE) {
1974                 rtm.rtm_type = route->type;
1975                 if (!(route->flags & (DEVROUTE_TABLE | DEVROUTE_SRCTABLE))) {
1976                         if (rtm.rtm_type == RTN_LOCAL || rtm.rtm_type == RTN_BROADCAST ||
1977                             rtm.rtm_type == RTN_NAT || rtm.rtm_type == RTN_ANYCAST)
1978                                 rtm.rtm_table = RT_TABLE_LOCAL;
1979                 }
1980
1981                 if (rtm.rtm_type == RTN_LOCAL || rtm.rtm_type == RTN_NAT) {
1982                         rtm.rtm_scope = RT_SCOPE_HOST;
1983                 } else if (rtm.rtm_type == RTN_BROADCAST || rtm.rtm_type == RTN_MULTICAST ||
1984                                 rtm.rtm_type == RTN_ANYCAST) {
1985                         rtm.rtm_scope = RT_SCOPE_LINK;
1986                 } else if (rtm.rtm_type == RTN_BLACKHOLE || rtm.rtm_type == RTN_UNREACHABLE ||
1987                                 rtm.rtm_type == RTN_PROHIBIT || rtm.rtm_type == RTN_FAILED_POLICY ||
1988                                 rtm.rtm_type == RTN_THROW) {
1989                         rtm.rtm_scope = RT_SCOPE_UNIVERSE;
1990                         dev = NULL;
1991                 }
1992         }
1993
1994         msg = nlmsg_alloc_simple(cmd, flags);
1995         if (!msg)
1996                 return -1;
1997
1998         nlmsg_append(msg, &rtm, sizeof(rtm), 0);
1999
2000         if (route->mask)
2001                 nla_put(msg, RTA_DST, alen, &route->addr);
2002
2003         if (route->sourcemask) {
2004                 if (rtm.rtm_family == AF_INET)
2005                         nla_put(msg, RTA_PREFSRC, alen, &route->source);
2006                 else
2007                         nla_put(msg, RTA_SRC, alen, &route->source);
2008         }
2009
2010         if (route->metric > 0)
2011                 nla_put_u32(msg, RTA_PRIORITY, route->metric);
2012
2013         if (have_gw)
2014                 nla_put(msg, RTA_GATEWAY, alen, &route->nexthop);
2015
2016         if (dev)
2017                 nla_put_u32(msg, RTA_OIF, dev->ifindex);
2018
2019         if (table >= 256)
2020                 nla_put_u32(msg, RTA_TABLE, table);
2021
2022         if (route->flags & DEVROUTE_MTU) {
2023                 struct nlattr *metrics;
2024
2025                 if (!(metrics = nla_nest_start(msg, RTA_METRICS)))
2026                         goto nla_put_failure;
2027
2028                 nla_put_u32(msg, RTAX_MTU, route->mtu);
2029
2030                 nla_nest_end(msg, metrics);
2031         }
2032
2033         return system_rtnl_call(msg);
2034
2035 nla_put_failure:
2036         nlmsg_free(msg);
2037         return -ENOMEM;
2038 }
2039
2040 int system_add_route(struct device *dev, struct device_route *route)
2041 {
2042         return system_rt(dev, route, RTM_NEWROUTE);
2043 }
2044
2045 int system_del_route(struct device *dev, struct device_route *route)
2046 {
2047         return system_rt(dev, route, RTM_DELROUTE);
2048 }
2049
2050 int system_flush_routes(void)
2051 {
2052         const char *names[] = {
2053                 "/proc/sys/net/ipv4/route/flush",
2054                 "/proc/sys/net/ipv6/route/flush"
2055         };
2056         int fd, i;
2057
2058         for (i = 0; i < ARRAY_SIZE(names); i++) {
2059                 fd = open(names[i], O_WRONLY);
2060                 if (fd < 0)
2061                         continue;
2062
2063                 if (write(fd, "-1", 2)) {}
2064                 close(fd);
2065         }
2066         return 0;
2067 }
2068
2069 bool system_resolve_rt_type(const char *type, unsigned int *id)
2070 {
2071         return system_rtn_aton(type, id);
2072 }
2073
2074 bool system_resolve_rt_proto(const char *type, unsigned int *id)
2075 {
2076         FILE *f;
2077         char *e, buf[128];
2078         unsigned int n, proto = 256;
2079         n = strtoul(type, &e, 0);
2080         if (!*e && e != type)
2081                 proto = n;
2082         else if (!strcmp(type, "unspec"))
2083                 proto = RTPROT_UNSPEC;
2084         else if (!strcmp(type, "kernel"))
2085                 proto = RTPROT_KERNEL;
2086         else if (!strcmp(type, "boot"))
2087                 proto = RTPROT_BOOT;
2088         else if (!strcmp(type, "static"))
2089                 proto = RTPROT_STATIC;
2090         else if ((f = fopen("/etc/iproute2/rt_protos", "r")) != NULL) {
2091                 while (fgets(buf, sizeof(buf) - 1, f) != NULL) {
2092                         if ((e = strtok(buf, " \t\n")) == NULL || *e == '#')
2093                                 continue;
2094
2095                         n = strtoul(e, NULL, 10);
2096                         e = strtok(NULL, " \t\n");
2097
2098                         if (e && !strcmp(e, type)) {
2099                                 proto = n;
2100                                 break;
2101                         }
2102                 }
2103                 fclose(f);
2104         }
2105
2106         if (proto > 255)
2107                 return false;
2108
2109         *id = proto;
2110         return true;
2111 }
2112
2113 bool system_resolve_rt_table(const char *name, unsigned int *id)
2114 {
2115         FILE *f;
2116         char *e, buf[128];
2117         unsigned int n, table = RT_TABLE_UNSPEC;
2118
2119         /* first try to parse table as number */
2120         if ((n = strtoul(name, &e, 0)) > 0 && !*e)
2121                 table = n;
2122
2123         /* handle well known aliases */
2124         else if (!strcmp(name, "default"))
2125                 table = RT_TABLE_DEFAULT;
2126         else if (!strcmp(name, "main"))
2127                 table = RT_TABLE_MAIN;
2128         else if (!strcmp(name, "local"))
2129                 table = RT_TABLE_LOCAL;
2130
2131         /* try to look up name in /etc/iproute2/rt_tables */
2132         else if ((f = fopen("/etc/iproute2/rt_tables", "r")) != NULL)
2133         {
2134                 while (fgets(buf, sizeof(buf) - 1, f) != NULL)
2135                 {
2136                         if ((e = strtok(buf, " \t\n")) == NULL || *e == '#')
2137                                 continue;
2138
2139                         n = strtoul(e, NULL, 10);
2140                         e = strtok(NULL, " \t\n");
2141
2142                         if (e && !strcmp(e, name))
2143                         {
2144                                 table = n;
2145                                 break;
2146                         }
2147                 }
2148
2149                 fclose(f);
2150         }
2151
2152         if (table == RT_TABLE_UNSPEC)
2153                 return false;
2154
2155         *id = table;
2156         return true;
2157 }
2158
2159 bool system_is_default_rt_table(unsigned int id)
2160 {
2161         return (id == RT_TABLE_MAIN);
2162 }
2163
2164 bool system_resolve_rpfilter(const char *filter, unsigned int *id)
2165 {
2166         char *e;
2167         unsigned int n;
2168
2169         if (!strcmp(filter, "strict"))
2170                 n = 1;
2171         else if (!strcmp(filter, "loose"))
2172                 n = 2;
2173         else {
2174                 n = strtoul(filter, &e, 0);
2175                 if (*e || e == filter || n > 2)
2176                         return false;
2177         }
2178
2179         *id = n;
2180         return true;
2181 }
2182
2183 static int system_iprule(struct iprule *rule, int cmd)
2184 {
2185         int alen = ((rule->flags & IPRULE_FAMILY) == IPRULE_INET4) ? 4 : 16;
2186
2187         struct nl_msg *msg;
2188         struct rtmsg rtm = {
2189                 .rtm_family = (alen == 4) ? AF_INET : AF_INET6,
2190                 .rtm_protocol = RTPROT_STATIC,
2191                 .rtm_scope = RT_SCOPE_UNIVERSE,
2192                 .rtm_table = RT_TABLE_UNSPEC,
2193                 .rtm_type = RTN_UNSPEC,
2194                 .rtm_flags = 0,
2195         };
2196
2197         if (cmd == RTM_NEWRULE)
2198                 rtm.rtm_type = RTN_UNICAST;
2199
2200         if (rule->invert)
2201                 rtm.rtm_flags |= FIB_RULE_INVERT;
2202
2203         if (rule->flags & IPRULE_SRC)
2204                 rtm.rtm_src_len = rule->src_mask;
2205
2206         if (rule->flags & IPRULE_DEST)
2207                 rtm.rtm_dst_len = rule->dest_mask;
2208
2209         if (rule->flags & IPRULE_TOS)
2210                 rtm.rtm_tos = rule->tos;
2211
2212         if (rule->flags & IPRULE_LOOKUP) {
2213                 if (rule->lookup < 256)
2214                         rtm.rtm_table = rule->lookup;
2215         }
2216
2217         if (rule->flags & IPRULE_ACTION)
2218                 rtm.rtm_type = rule->action;
2219         else if (rule->flags & IPRULE_GOTO)
2220                 rtm.rtm_type = FR_ACT_GOTO;
2221         else if (!(rule->flags & (IPRULE_LOOKUP | IPRULE_ACTION | IPRULE_GOTO)))
2222                 rtm.rtm_type = FR_ACT_NOP;
2223
2224         msg = nlmsg_alloc_simple(cmd, NLM_F_REQUEST);
2225
2226         if (!msg)
2227                 return -1;
2228
2229         nlmsg_append(msg, &rtm, sizeof(rtm), 0);
2230
2231         if (rule->flags & IPRULE_IN)
2232                 nla_put(msg, FRA_IFNAME, strlen(rule->in_dev) + 1, rule->in_dev);
2233
2234         if (rule->flags & IPRULE_OUT)
2235                 nla_put(msg, FRA_OIFNAME, strlen(rule->out_dev) + 1, rule->out_dev);
2236
2237         if (rule->flags & IPRULE_SRC)
2238                 nla_put(msg, FRA_SRC, alen, &rule->src_addr);
2239
2240         if (rule->flags & IPRULE_DEST)
2241                 nla_put(msg, FRA_DST, alen, &rule->dest_addr);
2242
2243         if (rule->flags & IPRULE_PRIORITY)
2244                 nla_put_u32(msg, FRA_PRIORITY, rule->priority);
2245         else if (cmd == RTM_NEWRULE)
2246                 nla_put_u32(msg, FRA_PRIORITY, rule->order);
2247
2248         if (rule->flags & IPRULE_FWMARK)
2249                 nla_put_u32(msg, FRA_FWMARK, rule->fwmark);
2250
2251         if (rule->flags & IPRULE_FWMASK)
2252                 nla_put_u32(msg, FRA_FWMASK, rule->fwmask);
2253
2254         if (rule->flags & IPRULE_LOOKUP) {
2255                 if (rule->lookup >= 256)
2256                         nla_put_u32(msg, FRA_TABLE, rule->lookup);
2257         }
2258
2259         if (rule->flags & IPRULE_SUP_PREFIXLEN)
2260                 nla_put_u32(msg, FRA_SUPPRESS_PREFIXLEN, rule->sup_prefixlen);
2261
2262         if (rule->flags & IPRULE_GOTO)
2263                 nla_put_u32(msg, FRA_GOTO, rule->gotoid);
2264
2265         return system_rtnl_call(msg);
2266 }
2267
2268 int system_add_iprule(struct iprule *rule)
2269 {
2270         return system_iprule(rule, RTM_NEWRULE);
2271 }
2272
2273 int system_del_iprule(struct iprule *rule)
2274 {
2275         return system_iprule(rule, RTM_DELRULE);
2276 }
2277
2278 int system_flush_iprules(void)
2279 {
2280         int rv = 0;
2281         struct iprule rule;
2282
2283         system_if_clear_entries(NULL, RTM_GETRULE, AF_INET);
2284         system_if_clear_entries(NULL, RTM_GETRULE, AF_INET6);
2285
2286         memset(&rule, 0, sizeof(rule));
2287
2288
2289         rule.flags = IPRULE_INET4 | IPRULE_PRIORITY | IPRULE_LOOKUP;
2290
2291         rule.priority = 0;
2292         rule.lookup = RT_TABLE_LOCAL;
2293         rv |= system_iprule(&rule, RTM_NEWRULE);
2294
2295         rule.priority = 32766;
2296         rule.lookup = RT_TABLE_MAIN;
2297         rv |= system_iprule(&rule, RTM_NEWRULE);
2298
2299         rule.priority = 32767;
2300         rule.lookup = RT_TABLE_DEFAULT;
2301         rv |= system_iprule(&rule, RTM_NEWRULE);
2302
2303
2304         rule.flags = IPRULE_INET6 | IPRULE_PRIORITY | IPRULE_LOOKUP;
2305
2306         rule.priority = 0;
2307         rule.lookup = RT_TABLE_LOCAL;
2308         rv |= system_iprule(&rule, RTM_NEWRULE);
2309
2310         rule.priority = 32766;
2311         rule.lookup = RT_TABLE_MAIN;
2312         rv |= system_iprule(&rule, RTM_NEWRULE);
2313
2314         return rv;
2315 }
2316
2317 bool system_resolve_iprule_action(const char *action, unsigned int *id)
2318 {
2319         return system_rtn_aton(action, id);
2320 }
2321
2322 time_t system_get_rtime(void)
2323 {
2324         struct timespec ts;
2325         struct timeval tv;
2326
2327         if (syscall(__NR_clock_gettime, CLOCK_MONOTONIC, &ts) == 0)
2328                 return ts.tv_sec;
2329
2330         if (gettimeofday(&tv, NULL) == 0)
2331                 return tv.tv_sec;
2332
2333         return 0;
2334 }
2335
2336 #ifndef IP_DF
2337 #define IP_DF       0x4000
2338 #endif
2339
2340 static int tunnel_ioctl(const char *name, int cmd, void *p)
2341 {
2342         struct ifreq ifr;
2343
2344         memset(&ifr, 0, sizeof(ifr));
2345         strncpy(ifr.ifr_name, name, sizeof(ifr.ifr_name) - 1);
2346         ifr.ifr_ifru.ifru_data = p;
2347         return ioctl(sock_ioctl, cmd, &ifr);
2348 }
2349
2350 #ifdef IFLA_IPTUN_MAX
2351 static int system_add_ip6_tunnel(const char *name, const unsigned int link,
2352                                  struct blob_attr **tb)
2353 {
2354         struct nl_msg *nlm = nlmsg_alloc_simple(RTM_NEWLINK,
2355                                 NLM_F_REQUEST | NLM_F_REPLACE | NLM_F_CREATE);
2356         struct ifinfomsg ifi = { .ifi_family = AF_UNSPEC };
2357         struct blob_attr *cur;
2358         int ret = 0, ttl = 0;
2359
2360         if (!nlm)
2361                 return -1;
2362
2363         nlmsg_append(nlm, &ifi, sizeof(ifi), 0);
2364         nla_put_string(nlm, IFLA_IFNAME, name);
2365
2366         if (link)
2367                 nla_put_u32(nlm, IFLA_LINK, link);
2368
2369         struct nlattr *linkinfo = nla_nest_start(nlm, IFLA_LINKINFO);
2370         if (!linkinfo) {
2371                 ret = -ENOMEM;
2372                 goto failure;
2373         }
2374
2375         nla_put_string(nlm, IFLA_INFO_KIND, "ip6tnl");
2376         struct nlattr *infodata = nla_nest_start(nlm, IFLA_INFO_DATA);
2377         if (!infodata) {
2378                 ret = -ENOMEM;
2379                 goto failure;
2380         }
2381
2382         if (link)
2383                 nla_put_u32(nlm, IFLA_IPTUN_LINK, link);
2384
2385         if ((cur = tb[TUNNEL_ATTR_TTL]))
2386                 ttl = blobmsg_get_u32(cur);
2387
2388         nla_put_u8(nlm, IFLA_IPTUN_PROTO, IPPROTO_IPIP);
2389         nla_put_u8(nlm, IFLA_IPTUN_TTL, (ttl) ? ttl : 64);
2390
2391         struct in6_addr in6buf;
2392         if ((cur = tb[TUNNEL_ATTR_LOCAL])) {
2393                 if (inet_pton(AF_INET6, blobmsg_data(cur), &in6buf) < 1) {
2394                         ret = -EINVAL;
2395                         goto failure;
2396                 }
2397                 nla_put(nlm, IFLA_IPTUN_LOCAL, sizeof(in6buf), &in6buf);
2398         }
2399
2400         if ((cur = tb[TUNNEL_ATTR_REMOTE])) {
2401                 if (inet_pton(AF_INET6, blobmsg_data(cur), &in6buf) < 1) {
2402                         ret = -EINVAL;
2403                         goto failure;
2404                 }
2405                 nla_put(nlm, IFLA_IPTUN_REMOTE, sizeof(in6buf), &in6buf);
2406         }
2407
2408         if ((cur = tb[TUNNEL_ATTR_DATA])) {
2409                 struct blob_attr *tb_data[__IPIP6_DATA_ATTR_MAX];
2410                 uint32_t tun_flags = IP6_TNL_F_IGN_ENCAP_LIMIT;
2411
2412                 blobmsg_parse(ipip6_data_attr_list.params, __IPIP6_DATA_ATTR_MAX, tb_data,
2413                         blobmsg_data(cur), blobmsg_len(cur));
2414
2415                 if ((cur = tb_data[IPIP6_DATA_ENCAPLIMIT])) {
2416                         char *str = blobmsg_get_string(cur);
2417
2418                         if (strcmp(str, "ignore")) {
2419                                 char *e;
2420                                 unsigned encap_limit = strtoul(str, &e, 0);
2421
2422                                 if (e == str || *e || encap_limit > 255) {
2423                                         ret = -EINVAL;
2424                                         goto failure;
2425                                 }
2426
2427                                 nla_put_u8(nlm, IFLA_IPTUN_ENCAP_LIMIT, encap_limit);
2428                                 tun_flags &= ~IP6_TNL_F_IGN_ENCAP_LIMIT;
2429                         }
2430                 }
2431
2432 #ifdef IFLA_IPTUN_FMR_MAX
2433                 if ((cur = tb_data[IPIP6_DATA_FMRS])) {
2434                         struct blob_attr *rcur;
2435                         unsigned rrem, fmrcnt = 0;
2436                         struct nlattr *fmrs = nla_nest_start(nlm, IFLA_IPTUN_FMRS);
2437
2438                         if (!fmrs) {
2439                                 ret = -ENOMEM;
2440                                 goto failure;
2441                         }
2442
2443                         blobmsg_for_each_attr(rcur, cur, rrem) {
2444                                 struct blob_attr *tb_fmr[__FMR_DATA_ATTR_MAX], *tb_cur;
2445                                 struct in6_addr ip6prefix;
2446                                 struct in_addr ip4prefix;
2447                                 unsigned ip4len, ip6len, ealen, offset;
2448
2449                                 blobmsg_parse(fmr_data_attr_list.params, __FMR_DATA_ATTR_MAX, tb_fmr,
2450                                                 blobmsg_data(rcur), blobmsg_len(rcur));
2451
2452                                 if (!(tb_cur = tb_fmr[FMR_DATA_PREFIX6]) ||
2453                                                 !parse_ip_and_netmask(AF_INET6,
2454                                                         blobmsg_data(tb_cur), &ip6prefix,
2455                                                         &ip6len)) {
2456                                         ret = -EINVAL;
2457                                         goto failure;
2458                                 }
2459
2460                                 if (!(tb_cur = tb_fmr[FMR_DATA_PREFIX4]) ||
2461                                                 !parse_ip_and_netmask(AF_INET,
2462                                                         blobmsg_data(tb_cur), &ip4prefix,
2463                                                         &ip4len)) {
2464                                         ret = -EINVAL;
2465                                         goto failure;
2466                                 }
2467
2468                                 if (!(tb_cur = tb_fmr[FMR_DATA_EALEN])) {
2469                                         ret = -EINVAL;
2470                                         goto failure;
2471                                 }
2472                                 ealen = blobmsg_get_u32(tb_cur);
2473
2474                                 if (!(tb_cur = tb_fmr[FMR_DATA_OFFSET])) {
2475                                         ret = -EINVAL;
2476                                         goto failure;
2477                                 }
2478                                 offset = blobmsg_get_u32(tb_cur);
2479
2480                                 struct nlattr *rule = nla_nest_start(nlm, ++fmrcnt);
2481                                 if (!rule) {
2482                                         ret = -ENOMEM;
2483                                         goto failure;
2484                                 }
2485
2486                                 nla_put(nlm, IFLA_IPTUN_FMR_IP6_PREFIX, sizeof(ip6prefix), &ip6prefix);
2487                                 nla_put(nlm, IFLA_IPTUN_FMR_IP4_PREFIX, sizeof(ip4prefix), &ip4prefix);
2488                                 nla_put_u8(nlm, IFLA_IPTUN_FMR_IP6_PREFIX_LEN, ip6len);
2489                                 nla_put_u8(nlm, IFLA_IPTUN_FMR_IP4_PREFIX_LEN, ip4len);
2490                                 nla_put_u8(nlm, IFLA_IPTUN_FMR_EA_LEN, ealen);
2491                                 nla_put_u8(nlm, IFLA_IPTUN_FMR_OFFSET, offset);
2492
2493                                 nla_nest_end(nlm, rule);
2494                         }
2495
2496                         nla_nest_end(nlm, fmrs);
2497                 }
2498 #endif
2499                 if (tun_flags)
2500                         nla_put_u32(nlm, IFLA_IPTUN_FLAGS, tun_flags);
2501         }
2502
2503         nla_nest_end(nlm, infodata);
2504         nla_nest_end(nlm, linkinfo);
2505
2506         return system_rtnl_call(nlm);
2507
2508 failure:
2509         nlmsg_free(nlm);
2510         return ret;
2511 }
2512 #endif
2513
2514 #ifdef IFLA_IPTUN_MAX
2515 #define IP6_FLOWINFO_TCLASS     htonl(0x0FF00000)
2516 static int system_add_gre_tunnel(const char *name, const char *kind,
2517                                  const unsigned int link, struct blob_attr **tb, bool v6)
2518 {
2519         struct nl_msg *nlm;
2520         struct ifinfomsg ifi = { .ifi_family = AF_UNSPEC, };
2521         struct blob_attr *cur;
2522         uint32_t ikey = 0, okey = 0, flowinfo = 0, flags6 = IP6_TNL_F_IGN_ENCAP_LIMIT;
2523         uint16_t iflags = 0, oflags = 0;
2524         uint8_t tos = 0;
2525         int ret = 0, ttl = 0;
2526         unsigned encap_limit = 0;
2527
2528         nlm = nlmsg_alloc_simple(RTM_NEWLINK, NLM_F_REQUEST | NLM_F_REPLACE | NLM_F_CREATE);
2529         if (!nlm)
2530                 return -1;
2531
2532         nlmsg_append(nlm, &ifi, sizeof(ifi), 0);
2533         nla_put_string(nlm, IFLA_IFNAME, name);
2534
2535         struct nlattr *linkinfo = nla_nest_start(nlm, IFLA_LINKINFO);
2536         if (!linkinfo) {
2537                 ret = -ENOMEM;
2538                 goto failure;
2539         }
2540
2541         nla_put_string(nlm, IFLA_INFO_KIND, kind);
2542         struct nlattr *infodata = nla_nest_start(nlm, IFLA_INFO_DATA);
2543         if (!infodata) {
2544                 ret = -ENOMEM;
2545                 goto failure;
2546         }
2547
2548         if (link)
2549                 nla_put_u32(nlm, IFLA_GRE_LINK, link);
2550
2551         if ((cur = tb[TUNNEL_ATTR_TTL]))
2552                 ttl = blobmsg_get_u32(cur);
2553
2554         if ((cur = tb[TUNNEL_ATTR_TOS])) {
2555                 char *str = blobmsg_get_string(cur);
2556                 if (strcmp(str, "inherit")) {
2557                         unsigned uval;
2558
2559                         if (!system_tos_aton(str, &uval)) {
2560                                 ret = -EINVAL;
2561                                 goto failure;
2562                         }
2563
2564                         if (v6)
2565                                 flowinfo |= htonl(uval << 20) & IP6_FLOWINFO_TCLASS;
2566                         else
2567                                 tos = uval;
2568                 } else {
2569                         if (v6)
2570                                 flags6 |= IP6_TNL_F_USE_ORIG_TCLASS;
2571                         else
2572                                 tos = 1;
2573                 }
2574         }
2575
2576         if ((cur = tb[TUNNEL_ATTR_DATA])) {
2577                 struct blob_attr *tb_data[__GRE_DATA_ATTR_MAX];
2578
2579                 blobmsg_parse(gre_data_attr_list.params, __GRE_DATA_ATTR_MAX, tb_data,
2580                         blobmsg_data(cur), blobmsg_len(cur));
2581
2582                 if ((cur = tb_data[GRE_DATA_IKEY])) {
2583                         if ((ikey = blobmsg_get_u32(cur)))
2584                                 iflags |= GRE_KEY;
2585                 }
2586
2587                 if ((cur = tb_data[GRE_DATA_OKEY])) {
2588                         if ((okey = blobmsg_get_u32(cur)))
2589                                 oflags |= GRE_KEY;
2590                 }
2591
2592                 if ((cur = tb_data[GRE_DATA_ICSUM])) {
2593                         if (blobmsg_get_bool(cur))
2594                                 iflags |= GRE_CSUM;
2595                 }
2596
2597                 if ((cur = tb_data[GRE_DATA_OCSUM])) {
2598                         if (blobmsg_get_bool(cur))
2599                                 oflags |= GRE_CSUM;
2600                 }
2601
2602                 if ((cur = tb_data[GRE_DATA_ISEQNO])) {
2603                         if (blobmsg_get_bool(cur))
2604                                 iflags |= GRE_SEQ;
2605                 }
2606
2607                 if ((cur = tb_data[GRE_DATA_OSEQNO])) {
2608                         if (blobmsg_get_bool(cur))
2609                                 oflags |= GRE_SEQ;
2610                 }
2611
2612                 if ((cur = tb_data[GRE_DATA_ENCAPLIMIT])) {
2613                         char *str = blobmsg_get_string(cur);
2614
2615                         if (strcmp(str, "ignore")) {
2616                                 char *e;
2617
2618                                 encap_limit = strtoul(str, &e, 0);
2619
2620                                 if (e == str || *e || encap_limit > 255) {
2621                                         ret = -EINVAL;
2622                                         goto failure;
2623                                 }
2624
2625                                 flags6 &= ~IP6_TNL_F_IGN_ENCAP_LIMIT;
2626                         }
2627                 }
2628         }
2629
2630         if (v6) {
2631                 struct in6_addr in6buf;
2632                 if ((cur = tb[TUNNEL_ATTR_LOCAL])) {
2633                         if (inet_pton(AF_INET6, blobmsg_data(cur), &in6buf) < 1) {
2634                                 ret = -EINVAL;
2635                                 goto failure;
2636                         }
2637                         nla_put(nlm, IFLA_GRE_LOCAL, sizeof(in6buf), &in6buf);
2638                 }
2639
2640                 if ((cur = tb[TUNNEL_ATTR_REMOTE])) {
2641                         if (inet_pton(AF_INET6, blobmsg_data(cur), &in6buf) < 1) {
2642                                 ret = -EINVAL;
2643                                 goto failure;
2644                         }
2645                         nla_put(nlm, IFLA_GRE_REMOTE, sizeof(in6buf), &in6buf);
2646                 }
2647
2648                 if (!(flags6 & IP6_TNL_F_IGN_ENCAP_LIMIT))
2649                         nla_put_u8(nlm, IFLA_GRE_ENCAP_LIMIT, encap_limit);
2650
2651                 if (flowinfo)
2652                         nla_put_u32(nlm, IFLA_GRE_FLOWINFO, flowinfo);
2653
2654                 if (flags6)
2655                         nla_put_u32(nlm, IFLA_GRE_FLAGS, flags6);
2656
2657                 if (!ttl)
2658                         ttl = 64;
2659         } else {
2660                 struct in_addr inbuf;
2661                 bool set_df = true;
2662
2663                 if ((cur = tb[TUNNEL_ATTR_LOCAL])) {
2664                         if (inet_pton(AF_INET, blobmsg_data(cur), &inbuf) < 1) {
2665                                 ret = -EINVAL;
2666                                 goto failure;
2667                         }
2668                         nla_put(nlm, IFLA_GRE_LOCAL, sizeof(inbuf), &inbuf);
2669                 }
2670
2671                 if ((cur = tb[TUNNEL_ATTR_REMOTE])) {
2672                         if (inet_pton(AF_INET, blobmsg_data(cur), &inbuf) < 1) {
2673                                 ret = -EINVAL;
2674                                 goto failure;
2675                         }
2676                         nla_put(nlm, IFLA_GRE_REMOTE, sizeof(inbuf), &inbuf);
2677
2678                         if (IN_MULTICAST(ntohl(inbuf.s_addr))) {
2679                                 if (!okey) {
2680                                         okey = inbuf.s_addr;
2681                                         oflags |= GRE_KEY;
2682                                 }
2683
2684                                 if (!ikey) {
2685                                         ikey = inbuf.s_addr;
2686                                         iflags |= GRE_KEY;
2687                                 }
2688                         }
2689                 }
2690
2691                 if ((cur = tb[TUNNEL_ATTR_DF]))
2692                         set_df = blobmsg_get_bool(cur);
2693
2694                 if (!set_df) {
2695                         /* ttl != 0 and nopmtudisc are incompatible */
2696                         if (ttl) {
2697                                 ret = -EINVAL;
2698                                 goto failure;
2699                         }
2700                 } else if (!ttl)
2701                         ttl = 64;
2702
2703                 nla_put_u8(nlm, IFLA_GRE_PMTUDISC, set_df ? 1 : 0);
2704
2705                 nla_put_u8(nlm, IFLA_GRE_TOS, tos);
2706         }
2707
2708         if (ttl)
2709                 nla_put_u8(nlm, IFLA_GRE_TTL, ttl);
2710
2711         if (oflags)
2712                 nla_put_u16(nlm, IFLA_GRE_OFLAGS, oflags);
2713
2714         if (iflags)
2715                 nla_put_u16(nlm, IFLA_GRE_IFLAGS, iflags);
2716
2717         if (okey)
2718                 nla_put_u32(nlm, IFLA_GRE_OKEY, htonl(okey));
2719
2720         if (ikey)
2721                 nla_put_u32(nlm, IFLA_GRE_IKEY, htonl(ikey));
2722
2723         nla_nest_end(nlm, infodata);
2724         nla_nest_end(nlm, linkinfo);
2725
2726         return system_rtnl_call(nlm);
2727
2728 failure:
2729         nlmsg_free(nlm);
2730         return ret;
2731 }
2732 #endif
2733
2734 #ifdef IFLA_VTI_MAX
2735 static int system_add_vti_tunnel(const char *name, const char *kind,
2736                                  const unsigned int link, struct blob_attr **tb, bool v6)
2737 {
2738         struct nl_msg *nlm;
2739         struct ifinfomsg ifi = { .ifi_family = AF_UNSPEC, };
2740         struct blob_attr *cur;
2741         int ret = 0;
2742
2743         nlm = nlmsg_alloc_simple(RTM_NEWLINK, NLM_F_REQUEST | NLM_F_REPLACE | NLM_F_CREATE);
2744         if (!nlm)
2745                 return -1;
2746
2747         nlmsg_append(nlm, &ifi, sizeof(ifi), 0);
2748         nla_put_string(nlm, IFLA_IFNAME, name);
2749
2750         struct nlattr *linkinfo = nla_nest_start(nlm, IFLA_LINKINFO);
2751         if (!linkinfo) {
2752                 ret = -ENOMEM;
2753                 goto failure;
2754         }
2755
2756         nla_put_string(nlm, IFLA_INFO_KIND, kind);
2757         struct nlattr *infodata = nla_nest_start(nlm, IFLA_INFO_DATA);
2758         if (!infodata) {
2759                 ret = -ENOMEM;
2760                 goto failure;
2761         }
2762
2763         if (link)
2764                 nla_put_u32(nlm, IFLA_VTI_LINK, link);
2765
2766         if (v6) {
2767                 struct in6_addr in6buf;
2768                 if ((cur = tb[TUNNEL_ATTR_LOCAL])) {
2769                         if (inet_pton(AF_INET6, blobmsg_data(cur), &in6buf) < 1) {
2770                                 ret = -EINVAL;
2771                                 goto failure;
2772                         }
2773                         nla_put(nlm, IFLA_VTI_LOCAL, sizeof(in6buf), &in6buf);
2774                 }
2775
2776                 if ((cur = tb[TUNNEL_ATTR_REMOTE])) {
2777                         if (inet_pton(AF_INET6, blobmsg_data(cur), &in6buf) < 1) {
2778                                 ret = -EINVAL;
2779                                 goto failure;
2780                         }
2781                         nla_put(nlm, IFLA_VTI_REMOTE, sizeof(in6buf), &in6buf);
2782                 }
2783
2784         } else {
2785                 struct in_addr inbuf;
2786
2787                 if ((cur = tb[TUNNEL_ATTR_LOCAL])) {
2788                         if (inet_pton(AF_INET, blobmsg_data(cur), &inbuf) < 1) {
2789                                 ret = -EINVAL;
2790                                 goto failure;
2791                         }
2792                         nla_put(nlm, IFLA_VTI_LOCAL, sizeof(inbuf), &inbuf);
2793                 }
2794
2795                 if ((cur = tb[TUNNEL_ATTR_REMOTE])) {
2796                         if (inet_pton(AF_INET, blobmsg_data(cur), &inbuf) < 1) {
2797                                 ret = -EINVAL;
2798                                 goto failure;
2799                         }
2800                         nla_put(nlm, IFLA_VTI_REMOTE, sizeof(inbuf), &inbuf);
2801                 }
2802
2803         }
2804
2805         if ((cur = tb[TUNNEL_ATTR_DATA])) {
2806                 struct blob_attr *tb_data[__VTI_DATA_ATTR_MAX];
2807                 uint32_t ikey = 0, okey = 0;
2808
2809                 blobmsg_parse(vti_data_attr_list.params, __VTI_DATA_ATTR_MAX, tb_data,
2810                         blobmsg_data(cur), blobmsg_len(cur));
2811
2812                 if ((cur = tb_data[VTI_DATA_IKEY])) {
2813                         if ((ikey = blobmsg_get_u32(cur)))
2814                                 nla_put_u32(nlm, IFLA_VTI_IKEY, htonl(ikey));
2815                 }
2816
2817                 if ((cur = tb_data[VTI_DATA_OKEY])) {
2818                         if ((okey = blobmsg_get_u32(cur)))
2819                                 nla_put_u32(nlm, IFLA_VTI_OKEY, htonl(okey));
2820                 }
2821         }
2822
2823         nla_nest_end(nlm, infodata);
2824         nla_nest_end(nlm, linkinfo);
2825
2826         return system_rtnl_call(nlm);
2827
2828 failure:
2829         nlmsg_free(nlm);
2830         return ret;
2831 }
2832 #endif
2833
2834 #ifdef IFLA_VXLAN_MAX
2835 static int system_add_vxlan(const char *name, const unsigned int link, struct blob_attr **tb, bool v6)
2836 {
2837         struct blob_attr *tb_data[__VXLAN_DATA_ATTR_MAX];
2838         struct nl_msg *msg;
2839         struct nlattr *linkinfo, *data;
2840         struct ifinfomsg iim = { .ifi_family = AF_UNSPEC, };
2841         struct blob_attr *cur;
2842         int ret = 0;
2843
2844         if ((cur = tb[TUNNEL_ATTR_DATA]))
2845                 blobmsg_parse(vxlan_data_attr_list.params, __VXLAN_DATA_ATTR_MAX, tb_data,
2846                         blobmsg_data(cur), blobmsg_len(cur));
2847         else
2848                 return -EINVAL;
2849
2850         msg = nlmsg_alloc_simple(RTM_NEWLINK, NLM_F_REQUEST | NLM_F_CREATE | NLM_F_EXCL);
2851
2852         if (!msg)
2853                 return -1;
2854
2855         nlmsg_append(msg, &iim, sizeof(iim), 0);
2856
2857         nla_put_string(msg, IFLA_IFNAME, name);
2858
2859         if ((cur = tb_data[VXLAN_DATA_ATTR_MACADDR])) {
2860                 struct ether_addr *ea = ether_aton(blobmsg_get_string(cur));
2861                 if (!ea) {
2862                         ret = -EINVAL;
2863                         goto failure;
2864                 }
2865
2866                 nla_put(msg, IFLA_ADDRESS, ETH_ALEN, ea);
2867         }
2868
2869         if ((cur = tb[TUNNEL_ATTR_MTU])) {
2870                 uint32_t mtu = blobmsg_get_u32(cur);
2871                 nla_put_u32(msg, IFLA_MTU, mtu);
2872         }
2873
2874         if (!(linkinfo = nla_nest_start(msg, IFLA_LINKINFO))) {
2875                 ret = -ENOMEM;
2876                 goto failure;
2877         }
2878
2879         nla_put_string(msg, IFLA_INFO_KIND, "vxlan");
2880
2881         if (!(data = nla_nest_start(msg, IFLA_INFO_DATA))) {
2882                 ret = -ENOMEM;
2883                 goto failure;
2884         }
2885
2886         if (link)
2887                 nla_put_u32(msg, IFLA_VXLAN_LINK, link);
2888
2889         if ((cur = tb_data[VXLAN_DATA_ATTR_ID])) {
2890                 uint32_t id = blobmsg_get_u32(cur);
2891                 if (id >= (1u << 24) - 1) {
2892                         ret = -EINVAL;
2893                         goto failure;
2894                 }
2895
2896                 nla_put_u32(msg, IFLA_VXLAN_ID, id);
2897         }
2898
2899         if (v6) {
2900                 struct in6_addr in6buf;
2901                 if ((cur = tb[TUNNEL_ATTR_LOCAL])) {
2902                         if (inet_pton(AF_INET6, blobmsg_data(cur), &in6buf) < 1) {
2903                                 ret = -EINVAL;
2904                                 goto failure;
2905                         }
2906                         nla_put(msg, IFLA_VXLAN_LOCAL6, sizeof(in6buf), &in6buf);
2907                 }
2908
2909                 if ((cur = tb[TUNNEL_ATTR_REMOTE])) {
2910                         if (inet_pton(AF_INET6, blobmsg_data(cur), &in6buf) < 1) {
2911                                 ret = -EINVAL;
2912                                 goto failure;
2913                         }
2914                         nla_put(msg, IFLA_VXLAN_GROUP6, sizeof(in6buf), &in6buf);
2915                 }
2916         } else {
2917                 struct in_addr inbuf;
2918
2919                 if ((cur = tb[TUNNEL_ATTR_LOCAL])) {
2920                         if (inet_pton(AF_INET, blobmsg_data(cur), &inbuf) < 1) {
2921                                 ret = -EINVAL;
2922                                 goto failure;
2923                         }
2924                         nla_put(msg, IFLA_VXLAN_LOCAL, sizeof(inbuf), &inbuf);
2925                 }
2926
2927                 if ((cur = tb[TUNNEL_ATTR_REMOTE])) {
2928                         if (inet_pton(AF_INET, blobmsg_data(cur), &inbuf) < 1) {
2929                                 ret = -EINVAL;
2930                                 goto failure;
2931                         }
2932                         nla_put(msg, IFLA_VXLAN_GROUP, sizeof(inbuf), &inbuf);
2933                 }
2934         }
2935
2936         uint32_t port = 4789;
2937         if ((cur = tb_data[VXLAN_DATA_ATTR_PORT])) {
2938                 port = blobmsg_get_u32(cur);
2939                 if (port < 1 || port > 65535) {
2940                         ret = -EINVAL;
2941                         goto failure;
2942                 }
2943         }
2944         nla_put_u16(msg, IFLA_VXLAN_PORT, htons(port));
2945
2946         if ((cur = tb_data[VXLAN_DATA_ATTR_RXCSUM])) {
2947                 bool rxcsum = blobmsg_get_bool(cur);
2948                 nla_put_u8(msg, IFLA_VXLAN_UDP_ZERO_CSUM6_RX, !rxcsum);
2949         }
2950
2951         if ((cur = tb_data[VXLAN_DATA_ATTR_TXCSUM])) {
2952                 bool txcsum = blobmsg_get_bool(cur);
2953                 nla_put_u8(msg, IFLA_VXLAN_UDP_CSUM, txcsum);
2954                 nla_put_u8(msg, IFLA_VXLAN_UDP_ZERO_CSUM6_TX, !txcsum);
2955         }
2956
2957         if ((cur = tb[TUNNEL_ATTR_TOS])) {
2958                 char *str = blobmsg_get_string(cur);
2959                 unsigned tos = 1;
2960
2961                 if (strcmp(str, "inherit")) {
2962                         if (!system_tos_aton(str, &tos)) {
2963                                 ret = -EINVAL;
2964                                 goto failure;
2965                         }
2966                 }
2967
2968                 nla_put_u8(msg, IFLA_VXLAN_TOS, tos);
2969         }
2970
2971         if ((cur = tb[TUNNEL_ATTR_TTL])) {
2972                 uint32_t ttl = blobmsg_get_u32(cur);
2973                 if (ttl < 1 || ttl > 255) {
2974                         ret = -EINVAL;
2975                         goto failure;
2976                 }
2977
2978                 nla_put_u8(msg, IFLA_VXLAN_TTL, ttl);
2979         }
2980
2981         nla_nest_end(msg, data);
2982         nla_nest_end(msg, linkinfo);
2983
2984         ret = system_rtnl_call(msg);
2985         if (ret)
2986                 D(SYSTEM, "Error adding vxlan '%s': %d\n", name, ret);
2987
2988         return ret;
2989
2990 failure:
2991         nlmsg_free(msg);
2992         return ret;
2993 }
2994 #endif
2995
2996 static int system_add_sit_tunnel(const char *name, const unsigned int link, struct blob_attr **tb)
2997 {
2998         struct blob_attr *cur;
2999         int ret = 0;
3000
3001         if (system_add_proto_tunnel(name, IPPROTO_IPV6, link, tb) < 0)
3002                 return -1;
3003
3004 #ifdef SIOCADD6RD
3005         if ((cur = tb[TUNNEL_ATTR_DATA])) {
3006                 struct blob_attr *tb_data[__SIXRD_DATA_ATTR_MAX];
3007                 unsigned int mask;
3008                 struct ip_tunnel_6rd p6;
3009
3010                 blobmsg_parse(sixrd_data_attr_list.params, __SIXRD_DATA_ATTR_MAX, tb_data,
3011                         blobmsg_data(cur), blobmsg_len(cur));
3012
3013                 memset(&p6, 0, sizeof(p6));
3014
3015                 if ((cur = tb_data[SIXRD_DATA_PREFIX])) {
3016                         if (!parse_ip_and_netmask(AF_INET6, blobmsg_data(cur),
3017                                                 &p6.prefix, &mask) || mask > 128) {
3018                                 ret = -EINVAL;
3019                                 goto failure;
3020                         }
3021
3022                         p6.prefixlen = mask;
3023                 }
3024
3025                 if ((cur = tb_data[SIXRD_DATA_RELAY_PREFIX])) {
3026                         if (!parse_ip_and_netmask(AF_INET, blobmsg_data(cur),
3027                                                 &p6.relay_prefix, &mask) || mask > 32) {
3028                                 ret = -EINVAL;
3029                                 goto failure;
3030                         }
3031
3032                         p6.relay_prefixlen = mask;
3033                 }
3034
3035                 if (tunnel_ioctl(name, SIOCADD6RD, &p6) < 0) {
3036                         ret = -1;
3037                         goto failure;
3038                 }
3039         }
3040 #endif
3041
3042         return ret;
3043
3044 failure:
3045         __system_del_ip_tunnel(name, tb);
3046         return ret;
3047 }
3048
3049 static int system_add_proto_tunnel(const char *name, const uint8_t proto, const unsigned int link, struct blob_attr **tb)
3050 {
3051         struct blob_attr *cur;
3052         bool set_df = true;
3053         struct ip_tunnel_parm p  = {
3054                 .link = link,
3055                 .iph = {
3056                         .version = 4,
3057                         .ihl = 5,
3058                         .protocol = proto,
3059                 }
3060         };
3061
3062         if ((cur = tb[TUNNEL_ATTR_LOCAL]) &&
3063                         inet_pton(AF_INET, blobmsg_data(cur), &p.iph.saddr) < 1)
3064                 return -EINVAL;
3065
3066         if ((cur = tb[TUNNEL_ATTR_REMOTE]) &&
3067                         inet_pton(AF_INET, blobmsg_data(cur), &p.iph.daddr) < 1)
3068                 return -EINVAL;
3069
3070         if ((cur = tb[TUNNEL_ATTR_DF]))
3071                 set_df = blobmsg_get_bool(cur);
3072
3073         if ((cur = tb[TUNNEL_ATTR_TTL]))
3074                 p.iph.ttl = blobmsg_get_u32(cur);
3075
3076         if ((cur = tb[TUNNEL_ATTR_TOS])) {
3077                 char *str = blobmsg_get_string(cur);
3078                 if (strcmp(str, "inherit")) {
3079                         unsigned uval;
3080
3081                         if (!system_tos_aton(str, &uval))
3082                                 return -EINVAL;
3083
3084                         p.iph.tos = uval;
3085                 } else
3086                         p.iph.tos = 1;
3087         }
3088
3089         p.iph.frag_off = set_df ? htons(IP_DF) : 0;
3090         /* ttl !=0 and nopmtudisc are incompatible */
3091         if (p.iph.ttl && p.iph.frag_off == 0)
3092                 return -EINVAL;
3093
3094         strncpy(p.name, name, sizeof(p.name) - 1);
3095
3096         switch (p.iph.protocol) {
3097         case IPPROTO_IPIP:
3098                 return tunnel_ioctl("tunl0", SIOCADDTUNNEL, &p);
3099         case IPPROTO_IPV6:
3100                 return tunnel_ioctl("sit0", SIOCADDTUNNEL, &p);
3101         default:
3102                 break;
3103         }
3104         return -1;
3105 }
3106
3107 static int __system_del_ip_tunnel(const char *name, struct blob_attr **tb)
3108 {
3109         struct blob_attr *cur;
3110         const char *str;
3111
3112         if (!(cur = tb[TUNNEL_ATTR_TYPE]))
3113                 return -EINVAL;
3114         str = blobmsg_data(cur);
3115
3116         if (!strcmp(str, "greip") || !strcmp(str, "gretapip") ||
3117             !strcmp(str, "greip6") || !strcmp(str, "gretapip6") ||
3118             !strcmp(str, "vtiip") || !strcmp(str, "vtiip6") ||
3119             !strcmp(str, "vxlan") || !strcmp(str, "vxlan6"))
3120                 return system_link_del(name);
3121         else
3122                 return tunnel_ioctl(name, SIOCDELTUNNEL, NULL);
3123 }
3124
3125 int system_del_ip_tunnel(const char *name, struct blob_attr *attr)
3126 {
3127         struct blob_attr *tb[__TUNNEL_ATTR_MAX];
3128
3129         blobmsg_parse(tunnel_attr_list.params, __TUNNEL_ATTR_MAX, tb,
3130                 blob_data(attr), blob_len(attr));
3131
3132         return __system_del_ip_tunnel(name, tb);
3133 }
3134
3135 int system_update_ipv6_mtu(struct device *dev, int mtu)
3136 {
3137         int ret = -1;
3138         char buf[64];
3139         int fd;
3140
3141         snprintf(buf, sizeof(buf), "/proc/sys/net/ipv6/conf/%s/mtu",
3142                         dev->ifname);
3143
3144         fd = open(buf, O_RDWR);
3145         if (fd < 0)
3146                 return ret;
3147
3148         if (!mtu) {
3149                 ssize_t len = read(fd, buf, sizeof(buf) - 1);
3150                 if (len < 0)
3151                         goto out;
3152
3153                 buf[len] = 0;
3154                 ret = atoi(buf);
3155         } else {
3156                 if (write(fd, buf, snprintf(buf, sizeof(buf), "%i", mtu)) > 0)
3157                         ret = mtu;
3158         }
3159
3160 out:
3161         close(fd);
3162         return ret;
3163 }
3164
3165 int system_add_ip_tunnel(const char *name, struct blob_attr *attr)
3166 {
3167         struct blob_attr *tb[__TUNNEL_ATTR_MAX];
3168         struct blob_attr *cur;
3169         const char *str;
3170
3171         blobmsg_parse(tunnel_attr_list.params, __TUNNEL_ATTR_MAX, tb,
3172                 blob_data(attr), blob_len(attr));
3173
3174         __system_del_ip_tunnel(name, tb);
3175
3176         if (!(cur = tb[TUNNEL_ATTR_TYPE]))
3177                 return -EINVAL;
3178         str = blobmsg_data(cur);
3179
3180         unsigned int ttl = 0;
3181         if ((cur = tb[TUNNEL_ATTR_TTL])) {
3182                 ttl = blobmsg_get_u32(cur);
3183                 if (ttl > 255)
3184                         return -EINVAL;
3185         }
3186
3187         unsigned int link = 0;
3188         if ((cur = tb[TUNNEL_ATTR_LINK])) {
3189                 struct interface *iface = vlist_find(&interfaces, blobmsg_data(cur), iface, node);
3190                 if (!iface)
3191                         return -EINVAL;
3192
3193                 if (iface->l3_dev.dev)
3194                         link = iface->l3_dev.dev->ifindex;
3195         }
3196
3197         if (!strcmp(str, "sit"))
3198                 return system_add_sit_tunnel(name, link, tb);
3199 #ifdef IFLA_IPTUN_MAX
3200         else if (!strcmp(str, "ipip6")) {
3201                 return system_add_ip6_tunnel(name, link, tb);
3202         } else if (!strcmp(str, "greip")) {
3203                 return system_add_gre_tunnel(name, "gre", link, tb, false);
3204         } else if (!strcmp(str, "gretapip"))  {
3205                 return system_add_gre_tunnel(name, "gretap", link, tb, false);
3206         } else if (!strcmp(str, "greip6")) {
3207                 return system_add_gre_tunnel(name, "ip6gre", link, tb, true);
3208         } else if (!strcmp(str, "gretapip6")) {
3209                 return system_add_gre_tunnel(name, "ip6gretap", link, tb, true);
3210 #ifdef IFLA_VTI_MAX
3211         } else if (!strcmp(str, "vtiip")) {
3212                 return system_add_vti_tunnel(name, "vti", link, tb, false);
3213         } else if (!strcmp(str, "vtiip6")) {
3214                 return system_add_vti_tunnel(name, "vti6", link, tb, true);
3215 #endif
3216 #ifdef IFLA_VXLAN_MAX
3217         } else if(!strcmp(str, "vxlan")) {
3218                 return system_add_vxlan(name, link, tb, false);
3219         } else if(!strcmp(str, "vxlan6")) {
3220                 return system_add_vxlan(name, link, tb, true);
3221 #endif
3222 #endif
3223         } else if (!strcmp(str, "ipip")) {
3224                 return system_add_proto_tunnel(name, IPPROTO_IPIP, link, tb);
3225         }
3226         else
3227                 return -EINVAL;
3228
3229         return 0;
3230 }