Add support for ip rules
[project/netifd.git] / system-linux.c
1 /*
2 * netifd - network interface daemon
3 * Copyright (C) 2012 Felix Fietkau <nbd@openwrt.org>
4 * Copyright (C) 2013 Jo-Philipp Wich <jow@openwrt.org>
5 *
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2
8 * as published by the Free Software Foundation
9 *
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
14 */
15 #define _GNU_SOURCE
16
17 #include <sys/socket.h>
18 #include <sys/ioctl.h>
19 #include <sys/stat.h>
20 #include <sys/syscall.h>
21
22 #include <net/if.h>
23 #include <net/if_arp.h>
24
25 #include <arpa/inet.h>
26 #include <netinet/in.h>
27
28 #include <linux/rtnetlink.h>
29 #include <linux/sockios.h>
30 #include <linux/ip.h>
31 #include <linux/if_vlan.h>
32 #include <linux/if_bridge.h>
33 #include <linux/if_tunnel.h>
34 #include <linux/ethtool.h>
35 #include <linux/fib_rules.h>
36
37 #include <unistd.h>
38 #include <string.h>
39 #include <fcntl.h>
40 #include <glob.h>
41 #include <time.h>
42
43 #include <netlink/msg.h>
44 #include <netlink/attr.h>
45 #include <netlink/socket.h>
46 #include <libubox/uloop.h>
47
48 #include "netifd.h"
49 #include "device.h"
50 #include "system.h"
51
52 struct event_socket {
53 struct uloop_fd uloop;
54 struct nl_sock *sock;
55 struct nl_cb *cb;
56 };
57
58 static int sock_ioctl = -1;
59 static struct nl_sock *sock_rtnl = NULL;
60
61 static int cb_rtnl_event(struct nl_msg *msg, void *arg);
62 static void handle_hotplug_event(struct uloop_fd *u, unsigned int events);
63
64 static char dev_buf[256];
65
66 static void
67 handler_nl_event(struct uloop_fd *u, unsigned int events)
68 {
69 struct event_socket *ev = container_of(u, struct event_socket, uloop);
70 nl_recvmsgs(ev->sock, ev->cb);
71 }
72
73 static struct nl_sock *
74 create_socket(int protocol, int groups)
75 {
76 struct nl_sock *sock;
77
78 sock = nl_socket_alloc();
79 if (!sock)
80 return NULL;
81
82 if (groups)
83 nl_join_groups(sock, groups);
84
85 if (nl_connect(sock, protocol))
86 return NULL;
87
88 return sock;
89 }
90
91 static bool
92 create_raw_event_socket(struct event_socket *ev, int protocol, int groups,
93 uloop_fd_handler cb)
94 {
95 ev->sock = create_socket(protocol, groups);
96 if (!ev->sock)
97 return false;
98
99 ev->uloop.fd = nl_socket_get_fd(ev->sock);
100 ev->uloop.cb = cb;
101 uloop_fd_add(&ev->uloop, ULOOP_READ | ULOOP_EDGE_TRIGGER);
102 return true;
103 }
104
105 static bool
106 create_event_socket(struct event_socket *ev, int protocol,
107 int (*cb)(struct nl_msg *msg, void *arg))
108 {
109 // Prepare socket for link events
110 ev->cb = nl_cb_alloc(NL_CB_DEFAULT);
111 if (!ev->cb)
112 return false;
113
114 nl_cb_set(ev->cb, NL_CB_VALID, NL_CB_CUSTOM, cb, NULL);
115
116 return create_raw_event_socket(ev, protocol, 0, handler_nl_event);
117 }
118
119 int system_init(void)
120 {
121 static struct event_socket rtnl_event;
122 static struct event_socket hotplug_event;
123
124 sock_ioctl = socket(AF_LOCAL, SOCK_DGRAM, 0);
125 fcntl(sock_ioctl, F_SETFD, fcntl(sock_ioctl, F_GETFD) | FD_CLOEXEC);
126
127 // Prepare socket for routing / address control
128 sock_rtnl = create_socket(NETLINK_ROUTE, 0);
129 if (!sock_rtnl)
130 return -1;
131
132 if (!create_event_socket(&rtnl_event, NETLINK_ROUTE, cb_rtnl_event))
133 return -1;
134
135 if (!create_raw_event_socket(&hotplug_event, NETLINK_KOBJECT_UEVENT, 1,
136 handle_hotplug_event))
137 return -1;
138
139 // Receive network link events form kernel
140 nl_socket_add_membership(rtnl_event.sock, RTNLGRP_LINK);
141
142 return 0;
143 }
144
145 static void system_set_sysctl(const char *path, const char *val)
146 {
147 int fd;
148
149 fd = open(path, O_WRONLY);
150 if (fd < 0)
151 return;
152
153 write(fd, val, strlen(val));
154 close(fd);
155 }
156
157 static void system_set_dev_sysctl(const char *path, const char *device, const char *val)
158 {
159 snprintf(dev_buf, sizeof(dev_buf), path, device);
160 system_set_sysctl(dev_buf, val);
161 }
162
163 static void system_set_disable_ipv6(struct device *dev, const char *val)
164 {
165 system_set_dev_sysctl("/proc/sys/net/ipv6/conf/%s/disable_ipv6", dev->ifname, val);
166 }
167
168 // Evaluate netlink messages
169 static int cb_rtnl_event(struct nl_msg *msg, void *arg)
170 {
171 struct nlmsghdr *nh = nlmsg_hdr(msg);
172 struct ifinfomsg *ifi = NLMSG_DATA(nh);
173 struct nlattr *nla[__IFLA_MAX];
174
175 if (nh->nlmsg_type != RTM_DELLINK && nh->nlmsg_type != RTM_NEWLINK)
176 goto out;
177
178 nlmsg_parse(nh, sizeof(*ifi), nla, __IFLA_MAX - 1, NULL);
179 if (!nla[IFLA_IFNAME])
180 goto out;
181
182 struct device *dev = device_get(RTA_DATA(nla[IFLA_IFNAME]), false);
183 if (!dev)
184 goto out;
185
186 dev->ifindex = ifi->ifi_index;
187 /* TODO: parse link status */
188
189 out:
190 return 0;
191 }
192
193 static void
194 handle_hotplug_msg(char *data, int size)
195 {
196 const char *subsystem = NULL, *interface = NULL;
197 char *cur, *end, *sep;
198 struct device *dev;
199 int skip;
200 bool add;
201
202 if (!strncmp(data, "add@", 4))
203 add = true;
204 else if (!strncmp(data, "remove@", 7))
205 add = false;
206 else
207 return;
208
209 skip = strlen(data) + 1;
210 end = data + size;
211
212 for (cur = data + skip; cur < end; cur += skip) {
213 skip = strlen(cur) + 1;
214
215 sep = strchr(cur, '=');
216 if (!sep)
217 continue;
218
219 *sep = 0;
220 if (!strcmp(cur, "INTERFACE"))
221 interface = sep + 1;
222 else if (!strcmp(cur, "SUBSYSTEM")) {
223 subsystem = sep + 1;
224 if (strcmp(subsystem, "net") != 0)
225 return;
226 }
227 if (subsystem && interface)
228 goto found;
229 }
230 return;
231
232 found:
233 dev = device_get(interface, false);
234 if (!dev)
235 return;
236
237 if (dev->type != &simple_device_type)
238 return;
239
240 if (add && system_if_force_external(dev->ifname))
241 return;
242
243 device_set_present(dev, add);
244 }
245
246 static void
247 handle_hotplug_event(struct uloop_fd *u, unsigned int events)
248 {
249 struct event_socket *ev = container_of(u, struct event_socket, uloop);
250 struct sockaddr_nl nla;
251 unsigned char *buf = NULL;
252 int size;
253
254 while ((size = nl_recv(ev->sock, &nla, &buf, NULL)) > 0) {
255 if (nla.nl_pid == 0)
256 handle_hotplug_msg((char *) buf, size);
257
258 free(buf);
259 }
260 }
261
262 static int system_rtnl_call(struct nl_msg *msg)
263 {
264 int ret;
265
266 ret = nl_send_auto_complete(sock_rtnl, msg);
267 nlmsg_free(msg);
268
269 if (ret < 0)
270 return ret;
271
272 return nl_wait_for_ack(sock_rtnl);
273 }
274
275 int system_bridge_delbr(struct device *bridge)
276 {
277 return ioctl(sock_ioctl, SIOCBRDELBR, bridge->ifname);
278 }
279
280 static int system_bridge_if(const char *bridge, struct device *dev, int cmd, void *data)
281 {
282 struct ifreq ifr;
283
284 memset(&ifr, 0, sizeof(ifr));
285 if (dev)
286 ifr.ifr_ifindex = dev->ifindex;
287 else
288 ifr.ifr_data = data;
289 strncpy(ifr.ifr_name, bridge, sizeof(ifr.ifr_name));
290 return ioctl(sock_ioctl, cmd, &ifr);
291 }
292
293 static bool system_is_bridge(const char *name, char *buf, int buflen)
294 {
295 struct stat st;
296
297 snprintf(buf, buflen, "/sys/devices/virtual/net/%s/bridge", name);
298 if (stat(buf, &st) < 0)
299 return false;
300
301 return true;
302 }
303
304 static char *system_get_bridge(const char *name, char *buf, int buflen)
305 {
306 char *path;
307 ssize_t len;
308 glob_t gl;
309
310 snprintf(buf, buflen, "/sys/devices/virtual/net/*/brif/%s/bridge", name);
311 if (glob(buf, GLOB_NOSORT, NULL, &gl) < 0)
312 return NULL;
313
314 if (gl.gl_pathc == 0)
315 return NULL;
316
317 len = readlink(gl.gl_pathv[0], buf, buflen);
318 if (len < 0)
319 return NULL;
320
321 buf[len] = 0;
322 path = strrchr(buf, '/');
323 if (!path)
324 return NULL;
325
326 return path + 1;
327 }
328
329 int system_bridge_addif(struct device *bridge, struct device *dev)
330 {
331 char *oldbr;
332
333 system_set_disable_ipv6(dev, "1");
334 oldbr = system_get_bridge(dev->ifname, dev_buf, sizeof(dev_buf));
335 if (oldbr && !strcmp(oldbr, bridge->ifname))
336 return 0;
337
338 return system_bridge_if(bridge->ifname, dev, SIOCBRADDIF, NULL);
339 }
340
341 int system_bridge_delif(struct device *bridge, struct device *dev)
342 {
343 system_set_disable_ipv6(dev, "0");
344 return system_bridge_if(bridge->ifname, dev, SIOCBRDELIF, NULL);
345 }
346
347 static int system_if_resolve(struct device *dev)
348 {
349 struct ifreq ifr;
350 strncpy(ifr.ifr_name, dev->ifname, sizeof(ifr.ifr_name));
351 if (!ioctl(sock_ioctl, SIOCGIFINDEX, &ifr))
352 return ifr.ifr_ifindex;
353 else
354 return 0;
355 }
356
357 static int system_if_flags(const char *ifname, unsigned add, unsigned rem)
358 {
359 struct ifreq ifr;
360
361 memset(&ifr, 0, sizeof(ifr));
362 strncpy(ifr.ifr_name, ifname, sizeof(ifr.ifr_name));
363 ioctl(sock_ioctl, SIOCGIFFLAGS, &ifr);
364 ifr.ifr_flags |= add;
365 ifr.ifr_flags &= ~rem;
366 return ioctl(sock_ioctl, SIOCSIFFLAGS, &ifr);
367 }
368
369 struct clear_data {
370 struct nl_msg *msg;
371 struct device *dev;
372 int type;
373 int size;
374 int af;
375 };
376
377
378 static bool check_ifaddr(struct nlmsghdr *hdr, int ifindex)
379 {
380 struct ifaddrmsg *ifa = NLMSG_DATA(hdr);
381
382 return ifa->ifa_index == ifindex;
383 }
384
385 static bool check_route(struct nlmsghdr *hdr, int ifindex)
386 {
387 struct rtmsg *r = NLMSG_DATA(hdr);
388 struct nlattr *tb[__RTA_MAX];
389
390 if (r->rtm_protocol == RTPROT_KERNEL &&
391 r->rtm_family == AF_INET6)
392 return false;
393
394 nlmsg_parse(hdr, sizeof(struct rtmsg), tb, __RTA_MAX - 1, NULL);
395 if (!tb[RTA_OIF])
396 return false;
397
398 return *(int *)RTA_DATA(tb[RTA_OIF]) == ifindex;
399 }
400
401 static bool check_rule(struct nlmsghdr *hdr, int ifindex)
402 {
403 return true;
404 }
405
406 static int cb_clear_event(struct nl_msg *msg, void *arg)
407 {
408 struct clear_data *clr = arg;
409 struct nlmsghdr *hdr = nlmsg_hdr(msg);
410 bool (*cb)(struct nlmsghdr *, int ifindex);
411 int type;
412
413 switch(clr->type) {
414 case RTM_GETADDR:
415 type = RTM_DELADDR;
416 if (hdr->nlmsg_type != RTM_NEWADDR)
417 return NL_SKIP;
418
419 cb = check_ifaddr;
420 break;
421 case RTM_GETROUTE:
422 type = RTM_DELROUTE;
423 if (hdr->nlmsg_type != RTM_NEWROUTE)
424 return NL_SKIP;
425
426 cb = check_route;
427 break;
428 case RTM_GETRULE:
429 type = RTM_DELRULE;
430 if (hdr->nlmsg_type != RTM_NEWRULE)
431 return NL_SKIP;
432
433 cb = check_rule;
434 break;
435 default:
436 return NL_SKIP;
437 }
438
439 if (!cb(hdr, clr->dev ? clr->dev->ifindex : 0))
440 return NL_SKIP;
441
442 if (type == RTM_DELRULE)
443 D(SYSTEM, "Remove a rule\n");
444 else
445 D(SYSTEM, "Remove %s from device %s\n",
446 type == RTM_DELADDR ? "an address" : "a route",
447 clr->dev->ifname);
448 memcpy(nlmsg_hdr(clr->msg), hdr, hdr->nlmsg_len);
449 hdr = nlmsg_hdr(clr->msg);
450 hdr->nlmsg_type = type;
451 hdr->nlmsg_flags = NLM_F_REQUEST;
452
453 if (!nl_send_auto_complete(sock_rtnl, clr->msg))
454 nl_wait_for_ack(sock_rtnl);
455
456 return NL_SKIP;
457 }
458
459 static int
460 cb_finish_event(struct nl_msg *msg, void *arg)
461 {
462 int *pending = arg;
463 *pending = 0;
464 return NL_STOP;
465 }
466
467 static int
468 error_handler(struct sockaddr_nl *nla, struct nlmsgerr *err, void *arg)
469 {
470 int *pending = arg;
471 *pending = err->error;
472 return NL_STOP;
473 }
474
475 static void
476 system_if_clear_entries(struct device *dev, int type, int af)
477 {
478 struct clear_data clr;
479 struct nl_cb *cb = nl_cb_alloc(NL_CB_DEFAULT);
480 struct rtmsg rtm = {
481 .rtm_family = af,
482 .rtm_flags = RTM_F_CLONED,
483 };
484 int flags = NLM_F_DUMP;
485 int pending = 1;
486
487 clr.af = af;
488 clr.dev = dev;
489 clr.type = type;
490 switch (type) {
491 case RTM_GETADDR:
492 case RTM_GETRULE:
493 clr.size = sizeof(struct rtgenmsg);
494 break;
495 case RTM_GETROUTE:
496 clr.size = sizeof(struct rtmsg);
497 break;
498 default:
499 return;
500 }
501
502 if (!cb)
503 return;
504
505 clr.msg = nlmsg_alloc_simple(type, flags);
506 if (!clr.msg)
507 goto out;
508
509 nlmsg_append(clr.msg, &rtm, clr.size, 0);
510 nl_cb_set(cb, NL_CB_VALID, NL_CB_CUSTOM, cb_clear_event, &clr);
511 nl_cb_set(cb, NL_CB_FINISH, NL_CB_CUSTOM, cb_finish_event, &pending);
512 nl_cb_err(cb, NL_CB_CUSTOM, error_handler, &pending);
513
514 nl_send_auto_complete(sock_rtnl, clr.msg);
515 while (pending > 0)
516 nl_recvmsgs(sock_rtnl, cb);
517
518 nlmsg_free(clr.msg);
519 out:
520 nl_cb_put(cb);
521 }
522
523 /*
524 * Clear bridge (membership) state and bring down device
525 */
526 void system_if_clear_state(struct device *dev)
527 {
528 static char buf[256];
529 char *bridge;
530
531 if (dev->external)
532 return;
533
534 dev->ifindex = system_if_resolve(dev);
535 if (!dev->ifindex)
536 return;
537
538 system_if_flags(dev->ifname, 0, IFF_UP);
539
540 if (system_is_bridge(dev->ifname, buf, sizeof(buf))) {
541 D(SYSTEM, "Delete existing bridge named '%s'\n", dev->ifname);
542 system_bridge_delbr(dev);
543 return;
544 }
545
546 bridge = system_get_bridge(dev->ifname, buf, sizeof(buf));
547 if (bridge) {
548 D(SYSTEM, "Remove device '%s' from bridge '%s'\n", dev->ifname, bridge);
549 system_bridge_if(bridge, dev, SIOCBRDELIF, NULL);
550 }
551
552 system_if_clear_entries(dev, RTM_GETROUTE, AF_INET);
553 system_if_clear_entries(dev, RTM_GETADDR, AF_INET);
554 system_if_clear_entries(dev, RTM_GETROUTE, AF_INET6);
555 system_if_clear_entries(dev, RTM_GETADDR, AF_INET6);
556 system_set_disable_ipv6(dev, "0");
557 }
558
559 static inline unsigned long
560 sec_to_jiffies(int val)
561 {
562 return (unsigned long) val * 100;
563 }
564
565 int system_bridge_addbr(struct device *bridge, struct bridge_config *cfg)
566 {
567 unsigned long args[4] = {};
568
569 if (ioctl(sock_ioctl, SIOCBRADDBR, bridge->ifname) < 0)
570 return -1;
571
572 args[0] = BRCTL_SET_BRIDGE_STP_STATE;
573 args[1] = !!cfg->stp;
574 system_bridge_if(bridge->ifname, NULL, SIOCDEVPRIVATE, &args);
575
576 args[0] = BRCTL_SET_BRIDGE_FORWARD_DELAY;
577 args[1] = sec_to_jiffies(cfg->forward_delay);
578 system_bridge_if(bridge->ifname, NULL, SIOCDEVPRIVATE, &args);
579
580 system_set_dev_sysctl("/sys/devices/virtual/net/%s/bridge/multicast_snooping",
581 bridge->ifname, cfg->igmp_snoop ? "1" : "0");
582
583 if (cfg->flags & BRIDGE_OPT_AGEING_TIME) {
584 args[0] = BRCTL_SET_AGEING_TIME;
585 args[1] = sec_to_jiffies(cfg->ageing_time);
586 system_bridge_if(bridge->ifname, NULL, SIOCDEVPRIVATE, &args);
587 }
588
589 if (cfg->flags & BRIDGE_OPT_HELLO_TIME) {
590 args[0] = BRCTL_SET_BRIDGE_HELLO_TIME;
591 args[1] = sec_to_jiffies(cfg->hello_time);
592 system_bridge_if(bridge->ifname, NULL, SIOCDEVPRIVATE, &args);
593 }
594
595 if (cfg->flags & BRIDGE_OPT_MAX_AGE) {
596 args[0] = BRCTL_SET_BRIDGE_MAX_AGE;
597 args[1] = sec_to_jiffies(cfg->max_age);
598 system_bridge_if(bridge->ifname, NULL, SIOCDEVPRIVATE, &args);
599 }
600
601 return 0;
602 }
603
604 static int system_vlan(struct device *dev, int id)
605 {
606 struct vlan_ioctl_args ifr = {
607 .cmd = SET_VLAN_NAME_TYPE_CMD,
608 .u.name_type = VLAN_NAME_TYPE_RAW_PLUS_VID_NO_PAD,
609 };
610
611 ioctl(sock_ioctl, SIOCSIFVLAN, &ifr);
612
613 if (id < 0) {
614 ifr.cmd = DEL_VLAN_CMD;
615 ifr.u.VID = 0;
616 } else {
617 ifr.cmd = ADD_VLAN_CMD;
618 ifr.u.VID = id;
619 }
620 strncpy(ifr.device1, dev->ifname, sizeof(ifr.device1));
621 return ioctl(sock_ioctl, SIOCSIFVLAN, &ifr);
622 }
623
624 int system_vlan_add(struct device *dev, int id)
625 {
626 return system_vlan(dev, id);
627 }
628
629 int system_vlan_del(struct device *dev)
630 {
631 return system_vlan(dev, -1);
632 }
633
634 static void
635 system_if_get_settings(struct device *dev, struct device_settings *s)
636 {
637 struct ifreq ifr;
638
639 memset(&ifr, 0, sizeof(ifr));
640 strncpy(ifr.ifr_name, dev->ifname, sizeof(ifr.ifr_name));
641
642 if (ioctl(sock_ioctl, SIOCGIFMTU, &ifr) == 0) {
643 s->mtu = ifr.ifr_mtu;
644 s->flags |= DEV_OPT_MTU;
645 }
646
647 if (ioctl(sock_ioctl, SIOCGIFTXQLEN, &ifr) == 0) {
648 s->txqueuelen = ifr.ifr_qlen;
649 s->flags |= DEV_OPT_TXQUEUELEN;
650 }
651
652 if (ioctl(sock_ioctl, SIOCGIFHWADDR, &ifr) == 0) {
653 memcpy(s->macaddr, &ifr.ifr_hwaddr.sa_data, sizeof(s->macaddr));
654 s->flags |= DEV_OPT_MACADDR;
655 }
656 }
657
658 void
659 system_if_apply_settings(struct device *dev, struct device_settings *s)
660 {
661 struct ifreq ifr;
662
663 memset(&ifr, 0, sizeof(ifr));
664 strncpy(ifr.ifr_name, dev->ifname, sizeof(ifr.ifr_name));
665 if (s->flags & DEV_OPT_MTU) {
666 ifr.ifr_mtu = s->mtu;
667 if (ioctl(sock_ioctl, SIOCSIFMTU, &ifr) < 0)
668 s->flags &= ~DEV_OPT_MTU;
669 }
670 if (s->flags & DEV_OPT_TXQUEUELEN) {
671 ifr.ifr_qlen = s->txqueuelen;
672 if (ioctl(sock_ioctl, SIOCSIFTXQLEN, &ifr) < 0)
673 s->flags &= ~DEV_OPT_TXQUEUELEN;
674 }
675 if ((s->flags & DEV_OPT_MACADDR) && !dev->external) {
676 ifr.ifr_hwaddr.sa_family = ARPHRD_ETHER;
677 memcpy(&ifr.ifr_hwaddr.sa_data, s->macaddr, sizeof(s->macaddr));
678 if (ioctl(sock_ioctl, SIOCSIFHWADDR, &ifr) < 0)
679 s->flags &= ~DEV_OPT_MACADDR;
680 }
681 }
682
683 int system_if_up(struct device *dev)
684 {
685 system_if_get_settings(dev, &dev->orig_settings);
686 system_if_apply_settings(dev, &dev->settings);
687 dev->ifindex = system_if_resolve(dev);
688 return system_if_flags(dev->ifname, IFF_UP, 0);
689 }
690
691 int system_if_down(struct device *dev)
692 {
693 int ret = system_if_flags(dev->ifname, 0, IFF_UP);
694 dev->orig_settings.flags &= dev->settings.flags;
695 system_if_apply_settings(dev, &dev->orig_settings);
696 return ret;
697 }
698
699 int system_if_check(struct device *dev)
700 {
701 device_set_present(dev, (system_if_resolve(dev) > 0));
702 return 0;
703 }
704
705 struct device *
706 system_if_get_parent(struct device *dev)
707 {
708 char buf[64], *devname;
709 int ifindex, iflink, len;
710 FILE *f;
711
712 snprintf(buf, sizeof(buf), "/sys/class/net/%s/iflink", dev->ifname);
713 f = fopen(buf, "r");
714 if (!f)
715 return NULL;
716
717 len = fread(buf, 1, sizeof(buf) - 1, f);
718 fclose(f);
719
720 if (len <= 0)
721 return NULL;
722
723 buf[len] = 0;
724 iflink = strtoul(buf, NULL, 0);
725 ifindex = system_if_resolve(dev);
726 if (!iflink || iflink == ifindex)
727 return NULL;
728
729 devname = if_indextoname(iflink, buf);
730 if (!devname)
731 return NULL;
732
733 return device_get(devname, true);
734 }
735
736 static bool
737 read_string_file(int dir_fd, const char *file, char *buf, int len)
738 {
739 bool ret = false;
740 char *c;
741 int fd;
742
743 fd = openat(dir_fd, file, O_RDONLY);
744 if (fd < 0)
745 return false;
746
747 retry:
748 len = read(fd, buf, len - 1);
749 if (len < 0) {
750 if (errno == EINTR)
751 goto retry;
752 } else if (len > 0) {
753 buf[len] = 0;
754
755 c = strchr(buf, '\n');
756 if (c)
757 *c = 0;
758
759 ret = true;
760 }
761
762 close(fd);
763
764 return ret;
765 }
766
767 static bool
768 read_uint64_file(int dir_fd, const char *file, uint64_t *val)
769 {
770 char buf[64];
771 bool ret = false;
772
773 ret = read_string_file(dir_fd, file, buf, sizeof(buf));
774 if (ret)
775 *val = strtoull(buf, NULL, 0);
776
777 return ret;
778 }
779
780 /* Assume advertised flags == supported flags */
781 static const struct {
782 uint32_t mask;
783 const char *name;
784 } ethtool_link_modes[] = {
785 { ADVERTISED_10baseT_Half, "10H" },
786 { ADVERTISED_10baseT_Full, "10F" },
787 { ADVERTISED_100baseT_Half, "100H" },
788 { ADVERTISED_100baseT_Full, "100F" },
789 { ADVERTISED_1000baseT_Half, "1000H" },
790 { ADVERTISED_1000baseT_Full, "1000F" },
791 };
792
793 static void system_add_link_modes(struct blob_buf *b, __u32 mask)
794 {
795 int i;
796 for (i = 0; i < ARRAY_SIZE(ethtool_link_modes); i++) {
797 if (mask & ethtool_link_modes[i].mask)
798 blobmsg_add_string(b, NULL, ethtool_link_modes[i].name);
799 }
800 }
801
802 bool
803 system_if_force_external(const char *ifname)
804 {
805 char buf[64];
806 struct stat s;
807
808 snprintf(buf, sizeof(buf), "/sys/class/net/%s/phy80211", ifname);
809 return stat(buf, &s) == 0;
810 }
811
812 int
813 system_if_dump_info(struct device *dev, struct blob_buf *b)
814 {
815 struct ethtool_cmd ecmd;
816 struct ifreq ifr;
817 char buf[64], *s;
818 void *c;
819 int dir_fd;
820 uint64_t val = 0;
821
822 snprintf(buf, sizeof(buf), "/sys/class/net/%s", dev->ifname);
823 dir_fd = open(buf, O_DIRECTORY);
824
825 if (read_uint64_file(dir_fd, "carrier", &val))
826 blobmsg_add_u8(b, "link", !!val);
827
828 memset(&ecmd, 0, sizeof(ecmd));
829 memset(&ifr, 0, sizeof(ifr));
830 strcpy(ifr.ifr_name, dev->ifname);
831 ifr.ifr_data = (caddr_t) &ecmd;
832 ecmd.cmd = ETHTOOL_GSET;
833
834 if (ioctl(sock_ioctl, SIOCETHTOOL, &ifr) == 0) {
835 c = blobmsg_open_array(b, "link-advertising");
836 system_add_link_modes(b, ecmd.advertising);
837 blobmsg_close_array(b, c);
838
839 c = blobmsg_open_array(b, "link-supported");
840 system_add_link_modes(b, ecmd.supported);
841 blobmsg_close_array(b, c);
842
843 s = blobmsg_alloc_string_buffer(b, "speed", 8);
844 snprintf(s, 8, "%d%c", ethtool_cmd_speed(&ecmd),
845 ecmd.duplex == DUPLEX_HALF ? 'H' : 'F');
846 blobmsg_add_string_buffer(b);
847 }
848
849 close(dir_fd);
850 return 0;
851 }
852
853 int
854 system_if_dump_stats(struct device *dev, struct blob_buf *b)
855 {
856 const char *const counters[] = {
857 "collisions", "rx_frame_errors", "tx_compressed",
858 "multicast", "rx_length_errors", "tx_dropped",
859 "rx_bytes", "rx_missed_errors", "tx_errors",
860 "rx_compressed", "rx_over_errors", "tx_fifo_errors",
861 "rx_crc_errors", "rx_packets", "tx_heartbeat_errors",
862 "rx_dropped", "tx_aborted_errors", "tx_packets",
863 "rx_errors", "tx_bytes", "tx_window_errors",
864 "rx_fifo_errors", "tx_carrier_errors",
865 };
866 char buf[64];
867 int stats_dir;
868 int i;
869 uint64_t val = 0;
870
871 snprintf(buf, sizeof(buf), "/sys/class/net/%s/statistics", dev->ifname);
872 stats_dir = open(buf, O_DIRECTORY);
873 if (stats_dir < 0)
874 return -1;
875
876 for (i = 0; i < ARRAY_SIZE(counters); i++)
877 if (read_uint64_file(stats_dir, counters[i], &val))
878 blobmsg_add_u64(b, counters[i], val);
879
880 close(stats_dir);
881 return 0;
882 }
883
884 static int system_addr(struct device *dev, struct device_addr *addr, int cmd)
885 {
886 bool v4 = ((addr->flags & DEVADDR_FAMILY) == DEVADDR_INET4);
887 int alen = v4 ? 4 : 16;
888 unsigned int flags = 0;
889 struct ifaddrmsg ifa = {
890 .ifa_family = (alen == 4) ? AF_INET : AF_INET6,
891 .ifa_prefixlen = addr->mask,
892 .ifa_index = dev->ifindex,
893 };
894
895 struct nl_msg *msg;
896 if (cmd == RTM_NEWADDR)
897 flags |= NLM_F_CREATE | NLM_F_REPLACE;
898
899 msg = nlmsg_alloc_simple(cmd, flags);
900 if (!msg)
901 return -1;
902
903 nlmsg_append(msg, &ifa, sizeof(ifa), 0);
904 nla_put(msg, IFA_LOCAL, alen, &addr->addr);
905 if (v4) {
906 if (addr->broadcast)
907 nla_put_u32(msg, IFA_BROADCAST, addr->broadcast);
908 if (addr->point_to_point)
909 nla_put_u32(msg, IFA_ADDRESS, addr->point_to_point);
910 } else {
911 time_t now = system_get_rtime();
912 struct ifa_cacheinfo cinfo = {0xffffffffU, 0xffffffffU, 0, 0};
913
914 if (addr->preferred_until) {
915 int preferred = addr->preferred_until - now;
916 if (preferred < 0)
917 preferred = 0;
918
919 cinfo.ifa_prefered = preferred;
920 }
921
922 if (addr->valid_until) {
923 int valid = addr->valid_until - now;
924 if (valid <= 0)
925 return -1;
926
927 cinfo.ifa_valid = valid;
928 }
929
930 nla_put(msg, IFA_CACHEINFO, sizeof(cinfo), &cinfo);
931 }
932
933 return system_rtnl_call(msg);
934 }
935
936 int system_add_address(struct device *dev, struct device_addr *addr)
937 {
938 return system_addr(dev, addr, RTM_NEWADDR);
939 }
940
941 int system_del_address(struct device *dev, struct device_addr *addr)
942 {
943 return system_addr(dev, addr, RTM_DELADDR);
944 }
945
946 static int system_rt(struct device *dev, struct device_route *route, int cmd)
947 {
948 int alen = ((route->flags & DEVADDR_FAMILY) == DEVADDR_INET4) ? 4 : 16;
949 bool have_gw;
950 unsigned int flags = 0;
951
952 if (alen == 4)
953 have_gw = !!route->nexthop.in.s_addr;
954 else
955 have_gw = route->nexthop.in6.s6_addr32[0] ||
956 route->nexthop.in6.s6_addr32[1] ||
957 route->nexthop.in6.s6_addr32[2] ||
958 route->nexthop.in6.s6_addr32[3];
959
960 unsigned char scope = (cmd == RTM_DELROUTE) ? RT_SCOPE_NOWHERE :
961 (have_gw) ? RT_SCOPE_UNIVERSE : RT_SCOPE_LINK;
962
963 unsigned int table = (route->flags & DEVROUTE_TABLE) ? route->table : RT_TABLE_MAIN;
964
965 struct rtmsg rtm = {
966 .rtm_family = (alen == 4) ? AF_INET : AF_INET6,
967 .rtm_dst_len = route->mask,
968 .rtm_table = (table < 256) ? table : RT_TABLE_UNSPEC,
969 .rtm_protocol = (route->flags & DEVADDR_KERNEL) ? RTPROT_KERNEL : RTPROT_STATIC,
970 .rtm_scope = scope,
971 .rtm_type = (cmd == RTM_DELROUTE) ? 0: RTN_UNICAST,
972 };
973 struct nl_msg *msg;
974
975 if (cmd == RTM_NEWROUTE) {
976 flags |= NLM_F_CREATE | NLM_F_REPLACE;
977
978 if (!dev) { // Add null-route
979 rtm.rtm_scope = RT_SCOPE_UNIVERSE;
980 rtm.rtm_type = RTN_UNREACHABLE;
981 }
982 }
983
984 msg = nlmsg_alloc_simple(cmd, flags);
985 if (!msg)
986 return -1;
987
988 nlmsg_append(msg, &rtm, sizeof(rtm), 0);
989
990 if (route->mask)
991 nla_put(msg, RTA_DST, alen, &route->addr);
992
993 if (route->metric > 0)
994 nla_put_u32(msg, RTA_PRIORITY, route->metric);
995
996 if (have_gw)
997 nla_put(msg, RTA_GATEWAY, alen, &route->nexthop);
998
999 if (dev)
1000 nla_put_u32(msg, RTA_OIF, dev->ifindex);
1001
1002 if (table >= 256)
1003 nla_put_u32(msg, RTA_TABLE, table);
1004
1005 return system_rtnl_call(msg);
1006 }
1007
1008 int system_add_route(struct device *dev, struct device_route *route)
1009 {
1010 return system_rt(dev, route, RTM_NEWROUTE);
1011 }
1012
1013 int system_del_route(struct device *dev, struct device_route *route)
1014 {
1015 return system_rt(dev, route, RTM_DELROUTE);
1016 }
1017
1018 int system_flush_routes(void)
1019 {
1020 const char *names[] = {
1021 "/proc/sys/net/ipv4/route/flush",
1022 "/proc/sys/net/ipv6/route/flush"
1023 };
1024 int fd, i;
1025
1026 for (i = 0; i < ARRAY_SIZE(names); i++) {
1027 fd = open(names[i], O_WRONLY);
1028 if (fd < 0)
1029 continue;
1030
1031 write(fd, "-1", 2);
1032 close(fd);
1033 }
1034 return 0;
1035 }
1036
1037 bool system_resolve_rt_table(const char *name, unsigned int *id)
1038 {
1039 FILE *f;
1040 char *e, buf[128];
1041 unsigned int n, table = RT_TABLE_UNSPEC;
1042
1043 /* first try to parse table as number */
1044 if ((n = strtoul(name, &e, 0)) > 0 && !*e)
1045 table = n;
1046
1047 /* handle well known aliases */
1048 else if (!strcmp(name, "default"))
1049 table = RT_TABLE_DEFAULT;
1050 else if (!strcmp(name, "main"))
1051 table = RT_TABLE_MAIN;
1052 else if (!strcmp(name, "local"))
1053 table = RT_TABLE_LOCAL;
1054
1055 /* try to look up name in /etc/iproute2/rt_tables */
1056 else if ((f = fopen("/etc/iproute2/rt_tables", "r")) != NULL)
1057 {
1058 while (fgets(buf, sizeof(buf) - 1, f) != NULL)
1059 {
1060 if ((e = strtok(buf, " \t\n")) == NULL || *e == '#')
1061 continue;
1062
1063 n = strtoul(e, NULL, 10);
1064 e = strtok(NULL, " \t\n");
1065
1066 if (e && !strcmp(e, name))
1067 {
1068 table = n;
1069 break;
1070 }
1071 }
1072
1073 fclose(f);
1074 }
1075
1076 if (table == RT_TABLE_UNSPEC)
1077 return false;
1078
1079 /* do not consider main table special */
1080 if (table == RT_TABLE_MAIN)
1081 table = RT_TABLE_UNSPEC;
1082
1083 *id = table;
1084 return true;
1085 }
1086
1087 static int system_iprule(struct iprule *rule, int cmd)
1088 {
1089 int alen = ((rule->flags & IPRULE_FAMILY) == IPRULE_INET4) ? 4 : 16;
1090
1091 struct nl_msg *msg;
1092 struct rtmsg rtm = {
1093 .rtm_family = (alen == 4) ? AF_INET : AF_INET6,
1094 .rtm_protocol = RTPROT_STATIC,
1095 .rtm_scope = RT_SCOPE_UNIVERSE,
1096 .rtm_table = RT_TABLE_UNSPEC,
1097 .rtm_type = RTN_UNSPEC,
1098 .rtm_flags = 0,
1099 };
1100
1101 if (cmd == RTM_NEWRULE) {
1102 rtm.rtm_type = RTN_UNICAST;
1103 rtm.rtm_flags |= NLM_F_REPLACE | NLM_F_EXCL;
1104 }
1105
1106 if (rule->invert)
1107 rtm.rtm_flags |= FIB_RULE_INVERT;
1108
1109 if (rule->flags & IPRULE_SRC)
1110 rtm.rtm_src_len = rule->src_mask;
1111
1112 if (rule->flags & IPRULE_DEST)
1113 rtm.rtm_dst_len = rule->dest_mask;
1114
1115 if (rule->flags & IPRULE_TOS)
1116 rtm.rtm_tos = rule->tos;
1117
1118 if (rule->flags & IPRULE_LOOKUP) {
1119 if (rule->lookup < 256)
1120 rtm.rtm_table = rule->lookup;
1121 }
1122
1123 if (rule->flags & IPRULE_ACTION)
1124 rtm.rtm_type = rule->action;
1125 else if (rule->flags & IPRULE_GOTO)
1126 rtm.rtm_type = FR_ACT_GOTO;
1127 else if (!(rule->flags & (IPRULE_LOOKUP | IPRULE_ACTION | IPRULE_GOTO)))
1128 rtm.rtm_type = FR_ACT_NOP;
1129
1130 msg = nlmsg_alloc_simple(cmd, NLM_F_REQUEST);
1131
1132 if (!msg)
1133 return -1;
1134
1135 nlmsg_append(msg, &rtm, sizeof(rtm), 0);
1136
1137 if (rule->flags & IPRULE_IN)
1138 nla_put(msg, FRA_IFNAME, strlen(rule->in_dev) + 1, rule->in_dev);
1139
1140 if (rule->flags & IPRULE_OUT)
1141 nla_put(msg, FRA_OIFNAME, strlen(rule->out_dev) + 1, rule->out_dev);
1142
1143 if (rule->flags & IPRULE_SRC)
1144 nla_put(msg, FRA_SRC, alen, &rule->src_addr);
1145
1146 if (rule->flags & IPRULE_DEST)
1147 nla_put(msg, FRA_DST, alen, &rule->dest_addr);
1148
1149 if (rule->flags & IPRULE_PRIORITY)
1150 nla_put_u32(msg, FRA_PRIORITY, rule->priority);
1151
1152 if (rule->flags & IPRULE_FWMARK)
1153 nla_put_u32(msg, FRA_FWMARK, rule->fwmark);
1154
1155 if (rule->flags & IPRULE_FWMASK)
1156 nla_put_u32(msg, FRA_FWMASK, rule->fwmask);
1157
1158 if (rule->flags & IPRULE_LOOKUP) {
1159 if (rule->lookup >= 256)
1160 nla_put_u32(msg, FRA_TABLE, rule->lookup);
1161 }
1162
1163 if (rule->flags & IPRULE_GOTO)
1164 nla_put_u32(msg, FRA_GOTO, rule->gotoid);
1165
1166 return system_rtnl_call(msg);
1167 }
1168
1169 int system_add_iprule(struct iprule *rule)
1170 {
1171 return system_iprule(rule, RTM_NEWRULE);
1172 }
1173
1174 int system_del_iprule(struct iprule *rule)
1175 {
1176 return system_iprule(rule, RTM_DELRULE);
1177 }
1178
1179 int system_flush_iprules(void)
1180 {
1181 int rv = 0;
1182 struct iprule rule;
1183
1184 system_if_clear_entries(NULL, RTM_GETRULE, AF_INET);
1185 system_if_clear_entries(NULL, RTM_GETRULE, AF_INET6);
1186
1187 memset(&rule, 0, sizeof(rule));
1188
1189
1190 rule.flags = IPRULE_INET4 | IPRULE_PRIORITY | IPRULE_LOOKUP;
1191
1192 rule.priority = 0;
1193 rule.lookup = RT_TABLE_LOCAL;
1194 rv |= system_iprule(&rule, RTM_NEWRULE);
1195
1196 rule.priority = 32766;
1197 rule.lookup = RT_TABLE_MAIN;
1198 rv |= system_iprule(&rule, RTM_NEWRULE);
1199
1200 rule.priority = 32767;
1201 rule.lookup = RT_TABLE_DEFAULT;
1202 rv |= system_iprule(&rule, RTM_NEWRULE);
1203
1204
1205 rule.flags = IPRULE_INET6 | IPRULE_PRIORITY | IPRULE_LOOKUP;
1206
1207 rule.priority = 0;
1208 rule.lookup = RT_TABLE_LOCAL;
1209 rv |= system_iprule(&rule, RTM_NEWRULE);
1210
1211 rule.priority = 32766;
1212 rule.lookup = RT_TABLE_MAIN;
1213 rv |= system_iprule(&rule, RTM_NEWRULE);
1214
1215 return rv;
1216 }
1217
1218 bool system_resolve_iprule_action(const char *action, unsigned int *id)
1219 {
1220 char *e;
1221 unsigned int n;
1222
1223 if (!strcmp(action, "local"))
1224 n = RTN_LOCAL;
1225 else if (!strcmp(action, "nat"))
1226 n = RTN_NAT;
1227 else if (!strcmp(action, "broadcast"))
1228 n = RTN_BROADCAST;
1229 else if (!strcmp(action, "anycast"))
1230 n = RTN_ANYCAST;
1231 else if (!strcmp(action, "multicast"))
1232 n = RTN_MULTICAST;
1233 else if (!strcmp(action, "prohibit"))
1234 n = RTN_PROHIBIT;
1235 else if (!strcmp(action, "unreachable"))
1236 n = RTN_UNREACHABLE;
1237 else if (!strcmp(action, "blackhole"))
1238 n = RTN_BLACKHOLE;
1239 else if (!strcmp(action, "xresolve"))
1240 n = RTN_XRESOLVE;
1241 else if (!strcmp(action, "unicast"))
1242 n = RTN_UNICAST;
1243 else if (!strcmp(action, "throw"))
1244 n = RTN_THROW;
1245 else {
1246 n = strtoul(action, &e, 0);
1247 if (!e || *e || e == action || n > 255)
1248 return false;
1249 }
1250
1251 *id = n;
1252 return true;
1253 }
1254
1255 time_t system_get_rtime(void)
1256 {
1257 struct timespec ts;
1258 struct timeval tv;
1259
1260 if (syscall(__NR_clock_gettime, CLOCK_MONOTONIC, &ts) == 0)
1261 return ts.tv_sec;
1262
1263 if (gettimeofday(&tv, NULL) == 0)
1264 return tv.tv_sec;
1265
1266 return 0;
1267 }
1268
1269 #ifndef IP_DF
1270 #define IP_DF 0x4000
1271 #endif
1272
1273 static void tunnel_parm_init(struct ip_tunnel_parm *p)
1274 {
1275 memset(p, 0, sizeof(*p));
1276 p->iph.version = 4;
1277 p->iph.ihl = 5;
1278 p->iph.frag_off = htons(IP_DF);
1279 }
1280
1281 static int tunnel_ioctl(const char *name, int cmd, void *p)
1282 {
1283 struct ifreq ifr;
1284
1285 memset(&ifr, 0, sizeof(ifr));
1286 strncpy(ifr.ifr_name, name, sizeof(ifr.ifr_name));
1287 ifr.ifr_ifru.ifru_data = p;
1288 return ioctl(sock_ioctl, cmd, &ifr);
1289 }
1290
1291 int system_del_ip_tunnel(const char *name)
1292 {
1293 struct ip_tunnel_parm p;
1294
1295 tunnel_parm_init(&p);
1296 return tunnel_ioctl(name, SIOCDELTUNNEL, &p);
1297 }
1298
1299 int system_update_ipv6_mtu(struct device *dev, int mtu)
1300 {
1301 int ret = -1;
1302 char buf[64];
1303 snprintf(buf, sizeof(buf), "/proc/sys/net/ipv6/conf/%s/mtu",
1304 dev->ifname);
1305
1306 int fd = open(buf, O_RDWR);
1307 ssize_t len = read(fd, buf, sizeof(buf) - 1);
1308 if (len < 0)
1309 goto out;
1310
1311 buf[len] = 0;
1312 ret = atoi(buf);
1313
1314 if (!mtu || ret <= mtu)
1315 goto out;
1316
1317 lseek(fd, 0, SEEK_SET);
1318 if (write(fd, buf, snprintf(buf, sizeof(buf), "%i", mtu)) <= 0)
1319 ret = -1;
1320
1321 out:
1322 close(fd);
1323 return ret;
1324 }
1325
1326 static int parse_ipaddr(struct blob_attr *attr, __be32 *addr)
1327 {
1328 if (!attr)
1329 return 1;
1330
1331 return inet_pton(AF_INET, blobmsg_data(attr), (void *) addr);
1332 }
1333
1334
1335 int system_add_ip_tunnel(const char *name, struct blob_attr *attr)
1336 {
1337 struct blob_attr *tb[__TUNNEL_ATTR_MAX];
1338 struct blob_attr *cur;
1339 struct ip_tunnel_parm p;
1340 const char *base, *str;
1341 bool is_sit;
1342
1343 system_del_ip_tunnel(name);
1344
1345 tunnel_parm_init(&p);
1346
1347 blobmsg_parse(tunnel_attr_list.params, __TUNNEL_ATTR_MAX, tb,
1348 blob_data(attr), blob_len(attr));
1349
1350 if (!(cur = tb[TUNNEL_ATTR_TYPE]))
1351 return -EINVAL;
1352 str = blobmsg_data(cur);
1353 is_sit = !strcmp(str, "sit");
1354
1355 if (is_sit) {
1356 p.iph.protocol = IPPROTO_IPV6;
1357 base = "sit0";
1358 } else
1359 return -EINVAL;
1360
1361 if (!parse_ipaddr(tb[TUNNEL_ATTR_LOCAL], &p.iph.saddr))
1362 return -EINVAL;
1363
1364 if (!parse_ipaddr(tb[TUNNEL_ATTR_REMOTE], &p.iph.daddr))
1365 return -EINVAL;
1366
1367 if ((cur = tb[TUNNEL_ATTR_TTL])) {
1368 unsigned int val = blobmsg_get_u32(cur);
1369
1370 if (val > 255)
1371 return -EINVAL;
1372
1373 p.iph.ttl = val;
1374 }
1375
1376 strncpy(p.name, name, sizeof(p.name));
1377 if (tunnel_ioctl(base, SIOCADDTUNNEL, &p) < 0)
1378 return -1;
1379
1380 #ifdef SIOCADD6RD
1381 cur = tb[TUNNEL_ATTR_6RD_PREFIX];
1382 if (cur && is_sit) {
1383 unsigned int mask;
1384 struct ip_tunnel_6rd p6;
1385
1386 memset(&p6, 0, sizeof(p6));
1387
1388 if (!parse_ip_and_netmask(AF_INET6, blobmsg_data(cur),
1389 &p6.prefix, &mask) || mask > 128)
1390 return -EINVAL;
1391 p6.prefixlen = mask;
1392
1393 if ((cur = tb[TUNNEL_ATTR_6RD_RELAY_PREFIX])) {
1394 if (!parse_ip_and_netmask(AF_INET, blobmsg_data(cur),
1395 &p6.relay_prefix, &mask) || mask > 32)
1396 return -EINVAL;
1397 p6.relay_prefixlen = mask;
1398 }
1399
1400 if (tunnel_ioctl(name, SIOCADD6RD, &p6) < 0) {
1401 system_del_ip_tunnel(name);
1402 return -1;
1403 }
1404 }
1405 #endif
1406
1407 return 0;
1408 }