add a function for creating a raw event socket that does not use genl or rtnl
[project/netifd.git] / system-linux.c
1 #define _GNU_SOURCE
2
3 #include <sys/socket.h>
4 #include <sys/ioctl.h>
5 #include <sys/stat.h>
6 #include <sys/syscall.h>
7
8 #include <linux/rtnetlink.h>
9 #include <linux/sockios.h>
10 #include <linux/if_vlan.h>
11 #include <linux/if_bridge.h>
12
13 #include <unistd.h>
14 #include <string.h>
15 #include <fcntl.h>
16 #include <glob.h>
17
18 #include <netlink/msg.h>
19 #include <netlink/attr.h>
20 #include <netlink/socket.h>
21 #include <libubox/uloop.h>
22
23 #include "netifd.h"
24 #include "device.h"
25 #include "system.h"
26
27 struct event_socket {
28 struct uloop_fd uloop;
29 struct nl_sock *sock;
30 struct nl_cb *cb;
31 };
32
33 static int sock_ioctl = -1;
34 static struct nl_sock *sock_rtnl = NULL;
35
36 static int cb_rtnl_event(struct nl_msg *msg, void *arg);
37
38 static void
39 handler_nl_event(struct uloop_fd *u, unsigned int events)
40 {
41 struct event_socket *ev = container_of(u, struct event_socket, uloop);
42 nl_recvmsgs(ev->sock, ev->cb);
43 }
44
45 static struct nl_sock *
46 create_socket(int protocol)
47 {
48 struct nl_sock *sock;
49
50 sock = nl_socket_alloc();
51 if (!sock)
52 return NULL;
53
54 if (nl_connect(sock, protocol))
55 return NULL;
56
57 return sock;
58 }
59
60 static bool
61 create_raw_event_socket(struct event_socket *ev, int protocol,
62 uloop_fd_handler cb)
63 {
64 ev->sock = create_socket(protocol);
65 if (!ev->sock)
66 return false;
67
68 ev->uloop.fd = nl_socket_get_fd(ev->sock);
69 ev->uloop.cb = handler_nl_event;
70 uloop_fd_add(&ev->uloop, ULOOP_READ | ULOOP_EDGE_TRIGGER);
71 return true;
72 }
73
74 static bool
75 create_event_socket(struct event_socket *ev, int protocol,
76 int (*cb)(struct nl_msg *msg, void *arg))
77 {
78 // Prepare socket for link events
79 ev->cb = nl_cb_alloc(NL_CB_DEFAULT);
80 if (!ev->cb)
81 return false;
82
83 nl_cb_set(ev->cb, NL_CB_VALID, NL_CB_CUSTOM, cb, NULL);
84
85 return create_raw_event_socket(ev, protocol, handler_nl_event);
86 }
87
88 int system_init(void)
89 {
90 static struct event_socket rtnl_event;
91
92 sock_ioctl = socket(AF_LOCAL, SOCK_DGRAM, 0);
93 fcntl(sock_ioctl, F_SETFD, fcntl(sock_ioctl, F_GETFD) | FD_CLOEXEC);
94
95 // Prepare socket for routing / address control
96 sock_rtnl = create_socket(NETLINK_ROUTE);
97 if (!sock_rtnl)
98 return -1;
99
100 if (!create_event_socket(&rtnl_event, NETLINK_ROUTE, cb_rtnl_event))
101 return -1;
102
103 // Receive network link events form kernel
104 nl_socket_add_membership(rtnl_event.sock, RTNLGRP_LINK);
105
106 return 0;
107 }
108
109 static void system_set_sysctl(const char *path, const char *val)
110 {
111 int fd;
112
113 fd = open(path, O_WRONLY);
114 if (fd < 0)
115 return;
116
117 write(fd, val, strlen(val));
118 close(fd);
119 }
120
121 static void system_set_dev_sysctl(const char *path, const char *device, const char *val)
122 {
123 static char buf[256];
124
125 snprintf(buf, sizeof(buf), path, val);
126 system_set_sysctl(buf, val);
127 }
128
129 static void system_set_disable_ipv6(struct device *dev, const char *val)
130 {
131 system_set_dev_sysctl("/proc/sys/net/ipv6/conf/%s/disable_ipv6", dev->ifname, val);
132 }
133
134 // Evaluate netlink messages
135 static int cb_rtnl_event(struct nl_msg *msg, void *arg)
136 {
137 struct nlmsghdr *nh = nlmsg_hdr(msg);
138 struct ifinfomsg *ifi = NLMSG_DATA(nh);
139 struct nlattr *nla[__IFLA_MAX];
140
141 if (nh->nlmsg_type != RTM_DELLINK && nh->nlmsg_type != RTM_NEWLINK)
142 goto out;
143
144 nlmsg_parse(nh, sizeof(*ifi), nla, __IFLA_MAX - 1, NULL);
145 if (!nla[IFLA_IFNAME])
146 goto out;
147
148 struct device *dev = device_get(RTA_DATA(nla[IFLA_IFNAME]), false);
149 if (!dev)
150 goto out;
151
152 dev->ifindex = ifi->ifi_index;
153 device_set_present(dev, (nh->nlmsg_type == RTM_NEWLINK));
154
155 out:
156 return 0;
157 }
158
159 static int system_rtnl_call(struct nl_msg *msg)
160 {
161 int s = -(nl_send_auto_complete(sock_rtnl, msg)
162 || nl_wait_for_ack(sock_rtnl));
163 nlmsg_free(msg);
164 return s;
165 }
166
167 int system_bridge_delbr(struct device *bridge)
168 {
169 return ioctl(sock_ioctl, SIOCBRDELBR, bridge->ifname);
170 }
171
172 static int system_bridge_if(const char *bridge, struct device *dev, int cmd, void *data)
173 {
174 struct ifreq ifr;
175 if (dev)
176 ifr.ifr_ifindex = dev->ifindex;
177 else
178 ifr.ifr_data = data;
179 strncpy(ifr.ifr_name, bridge, sizeof(ifr.ifr_name));
180 return ioctl(sock_ioctl, cmd, &ifr);
181 }
182
183 int system_bridge_addif(struct device *bridge, struct device *dev)
184 {
185 system_set_disable_ipv6(dev, "1");
186 return system_bridge_if(bridge->ifname, dev, SIOCBRADDIF, NULL);
187 }
188
189 int system_bridge_delif(struct device *bridge, struct device *dev)
190 {
191 system_set_disable_ipv6(dev, "0");
192 return system_bridge_if(bridge->ifname, dev, SIOCBRDELIF, NULL);
193 }
194
195 static bool system_is_bridge(const char *name, char *buf, int buflen)
196 {
197 struct stat st;
198
199 snprintf(buf, buflen, "/sys/devices/virtual/net/%s/bridge", name);
200 if (stat(buf, &st) < 0)
201 return false;
202
203 return true;
204 }
205
206 static char *system_get_bridge(const char *name, char *buf, int buflen)
207 {
208 char *path;
209 ssize_t len;
210 glob_t gl;
211
212 snprintf(buf, buflen, "/sys/devices/virtual/net/*/brif/%s/bridge", name);
213 if (glob(buf, GLOB_NOSORT, NULL, &gl) < 0)
214 return NULL;
215
216 if (gl.gl_pathc == 0)
217 return NULL;
218
219 len = readlink(gl.gl_pathv[0], buf, buflen);
220 if (len < 0)
221 return NULL;
222
223 buf[len] = 0;
224 path = strrchr(buf, '/');
225 if (!path)
226 return NULL;
227
228 return path + 1;
229 }
230
231 static int system_if_resolve(struct device *dev)
232 {
233 struct ifreq ifr;
234 strncpy(ifr.ifr_name, dev->ifname, sizeof(ifr.ifr_name));
235 if (!ioctl(sock_ioctl, SIOCGIFINDEX, &ifr))
236 return ifr.ifr_ifindex;
237 else
238 return 0;
239 }
240
241 static int system_if_flags(const char *ifname, unsigned add, unsigned rem)
242 {
243 struct ifreq ifr;
244 strncpy(ifr.ifr_name, ifname, sizeof(ifr.ifr_name));
245 ioctl(sock_ioctl, SIOCGIFFLAGS, &ifr);
246 ifr.ifr_flags |= add;
247 ifr.ifr_flags &= ~rem;
248 return ioctl(sock_ioctl, SIOCSIFFLAGS, &ifr);
249 }
250
251 struct clear_data {
252 struct nl_msg *msg;
253 struct device *dev;
254 int type;
255 int size;
256 int af;
257 };
258
259
260 static bool check_ifaddr(struct nlmsghdr *hdr, int ifindex)
261 {
262 struct ifaddrmsg *ifa = NLMSG_DATA(hdr);
263
264 return ifa->ifa_index == ifindex;
265 }
266
267 static bool check_route(struct nlmsghdr *hdr, int ifindex)
268 {
269 struct nlattr *tb[__RTA_MAX];
270
271 nlmsg_parse(hdr, sizeof(struct rtmsg), tb, __RTA_MAX - 1, NULL);
272 if (!tb[RTA_OIF])
273 return false;
274
275 return *(int *)RTA_DATA(tb[RTA_OIF]) == ifindex;
276 }
277
278 static int cb_clear_event(struct nl_msg *msg, void *arg)
279 {
280 struct clear_data *clr = arg;
281 struct nlmsghdr *hdr = nlmsg_hdr(msg);
282 bool (*cb)(struct nlmsghdr *, int ifindex);
283 int type;
284
285 switch(clr->type) {
286 case RTM_GETADDR:
287 type = RTM_DELADDR;
288 if (hdr->nlmsg_type != RTM_NEWADDR)
289 return NL_SKIP;
290
291 cb = check_ifaddr;
292 break;
293 case RTM_GETROUTE:
294 type = RTM_DELROUTE;
295 if (hdr->nlmsg_type != RTM_NEWROUTE)
296 return NL_SKIP;
297
298 cb = check_route;
299 break;
300 default:
301 return NL_SKIP;
302 }
303
304 if (!cb(hdr, clr->dev->ifindex))
305 return NL_SKIP;
306
307 D(SYSTEM, "Remove %s from device %s\n",
308 type == RTM_DELADDR ? "an address" : "a route",
309 clr->dev->ifname);
310 memcpy(nlmsg_hdr(clr->msg), hdr, hdr->nlmsg_len);
311 hdr = nlmsg_hdr(clr->msg);
312 hdr->nlmsg_type = type;
313 hdr->nlmsg_flags = NLM_F_REQUEST;
314
315 if (!nl_send_auto_complete(sock_rtnl, clr->msg))
316 nl_wait_for_ack(sock_rtnl);
317
318 return NL_SKIP;
319 }
320
321 static int
322 cb_finish_event(struct nl_msg *msg, void *arg)
323 {
324 int *pending = arg;
325 *pending = 0;
326 return NL_STOP;
327 }
328
329 static int
330 error_handler(struct sockaddr_nl *nla, struct nlmsgerr *err, void *arg)
331 {
332 int *pending = arg;
333 *pending = err->error;
334 return NL_STOP;
335 }
336
337 static void
338 system_if_clear_entries(struct device *dev, int type, int af)
339 {
340 struct clear_data clr;
341 struct nl_cb *cb = nl_cb_alloc(NL_CB_DEFAULT);
342 struct rtmsg rtm = {
343 .rtm_family = af,
344 .rtm_flags = RTM_F_CLONED,
345 };
346 int flags = NLM_F_DUMP;
347 int pending = 1;
348
349 clr.af = af;
350 clr.dev = dev;
351 clr.type = type;
352 switch (type) {
353 case RTM_GETADDR:
354 clr.size = sizeof(struct rtgenmsg);
355 break;
356 case RTM_GETROUTE:
357 clr.size = sizeof(struct rtmsg);
358 break;
359 default:
360 return;
361 }
362
363 if (!cb)
364 return;
365
366 clr.msg = nlmsg_alloc_simple(type, flags);
367 if (!clr.msg)
368 goto out;
369
370 nlmsg_append(clr.msg, &rtm, clr.size, 0);
371 nl_cb_set(cb, NL_CB_VALID, NL_CB_CUSTOM, cb_clear_event, &clr);
372 nl_cb_set(cb, NL_CB_FINISH, NL_CB_CUSTOM, cb_finish_event, &pending);
373 nl_cb_err(cb, NL_CB_CUSTOM, error_handler, &pending);
374
375 nl_send_auto_complete(sock_rtnl, clr.msg);
376 while (pending > 0)
377 nl_recvmsgs(sock_rtnl, cb);
378
379 nlmsg_free(clr.msg);
380 out:
381 nl_cb_put(cb);
382 }
383
384 /*
385 * Clear bridge (membership) state and bring down device
386 */
387 void system_if_clear_state(struct device *dev)
388 {
389 static char buf[256];
390 char *bridge;
391
392 if (dev->external)
393 return;
394
395 dev->ifindex = system_if_resolve(dev);
396 if (!dev->ifindex)
397 return;
398
399 system_if_flags(dev->ifname, 0, IFF_UP);
400
401 if (system_is_bridge(dev->ifname, buf, sizeof(buf))) {
402 D(SYSTEM, "Delete existing bridge named '%s'\n", dev->ifname);
403 system_bridge_delbr(dev);
404 return;
405 }
406
407 bridge = system_get_bridge(dev->ifname, buf, sizeof(buf));
408 if (bridge) {
409 D(SYSTEM, "Remove device '%s' from bridge '%s'\n", dev->ifname, bridge);
410 system_bridge_if(bridge, dev, SIOCBRDELIF, NULL);
411 }
412
413 system_if_clear_entries(dev, RTM_GETROUTE, AF_INET);
414 system_if_clear_entries(dev, RTM_GETADDR, AF_INET);
415 system_if_clear_entries(dev, RTM_GETROUTE, AF_INET6);
416 system_if_clear_entries(dev, RTM_GETADDR, AF_INET6);
417 system_set_disable_ipv6(dev, "0");
418 }
419
420 static inline unsigned long
421 sec_to_jiffies(int val)
422 {
423 return (unsigned long) val * 100;
424 }
425
426 int system_bridge_addbr(struct device *bridge, struct bridge_config *cfg)
427 {
428 unsigned long args[4] = {};
429
430 if (ioctl(sock_ioctl, SIOCBRADDBR, bridge->ifname) < 0)
431 return -1;
432
433 args[0] = BRCTL_SET_BRIDGE_STP_STATE;
434 args[1] = !!cfg->stp;
435 system_bridge_if(bridge->ifname, NULL, SIOCDEVPRIVATE, &args);
436
437 args[0] = BRCTL_SET_BRIDGE_FORWARD_DELAY;
438 args[1] = sec_to_jiffies(cfg->forward_delay);
439 system_bridge_if(bridge->ifname, NULL, SIOCDEVPRIVATE, &args);
440
441 system_set_dev_sysctl("/sys/devices/virtual/net/%s/bridge/multicast_snooping",
442 bridge->ifname, cfg->igmp_snoop ? "1" : "0");
443
444 if (cfg->flags & BRIDGE_OPT_AGEING_TIME) {
445 args[0] = BRCTL_SET_AGEING_TIME;
446 args[1] = sec_to_jiffies(cfg->ageing_time);
447 system_bridge_if(bridge->ifname, NULL, SIOCDEVPRIVATE, &args);
448 }
449
450 if (cfg->flags & BRIDGE_OPT_HELLO_TIME) {
451 args[0] = BRCTL_SET_BRIDGE_HELLO_TIME;
452 args[1] = sec_to_jiffies(cfg->hello_time);
453 system_bridge_if(bridge->ifname, NULL, SIOCDEVPRIVATE, &args);
454 }
455
456 if (cfg->flags & BRIDGE_OPT_MAX_AGE) {
457 args[0] = BRCTL_SET_BRIDGE_MAX_AGE;
458 args[1] = sec_to_jiffies(cfg->max_age);
459 system_bridge_if(bridge->ifname, NULL, SIOCDEVPRIVATE, &args);
460 }
461
462 return 0;
463 }
464
465 static int system_vlan(struct device *dev, int id)
466 {
467 struct vlan_ioctl_args ifr = {
468 .cmd = SET_VLAN_NAME_TYPE_CMD,
469 .u.name_type = VLAN_NAME_TYPE_RAW_PLUS_VID_NO_PAD,
470 };
471
472 ioctl(sock_ioctl, SIOCSIFVLAN, &ifr);
473
474 if (id < 0) {
475 ifr.cmd = DEL_VLAN_CMD;
476 ifr.u.VID = 0;
477 } else {
478 ifr.cmd = ADD_VLAN_CMD;
479 ifr.u.VID = id;
480 }
481 strncpy(ifr.device1, dev->ifname, sizeof(ifr.device1));
482 return ioctl(sock_ioctl, SIOCSIFVLAN, &ifr);
483 }
484
485 int system_vlan_add(struct device *dev, int id)
486 {
487 return system_vlan(dev, id);
488 }
489
490 int system_vlan_del(struct device *dev)
491 {
492 return system_vlan(dev, -1);
493 }
494
495 static void
496 system_if_apply_settings(struct device *dev)
497 {
498 struct ifreq ifr;
499
500 memset(&ifr, 0, sizeof(ifr));
501 strncpy(ifr.ifr_name, dev->ifname, sizeof(ifr.ifr_name));
502 if (dev->flags & DEV_OPT_MTU) {
503 ifr.ifr_mtu = dev->mtu;
504 ioctl(sock_ioctl, SIOCSIFMTU, &ifr);
505 }
506 if (dev->flags & DEV_OPT_TXQUEUELEN) {
507 ifr.ifr_qlen = dev->txqueuelen;
508 ioctl(sock_ioctl, SIOCSIFTXQLEN, &ifr);
509 }
510 if (dev->flags & DEV_OPT_MACADDR) {
511 memcpy(&ifr.ifr_hwaddr, dev->macaddr, sizeof(dev->macaddr));
512 ioctl(sock_ioctl, SIOCSIFHWADDR, &ifr);
513 }
514
515 dev->ifindex = system_if_resolve(dev);
516 }
517
518 int system_if_up(struct device *dev)
519 {
520 system_if_apply_settings(dev);
521 return system_if_flags(dev->ifname, IFF_UP, 0);
522 }
523
524 int system_if_down(struct device *dev)
525 {
526 return system_if_flags(dev->ifname, 0, IFF_UP);
527 }
528
529 int system_if_check(struct device *dev)
530 {
531 device_set_present(dev, (system_if_resolve(dev) >= 0));
532 return 0;
533 }
534
535 int system_if_dump_stats(struct device *dev, struct blob_buf *b)
536 {
537 const char *const counters[] = {
538 "collisions", "rx_frame_errors", "tx_compressed",
539 "multicast", "rx_length_errors", "tx_dropped",
540 "rx_bytes", "rx_missed_errors", "tx_errors",
541 "rx_compressed", "rx_over_errors", "tx_fifo_errors",
542 "rx_crc_errors", "rx_packets", "tx_heartbeat_errors",
543 "rx_dropped", "tx_aborted_errors", "tx_packets",
544 "rx_errors", "tx_bytes", "tx_window_errors",
545 "rx_fifo_errors", "tx_carrier_errors",
546 };
547 char buf[64];
548 int stats_dir;
549 int i, fd, len;
550
551 snprintf(buf, sizeof(buf), "/sys/class/net/%s/statistics", dev->ifname);
552 stats_dir = open(buf, O_DIRECTORY);
553 if (stats_dir < 0)
554 return -1;
555
556 for (i = 0; i < ARRAY_SIZE(counters); i++) {
557 fd = openat(stats_dir, counters[i], O_RDONLY);
558 if (fd < 0)
559 continue;
560
561 retry:
562 len = read(fd, buf, sizeof(buf));
563 if (len < 0) {
564 if (errno == EINTR)
565 goto retry;
566 continue;
567 }
568
569 buf[len] = 0;
570 blobmsg_add_u32(b, counters[i], strtoul(buf, NULL, 0));
571 close(fd);
572 }
573
574 close(stats_dir);
575 return 0;
576 }
577
578 static int system_addr(struct device *dev, struct device_addr *addr, int cmd)
579 {
580 int alen = ((addr->flags & DEVADDR_FAMILY) == DEVADDR_INET4) ? 4 : 16;
581 struct ifaddrmsg ifa = {
582 .ifa_family = (alen == 4) ? AF_INET : AF_INET6,
583 .ifa_prefixlen = addr->mask,
584 .ifa_index = dev->ifindex,
585 };
586
587 struct nl_msg *msg;
588
589 dev = addr->device;
590 if (dev) {
591 if (!dev->ifindex)
592 return -1;
593
594 ifa.ifa_index = dev->ifindex;
595 }
596
597 msg = nlmsg_alloc_simple(cmd, 0);
598 if (!msg)
599 return -1;
600
601 nlmsg_append(msg, &ifa, sizeof(ifa), 0);
602 nla_put(msg, IFA_LOCAL, alen, &addr->addr);
603 return system_rtnl_call(msg);
604 }
605
606 int system_add_address(struct device *dev, struct device_addr *addr)
607 {
608 return system_addr(dev, addr, RTM_NEWADDR);
609 }
610
611 int system_del_address(struct device *dev, struct device_addr *addr)
612 {
613 return system_addr(dev, addr, RTM_DELADDR);
614 }
615
616 static int system_rt(struct device *dev, struct device_route *route, int cmd)
617 {
618 int alen = ((route->flags & DEVADDR_FAMILY) == DEVADDR_INET4) ? 4 : 16;
619 bool have_gw;
620 unsigned int flags = 0;
621 int ifindex = dev->ifindex;
622
623 if (alen == 4)
624 have_gw = !!route->nexthop.in.s_addr;
625 else
626 have_gw = route->nexthop.in6.s6_addr32[0] ||
627 route->nexthop.in6.s6_addr32[1] ||
628 route->nexthop.in6.s6_addr32[2] ||
629 route->nexthop.in6.s6_addr32[3];
630
631 unsigned char scope = (cmd == RTM_DELROUTE) ? RT_SCOPE_NOWHERE :
632 (have_gw) ? RT_SCOPE_UNIVERSE : RT_SCOPE_LINK;
633
634 struct rtmsg rtm = {
635 .rtm_family = (alen == 4) ? AF_INET : AF_INET6,
636 .rtm_dst_len = route->mask,
637 .rtm_table = RT_TABLE_MAIN,
638 .rtm_protocol = RTPROT_BOOT,
639 .rtm_scope = scope,
640 .rtm_type = (cmd == RTM_DELROUTE) ? 0: RTN_UNICAST,
641 };
642 struct nl_msg *msg;
643
644 if (cmd == RTM_NEWROUTE)
645 flags |= NLM_F_CREATE | NLM_F_REPLACE;
646
647 dev = route->device;
648 if (dev) {
649 if (!dev->ifindex)
650 return -1;
651
652 ifindex = dev->ifindex;
653 }
654
655 msg = nlmsg_alloc_simple(cmd, flags);
656 if (!msg)
657 return -1;
658
659 nlmsg_append(msg, &rtm, sizeof(rtm), 0);
660
661 if (route->mask)
662 nla_put(msg, RTA_DST, alen, &route->addr);
663
664 if (have_gw)
665 nla_put(msg, RTA_GATEWAY, alen, &route->nexthop);
666
667 if (route->flags & DEVADDR_DEVICE)
668 nla_put_u32(msg, RTA_OIF, ifindex);
669
670 return system_rtnl_call(msg);
671 }
672
673 int system_add_route(struct device *dev, struct device_route *route)
674 {
675 return system_rt(dev, route, RTM_NEWROUTE);
676 }
677
678 int system_del_route(struct device *dev, struct device_route *route)
679 {
680 return system_rt(dev, route, RTM_DELROUTE);
681 }
682
683 int system_flush_routes(void)
684 {
685 const char *names[] = {
686 "/proc/sys/net/ipv4/route/flush",
687 "/proc/sys/net/ipv6/route/flush"
688 };
689 int fd, i;
690
691 for (i = 0; i < ARRAY_SIZE(names); i++) {
692 fd = open(names[i], O_WRONLY);
693 if (fd < 0)
694 continue;
695
696 write(fd, "-1", 2);
697 close(fd);
698 }
699 return 0;
700 }
701
702 time_t system_get_rtime(void)
703 {
704 struct timespec ts;
705 struct timeval tv;
706
707 if (syscall(__NR_clock_gettime, CLOCK_MONOTONIC, &ts) == 0)
708 return ts.tv_sec;
709
710 if (gettimeofday(&tv, NULL) == 0)
711 return tv.tv_sec;
712
713 return 0;
714 }