]> git.proxmox.com Git - mirror_iproute2.git/blobdiff - ip/ipvrf.c
Include bsd/string.h only in include/utils.h
[mirror_iproute2.git] / ip / ipvrf.c
index 8bd99d6251f26b3cbdb0b33fb64301dc9b4b7ac6..8a6b7f977b1423da8c1ee0df8379d90ba4716cc0 100644 (file)
@@ -21,6 +21,7 @@
 #include <stdlib.h>
 #include <unistd.h>
 #include <string.h>
+#include <dirent.h>
 #include <errno.h>
 #include <limits.h>
 
 
 #define CGRP_PROC_FILE  "/cgroup.procs"
 
+static struct link_filter vrf_filter;
+
 static void usage(void)
 {
-       fprintf(stderr, "Usage: ip vrf exec [NAME] cmd ...\n");
+       fprintf(stderr, "Usage: ip vrf show [NAME] ...\n");
+       fprintf(stderr, "       ip vrf exec [NAME] cmd ...\n");
        fprintf(stderr, "       ip vrf identify [PID]\n");
        fprintf(stderr, "       ip vrf pids [NAME]\n");
 
        exit(-1);
 }
 
+/*
+ * parse process based cgroup file looking for PATH/vrf/NAME where
+ * NAME is the name of the vrf the process is associated with
+ */
 static int vrf_identify(pid_t pid, char *name, size_t len)
 {
        char path[PATH_MAX];
@@ -55,14 +63,18 @@ static int vrf_identify(pid_t pid, char *name, size_t len)
        memset(name, 0, len);
 
        while (fgets(buf, sizeof(buf), fp)) {
-               vrf = strstr(buf, "::/vrf/");
+               /* want the controller-less cgroup */
+               if (strstr(buf, "::/") == NULL)
+                       continue;
+
+               vrf = strstr(buf, "/vrf/");
                if (vrf) {
-                       vrf += 7;  /* skip past "::/vrf/" */
+                       vrf += 5;  /* skip past "/vrf/" */
                        end = strchr(vrf, '\n');
                        if (end)
                                *end = '\0';
 
-                       strncpy(name, vrf, len - 1);
+                       strlcpy(name, vrf, len);
                        break;
                }
        }
@@ -97,13 +109,109 @@ static int ipvrf_identify(int argc, char **argv)
        return rc;
 }
 
-static int ipvrf_pids(int argc, char **argv)
+/* read PATH/vrf/NAME/cgroup.procs file */
+static void read_cgroup_pids(const char *base_path, char *name)
 {
        char path[PATH_MAX];
        char buf[4096];
+       FILE *fp;
+
+       if (snprintf(path, sizeof(path), "%s/vrf/%s%s",
+                    base_path, name, CGRP_PROC_FILE) >= sizeof(path))
+               return;
+
+       fp = fopen(path, "r");
+       if (!fp)
+               return; /* no cgroup file, nothing to show */
+
+       /* dump contents (pids) of cgroup.procs */
+       while (fgets(buf, sizeof(buf), fp)) {
+               char *nl, comm[32];
+
+               nl = strchr(buf, '\n');
+               if (nl)
+                       *nl = '\0';
+
+               if (get_command_name(buf, comm, sizeof(comm)))
+                       strcpy(comm, "<terminated?>");
+
+               printf("%5s  %s\n", buf, comm);
+       }
+
+       fclose(fp);
+}
+
+/* recurse path looking for PATH[/NETNS]/vrf/NAME */
+static int recurse_dir(char *base_path, char *name, const char *netns)
+{
+       char path[PATH_MAX];
+       struct dirent *de;
+       struct stat fstat;
+       int rc;
+       DIR *d;
+
+       d = opendir(base_path);
+       if (!d)
+               return -1;
+
+       while ((de = readdir(d)) != NULL) {
+               if (!strcmp(de->d_name, ".") || !strcmp(de->d_name, ".."))
+                       continue;
+
+               if (!strcmp(de->d_name, "vrf")) {
+                       const char *pdir = strrchr(base_path, '/');
+
+                       /* found a 'vrf' directory. if it is for the given
+                        * namespace then dump the cgroup pids
+                        */
+                       if (*netns == '\0' ||
+                           (pdir && !strcmp(pdir+1, netns)))
+                               read_cgroup_pids(base_path, name);
+
+                       continue;
+               }
+
+               /* is this a subdir that needs to be walked */
+               if (snprintf(path, sizeof(path), "%s/%s",
+                            base_path, de->d_name) >= sizeof(path))
+                       continue;
+
+               if (lstat(path, &fstat) < 0)
+                       continue;
+
+               if (S_ISDIR(fstat.st_mode)) {
+                       rc = recurse_dir(path, name, netns);
+                       if (rc != 0)
+                               goto out;
+               }
+       }
+
+       rc = 0;
+out:
+       closedir(d);
+
+       return rc;
+}
+
+static int ipvrf_get_netns(char *netns, int len)
+{
+       if (netns_identify_pid("self", netns, len-3)) {
+               fprintf(stderr, "Failed to get name of network namespace: %s\n",
+                       strerror(errno));
+               return -1;
+       }
+
+       if (*netns != '\0')
+               strcat(netns, "-ns");
+
+       return 0;
+}
+
+static int ipvrf_pids(int argc, char **argv)
+{
        char *mnt, *vrf;
-       int fd, rc = -1;
-       ssize_t n;
+       char netns[256];
+       int ret = -1;
 
        if (argc != 1) {
                fprintf(stderr, "Invalid arguments\n");
@@ -111,34 +219,24 @@ static int ipvrf_pids(int argc, char **argv)
        }
 
        vrf = argv[0];
+       if (!name_is_vrf(vrf)) {
+               fprintf(stderr, "Invalid VRF name\n");
+               return -1;
+       }
 
        mnt = find_cgroup2_mount();
        if (!mnt)
                return -1;
 
-       snprintf(path, sizeof(path), "%s/vrf/%s%s", mnt, vrf, CGRP_PROC_FILE);
-       free(mnt);
-       fd = open(path, O_RDONLY);
-       if (fd < 0)
-               return 0; /* no cgroup file, nothing to show */
+       if (ipvrf_get_netns(netns, sizeof(netns)) < 0)
+               goto out;
 
-       while (1) {
-               n = read(fd, buf, sizeof(buf) - 1);
-               if (n < 0) {
-                       fprintf(stderr,
-                               "Failed to read cgroups file: %s\n",
-                               strerror(errno));
-                       break;
-               } else if (n == 0) {
-                       rc = 0;
-                       break;
-               }
-               printf("%s", buf);
-       }
+       ret = recurse_dir(mnt, vrf, netns);
 
-       close(fd);
+out:
+       free(mnt);
 
-       return rc;
+       return ret;
 }
 
 /* load BPF program to set sk_bound_dev_if for sockets */
@@ -203,9 +301,59 @@ out:
        return rc;
 }
 
+/* get base path for controller-less cgroup for a process.
+ * path returned does not include /vrf/NAME if it exists
+ */
+static int vrf_path(char *vpath, size_t len)
+{
+       char path[PATH_MAX];
+       char buf[4096];
+       char *vrf;
+       FILE *fp;
+
+       snprintf(path, sizeof(path), "/proc/%d/cgroup", getpid());
+       fp = fopen(path, "r");
+       if (!fp)
+               return -1;
+
+       vpath[0] = '\0';
+
+       while (fgets(buf, sizeof(buf), fp)) {
+               char *start, *nl;
+
+               start = strstr(buf, "::/");
+               if (!start)
+                       continue;
+
+               /* advance past '::' */
+               start += 2;
+
+               nl = strchr(start, '\n');
+               if (nl)
+                       *nl = '\0';
+
+               vrf = strstr(start, "/vrf");
+               if (vrf)
+                       *vrf = '\0';
+
+               strlcpy(vpath, start, len);
+
+               /* if vrf path is just / then return nothing */
+               if (!strcmp(vpath, "/"))
+                       vpath[0] = '\0';
+
+               break;
+       }
+
+       fclose(fp);
+
+       return 0;
+}
+
 static int vrf_switch(const char *name)
 {
        char path[PATH_MAX], *mnt, pid[16];
+       char vpath[PATH_MAX], netns[256];
        int ifindex = 0;
        int rc = -1, len, fd = -1;
 
@@ -221,11 +369,37 @@ static int vrf_switch(const char *name)
        if (!mnt)
                return -1;
 
+       /* -1 on length to add '/' to the end */
+       if (ipvrf_get_netns(netns, sizeof(netns) - 1) < 0)
+               goto out;
+
+       if (vrf_path(vpath, sizeof(vpath)) < 0) {
+               fprintf(stderr, "Failed to get base cgroup path: %s\n",
+                       strerror(errno));
+               goto out;
+       }
+
+       /* if path already ends in netns then don't add it again */
+       if (*netns != '\0') {
+               char *pdir = strrchr(vpath, '/');
+
+               if (!pdir)
+                       pdir = vpath;
+               else
+                       pdir++;
+
+               if (strcmp(pdir, netns) == 0)
+                       *pdir = '\0';
+
+               strcat(netns, "/");
+       }
+
        /* path to cgroup; make sure buffer has room to cat "/cgroup.procs"
         * to the end of the path
         */
-       len = snprintf(path, sizeof(path) - sizeof(CGRP_PROC_FILE), "%s/vrf/%s",
-                      mnt, ifindex ? name : "");
+       len = snprintf(path, sizeof(path) - sizeof(CGRP_PROC_FILE),
+                      "%s%s/%svrf/%s",
+                      mnt, vpath, netns, ifindex ? name : "");
        if (len > sizeof(path) - sizeof(CGRP_PROC_FILE)) {
                fprintf(stderr, "Invalid path to cgroup2 mount\n");
                goto out;
@@ -253,13 +427,16 @@ static int vrf_switch(const char *name)
        snprintf(pid, sizeof(pid), "%d", getpid());
        if (write(fd, pid, strlen(pid)) < 0) {
                fprintf(stderr, "Failed to join cgroup\n");
-               goto out;
+               goto out2;
        }
 
        rc = 0;
+out2:
+       close(fd);
 out:
        free(mnt);
-       close(fd);
+
+       drop_cap();
 
        return rc;
 }
@@ -295,13 +472,148 @@ void vrf_reset(void)
        vrf_switch("default");
 }
 
-int do_ipvrf(int argc, char **argv)
+static int ipvrf_filter_req(struct nlmsghdr *nlh, int reqlen)
+{
+       struct rtattr *linkinfo;
+       int err;
+
+       if (vrf_filter.kind) {
+               linkinfo = addattr_nest(nlh, reqlen, IFLA_LINKINFO);
+
+               err = addattr_l(nlh, reqlen, IFLA_INFO_KIND, vrf_filter.kind,
+                               strlen(vrf_filter.kind));
+               if (err)
+                       return err;
+
+               addattr_nest_end(nlh, linkinfo);
+       }
+
+       return 0;
+}
+
+/* input arg is linkinfo */
+static __u32 vrf_table_linkinfo(struct rtattr *li[])
+{
+       struct rtattr *attr[IFLA_VRF_MAX + 1];
+
+       if (li[IFLA_INFO_DATA]) {
+               parse_rtattr_nested(attr, IFLA_VRF_MAX, li[IFLA_INFO_DATA]);
+
+               if (attr[IFLA_VRF_TABLE])
+                       return rta_getattr_u32(attr[IFLA_VRF_TABLE]);
+       }
+
+       return 0;
+}
+
+static int ipvrf_print(struct nlmsghdr *n)
 {
-       if (argc == 0) {
-               fprintf(stderr, "No command given. Try \"ip vrf help\".\n");
-               exit(-1);
+       struct ifinfomsg *ifi = NLMSG_DATA(n);
+       struct rtattr *tb[IFLA_MAX+1];
+       struct rtattr *li[IFLA_INFO_MAX+1];
+       int len = n->nlmsg_len;
+       const char *name;
+       __u32 tb_id;
+
+       len -= NLMSG_LENGTH(sizeof(*ifi));
+       if (len < 0)
+               return 0;
+
+       if (vrf_filter.ifindex && vrf_filter.ifindex != ifi->ifi_index)
+               return 0;
+
+       parse_rtattr(tb, IFLA_MAX, IFLA_RTA(ifi), len);
+
+       /* kernel does not support filter by master device */
+       if (tb[IFLA_MASTER]) {
+               int master = *(int *)RTA_DATA(tb[IFLA_MASTER]);
+
+               if (vrf_filter.master && master != vrf_filter.master)
+                       return 0;
        }
 
+       if (!tb[IFLA_IFNAME]) {
+               fprintf(stderr,
+                       "BUG: device with ifindex %d has nil ifname\n",
+                       ifi->ifi_index);
+               return 0;
+       }
+       name = rta_getattr_str(tb[IFLA_IFNAME]);
+
+       /* missing LINKINFO means not VRF. e.g., kernel does not
+        * support filtering on kind, so userspace needs to handle
+        */
+       if (!tb[IFLA_LINKINFO])
+               return 0;
+
+       parse_rtattr_nested(li, IFLA_INFO_MAX, tb[IFLA_LINKINFO]);
+
+       if (!li[IFLA_INFO_KIND])
+               return 0;
+
+       if (strcmp(RTA_DATA(li[IFLA_INFO_KIND]), "vrf"))
+               return 0;
+
+       tb_id = vrf_table_linkinfo(li);
+       if (!tb_id) {
+               fprintf(stderr,
+                       "BUG: VRF %s is missing table id\n", name);
+               return 0;
+       }
+
+       printf("%-16s %5u", name, tb_id);
+
+       printf("\n");
+       return 1;
+}
+
+static int ipvrf_show(int argc, char **argv)
+{
+       struct nlmsg_chain linfo = { NULL, NULL};
+       int rc = 0;
+
+       vrf_filter.kind = "vrf";
+
+       if (argc > 1)
+               usage();
+
+       if (argc == 1) {
+               __u32 tb_id;
+
+               tb_id = ipvrf_get_table(argv[0]);
+               if (!tb_id) {
+                       fprintf(stderr, "Invalid VRF\n");
+                       return 1;
+               }
+               printf("%s %u\n", argv[0], tb_id);
+               return 0;
+       }
+
+       if (ip_linkaddr_list(0, ipvrf_filter_req, &linfo, NULL) == 0) {
+               struct nlmsg_list *l;
+               unsigned nvrf = 0;
+               int n;
+
+               n = printf("%-16s  %5s\n", "Name", "Table");
+               printf("%.*s\n", n-1, "-----------------------");
+               for (l = linfo.head; l; l = l->next)
+                       nvrf += ipvrf_print(&l->h);
+
+               if (!nvrf)
+                       printf("No VRF has been configured\n");
+       } else
+               rc = 1;
+
+       free_nlmsg_chain(&linfo);
+
+       return rc;
+}
+
+int do_ipvrf(int argc, char **argv)
+{
+       if (argc == 0)
+               return ipvrf_show(0, NULL);
+
        if (matches(*argv, "identify") == 0)
                return ipvrf_identify(argc-1, argv+1);
 
@@ -311,6 +623,11 @@ int do_ipvrf(int argc, char **argv)
        if (matches(*argv, "exec") == 0)
                return ipvrf_exec(argc-1, argv+1);
 
+       if (matches(*argv, "show") == 0 ||
+           matches(*argv, "lst") == 0 ||
+           matches(*argv, "list") == 0)
+               return ipvrf_show(argc-1, argv+1);
+
        if (matches(*argv, "help") == 0)
                usage();