src/basic/namespace-util.c

   1 /* SPDX-License-Identifier: LGPL-2.1-or-later */
   2
   3 #include <fcntl.h>
   4 #include <sys/ioctl.h>
   5 #include <sys/mount.h>
   6
   7 #include "fd-util.h"
   8 #include "missing_fs.h"
   9 #include "missing_magic.h"
  10 #include "namespace-util.h"
  11 #include "process-util.h"
  12 #include "stat-util.h"
  13 #include "user-util.h"
  14
  15 int namespace_open(pid_t pid, int *pidns_fd, int *mntns_fd, int *netns_fd, int *userns_fd, int *root_fd) {
  16         _cleanup_close_ int pidnsfd = -1, mntnsfd = -1, netnsfd = -1, usernsfd = -1;
  17         int rfd = -1;
  18
  19         assert(pid >= 0);
  20
  21         if (mntns_fd) {
  22                 const char *mntns;
  23
  24                 mntns = procfs_file_alloca(pid, "ns/mnt");
  25                 mntnsfd = open(mntns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
  26                 if (mntnsfd < 0)
  27                         return -errno;
  28         }
  29
  30         if (pidns_fd) {
  31                 const char *pidns;
  32
  33                 pidns = procfs_file_alloca(pid, "ns/pid");
  34                 pidnsfd = open(pidns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
  35                 if (pidnsfd < 0)
  36                         return -errno;
  37         }
  38
  39         if (netns_fd) {
  40                 const char *netns;
  41
  42                 netns = procfs_file_alloca(pid, "ns/net");
  43                 netnsfd = open(netns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
  44                 if (netnsfd < 0)
  45                         return -errno;
  46         }
  47
  48         if (userns_fd) {
  49                 const char *userns;
  50
  51                 userns = procfs_file_alloca(pid, "ns/user");
  52                 usernsfd = open(userns, O_RDONLY|O_NOCTTY|O_CLOEXEC);
  53                 if (usernsfd < 0 && errno != ENOENT)
  54                         return -errno;
  55         }
  56
  57         if (root_fd) {
  58                 const char *root;
  59
  60                 root = procfs_file_alloca(pid, "root");
  61                 rfd = open(root, O_RDONLY|O_NOCTTY|O_CLOEXEC|O_DIRECTORY);
  62                 if (rfd < 0)
  63                         return -errno;
  64         }
  65
  66         if (pidns_fd)
  67                 *pidns_fd = TAKE_FD(pidnsfd);
  68
  69         if (mntns_fd)
  70                 *mntns_fd = TAKE_FD(mntnsfd);
  71
  72         if (netns_fd)
  73                 *netns_fd = TAKE_FD(netnsfd);
  74
  75         if (userns_fd)
  76                 *userns_fd = TAKE_FD(usernsfd);
  77
  78         if (root_fd)
  79                 *root_fd = TAKE_FD(rfd);
  80
  81         return 0;
  82 }
  83
  84 int namespace_enter(int pidns_fd, int mntns_fd, int netns_fd, int userns_fd, int root_fd) {
  85         if (userns_fd >= 0) {
  86                 /* Can't setns to your own userns, since then you could
  87                  * escalate from non-root to root in your own namespace, so
  88                  * check if namespaces equal before attempting to enter. */
  89                 _cleanup_free_ char *userns_fd_path = NULL;
  90                 int r;
  91                 if (asprintf(&userns_fd_path, "/proc/self/fd/%d", userns_fd) < 0)
  92                         return -ENOMEM;
  93
  94                 r = files_same(userns_fd_path, "/proc/self/ns/user", 0);
  95                 if (r < 0)
  96                         return r;
  97                 if (r)
  98                         userns_fd = -1;
  99         }
 100
 101         if (pidns_fd >= 0)
 102                 if (setns(pidns_fd, CLONE_NEWPID) < 0)
 103                         return -errno;
 104
 105         if (mntns_fd >= 0)
 106                 if (setns(mntns_fd, CLONE_NEWNS) < 0)
 107                         return -errno;
 108
 109         if (netns_fd >= 0)
 110                 if (setns(netns_fd, CLONE_NEWNET) < 0)
 111                         return -errno;
 112
 113         if (userns_fd >= 0)
 114                 if (setns(userns_fd, CLONE_NEWUSER) < 0)
 115                         return -errno;
 116
 117         if (root_fd >= 0) {
 118                 if (fchdir(root_fd) < 0)
 119                         return -errno;
 120
 121                 if (chroot(".") < 0)
 122                         return -errno;
 123         }
 124
 125         return reset_uid_gid();
 126 }
 127
 128 int fd_is_network_ns(int fd) {
 129         struct statfs s;
 130         int r;
 131
 132         /* Checks whether the specified file descriptor refers to a network namespace. On old kernels there's no nice
 133          * way to detect that, hence on those we'll return a recognizable error (EUCLEAN), so that callers can handle
 134          * this somewhat nicely.
 135          *
 136          * This function returns > 0 if the fd definitely refers to a network namespace, 0 if it definitely does not
 137          * refer to a network namespace, -EUCLEAN if we can't determine, and other negative error codes on error. */
 138
 139         if (fstatfs(fd, &s) < 0)
 140                 return -errno;
 141
 142         if (!is_fs_type(&s, NSFS_MAGIC)) {
 143                 /* On really old kernels, there was no "nsfs", and network namespace sockets belonged to procfs
 144                  * instead. Handle that in a somewhat smart way. */
 145
 146                 if (is_fs_type(&s, PROC_SUPER_MAGIC)) {
 147                         struct statfs t;
 148
 149                         /* OK, so it is procfs. Let's see if our own network namespace is procfs, too. If so, then the
 150                          * passed fd might refer to a network namespace, but we can't know for sure. In that case,
 151                          * return a recognizable error. */
 152
 153                         if (statfs("/proc/self/ns/net", &t) < 0)
 154                                 return -errno;
 155
 156                         if (s.f_type == t.f_type)
 157                                 return -EUCLEAN; /* It's possible, we simply don't know */
 158                 }
 159
 160                 return 0; /* No! */
 161         }
 162
 163         r = ioctl(fd, NS_GET_NSTYPE);
 164         if (r < 0) {
 165                 if (errno == ENOTTY) /* Old kernels didn't know this ioctl, let's also return a recognizable error in that case */
 166                         return -EUCLEAN;
 167
 168                 return -errno;
 169         }
 170
 171         return r == CLONE_NEWNET;
 172 }
 173
 174 int detach_mount_namespace(void) {
 175
 176         /* Detaches the mount namespace, disabling propagation from our namespace to the host */
 177
 178         if (unshare(CLONE_NEWNS) < 0)
 179                 return -errno;
 180
 181         if (mount(NULL, "/", NULL, MS_SLAVE | MS_REC, NULL) < 0)
 182                 return -errno;
 183
 184         return 0;
 185 }