]> git.ipfire.org Git - thirdparty/systemd.git/blob - src/basic/virt.c
Merge pull request #7388 from keszybz/doc-tweak
[thirdparty/systemd.git] / src / basic / virt.c
1 /***
2 This file is part of systemd.
3
4 Copyright 2011 Lennart Poettering
5
6 systemd is free software; you can redistribute it and/or modify it
7 under the terms of the GNU Lesser General Public License as published by
8 the Free Software Foundation; either version 2.1 of the License, or
9 (at your option) any later version.
10
11 systemd is distributed in the hope that it will be useful, but
12 WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 Lesser General Public License for more details.
15
16 You should have received a copy of the GNU Lesser General Public License
17 along with systemd; If not, see <http://www.gnu.org/licenses/>.
18 ***/
19
20 #include <errno.h>
21 #include <stdint.h>
22 #include <stdlib.h>
23 #include <string.h>
24 #include <unistd.h>
25
26 #include "alloc-util.h"
27 #include "dirent-util.h"
28 #include "env-util.h"
29 #include "fd-util.h"
30 #include "fileio.h"
31 #include "macro.h"
32 #include "process-util.h"
33 #include "stat-util.h"
34 #include "string-table.h"
35 #include "string-util.h"
36 #include "virt.h"
37
38 static int detect_vm_cpuid(void) {
39
40 /* CPUID is an x86 specific interface. */
41 #if defined(__i386__) || defined(__x86_64__)
42
43 static const struct {
44 const char *cpuid;
45 int id;
46 } cpuid_vendor_table[] = {
47 { "XenVMMXenVMM", VIRTUALIZATION_XEN },
48 { "KVMKVMKVM", VIRTUALIZATION_KVM },
49 { "TCGTCGTCGTCG", VIRTUALIZATION_QEMU },
50 /* http://kb.vmware.com/selfservice/microsites/search.do?language=en_US&cmd=displayKC&externalId=1009458 */
51 { "VMwareVMware", VIRTUALIZATION_VMWARE },
52 /* https://docs.microsoft.com/en-us/virtualization/hyper-v-on-windows/reference/tlfs */
53 { "Microsoft Hv", VIRTUALIZATION_MICROSOFT },
54 /* https://wiki.freebsd.org/bhyve */
55 { "bhyve bhyve ", VIRTUALIZATION_BHYVE },
56 };
57
58 uint32_t eax, ecx;
59 bool hypervisor;
60
61 /* http://lwn.net/Articles/301888/ */
62
63 #if defined (__i386__)
64 #define REG_a "eax"
65 #define REG_b "ebx"
66 #elif defined (__amd64__)
67 #define REG_a "rax"
68 #define REG_b "rbx"
69 #endif
70
71 /* First detect whether there is a hypervisor */
72 eax = 1;
73 __asm__ __volatile__ (
74 /* ebx/rbx is being used for PIC! */
75 " push %%"REG_b" \n\t"
76 " cpuid \n\t"
77 " pop %%"REG_b" \n\t"
78
79 : "=a" (eax), "=c" (ecx)
80 : "0" (eax)
81 );
82
83 hypervisor = !!(ecx & 0x80000000U);
84
85 if (hypervisor) {
86 union {
87 uint32_t sig32[3];
88 char text[13];
89 } sig = {};
90 unsigned j;
91
92 /* There is a hypervisor, see what it is */
93 eax = 0x40000000U;
94 __asm__ __volatile__ (
95 /* ebx/rbx is being used for PIC! */
96 " push %%"REG_b" \n\t"
97 " cpuid \n\t"
98 " mov %%ebx, %1 \n\t"
99 " pop %%"REG_b" \n\t"
100
101 : "=a" (eax), "=r" (sig.sig32[0]), "=c" (sig.sig32[1]), "=d" (sig.sig32[2])
102 : "0" (eax)
103 );
104
105 log_debug("Virtualization found, CPUID=%s", sig.text);
106
107 for (j = 0; j < ELEMENTSOF(cpuid_vendor_table); j ++)
108 if (streq(sig.text, cpuid_vendor_table[j].cpuid))
109 return cpuid_vendor_table[j].id;
110
111 return VIRTUALIZATION_VM_OTHER;
112 }
113 #endif
114 log_debug("No virtualization found in CPUID");
115
116 return VIRTUALIZATION_NONE;
117 }
118
119 static int detect_vm_device_tree(void) {
120 #if defined(__arm__) || defined(__aarch64__) || defined(__powerpc__) || defined(__powerpc64__)
121 _cleanup_free_ char *hvtype = NULL;
122 int r;
123
124 r = read_one_line_file("/proc/device-tree/hypervisor/compatible", &hvtype);
125 if (r == -ENOENT) {
126 _cleanup_closedir_ DIR *dir = NULL;
127 struct dirent *dent;
128
129 dir = opendir("/proc/device-tree");
130 if (!dir) {
131 if (errno == ENOENT) {
132 log_debug_errno(errno, "/proc/device-tree: %m");
133 return VIRTUALIZATION_NONE;
134 }
135 return -errno;
136 }
137
138 FOREACH_DIRENT(dent, dir, return -errno)
139 if (strstr(dent->d_name, "fw-cfg")) {
140 log_debug("Virtualization QEMU: \"fw-cfg\" present in /proc/device-tree/%s", dent->d_name);
141 return VIRTUALIZATION_QEMU;
142 }
143
144 log_debug("No virtualization found in /proc/device-tree/*");
145 return VIRTUALIZATION_NONE;
146 } else if (r < 0)
147 return r;
148
149 log_debug("Virtualization %s found in /proc/device-tree/hypervisor/compatible", hvtype);
150 if (streq(hvtype, "linux,kvm"))
151 return VIRTUALIZATION_KVM;
152 else if (strstr(hvtype, "xen"))
153 return VIRTUALIZATION_XEN;
154 else
155 return VIRTUALIZATION_VM_OTHER;
156 #else
157 log_debug("This platform does not support /proc/device-tree");
158 return VIRTUALIZATION_NONE;
159 #endif
160 }
161
162 static int detect_vm_dmi(void) {
163 #if defined(__i386__) || defined(__x86_64__) || defined(__arm__) || defined(__aarch64__)
164
165 static const char *const dmi_vendors[] = {
166 "/sys/class/dmi/id/product_name", /* Test this before sys_vendor to detect KVM over QEMU */
167 "/sys/class/dmi/id/sys_vendor",
168 "/sys/class/dmi/id/board_vendor",
169 "/sys/class/dmi/id/bios_vendor"
170 };
171
172 static const struct {
173 const char *vendor;
174 int id;
175 } dmi_vendor_table[] = {
176 { "KVM", VIRTUALIZATION_KVM },
177 { "QEMU", VIRTUALIZATION_QEMU },
178 /* http://kb.vmware.com/selfservice/microsites/search.do?language=en_US&cmd=displayKC&externalId=1009458 */
179 { "VMware", VIRTUALIZATION_VMWARE },
180 { "VMW", VIRTUALIZATION_VMWARE },
181 { "innotek GmbH", VIRTUALIZATION_ORACLE },
182 { "Xen", VIRTUALIZATION_XEN },
183 { "Bochs", VIRTUALIZATION_BOCHS },
184 { "Parallels", VIRTUALIZATION_PARALLELS },
185 /* https://wiki.freebsd.org/bhyve */
186 { "BHYVE", VIRTUALIZATION_BHYVE },
187 };
188 unsigned i;
189 int r;
190
191 for (i = 0; i < ELEMENTSOF(dmi_vendors); i++) {
192 _cleanup_free_ char *s = NULL;
193 unsigned j;
194
195 r = read_one_line_file(dmi_vendors[i], &s);
196 if (r < 0) {
197 if (r == -ENOENT)
198 continue;
199
200 return r;
201 }
202
203
204
205 for (j = 0; j < ELEMENTSOF(dmi_vendor_table); j++)
206 if (startswith(s, dmi_vendor_table[j].vendor)) {
207 log_debug("Virtualization %s found in DMI (%s)", s, dmi_vendors[i]);
208 return dmi_vendor_table[j].id;
209 }
210 }
211 #endif
212
213 log_debug("No virtualization found in DMI");
214
215 return VIRTUALIZATION_NONE;
216 }
217
218 static int detect_vm_xen(void) {
219
220 /* Check for Dom0 will be executed later in detect_vm_xen_dom0
221 Thats why we dont check the content of /proc/xen/capabilities here. */
222 if (access("/proc/xen/capabilities", F_OK) < 0) {
223 log_debug("Virtualization XEN not found, /proc/xen/capabilities does not exist");
224 return VIRTUALIZATION_NONE;
225 }
226
227 log_debug("Virtualization XEN found (/proc/xen/capabilities exists)");
228 return VIRTUALIZATION_XEN;
229 }
230
231 static bool detect_vm_xen_dom0(void) {
232 _cleanup_free_ char *domcap = NULL;
233 char *cap, *i;
234 int r;
235
236 r = read_one_line_file("/proc/xen/capabilities", &domcap);
237 if (r == -ENOENT) {
238 log_debug("Virtualization XEN not found, /proc/xen/capabilities does not exist");
239 return false;
240 }
241 if (r < 0)
242 return r;
243
244 i = domcap;
245 while ((cap = strsep(&i, ",")))
246 if (streq(cap, "control_d"))
247 break;
248 if (!cap) {
249 log_debug("Virtualization XEN DomU found (/proc/xen/capabilites)");
250 return false;
251 }
252
253 log_debug("Virtualization XEN Dom0 ignored (/proc/xen/capabilities)");
254 return true;
255 }
256
257 static int detect_vm_hypervisor(void) {
258 _cleanup_free_ char *hvtype = NULL;
259 int r;
260
261 r = read_one_line_file("/sys/hypervisor/type", &hvtype);
262 if (r == -ENOENT)
263 return VIRTUALIZATION_NONE;
264 if (r < 0)
265 return r;
266
267 log_debug("Virtualization %s found in /sys/hypervisor/type", hvtype);
268
269 if (streq(hvtype, "xen"))
270 return VIRTUALIZATION_XEN;
271 else
272 return VIRTUALIZATION_VM_OTHER;
273 }
274
275 static int detect_vm_uml(void) {
276 _cleanup_free_ char *cpuinfo_contents = NULL;
277 int r;
278
279 /* Detect User-Mode Linux by reading /proc/cpuinfo */
280 r = read_full_file("/proc/cpuinfo", &cpuinfo_contents, NULL);
281 if (r < 0)
282 return r;
283
284 if (strstr(cpuinfo_contents, "\nvendor_id\t: User Mode Linux\n")) {
285 log_debug("UML virtualization found in /proc/cpuinfo");
286 return VIRTUALIZATION_UML;
287 }
288
289 log_debug("No virtualization found in /proc/cpuinfo.");
290 return VIRTUALIZATION_NONE;
291 }
292
293 static int detect_vm_zvm(void) {
294
295 #if defined(__s390__)
296 _cleanup_free_ char *t = NULL;
297 int r;
298
299 r = get_proc_field("/proc/sysinfo", "VM00 Control Program", WHITESPACE, &t);
300 if (r == -ENOENT)
301 return VIRTUALIZATION_NONE;
302 if (r < 0)
303 return r;
304
305 log_debug("Virtualization %s found in /proc/sysinfo", t);
306 if (streq(t, "z/VM"))
307 return VIRTUALIZATION_ZVM;
308 else
309 return VIRTUALIZATION_KVM;
310 #else
311 log_debug("This platform does not support /proc/sysinfo");
312 return VIRTUALIZATION_NONE;
313 #endif
314 }
315
316 /* Returns a short identifier for the various VM implementations */
317 int detect_vm(void) {
318 static thread_local int cached_found = _VIRTUALIZATION_INVALID;
319 int r, dmi;
320 bool other = false;
321
322 if (cached_found >= 0)
323 return cached_found;
324
325 /* We have to use the correct order here:
326 *
327 * -> First try to detect Oracle Virtualbox, even if it uses KVM.
328 * -> Second try to detect from cpuid, this will report KVM for
329 * whatever software is used even if info in dmi is overwritten.
330 * -> Third try to detect from dmi. */
331
332 dmi = detect_vm_dmi();
333 if (dmi == VIRTUALIZATION_ORACLE) {
334 r = dmi;
335 goto finish;
336 }
337
338 r = detect_vm_cpuid();
339 if (r < 0)
340 return r;
341 if (r != VIRTUALIZATION_NONE) {
342 if (r == VIRTUALIZATION_VM_OTHER)
343 other = true;
344 else
345 goto finish;
346 }
347
348 r = dmi;
349 if (r < 0)
350 return r;
351 if (r != VIRTUALIZATION_NONE) {
352 if (r == VIRTUALIZATION_VM_OTHER)
353 other = true;
354 else
355 goto finish;
356 }
357
358 /* x86 xen will most likely be detected by cpuid. If not (most likely
359 * because we're not an x86 guest), then we should try the xen capabilities
360 * file next. If that's not found, then we check for the high-level
361 * hypervisor sysfs file:
362 *
363 * https://bugs.freedesktop.org/show_bug.cgi?id=77271 */
364
365 r = detect_vm_xen();
366 if (r < 0)
367 return r;
368 if (r != VIRTUALIZATION_NONE) {
369 if (r == VIRTUALIZATION_VM_OTHER)
370 other = true;
371 else
372 goto finish;
373 }
374
375 r = detect_vm_hypervisor();
376 if (r < 0)
377 return r;
378 if (r != VIRTUALIZATION_NONE) {
379 if (r == VIRTUALIZATION_VM_OTHER)
380 other = true;
381 else
382 goto finish;
383 }
384
385 r = detect_vm_device_tree();
386 if (r < 0)
387 return r;
388 if (r != VIRTUALIZATION_NONE) {
389 if (r == VIRTUALIZATION_VM_OTHER)
390 other = true;
391 else
392 goto finish;
393 }
394
395 r = detect_vm_uml();
396 if (r < 0)
397 return r;
398 if (r != VIRTUALIZATION_NONE) {
399 if (r == VIRTUALIZATION_VM_OTHER)
400 other = true;
401 else
402 goto finish;
403 }
404
405 r = detect_vm_zvm();
406 if (r < 0)
407 return r;
408
409 finish:
410 /* x86 xen Dom0 is detected as XEN in hypervisor and maybe others.
411 * In order to detect the Dom0 as not virtualization we need to
412 * double-check it */
413 if (r == VIRTUALIZATION_XEN && detect_vm_xen_dom0())
414 r = VIRTUALIZATION_NONE;
415 else if (r == VIRTUALIZATION_NONE && other)
416 r = VIRTUALIZATION_VM_OTHER;
417
418 cached_found = r;
419 log_debug("Found VM virtualization %s", virtualization_to_string(r));
420 return r;
421 }
422
423 int detect_container(void) {
424
425 static const struct {
426 const char *value;
427 int id;
428 } value_table[] = {
429 { "lxc", VIRTUALIZATION_LXC },
430 { "lxc-libvirt", VIRTUALIZATION_LXC_LIBVIRT },
431 { "systemd-nspawn", VIRTUALIZATION_SYSTEMD_NSPAWN },
432 { "docker", VIRTUALIZATION_DOCKER },
433 { "rkt", VIRTUALIZATION_RKT },
434 };
435
436 static thread_local int cached_found = _VIRTUALIZATION_INVALID;
437 _cleanup_free_ char *m = NULL;
438 const char *e = NULL;
439 unsigned j;
440 int r;
441
442 if (cached_found >= 0)
443 return cached_found;
444
445 /* /proc/vz exists in container and outside of the container, /proc/bc only outside of the container. */
446 if (access("/proc/vz", F_OK) >= 0 &&
447 access("/proc/bc", F_OK) < 0) {
448 r = VIRTUALIZATION_OPENVZ;
449 goto finish;
450 }
451
452 if (getpid_cached() == 1) {
453 /* If we are PID 1 we can just check our own environment variable, and that's authoritative. */
454
455 e = getenv("container");
456 if (isempty(e)) {
457 r = VIRTUALIZATION_NONE;
458 goto finish;
459 }
460
461 goto translate_name;
462 }
463
464 /* Otherwise, PID 1 might have dropped this information into a file in /run. This is better than accessing
465 * /proc/1/environ, since we don't need CAP_SYS_PTRACE for that. */
466 r = read_one_line_file("/run/systemd/container", &m);
467 if (r >= 0) {
468 e = m;
469 goto translate_name;
470 }
471 if (r != -ENOENT)
472 return log_debug_errno(r, "Failed to read /run/systemd/container: %m");
473
474 /* Fallback for cases where PID 1 was not systemd (for example, cases where init=/bin/sh is used. */
475 r = getenv_for_pid(1, "container", &m);
476 if (r > 0) {
477 e = m;
478 goto translate_name;
479 }
480 if (r < 0) /* This only works if we have CAP_SYS_PTRACE, hence let's better ignore failures here */
481 log_debug_errno(r, "Failed to read $container of PID 1, ignoring: %m");
482
483 /* Interestingly /proc/1/sched actually shows the host's PID for what we see as PID 1. Hence, if the PID shown
484 * there is not 1, we know we are in a PID namespace. and hence a container. */
485 r = read_one_line_file("/proc/1/sched", &m);
486 if (r >= 0) {
487 const char *t;
488
489 t = strrchr(m, '(');
490 if (!t)
491 return -EIO;
492
493 if (!startswith(t, "(1,")) {
494 r = VIRTUALIZATION_CONTAINER_OTHER;
495 goto finish;
496 }
497 } else if (r != -ENOENT)
498 return r;
499
500 /* If that didn't work, give up, assume no container manager. */
501 r = VIRTUALIZATION_NONE;
502 goto finish;
503
504 translate_name:
505 for (j = 0; j < ELEMENTSOF(value_table); j++)
506 if (streq(e, value_table[j].value)) {
507 r = value_table[j].id;
508 goto finish;
509 }
510
511 r = VIRTUALIZATION_CONTAINER_OTHER;
512
513 finish:
514 log_debug("Found container virtualization %s.", virtualization_to_string(r));
515 cached_found = r;
516 return r;
517 }
518
519 int detect_virtualization(void) {
520 int r;
521
522 r = detect_container();
523 if (r == 0)
524 r = detect_vm();
525
526 return r;
527 }
528
529 static int userns_has_mapping(const char *name) {
530 _cleanup_fclose_ FILE *f = NULL;
531 _cleanup_free_ char *buf = NULL;
532 size_t n_allocated = 0;
533 ssize_t n;
534 uint32_t a, b, c;
535 int r;
536
537 f = fopen(name, "re");
538 if (!f) {
539 log_debug_errno(errno, "Failed to open %s: %m", name);
540 return errno == ENOENT ? false : -errno;
541 }
542
543 n = getline(&buf, &n_allocated, f);
544 if (n < 0) {
545 if (feof(f)) {
546 log_debug("%s is empty, we're in an uninitialized user namespace", name);
547 return true;
548 }
549
550 return log_debug_errno(errno, "Failed to read %s: %m", name);
551 }
552
553 r = sscanf(buf, "%"PRIu32" %"PRIu32" %"PRIu32, &a, &b, &c);
554 if (r < 3)
555 return log_debug_errno(errno, "Failed to parse %s: %m", name);
556
557 if (a == 0 && b == 0 && c == UINT32_MAX) {
558 /* The kernel calls mappings_overlap() and does not allow overlaps */
559 log_debug("%s has a full 1:1 mapping", name);
560 return false;
561 }
562
563 /* Anything else implies that we are in a user namespace */
564 log_debug("Mapping found in %s, we're in a user namespace", name);
565 return true;
566 }
567
568 int running_in_userns(void) {
569 _cleanup_free_ char *line = NULL;
570 int r;
571
572 r = userns_has_mapping("/proc/self/uid_map");
573 if (r != 0)
574 return r;
575
576 r = userns_has_mapping("/proc/self/gid_map");
577 if (r != 0)
578 return r;
579
580 /* "setgroups" file was added in kernel v3.18-rc6-15-g9cc46516dd. It is also
581 * possible to compile a kernel without CONFIG_USER_NS, in which case "setgroups"
582 * also does not exist. We cannot distinguish those two cases, so assume that
583 * we're running on a stripped-down recent kernel, rather than on an old one,
584 * and if the file is not found, return false.
585 */
586 r = read_one_line_file("/proc/self/setgroups", &line);
587 if (r < 0) {
588 log_debug_errno(r, "/proc/self/setgroups: %m");
589 return r == -ENOENT ? false : r;
590 }
591
592 truncate_nl(line);
593 r = streq(line, "deny");
594 /* See user_namespaces(7) for a description of this "setgroups" contents. */
595 log_debug("/proc/self/setgroups contains \"%s\", %s user namespace", line, r ? "in" : "not in");
596 return r;
597 }
598
599 int running_in_chroot(void) {
600 int ret;
601
602 if (getenv_bool("SYSTEMD_IGNORE_CHROOT") > 0)
603 return 0;
604
605 ret = files_same("/proc/1/root", "/", 0);
606 if (ret < 0)
607 return ret;
608
609 return ret == 0;
610 }
611
612 static const char *const virtualization_table[_VIRTUALIZATION_MAX] = {
613 [VIRTUALIZATION_NONE] = "none",
614 [VIRTUALIZATION_KVM] = "kvm",
615 [VIRTUALIZATION_QEMU] = "qemu",
616 [VIRTUALIZATION_BOCHS] = "bochs",
617 [VIRTUALIZATION_XEN] = "xen",
618 [VIRTUALIZATION_UML] = "uml",
619 [VIRTUALIZATION_VMWARE] = "vmware",
620 [VIRTUALIZATION_ORACLE] = "oracle",
621 [VIRTUALIZATION_MICROSOFT] = "microsoft",
622 [VIRTUALIZATION_ZVM] = "zvm",
623 [VIRTUALIZATION_PARALLELS] = "parallels",
624 [VIRTUALIZATION_BHYVE] = "bhyve",
625 [VIRTUALIZATION_VM_OTHER] = "vm-other",
626
627 [VIRTUALIZATION_SYSTEMD_NSPAWN] = "systemd-nspawn",
628 [VIRTUALIZATION_LXC_LIBVIRT] = "lxc-libvirt",
629 [VIRTUALIZATION_LXC] = "lxc",
630 [VIRTUALIZATION_OPENVZ] = "openvz",
631 [VIRTUALIZATION_DOCKER] = "docker",
632 [VIRTUALIZATION_RKT] = "rkt",
633 [VIRTUALIZATION_CONTAINER_OTHER] = "container-other",
634 };
635
636 DEFINE_STRING_TABLE_LOOKUP(virtualization, int);