]> git.ipfire.org Git - thirdparty/man-pages.git/blame - man2/unshare.2
sched_setattr.2: tfix
[thirdparty/man-pages.git] / man2 / unshare.2
CommitLineData
f50f6cb5 1.\" Copyright (C) 2006, Janak Desai <janak@us.ibm.com>
f919b6e4 2.\" and Copyright (C) 2006, 2012 Michael Kerrisk <mtk.manpages@gmail.com>
2297bf0e 3.\"
b55e2bb3 4.\" %%%LICENSE_START(GPL_NOVERSION_ONELINE)
5cc01e9c 5.\" Licensed under the GPL
b55e2bb3 6.\" %%%LICENSE_END
5cc01e9c 7.\"
d44c4bf3 8.\" Patch Justification:
c13182ef
MK
9.\" unshare system call is needed to implement, using PAM,
10.\" per-security_context and/or per-user namespace to provide
11.\" polyinstantiated directories. Using unshare and bind mounts, a
12.\" PAM module can create private namespace with appropriate
13.\" directories(based on user's security context) bind mounted on
14.\" public directories such as /tmp, thus providing an instance of
15.\" /tmp that is based on user's security context. Without the
16.\" unshare system call, namespace separation can only be achieved
17.\" by clone, which would require porting and maintaining all commands
18.\" such as login, and su, that establish a user session.
d44c4bf3 19.\"
e8426ca2 20.TH UNSHARE 2 2020-04-11 "Linux" "Linux Programmer's Manual"
5cc01e9c
MK
21.SH NAME
22unshare \- disassociate parts of the process execution context
23.SH SYNOPSIS
24.nf
4f71ba5d 25.B #define _GNU_SOURCE
5cc01e9c 26.B #include <sched.h>
68e4db0a 27.PP
5cc01e9c
MK
28.BI "int unshare(int " flags );
29.fi
30.SH DESCRIPTION
c13182ef 31.BR unshare ()
15784e0a 32allows a process (or thread) to disassociate parts of its execution
f0d0f68d 33context that are currently being shared with other processes (or threads).
732e54dd 34Part of the execution context, such as the mount namespace, is shared
c13182ef 35implicitly when a new process is created using
5cc01e9c
MK
36.BR fork (2)
37or
c13182ef 38.BR vfork (2),
5cc01e9c 39while other parts, such as virtual memory, may be
15784e0a 40shared by explicit request when creating a process or thread using
5cc01e9c 41.BR clone (2).
efeece04 42.PP
c13182ef 43The main use of
5cc01e9c
MK
44.BR unshare ()
45is to allow a process to control its
46shared execution context without creating a new process.
efeece04 47.PP
c13182ef
MK
48The
49.I flags
50argument is a bit mask that specifies which parts of
51the execution context should be unshared.
5cc01e9c
MK
52This argument is specified by ORing together zero or more
53of the following constants:
54.TP
55.B CLONE_FILES
56Reverse the effect of the
57.BR clone (2)
58.B CLONE_FILES
59flag.
c13182ef 60Unshare the file descriptor table, so that the calling process
5cc01e9c
MK
61no longer shares its file descriptors with any other process.
62.TP
63.B CLONE_FS
64Reverse the effect of the
65.BR clone (2)
c13182ef 66.B CLONE_FS
5cc01e9c 67flag.
9ee4a2b6 68Unshare filesystem attributes, so that the calling process
f7b8bdbe
MK
69no longer shares its root directory
70.RB ( chroot (2)),
71current directory
72.RB ( chdir (2)),
73or umask
74.RB ( umask (2))
75attributes with any other process.
5cc01e9c 76.TP
216131bd
MK
77.BR CLONE_NEWCGROUP " (since Linux 4.6)"
78This flag has the same effect as the
79.BR clone (2)
80.B CLONE_NEWCGROUP
81flag.
82Unshare the cgroup namespace.
83Use of
84.BR CLONE_NEWCGROUP
85requires the
86.BR CAP_SYS_ADMIN
87capability.
88.TP
6881dc47 89.BR CLONE_NEWIPC " (since Linux 2.6.19)"
25539b1b
MK
90This flag has the same effect as the
91.BR clone (2)
92.B CLONE_NEWIPC
93flag.
1024e8ff 94Unshare the IPC namespace,
25539b1b 95so that the calling process has a private copy of the
1024e8ff 96IPC namespace which is not shared with any other process.
25539b1b
MK
97Specifying this flag automatically implies
98.BR CLONE_SYSVSEM
99as well.
100Use of
101.BR CLONE_NEWIPC
102requires the
103.BR CAP_SYS_ADMIN
104capability.
105.TP
6881dc47 106.BR CLONE_NEWNET " (since Linux 2.6.24)"
b3bc5386
MK
107This flag has the same effect as the
108.BR clone (2)
109.B CLONE_NEWNET
110flag.
111Unshare the network namespace,
61f22790
LAG
112so that the calling process is moved into a
113new network namespace which is not shared
114with any previously existing process.
6f2b4a65 115Use of
b3bc5386
MK
116.BR CLONE_NEWNET
117requires the
118.BR CAP_SYS_ADMIN
119capability.
120.TP
5cc01e9c
MK
121.B CLONE_NEWNS
122.\" These flag name are inconsistent:
c13182ef 123.\" CLONE_NEWNS does the same thing in clone(), but CLONE_VM,
5cc01e9c
MK
124.\" CLONE_FS, and CLONE_FILES reverse the action of the clone()
125.\" flags of the same name.
c8e4c1bd 126This flag has the same effect as the
5cc01e9c
MK
127.BR clone (2)
128.B CLONE_NEWNS
129flag.
732e54dd 130Unshare the mount namespace,
4df2eb09 131so that the calling process has a private copy of
5cc01e9c
MK
132its namespace which is not shared with any other process.
133Specifying this flag automatically implies
134.B CLONE_FS
135as well.
486d4e9b
MK
136Use of
137.BR CLONE_NEWNS
138requires the
139.BR CAP_SYS_ADMIN
140capability.
e203673a
MK
141For further information, see
142.BR mount_namespaces (7).
a948ae52 143.TP
8f141c5e
MK
144.BR CLONE_NEWPID " (since Linux 3.8)"
145This flag has the same effect as the
146.BR clone (2)
147.B CLONE_NEWPID
148flag.
149Unshare the PID namespace,
37ee2d61 150so that the calling process has a new PID namespace for its children
8f141c5e 151which is not shared with any previously existing process.
2193656a
MK
152The calling process is
153.I not
154moved into the new namespace.
155The first child created by the calling process will have
156the process ID 1 and will assume the role of
157.BR init (1)
158in the new namespace.
3c881e7c
MK
159.BR CLONE_NEWPID
160automatically implies
161.BR CLONE_THREAD
162as well.
8f141c5e
MK
163Use of
164.BR CLONE_NEWPID
165requires the
166.BR CAP_SYS_ADMIN
167capability.
5c8d010b
MK
168For further information, see
169.BR pid_namespaces (7).
8f141c5e 170.TP
e5a5efc8
MK
171.BR CLONE_NEWTIME " (since Linux 5.6)"
172Unshare the time namespace,
173so that the calling process has a new time namespace for its children
174which is not shared with any previously existing process.
175The calling process is
176.I not
177moved into the new namespace.
178Use of
179.BR CLONE_NEWTIME
180requires the
181.BR CAP_SYS_ADMIN
182capability.
183For further information, see
184.BR time_namespaces (7).
185.TP
c2cd5a7f
MK
186.BR CLONE_NEWUSER " (since Linux 3.8)"
187This flag has the same effect as the
188.BR clone (2)
189.B CLONE_NEWUSER
190flag.
191Unshare the user namespace,
192so that the calling process is moved into a new user namespace
193which is not shared with any previously existing process.
5afd65d1 194As with the child process created by
36ec1f75
MK
195.BR clone (2)
196with the
197.B CLONE_NEWUSER
198flag, the caller obtains a full set of capabilities in the new namespace.
88f48716
MK
199.IP
200.BR CLONE_NEWUSER
201requires that the calling process is not threaded; specifying
202.BR CLONE_NEWUSER
203automatically implies
4c3d7431 204.BR CLONE_THREAD .
6bab36f8 205Since Linux 3.9,
4c3d7431
MK
206.\" commit e66eded8309ebf679d3d3c1f5820d1f2ca332c71
207.\" https://lwn.net/Articles/543273/
6bab36f8
MK
208.BR CLONE_NEWUSER
209also automatically implies
210.BR CLONE_FS .
37ee2d61 211.BR CLONE_NEWUSER
88f48716 212requires that the user ID and group ID
6f6808f9 213of the calling process are mapped to user IDs and group IDs in the
37ee2d61 214user namespace of the calling process at the time of the call.
efeece04 215.IP
f647dc5e 216For further information on user namespaces, see
333446b9 217.BR user_namespaces (7).
c2cd5a7f 218.TP
667f4c78 219.BR CLONE_NEWUTS " (since Linux 2.6.19)"
78449461
MK
220This flag has the same effect as the
221.BR clone (2)
222.B CLONE_NEWUTS
223flag.
224Unshare the UTS IPC namespace,
225so that the calling process has a private copy of the
226UTS namespace which is not shared with any other process.
227Use of
228.BR CLONE_NEWUTS
229requires the
230.BR CAP_SYS_ADMIN
231capability.
232.TP
a948ae52 233.BR CLONE_SYSVSEM " (since Linux 2.6.26)
29015225 234.\" commit 9edff4ab1f8d82675277a04e359d0ed8bf14a7b7
a948ae52
MK
235This flag reverses the effect of the
236.BR clone (2)
237.B CLONE_SYSVSEM
238flag.
0d829b76
MK
239Unshare System\ V semaphore adjustment
240.RI ( semadj )
241values,
242so that the calling process has a new empty
243.I semadj
244list that is not shared with any other process.
245If this is the last process that has a reference to the process's current
246.I semadj
247list, then the adjustments in that list are applied
248to the corresponding semaphores, as described in
249.BR semop (2).
eb359a09 250.\" CLONE_NEWNS If CLONE_SIGHAND is set and signals are also being shared
5cc01e9c 251.\" (i.e., current->signal->count > 1), force CLONE_THREAD.
3d5f4595 252.PP
4dd85833
MK
253In addition,
254.BR CLONE_THREAD ,
255.BR CLONE_SIGHAND ,
256and
257.BR CLONE_VM
258can be specified in
259.I flags
260if the caller is single threaded (i.e., it is not sharing
261its address space with another process or thread).
262In this case, these flags have no effect.
130fbed6
MK
263(Note also that specifying
264.BR CLONE_THREAD
265automatically implies
266.BR CLONE_VM ,
267and specifying
268.BR CLONE_VM
269automatically implies
270.BR CLONE_SIGHAND .)
f231195f
MK
271.\" As at 3.9, the following forced implications also apply,
272.\" although the relevant flags are not yet implemented.
273.\" If CLONE_THREAD is set force CLONE_VM.
274.\" If CLONE_VM is set, force CLONE_SIGHAND.
275.\"
4dd85833
MK
276If the process is multithreaded, then
277the use of these flags results in an error.
278.\" See kernel/fork.c::check_unshare_flags()
279.PP
c13182ef 280If
5cc01e9c
MK
281.I flags
282is specified as zero, then
283.BR unshare ()
284is a no-op;
285no changes are made to the calling process's execution context.
286.SH RETURN VALUE
c13182ef
MK
287On success, zero returned.
288On failure, \-1 is returned and
289.I errno
5cc01e9c
MK
290is set to indicate the error.
291.SH ERRORS
292.TP
eab64696
MK
293.B EINVAL
294An invalid bit was specified in
295.IR flags .
296.TP
4dd85833
MK
297.B EINVAL
298.BR CLONE_THREAD ,
299.BR CLONE_SIGHAND ,
300or
301.BR CLONE_VM
302was specified in
303.IR flags ,
304and the caller is multithreaded.
305.TP
1f1c28e0
MK
306.B EINVAL
307.BR CLONE_NEWIPC
308was specified in
309.IR flags ,
310but the kernel was not configured with the
311.B CONFIG_SYSVIPC
312and
313.BR CONFIG_IPC_NS
314options.
315.TP
316.B EINVAL
317.BR CLONE_NEWNET
318was specified in
319.IR flags ,
320but the kernel was not configured with the
321.B CONFIG_NET_NS
322option.
323.TP
324.B EINVAL
325.BR CLONE_NEWPID
326was specified in
327.IR flags ,
328but the kernel was not configured with the
329.B CONFIG_PID_NS
330option.
331.TP
332.B EINVAL
333.BR CLONE_NEWUSER
334was specified in
335.IR flags ,
336but the kernel was not configured with the
337.B CONFIG_USER_NS
338option.
339.TP
340.B EINVAL
341.BR CLONE_NEWUTS
342was specified in
343.IR flags ,
344but the kernel was not configured with the
345.B CONFIG_UTS_NS
346option.
347.TP
7827e176
TA
348.B EINVAL
349.BR CLONE_NEWPID
350was specified in
e20f826d
MK
351.IR flags ,
352but the process has previously called
353.BR unshare ()
354with the
355.BR CLONE_NEWPID
356flag.
7827e176 357.TP
eab64696
MK
358.B ENOMEM
359Cannot allocate sufficient memory to copy parts of caller's
360context that need to be unshared.
361.TP
b20e22ae
MK
362.BR ENOSPC " (since Linux 3.7)"
363.\" commit f2302505775fd13ba93f034206f1e2a587017929
364.B CLONE_NEWPID
365was specified in flags,
366but the limit on the nesting depth of PID namespaces
367would have been exceeded; see
368.BR pid_namespaces (7).
369.TP
b5742ecc
MK
370.BR ENOSPC " (since Linux 4.9; beforehand " EUSERS )
371.B CLONE_NEWUSER
372was specified in
373.IR flags ,
374and the call would cause the limit on the number of
375nested user namespaces to be exceeded.
376See
377.BR user_namespaces (7).
efeece04 378.IP
b5742ecc
MK
379From Linux 3.11 to Linux 4.8, the error diagnosed in this case was
380.BR EUSERS .
381.TP
2f7a331e
MK
382.BR ENOSPC " (since Linux 4.9)"
383One of the values in
384.I flags
385specified the creation of a new user namespace,
386but doing so would have caused the limit defined by the corresponding file in
387.IR /proc/sys/user
388to be exceeded.
389For further details, see
390.BR namespaces (7).
391.TP
5cc01e9c 392.B EPERM
486d4e9b 393The calling process did not have the required privileges for this operation.
365d292a
MK
394.TP
395.B EPERM
396.BR CLONE_NEWUSER
397was specified in
398.IR flags ,
399but either the effective user ID or the effective group ID of the caller
400does not have a mapping in the parent namespace (see
f58fb24f 401.BR user_namespaces (7)).
cdd25f2e 402.TP
40a47a16
MK
403.BR EPERM " (since Linux 3.9)"
404.\" commit 3151527ee007b73a0ebd296010f1c0454a919c7d
12f74390
AM
405.B CLONE_NEWUSER
406was specified in
40a47a16
MK
407.I flags
408and the caller is in a chroot environment
409.\" FIXME What is the rationale for this restriction?
410(i.e., the caller's root directory does not match the root directory
411of the mount namespace in which it resides).
412.TP
b320d728 413.BR EUSERS " (from Linux 3.11 to Linux 4.8)"
cdd25f2e
MK
414.B CLONE_NEWUSER
415was specified in
416.IR flags ,
b5742ecc
MK
417and the limit on the number of nested user namespaces would be exceeded.
418See the discussion of the
419.BR ENOSPC
420error above.
ff457ccb 421.SH VERSIONS
5cc01e9c
MK
422The
423.BR unshare ()
424system call was added to Linux in kernel 2.6.16.
2dd578fd
MK
425.SH CONFORMING TO
426The
427.BR unshare ()
8382f16d 428system call is Linux-specific.
ff457ccb 429.SH NOTES
c13182ef 430Not all of the process attributes that can be shared when
5cc01e9c
MK
431a new process is created using
432.BR clone (2)
433can be unshared using
434.BR unshare ().
3c4e652d 435In particular, as at kernel 3.8,
f26fe082 436.\" FIXME all of the following needs to be reviewed for the current kernel
c13182ef 437.BR unshare ()
5cc01e9c
MK
438does not implement flags that reverse the effects of
439.BR CLONE_SIGHAND ,
3d5f4595 440.\" However, we can do unshare(CLONE_SIGHAND) if CLONE_SIGHAND
5cc01e9c
MK
441.\" was not specified when doing clone(); i.e., unsharing
442.\" signal handlers is permitted if we are not actually
443.\" sharing signal handlers. mtk
3d5f4595
MK
444.BR CLONE_THREAD ,
445or
3d5f4595 446.BR CLONE_VM .
3c4e652d 447.\" However, we can do unshare(CLONE_VM) if CLONE_VM
3d5f4595
MK
448.\" was not specified when doing clone(); i.e., unsharing
449.\" virtual memory is permitted if we are not actually
450.\" sharing virtual memory. mtk
5cc01e9c
MK
451Such functionality may be added in the future, if required.
452.\"
453.\"9) Future Work
454.\"--------------
455.\"The current implementation of unshare does not allow unsharing of
456.\"signals and signal handlers. Signals are complex to begin with and
457.\"to unshare signals and/or signal handlers of a currently running
458.\"process is even more complex. If in the future there is a specific
459.\"need to allow unsharing of signals and/or signal handlers, it can
460.\"be incrementally added to unshare without affecting legacy
461.\"applications using unshare.
462.\"
f919b6e4
MK
463.SH EXAMPLE
464The program below provides a simple implementation of the
465.BR unshare (1)
466command, which unshares one or more namespaces and executes the
08e54e51 467command supplied in its command-line arguments.
f919b6e4
MK
468Here's an example of the use of this program,
469running a shell in a new mount namespace,
470and verifying that the original shell and the
471new shell are in separate mount namespaces:
e646a1ba 472.PP
f919b6e4 473.in +4n
e646a1ba 474.EX
f919b6e4
MK
475$ \fBreadlink /proc/$$/ns/mnt\fP
476mnt:[4026531840]
477$ \fBsudo ./unshare -m /bin/bash\fP
f919b6e4
MK
478# \fBreadlink /proc/$$/ns/mnt\fP
479mnt:[4026532325]
b8302363 480.EE
f919b6e4 481.in
efeece04 482.PP
f919b6e4
MK
483The differing output of the two
484.BR readlink (1)
485commands shows that the two shells are in different mount namespaces.
486.SS Program source
487\&
e7d0bb47 488.EX
f5d401dd 489/* unshare.c
f919b6e4
MK
490
491 A simple implementation of the unshare(1) command: unshare
492 namespaces and execute a command.
493*/
494#define _GNU_SOURCE
495#include <sched.h>
496#include <unistd.h>
497#include <stdlib.h>
498#include <stdio.h>
499
500/* A simple error\-handling function: print an error message based
501 on the value in \(aqerrno\(aq and terminate the calling process */
502
d1a71985 503#define errExit(msg) do { perror(msg); exit(EXIT_FAILURE); \e
f919b6e4
MK
504 } while (0)
505
506static void
507usage(char *pname)
508{
d1a71985
MK
509 fprintf(stderr, "Usage: %s [options] program [arg...]\en", pname);
510 fprintf(stderr, "Options can be:\en");
beb5a76e 511 fprintf(stderr, " \-C unshare cgroup namespace\en");
d1a71985
MK
512 fprintf(stderr, " \-i unshare IPC namespace\en");
513 fprintf(stderr, " \-m unshare mount namespace\en");
514 fprintf(stderr, " \-n unshare network namespace\en");
515 fprintf(stderr, " \-p unshare PID namespace\en");
beb5a76e 516 fprintf(stderr, " \-t unshare time namespace\en");
d1a71985
MK
517 fprintf(stderr, " \-u unshare UTS namespace\en");
518 fprintf(stderr, " \-U unshare user namespace\en");
f919b6e4
MK
519 exit(EXIT_FAILURE);
520}
521
522int
523main(int argc, char *argv[])
524{
525 int flags, opt;
526
527 flags = 0;
528
beb5a76e 529 while ((opt = getopt(argc, argv, "CimnptuU")) != \-1) {
f919b6e4 530 switch (opt) {
beb5a76e 531 case \(aqC\(aq: flags |= CLONE_NEWCGROUP; break;
f919b6e4
MK
532 case \(aqi\(aq: flags |= CLONE_NEWIPC; break;
533 case \(aqm\(aq: flags |= CLONE_NEWNS; break;
534 case \(aqn\(aq: flags |= CLONE_NEWNET; break;
535 case \(aqp\(aq: flags |= CLONE_NEWPID; break;
beb5a76e 536 case \(aqt\(aq: flags |= CLONE_NEWTIME; break;
f919b6e4
MK
537 case \(aqu\(aq: flags |= CLONE_NEWUTS; break;
538 case \(aqU\(aq: flags |= CLONE_NEWUSER; break;
539 default: usage(argv[0]);
540 }
541 }
542
543 if (optind >= argc)
544 usage(argv[0]);
545
546 if (unshare(flags) == \-1)
547 errExit("unshare");
548
f5d401dd 549 execvp(argv[optind], &argv[optind]);
f919b6e4
MK
550 errExit("execvp");
551}
e7d0bb47 552.EE
5cc01e9c 553.SH SEE ALSO
e939d607 554.BR unshare (1),
c13182ef
MK
555.BR clone (2),
556.BR fork (2),
19a98048 557.BR kcmp (2),
47b0eb1e 558.BR setns (2),
3d02560d 559.BR vfork (2),
41096af1 560.BR namespaces (7)
efeece04 561.PP
5bbb004d 562.I Documentation/userspace-api/unshare.rst
173fe7e7 563in the Linux kernel source tree
5bbb004d
ES
564.\" commit f504d47be5e8fa7ecf2bf660b18b42e6960c0eb2
565(or
566.I Documentation/unshare.txt
567before Linux 4.12)