1 /* SPDX-License-Identifier: LGPL-2.1+ */
7 #include <sys/capability.h>
11 #include "alloc-util.h"
12 #include "capability-util.h"
16 #include "missing_prctl.h"
17 #include "parse-util.h"
18 #include "user-util.h"
21 int have_effective_cap(int value
) {
22 _cleanup_cap_free_ cap_t cap
;
29 if (cap_get_flag(cap
, value
, CAP_EFFECTIVE
, &fv
) < 0)
35 unsigned long cap_last_cap(void) {
36 static thread_local
unsigned long saved
;
37 static thread_local
bool valid
= false;
38 _cleanup_free_
char *content
= NULL
;
45 /* available since linux-3.2 */
46 r
= read_one_line_file("/proc/sys/kernel/cap_last_cap", &content
);
48 r
= safe_atolu(content
, &p
);
51 if (p
> 63) /* Safety for the future: if one day the kernel learns more than 64 caps,
52 * then we are in trouble (since we, as much userspace and kernel space
53 * store capability masks in uint64_t types). Let's hence protect
54 * ourselves against that and always cap at 63 for now. */
63 /* fall back to syscall-probing for pre linux-3.2 */
64 p
= MIN((unsigned long) CAP_LAST_CAP
, 63U);
66 if (prctl(PR_CAPBSET_READ
, p
) < 0) {
68 /* Hmm, look downwards, until we find one that works */
69 for (p
--; p
> 0; p
--)
70 if (prctl(PR_CAPBSET_READ
, p
) >= 0)
75 /* Hmm, look upwards, until we find one that doesn't work */
77 if (prctl(PR_CAPBSET_READ
, p
+1) < 0)
87 int capability_update_inherited_set(cap_t caps
, uint64_t set
) {
90 /* Add capabilities in the set to the inherited caps. Do not apply
93 for (i
= 0; i
< cap_last_cap(); i
++) {
95 if (set
& (UINT64_C(1) << i
)) {
100 /* Make the capability inheritable. */
101 if (cap_set_flag(caps
, CAP_INHERITABLE
, 1, &v
, CAP_SET
) < 0)
109 int capability_ambient_set_apply(uint64_t set
, bool also_inherit
) {
110 _cleanup_cap_free_ cap_t caps
= NULL
;
114 /* Add the capabilities to the ambient set. */
117 caps
= cap_get_proc();
121 r
= capability_update_inherited_set(caps
, set
);
125 if (cap_set_proc(caps
) < 0)
129 for (i
= 0; i
< cap_last_cap(); i
++) {
131 if (set
& (UINT64_C(1) << i
)) {
133 /* Add the capability to the ambient set. */
134 if (prctl(PR_CAP_AMBIENT
, PR_CAP_AMBIENT_RAISE
, i
, 0, 0) < 0)
142 int capability_bounding_set_drop(uint64_t keep
, bool right_now
) {
143 _cleanup_cap_free_ cap_t before_cap
= NULL
, after_cap
= NULL
;
148 /* If we are run as PID 1 we will lack CAP_SETPCAP by default
149 * in the effective set (yes, the kernel drops that when
150 * executing init!), so get it back temporarily so that we can
151 * call PR_CAPBSET_DROP. */
153 before_cap
= cap_get_proc();
157 if (cap_get_flag(before_cap
, CAP_SETPCAP
, CAP_EFFECTIVE
, &fv
) < 0)
161 _cleanup_cap_free_ cap_t temp_cap
= NULL
;
162 static const cap_value_t v
= CAP_SETPCAP
;
164 temp_cap
= cap_dup(before_cap
);
168 if (cap_set_flag(temp_cap
, CAP_EFFECTIVE
, 1, &v
, CAP_SET
) < 0)
171 if (cap_set_proc(temp_cap
) < 0)
172 log_debug_errno(errno
, "Can't acquire effective CAP_SETPCAP bit, ignoring: %m");
174 /* If we didn't manage to acquire the CAP_SETPCAP bit, we continue anyway, after all this just means
175 * we'll fail later, when we actually intend to drop some capabilities. */
178 after_cap
= cap_dup(before_cap
);
182 for (i
= 0; i
<= cap_last_cap(); i
++) {
185 if ((keep
& (UINT64_C(1) << i
)))
188 /* Drop it from the bounding set */
189 if (prctl(PR_CAPBSET_DROP
, i
) < 0) {
192 /* If dropping the capability failed, let's see if we didn't have it in the first place. If so,
193 * continue anyway, as dropping a capability we didn't have in the first place doesn't really
195 if (prctl(PR_CAPBSET_READ
, i
) != 0)
200 /* Also drop it from the inheritable set, so
201 * that anything we exec() loses the
202 * capability for good. */
203 if (cap_set_flag(after_cap
, CAP_INHERITABLE
, 1, &v
, CAP_CLEAR
) < 0) {
208 /* If we shall apply this right now drop it
209 * also from our own capability sets. */
211 if (cap_set_flag(after_cap
, CAP_PERMITTED
, 1, &v
, CAP_CLEAR
) < 0 ||
212 cap_set_flag(after_cap
, CAP_EFFECTIVE
, 1, &v
, CAP_CLEAR
) < 0) {
222 if (cap_set_proc(after_cap
) < 0) {
223 /* If there are no actual changes anyway then let's ignore this error. */
224 if (cap_compare(before_cap
, after_cap
) != 0)
231 static int drop_from_file(const char *fn
, uint64_t keep
) {
232 _cleanup_free_
char *p
= NULL
;
233 uint64_t current
, after
;
237 r
= read_one_line_file(fn
, &p
);
241 assert_cc(sizeof(hi
) == sizeof(unsigned));
242 assert_cc(sizeof(lo
) == sizeof(unsigned));
244 k
= sscanf(p
, "%u %u", &lo
, &hi
);
248 current
= (uint64_t) lo
| ((uint64_t) hi
<< 32ULL);
249 after
= current
& keep
;
251 if (current
== after
)
254 lo
= (unsigned) (after
& 0xFFFFFFFFULL
);
255 hi
= (unsigned) ((after
>> 32ULL) & 0xFFFFFFFFULL
);
257 return write_string_filef(fn
, WRITE_STRING_FILE_CREATE
, "%u %u", lo
, hi
);
260 int capability_bounding_set_drop_usermode(uint64_t keep
) {
263 r
= drop_from_file("/proc/sys/kernel/usermodehelper/inheritable", keep
);
267 r
= drop_from_file("/proc/sys/kernel/usermodehelper/bset", keep
);
274 int drop_privileges(uid_t uid
, gid_t gid
, uint64_t keep_capabilities
) {
277 /* Unfortunately we cannot leave privilege dropping to PID 1 here, since we want to run as user but
278 * want to keep some capabilities. Since file capabilities have been introduced this cannot be done
279 * across exec() anymore, unless our binary has the capability configured in the file system, which
280 * we want to avoid. */
282 if (setresgid(gid
, gid
, gid
) < 0)
283 return log_error_errno(errno
, "Failed to change group ID: %m");
285 r
= maybe_setgroups(0, NULL
);
287 return log_error_errno(r
, "Failed to drop auxiliary groups list: %m");
289 /* Ensure we keep the permitted caps across the setresuid(). Note that we do this even if we actually
290 * don't want to keep any capabilities, since we want to be able to drop them from the bounding set
291 * too, and we can only do that if we have capabilities. */
292 if (prctl(PR_SET_KEEPCAPS
, 1) < 0)
293 return log_error_errno(errno
, "Failed to enable keep capabilities flag: %m");
295 if (setresuid(uid
, uid
, uid
) < 0)
296 return log_error_errno(errno
, "Failed to change user ID: %m");
298 if (prctl(PR_SET_KEEPCAPS
, 0) < 0)
299 return log_error_errno(errno
, "Failed to disable keep capabilities flag: %m");
301 /* Drop all caps from the bounding set (as well as the inheritable/permitted/effective sets), except
302 * the ones we want to keep */
303 r
= capability_bounding_set_drop(keep_capabilities
, true);
305 return log_error_errno(r
, "Failed to drop capabilities: %m");
307 /* Now upgrade the permitted caps we still kept to effective caps */
308 if (keep_capabilities
!= 0) {
309 cap_value_t bits
[u64log2(keep_capabilities
) + 1];
310 _cleanup_cap_free_ cap_t d
= NULL
;
317 for (i
= 0; i
< ELEMENTSOF(bits
); i
++)
318 if (keep_capabilities
& (1ULL << i
))
321 /* use enough bits */
322 assert(i
== 64 || (keep_capabilities
>> i
) == 0);
323 /* don't use too many bits */
324 assert(keep_capabilities
& (UINT64_C(1) << (i
- 1)));
326 if (cap_set_flag(d
, CAP_EFFECTIVE
, j
, bits
, CAP_SET
) < 0 ||
327 cap_set_flag(d
, CAP_PERMITTED
, j
, bits
, CAP_SET
) < 0)
328 return log_error_errno(errno
, "Failed to enable capabilities bits: %m");
330 if (cap_set_proc(d
) < 0)
331 return log_error_errno(errno
, "Failed to increase capabilities: %m");
337 int drop_capability(cap_value_t cv
) {
338 _cleanup_cap_free_ cap_t tmp_cap
= NULL
;
340 tmp_cap
= cap_get_proc();
344 if ((cap_set_flag(tmp_cap
, CAP_INHERITABLE
, 1, &cv
, CAP_CLEAR
) < 0) ||
345 (cap_set_flag(tmp_cap
, CAP_PERMITTED
, 1, &cv
, CAP_CLEAR
) < 0) ||
346 (cap_set_flag(tmp_cap
, CAP_EFFECTIVE
, 1, &cv
, CAP_CLEAR
) < 0))
349 if (cap_set_proc(tmp_cap
) < 0)
355 bool ambient_capabilities_supported(void) {
356 static int cache
= -1;
361 /* If PR_CAP_AMBIENT returns something valid, or an unexpected error code we assume that ambient caps are
364 cache
= prctl(PR_CAP_AMBIENT
, PR_CAP_AMBIENT_IS_SET
, CAP_KILL
, 0, 0) >= 0 ||
365 !IN_SET(errno
, EINVAL
, EOPNOTSUPP
, ENOSYS
);
370 int capability_quintet_enforce(const CapabilityQuintet
*q
) {
371 _cleanup_cap_free_ cap_t c
= NULL
, modified
= NULL
;
374 if (q
->ambient
!= (uint64_t) -1) {
376 bool changed
= false;
382 /* In order to raise the ambient caps set we first need to raise the matching inheritable + permitted
384 for (i
= 0; i
<= cap_last_cap(); i
++) {
385 uint64_t m
= UINT64_C(1) << i
;
386 cap_value_t cv
= (cap_value_t
) i
;
387 cap_flag_value_t old_value_inheritable
, old_value_permitted
;
389 if ((q
->ambient
& m
) == 0)
392 if (cap_get_flag(c
, cv
, CAP_INHERITABLE
, &old_value_inheritable
) < 0)
394 if (cap_get_flag(c
, cv
, CAP_PERMITTED
, &old_value_permitted
) < 0)
397 if (old_value_inheritable
== CAP_SET
&& old_value_permitted
== CAP_SET
)
400 if (cap_set_flag(c
, CAP_INHERITABLE
, 1, &cv
, CAP_SET
) < 0)
402 if (cap_set_flag(c
, CAP_PERMITTED
, 1, &cv
, CAP_SET
) < 0)
409 if (cap_set_proc(c
) < 0)
412 r
= capability_ambient_set_apply(q
->ambient
, false);
417 if (q
->inheritable
!= (uint64_t) -1 || q
->permitted
!= (uint64_t) -1 || q
->effective
!= (uint64_t) -1) {
418 bool changed
= false;
427 for (i
= 0; i
<= cap_last_cap(); i
++) {
428 uint64_t m
= UINT64_C(1) << i
;
429 cap_value_t cv
= (cap_value_t
) i
;
431 if (q
->inheritable
!= (uint64_t) -1) {
432 cap_flag_value_t old_value
, new_value
;
434 if (cap_get_flag(c
, cv
, CAP_INHERITABLE
, &old_value
) < 0) {
435 if (errno
== EINVAL
) /* If the kernel knows more caps than this
436 * version of libcap, then this will return
437 * EINVAL. In that case, simply ignore it,
438 * pretend it doesn't exist. */
444 new_value
= (q
->inheritable
& m
) ? CAP_SET
: CAP_CLEAR
;
446 if (old_value
!= new_value
) {
449 if (cap_set_flag(c
, CAP_INHERITABLE
, 1, &cv
, new_value
) < 0)
454 if (q
->permitted
!= (uint64_t) -1) {
455 cap_flag_value_t old_value
, new_value
;
457 if (cap_get_flag(c
, cv
, CAP_PERMITTED
, &old_value
) < 0) {
464 new_value
= (q
->permitted
& m
) ? CAP_SET
: CAP_CLEAR
;
466 if (old_value
!= new_value
) {
469 if (cap_set_flag(c
, CAP_PERMITTED
, 1, &cv
, new_value
) < 0)
474 if (q
->effective
!= (uint64_t) -1) {
475 cap_flag_value_t old_value
, new_value
;
477 if (cap_get_flag(c
, cv
, CAP_EFFECTIVE
, &old_value
) < 0) {
484 new_value
= (q
->effective
& m
) ? CAP_SET
: CAP_CLEAR
;
486 if (old_value
!= new_value
) {
489 if (cap_set_flag(c
, CAP_EFFECTIVE
, 1, &cv
, new_value
) < 0)
496 /* In order to change the bounding caps, we need to keep CAP_SETPCAP for a bit
497 * longer. Let's add it to our list hence for now. */
498 if (q
->bounding
!= (uint64_t) -1) {
499 cap_value_t cv
= CAP_SETPCAP
;
501 modified
= cap_dup(c
);
505 if (cap_set_flag(modified
, CAP_PERMITTED
, 1, &cv
, CAP_SET
) < 0)
507 if (cap_set_flag(modified
, CAP_EFFECTIVE
, 1, &cv
, CAP_SET
) < 0)
510 if (cap_compare(modified
, c
) == 0) {
511 /* No change? then drop this nonsense again */
517 /* Now, let's enforce the caps for the first time. Note that this is where we acquire
518 * caps in any of the sets we currently don't have. We have to do this before
519 * dropping the bounding caps below, since at that point we can never acquire new
520 * caps in inherited/permitted/effective anymore, but only lose them. */
521 if (cap_set_proc(modified
?: c
) < 0)
526 if (q
->bounding
!= (uint64_t) -1) {
527 r
= capability_bounding_set_drop(q
->bounding
, false);
532 /* If needed, let's now set the caps again, this time in the final version, which differs from what
533 * we have already set only in the CAP_SETPCAP bit, which we needed for dropping the bounding
534 * bits. This call only undoes bits and doesn't acquire any which means the bounding caps don't
537 if (cap_set_proc(c
) < 0)