2 This file is part of systemd.
4 Copyright 2016 Lennart Poettering
6 systemd is free software; you can redistribute it and/or modify it
7 under the terms of the GNU Lesser General Public License as published by
8 the Free Software Foundation; either version 2.1 of the License, or
9 (at your option) any later version.
11 systemd is distributed in the hope that it will be useful, but
12 WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 Lesser General Public License for more details.
16 You should have received a copy of the GNU Lesser General Public License
17 along with systemd; If not, see <http://www.gnu.org/licenses/>.
22 #include <sys/eventfd.h>
26 #include <sys/types.h>
29 #include "alloc-util.h"
34 #include "process-util.h"
35 #include "raw-clone.h"
36 #include "seccomp-util.h"
38 #include "string-util.h"
42 static void test_seccomp_arch_to_string(void) {
46 a
= seccomp_arch_native();
48 name
= seccomp_arch_to_string(a
);
50 assert_se(seccomp_arch_from_string(name
, &b
) >= 0);
54 static void test_architecture_table(void) {
77 assert_se(seccomp_arch_from_string(n
, &c
) >= 0);
78 n2
= seccomp_arch_to_string(c
);
79 log_info("seccomp-arch: %s → 0x%"PRIx32
" → %s", n
, c
, n2
);
80 assert_se(streq_ptr(n
, n2
));
84 static void test_syscall_filter_set_find(void) {
85 assert_se(!syscall_filter_set_find(NULL
));
86 assert_se(!syscall_filter_set_find(""));
87 assert_se(!syscall_filter_set_find("quux"));
88 assert_se(!syscall_filter_set_find("@quux"));
90 assert_se(syscall_filter_set_find("@clock") == syscall_filter_sets
+ SYSCALL_FILTER_SET_CLOCK
);
91 assert_se(syscall_filter_set_find("@default") == syscall_filter_sets
+ SYSCALL_FILTER_SET_DEFAULT
);
92 assert_se(syscall_filter_set_find("@raw-io") == syscall_filter_sets
+ SYSCALL_FILTER_SET_RAW_IO
);
95 static void test_filter_sets(void) {
99 if (!is_seccomp_available())
104 for (i
= 0; i
< _SYSCALL_FILTER_SET_MAX
; i
++) {
107 log_info("Testing %s", syscall_filter_sets
[i
].name
);
112 if (pid
== 0) { /* Child? */
115 if (i
== SYSCALL_FILTER_SET_DEFAULT
) /* if we look at the default set, whitelist instead of blacklist */
116 r
= seccomp_load_syscall_filter_set(SCMP_ACT_ERRNO(EUCLEAN
), syscall_filter_sets
+ i
, SCMP_ACT_ALLOW
);
118 r
= seccomp_load_syscall_filter_set(SCMP_ACT_ALLOW
, syscall_filter_sets
+ i
, SCMP_ACT_ERRNO(EUCLEAN
));
122 /* Test the sycall filter with one random system call */
123 fd
= eventfd(0, EFD_NONBLOCK
|EFD_CLOEXEC
);
124 if (IN_SET(i
, SYSCALL_FILTER_SET_IO_EVENT
, SYSCALL_FILTER_SET_DEFAULT
))
125 assert_se(fd
< 0 && errno
== EUCLEAN
);
134 assert_se(wait_for_terminate_and_warn(syscall_filter_sets
[i
].name
, pid
, true) == EXIT_SUCCESS
);
138 static void test_restrict_namespace(void) {
139 _cleanup_free_
char *s
= NULL
;
143 assert_se(namespace_flag_to_string(0) == NULL
);
144 assert_se(streq(namespace_flag_to_string(CLONE_NEWNS
), "mnt"));
145 assert_se(namespace_flag_to_string(CLONE_NEWNS
|CLONE_NEWIPC
) == NULL
);
146 assert_se(streq(namespace_flag_to_string(CLONE_NEWCGROUP
), "cgroup"));
148 assert_se(namespace_flag_from_string("mnt") == CLONE_NEWNS
);
149 assert_se(namespace_flag_from_string(NULL
) == 0);
150 assert_se(namespace_flag_from_string("") == 0);
151 assert_se(namespace_flag_from_string("uts") == CLONE_NEWUTS
);
152 assert_se(namespace_flag_from_string(namespace_flag_to_string(CLONE_NEWUTS
)) == CLONE_NEWUTS
);
153 assert_se(streq(namespace_flag_to_string(namespace_flag_from_string("ipc")), "ipc"));
155 assert_se(namespace_flag_from_string_many(NULL
, &ul
) == 0 && ul
== 0);
156 assert_se(namespace_flag_from_string_many("", &ul
) == 0 && ul
== 0);
157 assert_se(namespace_flag_from_string_many("mnt uts ipc", &ul
) == 0 && ul
== (CLONE_NEWNS
|CLONE_NEWUTS
|CLONE_NEWIPC
));
159 assert_se(namespace_flag_to_string_many(NAMESPACE_FLAGS_ALL
, &s
) == 0);
160 assert_se(streq(s
, "cgroup ipc net mnt pid user uts"));
161 assert_se(namespace_flag_from_string_many(s
, &ul
) == 0 && ul
== NAMESPACE_FLAGS_ALL
);
163 #if SECCOMP_RESTRICT_NAMESPACES_BROKEN == 0
165 if (!is_seccomp_available())
175 assert_se(seccomp_restrict_namespaces(CLONE_NEWNS
|CLONE_NEWNET
) >= 0);
177 assert_se(unshare(CLONE_NEWNS
) == 0);
178 assert_se(unshare(CLONE_NEWNET
) == 0);
179 assert_se(unshare(CLONE_NEWUTS
) == -1);
180 assert_se(errno
== EPERM
);
181 assert_se(unshare(CLONE_NEWIPC
) == -1);
182 assert_se(errno
== EPERM
);
183 assert_se(unshare(CLONE_NEWNET
|CLONE_NEWUTS
) == -1);
184 assert_se(errno
== EPERM
);
186 /* We use fd 0 (stdin) here, which of course will fail with EINVAL on setns(). Except of course our
187 * seccomp filter worked, and hits first and makes it return EPERM */
188 assert_se(setns(0, CLONE_NEWNS
) == -1);
189 assert_se(errno
== EINVAL
);
190 assert_se(setns(0, CLONE_NEWNET
) == -1);
191 assert_se(errno
== EINVAL
);
192 assert_se(setns(0, CLONE_NEWUTS
) == -1);
193 assert_se(errno
== EPERM
);
194 assert_se(setns(0, CLONE_NEWIPC
) == -1);
195 assert_se(errno
== EPERM
);
196 assert_se(setns(0, CLONE_NEWNET
|CLONE_NEWUTS
) == -1);
197 assert_se(errno
== EPERM
);
198 assert_se(setns(0, 0) == -1);
199 assert_se(errno
== EPERM
);
201 pid
= raw_clone(CLONE_NEWNS
);
205 pid
= raw_clone(CLONE_NEWNET
);
209 pid
= raw_clone(CLONE_NEWUTS
);
211 assert_se(errno
== EPERM
);
212 pid
= raw_clone(CLONE_NEWIPC
);
214 assert_se(errno
== EPERM
);
215 pid
= raw_clone(CLONE_NEWNET
|CLONE_NEWUTS
);
217 assert_se(errno
== EPERM
);
222 assert_se(wait_for_terminate_and_warn("nsseccomp", pid
, true) == EXIT_SUCCESS
);
226 static void test_protect_sysctl(void) {
229 if (!is_seccomp_available())
234 if (detect_container() > 0) /* in containers _sysctl() is likely missing anyway */
241 assert_se(syscall(__NR__sysctl
, NULL
) < 0);
242 assert_se(errno
== EFAULT
);
244 assert_se(seccomp_protect_sysctl() >= 0);
246 assert_se(syscall(__NR__sysctl
, 0, 0, 0) < 0);
247 assert_se(errno
== EPERM
);
252 assert_se(wait_for_terminate_and_warn("sysctlseccomp", pid
, true) == EXIT_SUCCESS
);
255 static void test_restrict_address_families(void) {
258 if (!is_seccomp_available())
270 fd
= socket(AF_INET
, SOCK_DGRAM
, 0);
274 fd
= socket(AF_UNIX
, SOCK_DGRAM
, 0);
278 fd
= socket(AF_NETLINK
, SOCK_DGRAM
, 0);
282 assert_se(s
= set_new(NULL
));
283 assert_se(set_put(s
, INT_TO_PTR(AF_UNIX
)) >= 0);
285 assert_se(seccomp_restrict_address_families(s
, false) >= 0);
287 fd
= socket(AF_INET
, SOCK_DGRAM
, 0);
291 fd
= socket(AF_UNIX
, SOCK_DGRAM
, 0);
292 #if SECCOMP_RESTRICT_ADDRESS_FAMILIES_BROKEN
297 assert_se(errno
== EAFNOSUPPORT
);
300 fd
= socket(AF_NETLINK
, SOCK_DGRAM
, 0);
306 assert_se(set_put(s
, INT_TO_PTR(AF_INET
)) >= 0);
308 assert_se(seccomp_restrict_address_families(s
, true) >= 0);
310 fd
= socket(AF_INET
, SOCK_DGRAM
, 0);
314 fd
= socket(AF_UNIX
, SOCK_DGRAM
, 0);
315 #if SECCOMP_RESTRICT_ADDRESS_FAMILIES_BROKEN
320 assert_se(errno
== EAFNOSUPPORT
);
323 fd
= socket(AF_NETLINK
, SOCK_DGRAM
, 0);
324 #if SECCOMP_RESTRICT_ADDRESS_FAMILIES_BROKEN
329 assert_se(errno
== EAFNOSUPPORT
);
335 assert_se(wait_for_terminate_and_warn("socketseccomp", pid
, true) == EXIT_SUCCESS
);
338 static void test_restrict_realtime(void) {
341 if (!is_seccomp_available())
346 if (detect_container() > 0) /* in containers RT privs are likely missing anyway */
353 assert_se(sched_setscheduler(0, SCHED_FIFO
, &(struct sched_param
) { .sched_priority
= 1 }) >= 0);
354 assert_se(sched_setscheduler(0, SCHED_RR
, &(struct sched_param
) { .sched_priority
= 1 }) >= 0);
355 assert_se(sched_setscheduler(0, SCHED_IDLE
, &(struct sched_param
) { .sched_priority
= 0 }) >= 0);
356 assert_se(sched_setscheduler(0, SCHED_BATCH
, &(struct sched_param
) { .sched_priority
= 0 }) >= 0);
357 assert_se(sched_setscheduler(0, SCHED_OTHER
, &(struct sched_param
) {}) >= 0);
359 assert_se(seccomp_restrict_realtime() >= 0);
361 assert_se(sched_setscheduler(0, SCHED_IDLE
, &(struct sched_param
) { .sched_priority
= 0 }) >= 0);
362 assert_se(sched_setscheduler(0, SCHED_BATCH
, &(struct sched_param
) { .sched_priority
= 0 }) >= 0);
363 assert_se(sched_setscheduler(0, SCHED_OTHER
, &(struct sched_param
) {}) >= 0);
365 assert_se(sched_setscheduler(0, SCHED_FIFO
, &(struct sched_param
) { .sched_priority
= 1 }) < 0);
366 assert_se(errno
== EPERM
);
367 assert_se(sched_setscheduler(0, SCHED_RR
, &(struct sched_param
) { .sched_priority
= 1 }) < 0);
368 assert_se(errno
== EPERM
);
373 assert_se(wait_for_terminate_and_warn("realtimeseccomp", pid
, true) == EXIT_SUCCESS
);
376 static void test_memory_deny_write_execute_mmap(void) {
379 if (!is_seccomp_available())
390 p
= mmap(NULL
, page_size(), PROT_WRITE
|PROT_EXEC
, MAP_PRIVATE
|MAP_ANONYMOUS
, -1,0);
391 assert_se(p
!= MAP_FAILED
);
392 assert_se(munmap(p
, page_size()) >= 0);
394 p
= mmap(NULL
, page_size(), PROT_WRITE
|PROT_READ
, MAP_PRIVATE
|MAP_ANONYMOUS
, -1,0);
395 assert_se(p
!= MAP_FAILED
);
396 assert_se(munmap(p
, page_size()) >= 0);
398 assert_se(seccomp_memory_deny_write_execute() >= 0);
400 p
= mmap(NULL
, page_size(), PROT_WRITE
|PROT_EXEC
, MAP_PRIVATE
|MAP_ANONYMOUS
, -1,0);
401 #if defined(__x86_64__) || defined(__i386__) || defined(__powerpc64__)
402 assert_se(p
== MAP_FAILED
);
403 assert_se(errno
== EPERM
);
404 #else /* unknown architectures */
405 assert_se(p
!= MAP_FAILED
);
406 assert_se(munmap(p
, page_size()) >= 0);
409 p
= mmap(NULL
, page_size(), PROT_WRITE
|PROT_READ
, MAP_PRIVATE
|MAP_ANONYMOUS
, -1,0);
410 assert_se(p
!= MAP_FAILED
);
411 assert_se(munmap(p
, page_size()) >= 0);
416 assert_se(wait_for_terminate_and_warn("memoryseccomp-mmap", pid
, true) == EXIT_SUCCESS
);
419 static void test_memory_deny_write_execute_shmat(void) {
423 if (!is_seccomp_available())
428 shmid
= shmget(IPC_PRIVATE
, page_size(), 0);
429 assert_se(shmid
>= 0);
437 p
= shmat(shmid
, NULL
, 0);
438 assert_se(p
!= MAP_FAILED
);
439 assert_se(shmdt(p
) == 0);
441 p
= shmat(shmid
, NULL
, SHM_EXEC
);
442 assert_se(p
!= MAP_FAILED
);
443 assert_se(shmdt(p
) == 0);
445 assert_se(seccomp_memory_deny_write_execute() >= 0);
447 p
= shmat(shmid
, NULL
, SHM_EXEC
);
448 #if defined(__x86_64__)
449 assert_se(p
== MAP_FAILED
);
450 assert_se(errno
== EPERM
);
451 #else /* __i386__, __powerpc64__, and "unknown" architectures */
452 assert_se(p
!= MAP_FAILED
);
453 assert_se(shmdt(p
) == 0);
456 p
= shmat(shmid
, NULL
, 0);
457 assert_se(p
!= MAP_FAILED
);
458 assert_se(shmdt(p
) == 0);
463 assert_se(wait_for_terminate_and_warn("memoryseccomp-shmat", pid
, true) == EXIT_SUCCESS
);
466 static void test_restrict_archs(void) {
469 if (!is_seccomp_available())
478 _cleanup_set_free_ Set
*s
= NULL
;
480 assert_se(access("/", F_OK
) >= 0);
482 assert_se(s
= set_new(NULL
));
485 assert_se(set_put(s
, UINT32_TO_PTR(SCMP_ARCH_X86
+1)) >= 0);
487 assert_se(seccomp_restrict_archs(s
) >= 0);
489 assert_se(access("/", F_OK
) >= 0);
490 assert_se(seccomp_restrict_archs(NULL
) >= 0);
492 assert_se(access("/", F_OK
) >= 0);
497 assert_se(wait_for_terminate_and_warn("archseccomp", pid
, true) == EXIT_SUCCESS
);
500 static void test_load_syscall_filter_set_raw(void) {
503 if (!is_seccomp_available())
512 _cleanup_set_free_ Set
*s
= NULL
;
514 assert_se(access("/", F_OK
) >= 0);
515 assert_se(poll(NULL
, 0, 0) == 0);
517 assert_se(seccomp_load_syscall_filter_set_raw(SCMP_ACT_ALLOW
, NULL
, SCMP_ACT_KILL
) >= 0);
518 assert_se(access("/", F_OK
) >= 0);
519 assert_se(poll(NULL
, 0, 0) == 0);
521 assert_se(s
= set_new(NULL
));
522 assert_se(set_put(s
, UINT32_TO_PTR(__NR_access
+ 1)) >= 0);
524 assert_se(seccomp_load_syscall_filter_set_raw(SCMP_ACT_ALLOW
, s
, SCMP_ACT_ERRNO(EUCLEAN
)) >= 0);
526 assert_se(access("/", F_OK
) < 0);
527 assert_se(errno
== EUCLEAN
);
529 assert_se(poll(NULL
, 0, 0) == 0);
533 assert_se(s
= set_new(NULL
));
534 assert_se(set_put(s
, UINT32_TO_PTR(__NR_poll
+ 1)) >= 0);
536 assert_se(seccomp_load_syscall_filter_set_raw(SCMP_ACT_ALLOW
, s
, SCMP_ACT_ERRNO(EUNATCH
)) >= 0);
538 assert_se(access("/", F_OK
) < 0);
539 assert_se(errno
== EUCLEAN
);
541 assert_se(poll(NULL
, 0, 0) < 0);
542 assert_se(errno
== EUNATCH
);
547 assert_se(wait_for_terminate_and_warn("syscallrawseccomp", pid
, true) == EXIT_SUCCESS
);
550 int main(int argc
, char *argv
[]) {
552 log_set_max_level(LOG_DEBUG
);
554 test_seccomp_arch_to_string();
555 test_architecture_table();
556 test_syscall_filter_set_find();
558 test_restrict_namespace();
559 test_protect_sysctl();
560 test_restrict_address_families();
561 test_restrict_realtime();
562 test_memory_deny_write_execute_mmap();
563 test_memory_deny_write_execute_shmat();
564 test_restrict_archs();
565 test_load_syscall_filter_set_raw();