2017-11-18 17:09:20 +01:00
|
|
|
/* SPDX-License-Identifier: LGPL-2.1+ */
|
2014-02-13 00:24:00 +01:00
|
|
|
#pragma once
|
|
|
|
|
2014-12-12 02:35:39 +01:00
|
|
|
#include <seccomp.h>
|
2016-10-21 21:48:10 +02:00
|
|
|
#include <stdbool.h>
|
2015-12-03 21:13:37 +01:00
|
|
|
#include <stdint.h>
|
2014-02-13 00:24:00 +01:00
|
|
|
|
seccomp: rework seccomp code, to improve compat with some archs
This substantially reworks the seccomp code, to ensure better
compatibility with some architectures, including i386.
So far we relied on libseccomp's internal handling of the multiple
syscall ABIs supported on Linux. This is problematic however, as it does
not define clear semantics if an ABI is not able to support specific
seccomp rules we install.
This rework hence changes a couple of things:
- We no longer use seccomp_rule_add(), but only
seccomp_rule_add_exact(), and fail the installation of a filter if the
architecture doesn't support it.
- We no longer rely on adding multiple syscall architectures to a single filter,
but instead install a separate filter for each syscall architecture
supported. This way, we can install a strict filter for x86-64, while
permitting a less strict filter for i386.
- All high-level filter additions are now moved from execute.c to
seccomp-util.c, so that we can test them independently of the service
execution logic.
- Tests have been added for all types of our seccomp filters.
- SystemCallFilters= and SystemCallArchitectures= are now implemented in
independent filters and installation logic, as they semantically are
very much independent of each other.
Fixes: #4575
2016-12-27 15:28:25 +01:00
|
|
|
#include "set.h"
|
|
|
|
|
2014-02-13 00:24:00 +01:00
|
|
|
const char* seccomp_arch_to_string(uint32_t c);
|
|
|
|
int seccomp_arch_from_string(const char *n, uint32_t *ret);
|
2014-02-18 22:14:00 +01:00
|
|
|
|
seccomp: rework seccomp code, to improve compat with some archs
This substantially reworks the seccomp code, to ensure better
compatibility with some architectures, including i386.
So far we relied on libseccomp's internal handling of the multiple
syscall ABIs supported on Linux. This is problematic however, as it does
not define clear semantics if an ABI is not able to support specific
seccomp rules we install.
This rework hence changes a couple of things:
- We no longer use seccomp_rule_add(), but only
seccomp_rule_add_exact(), and fail the installation of a filter if the
architecture doesn't support it.
- We no longer rely on adding multiple syscall architectures to a single filter,
but instead install a separate filter for each syscall architecture
supported. This way, we can install a strict filter for x86-64, while
permitting a less strict filter for i386.
- All high-level filter additions are now moved from execute.c to
seccomp-util.c, so that we can test them independently of the service
execution logic.
- Tests have been added for all types of our seccomp filters.
- SystemCallFilters= and SystemCallArchitectures= are now implemented in
independent filters and installation logic, as they semantically are
very much independent of each other.
Fixes: #4575
2016-12-27 15:28:25 +01:00
|
|
|
int seccomp_init_for_arch(scmp_filter_ctx *ret, uint32_t arch, uint32_t default_action);
|
2016-06-01 11:56:01 +02:00
|
|
|
|
2016-08-22 21:40:58 +02:00
|
|
|
bool is_seccomp_available(void);
|
|
|
|
|
2016-10-21 21:50:05 +02:00
|
|
|
typedef struct SyscallFilterSet {
|
|
|
|
const char *name;
|
2016-11-02 17:24:34 +01:00
|
|
|
const char *help;
|
2016-06-01 11:56:01 +02:00
|
|
|
const char *value;
|
2016-10-21 21:50:05 +02:00
|
|
|
} SyscallFilterSet;
|
|
|
|
|
|
|
|
enum {
|
2016-11-02 17:01:04 +01:00
|
|
|
/* Please leave DEFAULT first, but sort the rest alphabetically */
|
|
|
|
SYSCALL_FILTER_SET_DEFAULT,
|
2017-09-30 14:34:50 +02:00
|
|
|
SYSCALL_FILTER_SET_AIO,
|
2016-11-02 15:46:18 +01:00
|
|
|
SYSCALL_FILTER_SET_BASIC_IO,
|
2017-09-30 14:34:50 +02:00
|
|
|
SYSCALL_FILTER_SET_CHOWN,
|
2016-10-21 21:50:05 +02:00
|
|
|
SYSCALL_FILTER_SET_CLOCK,
|
|
|
|
SYSCALL_FILTER_SET_CPU_EMULATION,
|
|
|
|
SYSCALL_FILTER_SET_DEBUG,
|
2016-11-22 01:29:12 +01:00
|
|
|
SYSCALL_FILTER_SET_FILE_SYSTEM,
|
2016-10-21 21:50:05 +02:00
|
|
|
SYSCALL_FILTER_SET_IO_EVENT,
|
|
|
|
SYSCALL_FILTER_SET_IPC,
|
|
|
|
SYSCALL_FILTER_SET_KEYRING,
|
2017-09-13 19:55:16 +02:00
|
|
|
SYSCALL_FILTER_SET_MEMLOCK,
|
2016-10-21 21:50:05 +02:00
|
|
|
SYSCALL_FILTER_SET_MODULE,
|
|
|
|
SYSCALL_FILTER_SET_MOUNT,
|
|
|
|
SYSCALL_FILTER_SET_NETWORK_IO,
|
|
|
|
SYSCALL_FILTER_SET_OBSOLETE,
|
|
|
|
SYSCALL_FILTER_SET_PRIVILEGED,
|
|
|
|
SYSCALL_FILTER_SET_PROCESS,
|
|
|
|
SYSCALL_FILTER_SET_RAW_IO,
|
2016-12-27 14:26:55 +01:00
|
|
|
SYSCALL_FILTER_SET_REBOOT,
|
2016-11-02 15:46:18 +01:00
|
|
|
SYSCALL_FILTER_SET_RESOURCES,
|
2017-08-09 15:04:05 +02:00
|
|
|
SYSCALL_FILTER_SET_SETUID,
|
2017-09-13 19:55:16 +02:00
|
|
|
SYSCALL_FILTER_SET_SIGNAL,
|
2016-12-27 14:26:55 +01:00
|
|
|
SYSCALL_FILTER_SET_SWAP,
|
2017-09-30 14:34:50 +02:00
|
|
|
SYSCALL_FILTER_SET_SYNC,
|
2018-04-18 21:19:54 +02:00
|
|
|
SYSCALL_FILTER_SET_SYSTEM_SERVICE,
|
2017-09-13 19:55:16 +02:00
|
|
|
SYSCALL_FILTER_SET_TIMER,
|
2016-10-21 21:50:05 +02:00
|
|
|
_SYSCALL_FILTER_SET_MAX
|
|
|
|
};
|
|
|
|
|
|
|
|
extern const SyscallFilterSet syscall_filter_sets[];
|
|
|
|
|
|
|
|
const SyscallFilterSet *syscall_filter_set_find(const char *name);
|
|
|
|
|
2017-11-11 13:35:49 +01:00
|
|
|
int seccomp_filter_set_add(Hashmap *s, bool b, const SyscallFilterSet *set);
|
2017-08-09 16:09:04 +02:00
|
|
|
|
2018-09-24 16:59:12 +02:00
|
|
|
int seccomp_add_syscall_filter_item(scmp_filter_ctx *ctx, const char *name, uint32_t action, char **exclude, bool log_missing);
|
2017-09-10 19:10:29 +02:00
|
|
|
|
2018-09-24 16:59:12 +02:00
|
|
|
int seccomp_load_syscall_filter_set(uint32_t default_action, const SyscallFilterSet *set, uint32_t action, bool log_missing);
|
|
|
|
int seccomp_load_syscall_filter_set_raw(uint32_t default_action, Hashmap* set, uint32_t action, bool log_missing);
|
2016-11-02 03:25:19 +01:00
|
|
|
|
2018-02-26 12:51:35 +01:00
|
|
|
typedef enum SeccompParseFlags {
|
2018-06-07 16:03:43 +02:00
|
|
|
SECCOMP_PARSE_INVERT = 1 << 0,
|
|
|
|
SECCOMP_PARSE_WHITELIST = 1 << 1,
|
|
|
|
SECCOMP_PARSE_LOG = 1 << 2,
|
|
|
|
SECCOMP_PARSE_PERMISSIVE = 1 << 3,
|
2018-02-26 12:51:35 +01:00
|
|
|
} SeccompParseFlags;
|
|
|
|
|
|
|
|
int seccomp_parse_syscall_filter_full(
|
|
|
|
const char *name, int errno_num, Hashmap *filter, SeccompParseFlags flags,
|
|
|
|
const char *unit, const char *filename, unsigned line);
|
|
|
|
|
|
|
|
static inline int seccomp_parse_syscall_filter(const char *name, int errno_num, Hashmap *filter, SeccompParseFlags flags) {
|
|
|
|
return seccomp_parse_syscall_filter_full(name, errno_num, filter, flags, NULL, NULL, 0);
|
2017-12-23 10:45:32 +01:00
|
|
|
}
|
|
|
|
|
seccomp: rework seccomp code, to improve compat with some archs
This substantially reworks the seccomp code, to ensure better
compatibility with some architectures, including i386.
So far we relied on libseccomp's internal handling of the multiple
syscall ABIs supported on Linux. This is problematic however, as it does
not define clear semantics if an ABI is not able to support specific
seccomp rules we install.
This rework hence changes a couple of things:
- We no longer use seccomp_rule_add(), but only
seccomp_rule_add_exact(), and fail the installation of a filter if the
architecture doesn't support it.
- We no longer rely on adding multiple syscall architectures to a single filter,
but instead install a separate filter for each syscall architecture
supported. This way, we can install a strict filter for x86-64, while
permitting a less strict filter for i386.
- All high-level filter additions are now moved from execute.c to
seccomp-util.c, so that we can test them independently of the service
execution logic.
- Tests have been added for all types of our seccomp filters.
- SystemCallFilters= and SystemCallArchitectures= are now implemented in
independent filters and installation logic, as they semantically are
very much independent of each other.
Fixes: #4575
2016-12-27 15:28:25 +01:00
|
|
|
int seccomp_restrict_archs(Set *archs);
|
2016-11-02 03:25:19 +01:00
|
|
|
int seccomp_restrict_namespaces(unsigned long retain);
|
seccomp: rework seccomp code, to improve compat with some archs
This substantially reworks the seccomp code, to ensure better
compatibility with some architectures, including i386.
So far we relied on libseccomp's internal handling of the multiple
syscall ABIs supported on Linux. This is problematic however, as it does
not define clear semantics if an ABI is not able to support specific
seccomp rules we install.
This rework hence changes a couple of things:
- We no longer use seccomp_rule_add(), but only
seccomp_rule_add_exact(), and fail the installation of a filter if the
architecture doesn't support it.
- We no longer rely on adding multiple syscall architectures to a single filter,
but instead install a separate filter for each syscall architecture
supported. This way, we can install a strict filter for x86-64, while
permitting a less strict filter for i386.
- All high-level filter additions are now moved from execute.c to
seccomp-util.c, so that we can test them independently of the service
execution logic.
- Tests have been added for all types of our seccomp filters.
- SystemCallFilters= and SystemCallArchitectures= are now implemented in
independent filters and installation logic, as they semantically are
very much independent of each other.
Fixes: #4575
2016-12-27 15:28:25 +01:00
|
|
|
int seccomp_protect_sysctl(void);
|
|
|
|
int seccomp_restrict_address_families(Set *address_families, bool whitelist);
|
|
|
|
int seccomp_restrict_realtime(void);
|
|
|
|
int seccomp_memory_deny_write_execute(void);
|
2017-07-04 14:48:18 +02:00
|
|
|
int seccomp_lock_personality(unsigned long personality);
|
seccomp: rework seccomp code, to improve compat with some archs
This substantially reworks the seccomp code, to ensure better
compatibility with some architectures, including i386.
So far we relied on libseccomp's internal handling of the multiple
syscall ABIs supported on Linux. This is problematic however, as it does
not define clear semantics if an ABI is not able to support specific
seccomp rules we install.
This rework hence changes a couple of things:
- We no longer use seccomp_rule_add(), but only
seccomp_rule_add_exact(), and fail the installation of a filter if the
architecture doesn't support it.
- We no longer rely on adding multiple syscall architectures to a single filter,
but instead install a separate filter for each syscall architecture
supported. This way, we can install a strict filter for x86-64, while
permitting a less strict filter for i386.
- All high-level filter additions are now moved from execute.c to
seccomp-util.c, so that we can test them independently of the service
execution logic.
- Tests have been added for all types of our seccomp filters.
- SystemCallFilters= and SystemCallArchitectures= are now implemented in
independent filters and installation logic, as they semantically are
very much independent of each other.
Fixes: #4575
2016-12-27 15:28:25 +01:00
|
|
|
|
|
|
|
extern const uint32_t seccomp_local_archs[];
|
|
|
|
|
|
|
|
#define SECCOMP_FOREACH_LOCAL_ARCH(arch) \
|
|
|
|
for (unsigned _i = ({ (arch) = seccomp_local_archs[0]; 0; }); \
|
|
|
|
seccomp_local_archs[_i] != (uint32_t) -1; \
|
|
|
|
(arch) = seccomp_local_archs[++_i])
|
|
|
|
|
|
|
|
DEFINE_TRIVIAL_CLEANUP_FUNC(scmp_filter_ctx, seccomp_release);
|
2017-08-02 06:46:45 +02:00
|
|
|
|
|
|
|
int parse_syscall_archs(char **l, Set **archs);
|