blob: 6eaa8ea82bcf029d97c0c0ed328e7c7b9c69476c [file] [log] [blame]
Dylan Reid837c74a2016-01-22 17:25:21 -08001/* Copyright 2016 The Chromium OS Authors. All rights reserved.
2 * Use of this source code is governed by a BSD-style license that can be
3 * found in the LICENSE file.
4 */
5
Luis Hector Chavez479b95f2016-06-06 08:01:05 -07006#ifndef LIBCONTAINER_LIBCONTAINER_H_
7#define LIBCONTAINER_LIBCONTAINER_H_
Dylan Reid837c74a2016-01-22 17:25:21 -08008
Dylan Reid2bd9ea92016-04-07 20:57:47 -07009#include <stddef.h>
Luis Hector Chavezff5978f2017-06-27 12:52:58 -070010#include <stdint.h>
Luis Hector Chavezda352462018-01-30 09:10:00 -080011#include <sys/resource.h>
Dylan Reid0bb592b2016-11-09 13:34:11 -080012#include <sys/types.h>
Dylan Reid837c74a2016-01-22 17:25:21 -080013
Luis Hector Chavezdac0f662017-09-14 14:41:27 -070014#include <brillo/brillo_export.h>
Luis Hector Chaveze03926a2017-09-28 17:28:49 -070015#include <libminijail.h>
Luis Hector Chavezdac0f662017-09-14 14:41:27 -070016
Dylan Reid837c74a2016-01-22 17:25:21 -080017#ifdef __cplusplus
18extern "C" {
19#endif
20
21struct container_config;
22
23/* Create a container config. */
Luis Hector Chavez1e1fd9d2017-09-15 08:45:33 -070024BRILLO_EXPORT struct container_config* container_config_create(void);
Dylan Reid837c74a2016-01-22 17:25:21 -080025
26/* Destroy a config create with container_config_create. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070027BRILLO_EXPORT void container_config_destroy(struct container_config* c);
Dylan Reid837c74a2016-01-22 17:25:21 -080028
Mike Frysingerb22acdf2017-01-08 02:02:35 -050029/* config_root - Path to the root of the container itself. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070030BRILLO_EXPORT int container_config_config_root(struct container_config* c,
31 const char* config_root);
Mike Frysingerb22acdf2017-01-08 02:02:35 -050032
33/* Get the configured container root path. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070034BRILLO_EXPORT const char* container_config_get_config_root(
35 const struct container_config* c);
Mike Frysingerb22acdf2017-01-08 02:02:35 -050036
Dylan Reid837c74a2016-01-22 17:25:21 -080037/* rootfs - Path to the root of the container's filesystem. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070038BRILLO_EXPORT int container_config_rootfs(struct container_config* c,
39 const char* rootfs);
Dylan Reid837c74a2016-01-22 17:25:21 -080040
Dylan Reid11456722016-05-02 11:24:50 -070041/* Get the configured rootfs path. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070042BRILLO_EXPORT const char* container_config_get_rootfs(
43 const struct container_config* c);
Dylan Reid11456722016-05-02 11:24:50 -070044
Luis Hector Chavezc240e7e2016-09-22 10:33:03 -070045/* rootfs_mount_flags - Flags that will be passed to the mount() call when
46 * mounting the root of the container's filesystem. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070047BRILLO_EXPORT void container_config_rootfs_mount_flags(
48 struct container_config* c, unsigned long flags);
Luis Hector Chavezc240e7e2016-09-22 10:33:03 -070049
50/* Get the configured rootfs mount() flags. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070051BRILLO_EXPORT unsigned long container_config_get_rootfs_mount_flags(
52 const struct container_config* c);
Luis Hector Chavezc240e7e2016-09-22 10:33:03 -070053
Keshav Santhanam0e4c3282016-07-14 10:25:16 -070054/* runfs - Path to where the container filesystem has been mounted. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070055BRILLO_EXPORT int container_config_premounted_runfs(struct container_config* c,
56 const char* runfs);
Keshav Santhanam0e4c3282016-07-14 10:25:16 -070057
58/* Get the pre-mounted runfs path. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070059BRILLO_EXPORT const char* container_config_get_premounted_runfs(
60 const struct container_config* c);
Keshav Santhanam0e4c3282016-07-14 10:25:16 -070061
62/* The pid of the program will be written here. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070063BRILLO_EXPORT int container_config_pid_file(struct container_config* c,
64 const char* path);
Keshav Santhanam0e4c3282016-07-14 10:25:16 -070065
66/* Get the pid file path. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070067BRILLO_EXPORT const char* container_config_get_pid_file(
68 const struct container_config* c);
Keshav Santhanam0e4c3282016-07-14 10:25:16 -070069
Dylan Reid837c74a2016-01-22 17:25:21 -080070/* The program to run and args, e.g. "/sbin/init", "--second-stage". */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070071BRILLO_EXPORT int container_config_program_argv(struct container_config* c,
72 const char** argv,
73 size_t num_args);
Dylan Reid837c74a2016-01-22 17:25:21 -080074
Dylan Reid11456722016-05-02 11:24:50 -070075/* Get the number of command line args for the program to be run. */
Luis Hector Chavezdac0f662017-09-14 14:41:27 -070076BRILLO_EXPORT size_t
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070077container_config_get_num_program_args(const struct container_config* c);
Dylan Reid11456722016-05-02 11:24:50 -070078
79/* Get the program argument at the given index. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070080BRILLO_EXPORT const char* container_config_get_program_arg(
81 const struct container_config* c, size_t index);
Dylan Reid11456722016-05-02 11:24:50 -070082
Dylan Reid1874feb2016-06-22 17:53:50 -070083/* Sets/Gets the uid the container will run as. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070084BRILLO_EXPORT void container_config_uid(struct container_config* c, uid_t uid);
85BRILLO_EXPORT uid_t container_config_get_uid(const struct container_config* c);
Dylan Reid1874feb2016-06-22 17:53:50 -070086
Dylan Reid837c74a2016-01-22 17:25:21 -080087/* Mapping of UIDs in the container, e.g. "0 100000 1024" */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070088BRILLO_EXPORT int container_config_uid_map(struct container_config* c,
89 const char* uid_map);
Dylan Reid837c74a2016-01-22 17:25:21 -080090
Dylan Reid1874feb2016-06-22 17:53:50 -070091/* Sets/Gets the gid the container will run as. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070092BRILLO_EXPORT void container_config_gid(struct container_config* c, gid_t gid);
93BRILLO_EXPORT gid_t container_config_get_gid(const struct container_config* c);
Dylan Reid1874feb2016-06-22 17:53:50 -070094
Dylan Reid837c74a2016-01-22 17:25:21 -080095/* Mapping of GIDs in the container, e.g. "0 100000 1024" */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070096BRILLO_EXPORT int container_config_gid_map(struct container_config* c,
97 const char* gid_map);
Dylan Reid837c74a2016-01-22 17:25:21 -080098
Risanfd41aee2018-08-15 14:03:38 +090099/* Sets the additional gids the container will run as. */
100BRILLO_EXPORT void container_config_additional_gids(struct container_config* c,
101 const gid_t* gids,
102 size_t num_gids);
103
Dylan Reid837c74a2016-01-22 17:25:21 -0800104/* Alt-Syscall table to use or NULL if none. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700105BRILLO_EXPORT int container_config_alt_syscall_table(
106 struct container_config* c, const char* alt_syscall_table);
Dylan Reid837c74a2016-01-22 17:25:21 -0800107
Dylan Reid93fa4602017-06-06 13:39:31 -0700108/* Add a runtime limit for the contained process. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700109BRILLO_EXPORT int container_config_add_rlimit(struct container_config* c,
110 int type,
Luis Hector Chavezda352462018-01-30 09:10:00 -0800111 rlim_t cur,
112 rlim_t max);
Dylan Reid93fa4602017-06-06 13:39:31 -0700113
Dylan Reid837c74a2016-01-22 17:25:21 -0800114/*
115 * Add a filesystem to mount in the new VFS namespace.
116 *
117 * c - The container config in which to add the mount.
118 * source - Mount source, e.g. "tmpfs" or "/data".
119 * destination - Mount point in the container, e.g. "/dev".
120 * type - Mount type, e.g. "tmpfs", "selinuxfs", or "devpts".
121 * data - Mount data for extra options, e.g. "newinstance" or "ptmxmode=0000".
Mike Frysinger05e594e2017-01-10 02:11:08 -0500122 * verity - dm-verity options (if used).
Mike Frysinger412dbd22017-01-06 01:50:34 -0500123 * flags - Mount flags as defined in mount(2).
Dylan Reid837c74a2016-01-22 17:25:21 -0800124 * uid - uid to chown mount point to if created.
125 * gid - gid to chown mount point to if created.
126 * mode - Permissions of mount point if created.
127 * mount_in_ns - True if mount should happen in the process' vfs namespace.
128 * create - If true, create mount destination if it doesn't exist.
Mike Frysinger412dbd22017-01-06 01:50:34 -0500129 * loopback - If true, set up a loopback device and mount that.
Dylan Reid837c74a2016-01-22 17:25:21 -0800130 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700131BRILLO_EXPORT int container_config_add_mount(struct container_config* c,
132 const char* name,
133 const char* source,
134 const char* destination,
135 const char* type,
136 const char* data,
137 const char* verity,
138 int flags,
139 int uid,
140 int gid,
141 int mode,
142 int mount_in_ns,
143 int create,
144 int loopback);
Dylan Reid837c74a2016-01-22 17:25:21 -0800145
146/*
Dylan Reid4843d6b2017-03-31 18:14:30 -0700147 * Add a device cgroup permission.
148 *
149 * c - The container config in which to add the mount.
150 * allow - If true allow access to the specified r/w/m.
151 * type - 'c', 'b', or 'a' for char, block, or all respectively.
152 * major - Major device number.
153 * minor - Minor device number.
154 * read - If true set reading of device to |allow|.
155 * write - If true set writing of device to |allow|.
156 * modify - If true set modifying of device to |allow|.
157 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700158BRILLO_EXPORT int container_config_add_cgroup_device(struct container_config* c,
159 int allow,
160 char type,
161 int major,
162 int minor,
163 int read,
164 int write,
165 int modify);
Dylan Reid4843d6b2017-03-31 18:14:30 -0700166
167/*
Dylan Reid837c74a2016-01-22 17:25:21 -0800168 * Add a device node to create.
169 *
170 * c - The container config in which to add the mount.
171 * type - 'c' or 'b' for char or block respectively.
172 * path - Where to mknod, "/dev/zero".
173 * fs_permissions - Permissions to set on the node.
174 * major - Major device number.
175 * minor - Minor device number.
Stephen Barber7bae6642017-11-30 10:47:12 -0800176 * copy_major - Overwrite major with the major of the existing device node. If
177 * this is true major will be copied from an existing node. The |major| param
178 * should be set to -1 in this case.
Dylan Reid355d5e42016-04-29 16:53:31 -0700179 * copy_minor - Overwrite minor with the minor of the existing device node. If
180 * this is true minor will be copied from an existing node. The |minor| param
181 * should be set to -1 in this case.
Dylan Reid837c74a2016-01-22 17:25:21 -0800182 * uid - User to own the device.
183 * gid - Group to own the device.
184 * read_allowed - If true allow reading from the device via "devices" cgroup.
185 * write_allowed - If true allow writing to the device via "devices" cgroup.
186 * modify_allowed - If true allow creation of the device via "devices" cgroup.
187 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700188BRILLO_EXPORT int container_config_add_device(struct container_config* c,
189 char type,
190 const char* path,
191 int fs_permissions,
192 int major,
193 int minor,
Stephen Barber7bae6642017-11-30 10:47:12 -0800194 int copy_major,
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700195 int copy_minor,
196 int uid,
197 int gid,
198 int read_allowed,
199 int write_allowed,
200 int modify_allowed);
Dylan Reid837c74a2016-01-22 17:25:21 -0800201
Chinyue Chenfac909e2016-06-24 14:17:42 +0800202/* Set the CPU shares cgroup param for container. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700203BRILLO_EXPORT int container_config_set_cpu_shares(struct container_config* c,
204 int shares);
Chinyue Chenfac909e2016-06-24 14:17:42 +0800205
206/* Set the CFS CPU cgroup params for container. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700207BRILLO_EXPORT int container_config_set_cpu_cfs_params(
208 struct container_config* c, int quota, int period);
Chinyue Chenfac909e2016-06-24 14:17:42 +0800209
210/* Set the RT CPU cgroup params for container. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700211BRILLO_EXPORT int container_config_set_cpu_rt_params(struct container_config* c,
212 int rt_runtime,
213 int rt_period);
Chinyue Chenfac909e2016-06-24 14:17:42 +0800214
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700215BRILLO_EXPORT int container_config_get_cpu_shares(struct container_config* c);
216BRILLO_EXPORT int container_config_get_cpu_quota(struct container_config* c);
217BRILLO_EXPORT int container_config_get_cpu_period(struct container_config* c);
218BRILLO_EXPORT int container_config_get_cpu_rt_runtime(
219 struct container_config* c);
220BRILLO_EXPORT int container_config_get_cpu_rt_period(
221 struct container_config* c);
Chinyue Chen4f3fd682016-07-01 14:11:42 +0800222
Dylan Reid9e724af2016-07-21 09:58:07 -0700223/*
224 * Configure the owner of cgroups created for the container.
225 *
226 * This is needed so the container's cgroup namespace rootdir is accessible
227 * inside the container.
228 *
229 * cgroup_parent - Parent directory under which to create the cgroup.
230 * cgroup_owner - The uid that should own the cgroups that are created.
Dmitry Torokhov14eef722016-09-27 16:40:37 -0700231 * cgroup_group - The gid that should own the cgroups that are created.
Dylan Reid9e724af2016-07-21 09:58:07 -0700232 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700233BRILLO_EXPORT int container_config_set_cgroup_parent(struct container_config* c,
234 const char* parent,
235 uid_t cgroup_owner,
236 gid_t cgroup_group);
Dylan Reid9e724af2016-07-21 09:58:07 -0700237
238/* Get the parent cgroup directory from the config. Here for UT only. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700239BRILLO_EXPORT const char* container_config_get_cgroup_parent(
240 struct container_config* c);
Dylan Reid9e724af2016-07-21 09:58:07 -0700241
Stephen Barber771653f2017-10-04 23:48:57 -0700242/* Set namespaces to be used by the container. */
243BRILLO_EXPORT int container_config_namespaces(
244 struct container_config* c, const char** namespaces, size_t num_ns);
245
246/* Get the number of namespaces to enter. */
247BRILLO_EXPORT size_t
248container_config_get_num_namespaces(const struct container_config* c);
249
250/* Get the namespace at the given index. */
251BRILLO_EXPORT bool container_config_has_namespace(
252 const struct container_config* c, const char* ns);
Keshav Santhanam1b6bf672016-08-10 18:35:12 -0700253
Dylan Reidc4335842016-11-11 10:24:52 -0800254/*
255 * Configures the container so that any FDs open in the parent process are still
256 * visible to the child. Useful for apps that need stdin/stdout/stderr. Use
257 * with caution to avoid leaking other FDs into the namespaced app.
258 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700259BRILLO_EXPORT void container_config_keep_fds_open(struct container_config* c);
Dylan Reidc4335842016-11-11 10:24:52 -0800260
Luis Hector Chavezff5978f2017-06-27 12:52:58 -0700261/*
262 * Sets the capability mask of the container to |capmask|. If |ambient| is 1 it
263 * will additionally set the ambient capability set.
264 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700265BRILLO_EXPORT void container_config_set_capmask(struct container_config* c,
266 uint64_t capmask,
267 int ambient);
Luis Hector Chavezff5978f2017-06-27 12:52:58 -0700268
Luis Hector Chavezcd44ba72017-06-30 13:01:38 -0700269/*
270 * Skips settings the securebits in |securebits_skip_mask| when restricting
271 * capabilities. This is only used when container_config_set_capmask() is used.
272 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700273BRILLO_EXPORT void container_config_set_securebits_skip_mask(
274 struct container_config* c, uint64_t securebits_skip_mask);
Luis Hector Chavezcd44ba72017-06-30 13:01:38 -0700275
Luis Hector Chavezdac65c32017-07-21 10:30:23 -0700276/*
277 * Sets whether the container's entry point should run as init. An init process
278 * is responsible for setting up certain paths within the container (such as
279 * /proc) and performing explicit reaping of zombie processes. The container
280 * will also be torn down if the init process is killed.
281 * The default is true.
282 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700283BRILLO_EXPORT void container_config_set_run_as_init(struct container_config* c,
284 int run_as_init);
Luis Hector Chavezdac65c32017-07-21 10:30:23 -0700285
Luis Hector Chavez15e8e672017-07-20 15:13:27 -0700286/*
287 * Sets the SELinux context under which the container will run.
288 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700289BRILLO_EXPORT int container_config_set_selinux_context(
290 struct container_config* c, const char* context);
Luis Hector Chavez15e8e672017-07-20 15:13:27 -0700291
Luis Hector Chavezf8e8f4c2017-08-01 01:09:39 -0700292/*
293 * Sets a pre-execve hook that is run in the child process just before the
294 * container invokes execve(2). If this is used to run a pre-start hook which
295 * should run in the caller's context, a synchronization mechanism (such as a
296 * pair of pipes or sending messages through a unix domain pipe) should be used
297 * to ensure this hook blocks until the pre-start hook finishes running. The
298 * file descriptors used to synchronize this can be passed using
299 * container_config_inherit_fds().
300 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700301BRILLO_EXPORT void container_config_set_pre_execve_hook(
302 struct container_config* c, int (*hook)(void*), void* payload);
Luis Hector Chavezf8e8f4c2017-08-01 01:09:39 -0700303
304/*
Luis Hector Chaveze03926a2017-09-28 17:28:49 -0700305 * Adds a hook that will be run, execve(2)-style. This new process will be run
306 * outside the container in the original namespace. Any parameters that are
307 * equal to the magic value "$PID" will be replaced with the container's PID. If
308 * |pstdin_fd|, |pstdout_fd|, or |pstderr_fd| are set to non-null values, they
309 * will contain valid file descriptors that can be used to communicate with the
310 * process.
311 */
312BRILLO_EXPORT int container_config_add_hook(struct container_config* c,
313 minijail_hook_event_t event,
314 const char* filename,
315 const char** argv,
316 size_t num_args,
317 int* pstdin_fd,
318 int* pstdtout_fd,
319 int* pstderr_fd);
320
321/*
Luis Hector Chavezf8e8f4c2017-08-01 01:09:39 -0700322 * Sets the set of file descriptors to inherit.
323 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700324BRILLO_EXPORT int container_config_inherit_fds(struct container_config* c,
Luis Hector Chaveza5e87cb2018-05-21 07:21:22 -0700325 const int* inherited_fds,
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700326 size_t inherited_fd_count);
Luis Hector Chavezf8e8f4c2017-08-01 01:09:39 -0700327
Dylan Reid837c74a2016-01-22 17:25:21 -0800328/* Container manipulation. */
329struct container;
330
331/*
332 * Create a container based on the given config.
333 *
334 * name - Name of the directory holding the container config files.
335 * rundir - Where to build the temporary rootfs.
Dylan Reid837c74a2016-01-22 17:25:21 -0800336 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700337BRILLO_EXPORT struct container* container_new(const char* name,
338 const char* rundir);
Dylan Reid837c74a2016-01-22 17:25:21 -0800339
340/* Destroy a container created with container_new. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700341BRILLO_EXPORT void container_destroy(struct container* c);
Dylan Reid837c74a2016-01-22 17:25:21 -0800342
Dylan Reide040c6b2016-05-02 18:49:02 -0700343/* Start the container. Returns 0 on success.
344 * c - The container to run.
345 * config - Details of how the container should be run.
346 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700347BRILLO_EXPORT int container_start(struct container* c,
348 const struct container_config* config);
Dylan Reid837c74a2016-01-22 17:25:21 -0800349
350/* Get the path to the root of the container. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700351BRILLO_EXPORT const char* container_root(struct container* c);
Dylan Reid837c74a2016-01-22 17:25:21 -0800352
353/* Get the pid of the init process in the container. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700354BRILLO_EXPORT int container_pid(struct container* c);
Dylan Reid837c74a2016-01-22 17:25:21 -0800355
356/* Wait for the container to exit. Returns 0 on success. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700357BRILLO_EXPORT int container_wait(struct container* c);
Dylan Reid837c74a2016-01-22 17:25:21 -0800358
359/* Kill the container's init process, then wait for it to exit. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700360BRILLO_EXPORT int container_kill(struct container* c);
Dylan Reid837c74a2016-01-22 17:25:21 -0800361
yusukesbbc37a72017-11-21 09:51:54 -0800362/* Dumps the container config. The returned string has to be passed to free()
yusukes32622542018-01-05 18:59:52 -0800363 when it is no longer needed.
364 c - The config to dump.
365 sort_vectors - When not 0, the function sorts the list of mount points,
366 devices, and cgroups before dumping to make it easier to
367 compare two dumps side by side.
368*/
369BRILLO_EXPORT char* container_config_dump(struct container_config* c,
370 int sort_vectors);
yusukesbbc37a72017-11-21 09:51:54 -0800371
Dylan Reid837c74a2016-01-22 17:25:21 -0800372#ifdef __cplusplus
373}; /* extern "C" */
374#endif
375
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700376#endif /* LIBCONTAINER_LIBCONTAINER_H_ */