blob: fc94bebae0d05da5fde1d31df97341e9b634e471 [file] [log] [blame]
Dylan Reid837c74a2016-01-22 17:25:21 -08001/* Copyright 2016 The Chromium OS Authors. All rights reserved.
2 * Use of this source code is governed by a BSD-style license that can be
3 * found in the LICENSE file.
4 */
5
Luis Hector Chavez479b95f2016-06-06 08:01:05 -07006#ifndef LIBCONTAINER_LIBCONTAINER_H_
7#define LIBCONTAINER_LIBCONTAINER_H_
Dylan Reid837c74a2016-01-22 17:25:21 -08008
Dylan Reid2bd9ea92016-04-07 20:57:47 -07009#include <stddef.h>
Luis Hector Chavezff5978f2017-06-27 12:52:58 -070010#include <stdint.h>
Luis Hector Chavezda352462018-01-30 09:10:00 -080011#include <sys/resource.h>
Dylan Reid0bb592b2016-11-09 13:34:11 -080012#include <sys/types.h>
Dylan Reid837c74a2016-01-22 17:25:21 -080013
Luis Hector Chavezdac0f662017-09-14 14:41:27 -070014#include <brillo/brillo_export.h>
Luis Hector Chaveze03926a2017-09-28 17:28:49 -070015#include <libminijail.h>
Luis Hector Chavezdac0f662017-09-14 14:41:27 -070016
Dylan Reid837c74a2016-01-22 17:25:21 -080017#ifdef __cplusplus
18extern "C" {
19#endif
20
21struct container_config;
22
23/* Create a container config. */
Luis Hector Chavez1e1fd9d2017-09-15 08:45:33 -070024BRILLO_EXPORT struct container_config* container_config_create(void);
Dylan Reid837c74a2016-01-22 17:25:21 -080025
26/* Destroy a config create with container_config_create. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070027BRILLO_EXPORT void container_config_destroy(struct container_config* c);
Dylan Reid837c74a2016-01-22 17:25:21 -080028
Mike Frysingerb22acdf2017-01-08 02:02:35 -050029/* config_root - Path to the root of the container itself. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070030BRILLO_EXPORT int container_config_config_root(struct container_config* c,
31 const char* config_root);
Mike Frysingerb22acdf2017-01-08 02:02:35 -050032
33/* Get the configured container root path. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070034BRILLO_EXPORT const char* container_config_get_config_root(
35 const struct container_config* c);
Mike Frysingerb22acdf2017-01-08 02:02:35 -050036
Dylan Reid837c74a2016-01-22 17:25:21 -080037/* rootfs - Path to the root of the container's filesystem. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070038BRILLO_EXPORT int container_config_rootfs(struct container_config* c,
39 const char* rootfs);
Dylan Reid837c74a2016-01-22 17:25:21 -080040
Dylan Reid11456722016-05-02 11:24:50 -070041/* Get the configured rootfs path. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070042BRILLO_EXPORT const char* container_config_get_rootfs(
43 const struct container_config* c);
Dylan Reid11456722016-05-02 11:24:50 -070044
Luis Hector Chavezc240e7e2016-09-22 10:33:03 -070045/* rootfs_mount_flags - Flags that will be passed to the mount() call when
46 * mounting the root of the container's filesystem. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070047BRILLO_EXPORT void container_config_rootfs_mount_flags(
48 struct container_config* c, unsigned long flags);
Luis Hector Chavezc240e7e2016-09-22 10:33:03 -070049
50/* Get the configured rootfs mount() flags. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070051BRILLO_EXPORT unsigned long container_config_get_rootfs_mount_flags(
52 const struct container_config* c);
Luis Hector Chavezc240e7e2016-09-22 10:33:03 -070053
Keshav Santhanam0e4c3282016-07-14 10:25:16 -070054/* runfs - Path to where the container filesystem has been mounted. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070055BRILLO_EXPORT int container_config_premounted_runfs(struct container_config* c,
56 const char* runfs);
Keshav Santhanam0e4c3282016-07-14 10:25:16 -070057
58/* Get the pre-mounted runfs path. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070059BRILLO_EXPORT const char* container_config_get_premounted_runfs(
60 const struct container_config* c);
Keshav Santhanam0e4c3282016-07-14 10:25:16 -070061
62/* The pid of the program will be written here. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070063BRILLO_EXPORT int container_config_pid_file(struct container_config* c,
64 const char* path);
Keshav Santhanam0e4c3282016-07-14 10:25:16 -070065
66/* Get the pid file path. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070067BRILLO_EXPORT const char* container_config_get_pid_file(
68 const struct container_config* c);
Keshav Santhanam0e4c3282016-07-14 10:25:16 -070069
Dylan Reid837c74a2016-01-22 17:25:21 -080070/* The program to run and args, e.g. "/sbin/init", "--second-stage". */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070071BRILLO_EXPORT int container_config_program_argv(struct container_config* c,
72 const char** argv,
73 size_t num_args);
Dylan Reid837c74a2016-01-22 17:25:21 -080074
Dylan Reid11456722016-05-02 11:24:50 -070075/* Get the number of command line args for the program to be run. */
Luis Hector Chavezdac0f662017-09-14 14:41:27 -070076BRILLO_EXPORT size_t
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070077container_config_get_num_program_args(const struct container_config* c);
Dylan Reid11456722016-05-02 11:24:50 -070078
79/* Get the program argument at the given index. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070080BRILLO_EXPORT const char* container_config_get_program_arg(
81 const struct container_config* c, size_t index);
Dylan Reid11456722016-05-02 11:24:50 -070082
Dylan Reid1874feb2016-06-22 17:53:50 -070083/* Sets/Gets the uid the container will run as. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070084BRILLO_EXPORT void container_config_uid(struct container_config* c, uid_t uid);
85BRILLO_EXPORT uid_t container_config_get_uid(const struct container_config* c);
Dylan Reid1874feb2016-06-22 17:53:50 -070086
Dylan Reid837c74a2016-01-22 17:25:21 -080087/* Mapping of UIDs in the container, e.g. "0 100000 1024" */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070088BRILLO_EXPORT int container_config_uid_map(struct container_config* c,
89 const char* uid_map);
Dylan Reid837c74a2016-01-22 17:25:21 -080090
Dylan Reid1874feb2016-06-22 17:53:50 -070091/* Sets/Gets the gid the container will run as. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070092BRILLO_EXPORT void container_config_gid(struct container_config* c, gid_t gid);
93BRILLO_EXPORT gid_t container_config_get_gid(const struct container_config* c);
Dylan Reid1874feb2016-06-22 17:53:50 -070094
Dylan Reid837c74a2016-01-22 17:25:21 -080095/* Mapping of GIDs in the container, e.g. "0 100000 1024" */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -070096BRILLO_EXPORT int container_config_gid_map(struct container_config* c,
97 const char* gid_map);
Dylan Reid837c74a2016-01-22 17:25:21 -080098
99/* Alt-Syscall table to use or NULL if none. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700100BRILLO_EXPORT int container_config_alt_syscall_table(
101 struct container_config* c, const char* alt_syscall_table);
Dylan Reid837c74a2016-01-22 17:25:21 -0800102
Dylan Reid93fa4602017-06-06 13:39:31 -0700103/* Add a runtime limit for the contained process. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700104BRILLO_EXPORT int container_config_add_rlimit(struct container_config* c,
105 int type,
Luis Hector Chavezda352462018-01-30 09:10:00 -0800106 rlim_t cur,
107 rlim_t max);
Dylan Reid93fa4602017-06-06 13:39:31 -0700108
Dylan Reid837c74a2016-01-22 17:25:21 -0800109/*
110 * Add a filesystem to mount in the new VFS namespace.
111 *
112 * c - The container config in which to add the mount.
113 * source - Mount source, e.g. "tmpfs" or "/data".
114 * destination - Mount point in the container, e.g. "/dev".
115 * type - Mount type, e.g. "tmpfs", "selinuxfs", or "devpts".
116 * data - Mount data for extra options, e.g. "newinstance" or "ptmxmode=0000".
Mike Frysinger05e594e2017-01-10 02:11:08 -0500117 * verity - dm-verity options (if used).
Mike Frysinger412dbd22017-01-06 01:50:34 -0500118 * flags - Mount flags as defined in mount(2).
Dylan Reid837c74a2016-01-22 17:25:21 -0800119 * uid - uid to chown mount point to if created.
120 * gid - gid to chown mount point to if created.
121 * mode - Permissions of mount point if created.
122 * mount_in_ns - True if mount should happen in the process' vfs namespace.
123 * create - If true, create mount destination if it doesn't exist.
Mike Frysinger412dbd22017-01-06 01:50:34 -0500124 * loopback - If true, set up a loopback device and mount that.
Dylan Reid837c74a2016-01-22 17:25:21 -0800125 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700126BRILLO_EXPORT int container_config_add_mount(struct container_config* c,
127 const char* name,
128 const char* source,
129 const char* destination,
130 const char* type,
131 const char* data,
132 const char* verity,
133 int flags,
134 int uid,
135 int gid,
136 int mode,
137 int mount_in_ns,
138 int create,
139 int loopback);
Dylan Reid837c74a2016-01-22 17:25:21 -0800140
141/*
Dylan Reid4843d6b2017-03-31 18:14:30 -0700142 * Add a device cgroup permission.
143 *
144 * c - The container config in which to add the mount.
145 * allow - If true allow access to the specified r/w/m.
146 * type - 'c', 'b', or 'a' for char, block, or all respectively.
147 * major - Major device number.
148 * minor - Minor device number.
149 * read - If true set reading of device to |allow|.
150 * write - If true set writing of device to |allow|.
151 * modify - If true set modifying of device to |allow|.
152 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700153BRILLO_EXPORT int container_config_add_cgroup_device(struct container_config* c,
154 int allow,
155 char type,
156 int major,
157 int minor,
158 int read,
159 int write,
160 int modify);
Dylan Reid4843d6b2017-03-31 18:14:30 -0700161
162/*
Dylan Reid837c74a2016-01-22 17:25:21 -0800163 * Add a device node to create.
164 *
165 * c - The container config in which to add the mount.
166 * type - 'c' or 'b' for char or block respectively.
167 * path - Where to mknod, "/dev/zero".
168 * fs_permissions - Permissions to set on the node.
169 * major - Major device number.
170 * minor - Minor device number.
Stephen Barber7bae6642017-11-30 10:47:12 -0800171 * copy_major - Overwrite major with the major of the existing device node. If
172 * this is true major will be copied from an existing node. The |major| param
173 * should be set to -1 in this case.
Dylan Reid355d5e42016-04-29 16:53:31 -0700174 * copy_minor - Overwrite minor with the minor of the existing device node. If
175 * this is true minor will be copied from an existing node. The |minor| param
176 * should be set to -1 in this case.
Dylan Reid837c74a2016-01-22 17:25:21 -0800177 * uid - User to own the device.
178 * gid - Group to own the device.
179 * read_allowed - If true allow reading from the device via "devices" cgroup.
180 * write_allowed - If true allow writing to the device via "devices" cgroup.
181 * modify_allowed - If true allow creation of the device via "devices" cgroup.
182 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700183BRILLO_EXPORT int container_config_add_device(struct container_config* c,
184 char type,
185 const char* path,
186 int fs_permissions,
187 int major,
188 int minor,
Stephen Barber7bae6642017-11-30 10:47:12 -0800189 int copy_major,
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700190 int copy_minor,
191 int uid,
192 int gid,
193 int read_allowed,
194 int write_allowed,
195 int modify_allowed);
Dylan Reid837c74a2016-01-22 17:25:21 -0800196
Chinyue Chenfac909e2016-06-24 14:17:42 +0800197/* Set the CPU shares cgroup param for container. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700198BRILLO_EXPORT int container_config_set_cpu_shares(struct container_config* c,
199 int shares);
Chinyue Chenfac909e2016-06-24 14:17:42 +0800200
201/* Set the CFS CPU cgroup params for container. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700202BRILLO_EXPORT int container_config_set_cpu_cfs_params(
203 struct container_config* c, int quota, int period);
Chinyue Chenfac909e2016-06-24 14:17:42 +0800204
205/* Set the RT CPU cgroup params for container. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700206BRILLO_EXPORT int container_config_set_cpu_rt_params(struct container_config* c,
207 int rt_runtime,
208 int rt_period);
Chinyue Chenfac909e2016-06-24 14:17:42 +0800209
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700210BRILLO_EXPORT int container_config_get_cpu_shares(struct container_config* c);
211BRILLO_EXPORT int container_config_get_cpu_quota(struct container_config* c);
212BRILLO_EXPORT int container_config_get_cpu_period(struct container_config* c);
213BRILLO_EXPORT int container_config_get_cpu_rt_runtime(
214 struct container_config* c);
215BRILLO_EXPORT int container_config_get_cpu_rt_period(
216 struct container_config* c);
Chinyue Chen4f3fd682016-07-01 14:11:42 +0800217
Dylan Reid9e724af2016-07-21 09:58:07 -0700218/*
219 * Configure the owner of cgroups created for the container.
220 *
221 * This is needed so the container's cgroup namespace rootdir is accessible
222 * inside the container.
223 *
224 * cgroup_parent - Parent directory under which to create the cgroup.
225 * cgroup_owner - The uid that should own the cgroups that are created.
Dmitry Torokhov14eef722016-09-27 16:40:37 -0700226 * cgroup_group - The gid that should own the cgroups that are created.
Dylan Reid9e724af2016-07-21 09:58:07 -0700227 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700228BRILLO_EXPORT int container_config_set_cgroup_parent(struct container_config* c,
229 const char* parent,
230 uid_t cgroup_owner,
231 gid_t cgroup_group);
Dylan Reid9e724af2016-07-21 09:58:07 -0700232
233/* Get the parent cgroup directory from the config. Here for UT only. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700234BRILLO_EXPORT const char* container_config_get_cgroup_parent(
235 struct container_config* c);
Dylan Reid9e724af2016-07-21 09:58:07 -0700236
Stephen Barber771653f2017-10-04 23:48:57 -0700237/* Set namespaces to be used by the container. */
238BRILLO_EXPORT int container_config_namespaces(
239 struct container_config* c, const char** namespaces, size_t num_ns);
240
241/* Get the number of namespaces to enter. */
242BRILLO_EXPORT size_t
243container_config_get_num_namespaces(const struct container_config* c);
244
245/* Get the namespace at the given index. */
246BRILLO_EXPORT bool container_config_has_namespace(
247 const struct container_config* c, const char* ns);
Keshav Santhanam1b6bf672016-08-10 18:35:12 -0700248
Dylan Reidc4335842016-11-11 10:24:52 -0800249/*
250 * Configures the container so that any FDs open in the parent process are still
251 * visible to the child. Useful for apps that need stdin/stdout/stderr. Use
252 * with caution to avoid leaking other FDs into the namespaced app.
253 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700254BRILLO_EXPORT void container_config_keep_fds_open(struct container_config* c);
Dylan Reidc4335842016-11-11 10:24:52 -0800255
Luis Hector Chavezff5978f2017-06-27 12:52:58 -0700256/*
257 * Sets the capability mask of the container to |capmask|. If |ambient| is 1 it
258 * will additionally set the ambient capability set.
259 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700260BRILLO_EXPORT void container_config_set_capmask(struct container_config* c,
261 uint64_t capmask,
262 int ambient);
Luis Hector Chavezff5978f2017-06-27 12:52:58 -0700263
Luis Hector Chavezcd44ba72017-06-30 13:01:38 -0700264/*
265 * Skips settings the securebits in |securebits_skip_mask| when restricting
266 * capabilities. This is only used when container_config_set_capmask() is used.
267 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700268BRILLO_EXPORT void container_config_set_securebits_skip_mask(
269 struct container_config* c, uint64_t securebits_skip_mask);
Luis Hector Chavezcd44ba72017-06-30 13:01:38 -0700270
Luis Hector Chavezdac65c32017-07-21 10:30:23 -0700271/*
272 * Sets whether the container's entry point should run as init. An init process
273 * is responsible for setting up certain paths within the container (such as
274 * /proc) and performing explicit reaping of zombie processes. The container
275 * will also be torn down if the init process is killed.
276 * The default is true.
277 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700278BRILLO_EXPORT void container_config_set_run_as_init(struct container_config* c,
279 int run_as_init);
Luis Hector Chavezdac65c32017-07-21 10:30:23 -0700280
Luis Hector Chavez15e8e672017-07-20 15:13:27 -0700281/*
282 * Sets the SELinux context under which the container will run.
283 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700284BRILLO_EXPORT int container_config_set_selinux_context(
285 struct container_config* c, const char* context);
Luis Hector Chavez15e8e672017-07-20 15:13:27 -0700286
Luis Hector Chavezf8e8f4c2017-08-01 01:09:39 -0700287/*
288 * Sets a pre-execve hook that is run in the child process just before the
289 * container invokes execve(2). If this is used to run a pre-start hook which
290 * should run in the caller's context, a synchronization mechanism (such as a
291 * pair of pipes or sending messages through a unix domain pipe) should be used
292 * to ensure this hook blocks until the pre-start hook finishes running. The
293 * file descriptors used to synchronize this can be passed using
294 * container_config_inherit_fds().
295 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700296BRILLO_EXPORT void container_config_set_pre_execve_hook(
297 struct container_config* c, int (*hook)(void*), void* payload);
Luis Hector Chavezf8e8f4c2017-08-01 01:09:39 -0700298
299/*
Luis Hector Chaveze03926a2017-09-28 17:28:49 -0700300 * Adds a hook that will be run, execve(2)-style. This new process will be run
301 * outside the container in the original namespace. Any parameters that are
302 * equal to the magic value "$PID" will be replaced with the container's PID. If
303 * |pstdin_fd|, |pstdout_fd|, or |pstderr_fd| are set to non-null values, they
304 * will contain valid file descriptors that can be used to communicate with the
305 * process.
306 */
307BRILLO_EXPORT int container_config_add_hook(struct container_config* c,
308 minijail_hook_event_t event,
309 const char* filename,
310 const char** argv,
311 size_t num_args,
312 int* pstdin_fd,
313 int* pstdtout_fd,
314 int* pstderr_fd);
315
316/*
Luis Hector Chavezf8e8f4c2017-08-01 01:09:39 -0700317 * Sets the set of file descriptors to inherit.
318 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700319BRILLO_EXPORT int container_config_inherit_fds(struct container_config* c,
Luis Hector Chaveza5e87cb2018-05-21 07:21:22 -0700320 const int* inherited_fds,
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700321 size_t inherited_fd_count);
Luis Hector Chavezf8e8f4c2017-08-01 01:09:39 -0700322
Dylan Reid837c74a2016-01-22 17:25:21 -0800323/* Container manipulation. */
324struct container;
325
326/*
327 * Create a container based on the given config.
328 *
329 * name - Name of the directory holding the container config files.
330 * rundir - Where to build the temporary rootfs.
Dylan Reid837c74a2016-01-22 17:25:21 -0800331 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700332BRILLO_EXPORT struct container* container_new(const char* name,
333 const char* rundir);
Dylan Reid837c74a2016-01-22 17:25:21 -0800334
335/* Destroy a container created with container_new. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700336BRILLO_EXPORT void container_destroy(struct container* c);
Dylan Reid837c74a2016-01-22 17:25:21 -0800337
Dylan Reide040c6b2016-05-02 18:49:02 -0700338/* Start the container. Returns 0 on success.
339 * c - The container to run.
340 * config - Details of how the container should be run.
341 */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700342BRILLO_EXPORT int container_start(struct container* c,
343 const struct container_config* config);
Dylan Reid837c74a2016-01-22 17:25:21 -0800344
345/* Get the path to the root of the container. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700346BRILLO_EXPORT const char* container_root(struct container* c);
Dylan Reid837c74a2016-01-22 17:25:21 -0800347
348/* Get the pid of the init process in the container. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700349BRILLO_EXPORT int container_pid(struct container* c);
Dylan Reid837c74a2016-01-22 17:25:21 -0800350
351/* Wait for the container to exit. Returns 0 on success. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700352BRILLO_EXPORT int container_wait(struct container* c);
Dylan Reid837c74a2016-01-22 17:25:21 -0800353
354/* Kill the container's init process, then wait for it to exit. */
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700355BRILLO_EXPORT int container_kill(struct container* c);
Dylan Reid837c74a2016-01-22 17:25:21 -0800356
yusukesbbc37a72017-11-21 09:51:54 -0800357/* Dumps the container config. The returned string has to be passed to free()
yusukes32622542018-01-05 18:59:52 -0800358 when it is no longer needed.
359 c - The config to dump.
360 sort_vectors - When not 0, the function sorts the list of mount points,
361 devices, and cgroups before dumping to make it easier to
362 compare two dumps side by side.
363*/
364BRILLO_EXPORT char* container_config_dump(struct container_config* c,
365 int sort_vectors);
yusukesbbc37a72017-11-21 09:51:54 -0800366
Dylan Reid837c74a2016-01-22 17:25:21 -0800367#ifdef __cplusplus
368}; /* extern "C" */
369#endif
370
Luis Hector Chavez31735bc2017-09-15 08:17:10 -0700371#endif /* LIBCONTAINER_LIBCONTAINER_H_ */