blob: 52925c23d3d9160ff6680421f90b299195d0dc38 [file] [log] [blame]
Jes Sorensen86b645e2010-06-10 11:42:19 +02001/*
2 * os-posix.c
3 *
4 * Copyright (c) 2003-2008 Fabrice Bellard
5 * Copyright (c) 2010 Red Hat, Inc.
6 *
7 * Permission is hereby granted, free of charge, to any person obtaining a copy
8 * of this software and associated documentation files (the "Software"), to deal
9 * in the Software without restriction, including without limitation the rights
10 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
11 * copies of the Software, and to permit persons to whom the Software is
12 * furnished to do so, subject to the following conditions:
13 *
14 * The above copyright notice and this permission notice shall be included in
15 * all copies or substantial portions of the Software.
16 *
17 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
18 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
19 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
20 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
21 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
22 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
23 * THE SOFTWARE.
24 */
25
Peter Maydelld38ea872016-01-29 17:50:05 +000026#include "qemu/osdep.h"
Fiona Ebner03e471c2023-12-18 11:13:40 +010027#include <sys/resource.h>
Jes Sorensen8d963e62010-06-10 11:42:22 +020028#include <sys/wait.h>
Jes Sorensen8847cfe2010-06-10 11:42:26 +020029#include <pwd.h>
Stefan Hajnoczicc4662f2011-07-09 10:22:07 +010030#include <grp.h>
Jes Sorensen61705402010-06-10 11:42:23 +020031#include <libgen.h>
Jes Sorensen86b645e2010-06-10 11:42:19 +020032
Thomas Huthf853ac62016-01-13 09:05:32 +010033#include "qemu/error-report.h"
Dimitris Aragiorgis96c33a42016-02-18 13:38:38 +020034#include "qemu/log.h"
Philippe Mathieu-Daudé32cad1f2024-12-03 15:20:13 +010035#include "system/runstate.h"
Veronia Bahaaf348b6d2016-03-20 19:16:19 +020036#include "qemu/cutils.h"
Jes Sorensen86b645e2010-06-10 11:42:19 +020037
Jes Sorensence798cf2010-06-10 11:42:31 +020038#ifdef CONFIG_LINUX
39#include <sys/prctl.h>
Jes Sorensen949d31e2010-10-26 10:39:22 +020040#endif
41
Jes Sorensen8847cfe2010-06-10 11:42:26 +020042
Jes Sorensenfe98ac12010-06-10 11:42:21 +020043void os_setup_early_signal_handling(void)
Jes Sorensen86b645e2010-06-10 11:42:19 +020044{
45 struct sigaction act;
46 sigfillset(&act.sa_mask);
47 act.sa_flags = 0;
48 act.sa_handler = SIG_IGN;
49 sigaction(SIGPIPE, &act, NULL);
50}
Jes Sorensen8d963e62010-06-10 11:42:22 +020051
Gleb Natapovf64622c2011-03-15 13:56:04 +020052static void termsig_handler(int signal, siginfo_t *info, void *c)
Jes Sorensen8d963e62010-06-10 11:42:22 +020053{
Gleb Natapovf64622c2011-03-15 13:56:04 +020054 qemu_system_killed(info->si_signo, info->si_pid);
Jes Sorensen8d963e62010-06-10 11:42:22 +020055}
56
Jes Sorensen8d963e62010-06-10 11:42:22 +020057void os_setup_signal_handling(void)
58{
59 struct sigaction act;
60
61 memset(&act, 0, sizeof(act));
Gleb Natapovf64622c2011-03-15 13:56:04 +020062 act.sa_sigaction = termsig_handler;
63 act.sa_flags = SA_SIGINFO;
Jes Sorensen8d963e62010-06-10 11:42:22 +020064 sigaction(SIGINT, &act, NULL);
65 sigaction(SIGHUP, &act, NULL);
66 sigaction(SIGTERM, &act, NULL);
Jes Sorensen8d963e62010-06-10 11:42:22 +020067}
Jes Sorensen61705402010-06-10 11:42:23 +020068
Jes Sorensence798cf2010-06-10 11:42:31 +020069void os_set_proc_name(const char *s)
70{
71#if defined(PR_SET_NAME)
72 char name[16];
73 if (!s)
74 return;
Jim Meyering3eadc682012-10-04 13:09:51 +020075 pstrcpy(name, sizeof(name), s);
Jes Sorensence798cf2010-06-10 11:42:31 +020076 /* Could rewrite argv[0] too, but that's a bit more complicated.
77 This simple way is enough for `top'. */
78 if (prctl(PR_SET_NAME, name)) {
Ian Jacksona7aaec12018-04-16 15:16:23 +010079 error_report("unable to change process name: %s", strerror(errno));
Jes Sorensence798cf2010-06-10 11:42:31 +020080 exit(1);
81 }
82#else
Ian Jackson22cd4f42018-04-16 15:15:51 +010083 error_report("Change of process name not supported by your OS");
Jes Sorensence798cf2010-06-10 11:42:31 +020084 exit(1);
85#endif
86}
87
Michael Tokarev433aed52023-09-01 13:12:59 +030088
89/*
90 * Must set all three of these at once.
91 * Legal combinations are unset by name by uid
92 */
93static struct passwd *user_pwd; /* NULL non-NULL NULL */
94static uid_t user_uid = (uid_t)-1; /* -1 -1 >=0 */
95static gid_t user_gid = (gid_t)-1; /* -1 -1 >=0 */
96
Michael Tokarev22d02512023-09-01 13:12:56 +030097/*
Philippe Mathieu-Daudéd2803372023-10-04 14:00:07 +020098 * Prepare to change user ID. user_id can be one of 3 forms:
Michael Tokarev22d02512023-09-01 13:12:56 +030099 * - a username, in which case user ID will be changed to its uid,
100 * with primary and supplementary groups set up too;
101 * - a numeric uid, in which case only the uid will be set;
102 * - a pair of numeric uid:gid.
103 */
Philippe Mathieu-Daudéd2803372023-10-04 14:00:07 +0200104bool os_set_runas(const char *user_id)
Ian Jackson2c42f1e2017-09-15 18:10:44 +0100105{
106 unsigned long lv;
107 const char *ep;
108 uid_t got_uid;
109 gid_t got_gid;
110 int rc;
111
Philippe Mathieu-Daudéd2803372023-10-04 14:00:07 +0200112 user_pwd = getpwnam(user_id);
Michael Tokarev22d02512023-09-01 13:12:56 +0300113 if (user_pwd) {
114 user_uid = -1;
115 user_gid = -1;
116 return true;
117 }
118
Philippe Mathieu-Daudéd2803372023-10-04 14:00:07 +0200119 rc = qemu_strtoul(user_id, &ep, 0, &lv);
Ian Jackson2c42f1e2017-09-15 18:10:44 +0100120 got_uid = lv; /* overflow here is ID in C99 */
121 if (rc || *ep != ':' || got_uid != lv || got_uid == (uid_t)-1) {
122 return false;
123 }
124
125 rc = qemu_strtoul(ep + 1, 0, 0, &lv);
126 got_gid = lv; /* overflow here is ID in C99 */
127 if (rc || got_gid != lv || got_gid == (gid_t)-1) {
128 return false;
129 }
130
131 user_pwd = NULL;
132 user_uid = got_uid;
133 user_gid = got_gid;
134 return true;
135}
136
Jes Sorensene06eb602010-06-10 11:42:29 +0200137static void change_process_uid(void)
Jes Sorensen8847cfe2010-06-10 11:42:26 +0200138{
Ian Jackson2c42f1e2017-09-15 18:10:44 +0100139 assert((user_uid == (uid_t)-1) || user_pwd == NULL);
140 assert((user_uid == (uid_t)-1) ==
141 (user_gid == (gid_t)-1));
142
143 if (user_pwd || user_uid != (uid_t)-1) {
144 gid_t intended_gid = user_pwd ? user_pwd->pw_gid : user_gid;
145 uid_t intended_uid = user_pwd ? user_pwd->pw_uid : user_uid;
146 if (setgid(intended_gid) < 0) {
147 error_report("Failed to setgid(%d)", intended_gid);
Jes Sorensen8847cfe2010-06-10 11:42:26 +0200148 exit(1);
149 }
Ian Jackson2c42f1e2017-09-15 18:10:44 +0100150 if (user_pwd) {
151 if (initgroups(user_pwd->pw_name, user_pwd->pw_gid) < 0) {
152 error_report("Failed to initgroups(\"%s\", %d)",
153 user_pwd->pw_name, user_pwd->pw_gid);
154 exit(1);
155 }
156 } else {
157 if (setgroups(1, &user_gid) < 0) {
158 error_report("Failed to setgroups(1, [%d])",
159 user_gid);
160 exit(1);
161 }
Stefan Hajnoczicc4662f2011-07-09 10:22:07 +0100162 }
Ian Jackson2c42f1e2017-09-15 18:10:44 +0100163 if (setuid(intended_uid) < 0) {
164 error_report("Failed to setuid(%d)", intended_uid);
Jes Sorensen8847cfe2010-06-10 11:42:26 +0200165 exit(1);
166 }
167 if (setuid(0) != -1) {
Ian Jacksonf0a21712018-04-16 15:08:03 +0100168 error_report("Dropping privileges failed");
Jes Sorensen8847cfe2010-06-10 11:42:26 +0200169 exit(1);
170 }
171 }
172}
Jes Sorensen07663792010-06-10 11:42:27 +0200173
Michael Tokarev433aed52023-09-01 13:12:59 +0300174
175static const char *chroot_dir;
176
Philippe Mathieu-Daudéd2803372023-10-04 14:00:07 +0200177void os_set_chroot(const char *path)
Michael Tokarev5b156392023-09-01 13:12:57 +0300178{
Philippe Mathieu-Daudéd2803372023-10-04 14:00:07 +0200179 chroot_dir = path;
Michael Tokarev5b156392023-09-01 13:12:57 +0300180}
181
Jes Sorensene06eb602010-06-10 11:42:29 +0200182static void change_root(void)
Jes Sorensen07663792010-06-10 11:42:27 +0200183{
184 if (chroot_dir) {
185 if (chroot(chroot_dir) < 0) {
Ian Jackson22cd4f42018-04-16 15:15:51 +0100186 error_report("chroot failed");
Jes Sorensen07663792010-06-10 11:42:27 +0200187 exit(1);
188 }
189 if (chdir("/")) {
Ian Jacksona7aaec12018-04-16 15:16:23 +0100190 error_report("not able to chdir to /: %s", strerror(errno));
Jes Sorensen07663792010-06-10 11:42:27 +0200191 exit(1);
192 }
193 }
194
195}
Jes Sorenseneb505be2010-06-10 11:42:28 +0200196
Michael Tokarev433aed52023-09-01 13:12:59 +0300197
198static int daemonize;
199static int daemon_pipe;
200
201bool is_daemonized(void)
202{
203 return daemonize;
204}
205
206int os_set_daemonize(bool d)
207{
208 daemonize = d;
209 return 0;
210}
211
Jes Sorenseneb505be2010-06-10 11:42:28 +0200212void os_daemonize(void)
213{
214 if (daemonize) {
Gonglei63ce8e12014-09-26 16:14:30 +0800215 pid_t pid;
Michael Tokarev0be5e432014-10-30 17:30:51 +0300216 int fds[2];
Jes Sorenseneb505be2010-06-10 11:42:28 +0200217
Marc-André Lureau3338a412022-04-22 14:47:59 +0400218 if (!g_unix_open_pipe(fds, FD_CLOEXEC, NULL)) {
Gonglei63ce8e12014-09-26 16:14:30 +0800219 exit(1);
220 }
Jes Sorenseneb505be2010-06-10 11:42:28 +0200221
Gonglei63ce8e12014-09-26 16:14:30 +0800222 pid = fork();
223 if (pid > 0) {
224 uint8_t status;
225 ssize_t len;
Jes Sorenseneb505be2010-06-10 11:42:28 +0200226
Gonglei63ce8e12014-09-26 16:14:30 +0800227 close(fds[1]);
Jes Sorenseneb505be2010-06-10 11:42:28 +0200228
Michael Tokarevccea25f2014-10-30 17:37:16 +0300229 do {
230 len = read(fds[0], &status, 1);
231 } while (len < 0 && errno == EINTR);
Michael Tokarevfee78fd2014-10-30 17:40:48 +0300232
233 /* only exit successfully if our child actually wrote
234 * a one-byte zero to our pipe, upon successful init */
235 exit(len == 1 && status == 0 ? 0 : 1);
236
237 } else if (pid < 0) {
238 exit(1);
239 }
Gonglei63ce8e12014-09-26 16:14:30 +0800240
241 close(fds[0]);
Michael Tokarev0be5e432014-10-30 17:30:51 +0300242 daemon_pipe = fds[1];
Gonglei63ce8e12014-09-26 16:14:30 +0800243
244 setsid();
245
246 pid = fork();
247 if (pid > 0) {
248 exit(0);
249 } else if (pid < 0) {
Jes Sorenseneb505be2010-06-10 11:42:28 +0200250 exit(1);
Gonglei63ce8e12014-09-26 16:14:30 +0800251 }
252 umask(027);
Jes Sorenseneb505be2010-06-10 11:42:28 +0200253
254 signal(SIGTSTP, SIG_IGN);
255 signal(SIGTTOU, SIG_IGN);
256 signal(SIGTTIN, SIG_IGN);
257 }
258}
259
Fiona Ebner03e471c2023-12-18 11:13:40 +0100260void os_setup_limits(void)
261{
262 struct rlimit nofile;
263
264 if (getrlimit(RLIMIT_NOFILE, &nofile) < 0) {
265 warn_report("unable to query NOFILE limit: %s", strerror(errno));
266 return;
267 }
268
269 if (nofile.rlim_cur == nofile.rlim_max) {
270 return;
271 }
272
Trent Huberde448e02024-06-14 17:06:38 -0400273#ifdef CONFIG_DARWIN
274 nofile.rlim_cur = OPEN_MAX < nofile.rlim_max ? OPEN_MAX : nofile.rlim_max;
275#else
Fiona Ebner03e471c2023-12-18 11:13:40 +0100276 nofile.rlim_cur = nofile.rlim_max;
Trent Huberde448e02024-06-14 17:06:38 -0400277#endif
Fiona Ebner03e471c2023-12-18 11:13:40 +0100278
279 if (setrlimit(RLIMIT_NOFILE, &nofile) < 0) {
280 warn_report("unable to set NOFILE limit: %s", strerror(errno));
281 return;
282 }
283}
284
Jes Sorenseneb505be2010-06-10 11:42:28 +0200285void os_setup_post(void)
286{
287 int fd = 0;
288
289 if (daemonize) {
Jes Sorenseneb505be2010-06-10 11:42:28 +0200290 if (chdir("/")) {
Ian Jacksona7aaec12018-04-16 15:16:23 +0100291 error_report("not able to chdir to /: %s", strerror(errno));
Jes Sorenseneb505be2010-06-10 11:42:28 +0200292 exit(1);
293 }
Nikita Ivanov8b6aa692022-10-23 12:04:21 +0300294 fd = RETRY_ON_EINTR(qemu_open_old("/dev/null", O_RDWR));
Gonglei63ce8e12014-09-26 16:14:30 +0800295 if (fd == -1) {
296 exit(1);
297 }
Jes Sorenseneb505be2010-06-10 11:42:28 +0200298 }
299
Jes Sorensene06eb602010-06-10 11:42:29 +0200300 change_root();
301 change_process_uid();
Jes Sorenseneb505be2010-06-10 11:42:28 +0200302
303 if (daemonize) {
Michael Tokarev25cec2b2014-10-30 17:47:46 +0300304 uint8_t status = 0;
305 ssize_t len;
306
Jes Sorenseneb505be2010-06-10 11:42:28 +0200307 dup2(fd, 0);
308 dup2(fd, 1);
Dimitris Aragiorgis96c33a42016-02-18 13:38:38 +0200309 /* In case -D is given do not redirect stderr to /dev/null */
Richard Henderson229ef2e2022-04-17 11:29:45 -0700310 if (!qemu_log_enabled()) {
Dimitris Aragiorgis96c33a42016-02-18 13:38:38 +0200311 dup2(fd, 2);
312 }
Jes Sorenseneb505be2010-06-10 11:42:28 +0200313
314 close(fd);
Michael Tokarev25cec2b2014-10-30 17:47:46 +0300315
316 do {
317 len = write(daemon_pipe, &status, 1);
318 } while (len < 0 && errno == EINTR);
319 if (len != 1) {
320 exit(1);
321 }
Jes Sorenseneb505be2010-06-10 11:42:28 +0200322 }
323}
324
Jes Sorensen9156d762010-06-10 11:42:30 +0200325void os_set_line_buffering(void)
326{
327 setvbuf(stdout, NULL, _IOLBF, 0);
328}
Jes Sorensen949d31e2010-10-26 10:39:22 +0200329
Daniil Tatianine76fadf2025-02-12 17:39:17 +0300330int os_mlock(bool on_fault)
Satoru Moriya888a6bc2013-04-19 16:42:06 +0200331{
David CARLIER195588c2020-07-13 14:36:09 +0100332#ifdef HAVE_MLOCKALL
Satoru Moriya888a6bc2013-04-19 16:42:06 +0200333 int ret = 0;
Daniil Tatianine76fadf2025-02-12 17:39:17 +0300334 int flags = MCL_CURRENT | MCL_FUTURE;
Satoru Moriya888a6bc2013-04-19 16:42:06 +0200335
Daniil Tatianine76fadf2025-02-12 17:39:17 +0300336 if (on_fault) {
337#ifdef HAVE_MLOCK_ONFAULT
338 flags |= MCL_ONFAULT;
339#else
340 error_report("mlockall: on_fault not supported");
341 return -EINVAL;
342#endif
343 }
344
345 ret = mlockall(flags);
Satoru Moriya888a6bc2013-04-19 16:42:06 +0200346 if (ret < 0) {
Ian Jacksona7aaec12018-04-16 15:16:23 +0100347 error_report("mlockall: %s", strerror(errno));
Satoru Moriya888a6bc2013-04-19 16:42:06 +0200348 }
349
350 return ret;
David CARLIER195588c2020-07-13 14:36:09 +0100351#else
Daniil Tatianine76fadf2025-02-12 17:39:17 +0300352 (void)on_fault;
David CARLIER195588c2020-07-13 14:36:09 +0100353 return -ENOSYS;
354#endif
Satoru Moriya888a6bc2013-04-19 16:42:06 +0200355}