blob: b3ccffbf0fac3e2c3477f78c1035e60c2167b5c4 [file] [log] [blame]
bellarde88de092005-02-07 12:35:39 +00001#ifndef QEMU_H
2#define QEMU_H
bellard31e31b82003-02-18 22:55:36 +00003
Timothy E Baldwin4d330ce2016-05-12 18:47:46 +01004#include "hostdep.h"
bellard6180a182003-09-30 21:04:53 +00005#include "cpu.h"
Paolo Bonzini63c91552016-03-15 13:18:37 +01006#include "exec/exec-all.h"
Paolo Bonzinif08b6172014-03-28 19:42:10 +01007#include "exec/cpu_ldst.h"
blueswir1992f48a2007-10-14 16:27:31 +00008
balrog06177d32007-12-24 13:47:52 +00009#undef DEBUG_REMAP
10#ifdef DEBUG_REMAP
balrog06177d32007-12-24 13:47:52 +000011#endif /* DEBUG_REMAP */
12
Paolo Bonzini022c62c2012-12-17 18:19:49 +010013#include "exec/user/abitypes.h"
blueswir1992f48a2007-10-14 16:27:31 +000014
Paolo Bonzini022c62c2012-12-17 18:19:49 +010015#include "exec/user/thunk.h"
blueswir1992f48a2007-10-14 16:27:31 +000016#include "syscall_defs.h"
Lluís Vilanova460c5792016-02-01 19:38:42 +010017#include "target_syscall.h"
Paolo Bonzini022c62c2012-12-17 18:19:49 +010018#include "exec/gdbstub.h"
bellard66fb9762003-03-23 01:06:05 +000019
Peter Maydell1d48fdd2016-06-14 12:49:18 +010020/* This is the size of the host kernel's sigset_t, needed where we make
21 * direct system calls that take a sigset_t pointer and a size.
22 */
23#define SIGSET_T_SIZE (_NSIG / 8)
24
bellard31e31b82003-02-18 22:55:36 +000025/* This struct is used to hold certain information about the image.
26 * Basically, it replicates in user space what would be certain
27 * task_struct fields in the kernel
28 */
29struct image_info {
Richard Henderson9955ffa2010-07-27 10:25:30 -070030 abi_ulong load_bias;
blueswir1992f48a2007-10-14 16:27:31 +000031 abi_ulong load_addr;
32 abi_ulong start_code;
33 abi_ulong end_code;
34 abi_ulong start_data;
35 abi_ulong end_data;
36 abi_ulong start_brk;
37 abi_ulong brk;
Richard Henderson6fd59442020-01-17 13:02:45 -100038 abi_ulong reserve_brk;
blueswir1992f48a2007-10-14 16:27:31 +000039 abi_ulong start_mmap;
blueswir1992f48a2007-10-14 16:27:31 +000040 abi_ulong start_stack;
Paul Brook97374d32010-06-16 13:03:51 +010041 abi_ulong stack_limit;
blueswir1992f48a2007-10-14 16:27:31 +000042 abi_ulong entry;
43 abi_ulong code_offset;
44 abi_ulong data_offset;
Mika Westerbergedf8e2a2009-04-07 09:57:11 +030045 abi_ulong saved_auxv;
Alexander Graf125b0f52012-01-28 21:12:14 +020046 abi_ulong auxv_len;
Mika Westerbergedf8e2a2009-04-07 09:57:11 +030047 abi_ulong arg_start;
48 abi_ulong arg_end;
Richard Henderson7c4ee5b2016-12-15 09:38:11 -080049 abi_ulong arg_strings;
50 abi_ulong env_strings;
51 abi_ulong file_string;
Paul Brookd8fd2952012-03-30 18:02:50 +010052 uint32_t elf_flags;
Paolo Bonzini7d374352018-12-13 23:37:37 +010053 int personality;
Laurent Vivier33143c42018-07-16 21:53:49 +020054 abi_ulong alignment;
Christophe Lyona99856c2018-04-30 10:03:41 +020055
56 /* The fields below are used in FDPIC mode. */
Mike Frysinger1af02e82011-02-07 01:05:50 -050057 abi_ulong loadmap_addr;
58 uint16_t nsegs;
59 void *loadsegs;
60 abi_ulong pt_dynamic_addr;
Christophe Lyon3cb10cf2018-04-30 10:03:43 +020061 abi_ulong interpreter_loadmap_addr;
62 abi_ulong interpreter_pt_dynamic_addr;
Mike Frysinger1af02e82011-02-07 01:05:50 -050063 struct image_info *other_info;
Richard Henderson83f990e2020-10-21 10:37:47 -070064
65 /* For target-specific processing of NT_GNU_PROPERTY_TYPE_0. */
66 uint32_t note_flags;
67
Stefan Markovic74cfc702018-10-22 16:43:40 +020068#ifdef TARGET_MIPS
69 int fp_abi;
70 int interp_fp_abi;
71#endif
bellard31e31b82003-02-18 22:55:36 +000072};
73
bellardb346ff42003-06-15 20:05:50 +000074#ifdef TARGET_I386
bellard851e67a2003-03-29 16:53:14 +000075/* Information about the current linux thread */
76struct vm86_saved_state {
77 uint32_t eax; /* return code */
78 uint32_t ebx;
79 uint32_t ecx;
80 uint32_t edx;
81 uint32_t esi;
82 uint32_t edi;
83 uint32_t ebp;
84 uint32_t esp;
85 uint32_t eflags;
86 uint32_t eip;
87 uint16_t cs, ss, ds, es, fs, gs;
88};
bellardb346ff42003-06-15 20:05:50 +000089#endif
bellard851e67a2003-03-29 16:53:14 +000090
Peter Maydell848d72c2013-09-03 20:12:17 +010091#if defined(TARGET_ARM) && defined(TARGET_ABI32)
bellard28c4f362004-02-16 21:47:43 +000092/* FPU emulator */
93#include "nwfpe/fpa11.h"
bellard28c4f362004-02-16 21:47:43 +000094#endif
95
pbrook624f7972008-05-31 16:11:38 +000096#define MAX_SIGQUEUE_SIZE 1024
97
pbrook624f7972008-05-31 16:11:38 +000098struct emulated_sigtable {
99 int pending; /* true if signal is pending */
Timothy E Baldwin907f5fd2016-05-27 15:51:52 +0100100 target_siginfo_t info;
pbrook624f7972008-05-31 16:11:38 +0000101};
102
bellard851e67a2003-03-29 16:53:14 +0000103/* NOTE: we force a big alignment so that the stack stored after is
104 aligned too */
105typedef struct TaskState {
Mika Westerbergedf8e2a2009-04-07 09:57:11 +0300106 pid_t ts_tid; /* tid (or pid) of this task */
bellard28c4f362004-02-16 21:47:43 +0000107#ifdef TARGET_ARM
Peter Maydell848d72c2013-09-03 20:12:17 +0100108# ifdef TARGET_ABI32
bellard28c4f362004-02-16 21:47:43 +0000109 /* FPA state */
110 FPA11 fpa;
Peter Maydell848d72c2013-09-03 20:12:17 +0100111# endif
Keith Packarda10b9d92021-01-08 22:42:52 +0000112#endif
113#if defined(TARGET_ARM) || defined(TARGET_RISCV)
bellarda4f81972005-04-23 18:25:41 +0000114 int swi_errno;
bellard28c4f362004-02-16 21:47:43 +0000115#endif
j_mayer84409dd2007-04-06 08:56:50 +0000116#if defined(TARGET_I386) && !defined(TARGET_X86_64)
blueswir1992f48a2007-10-14 16:27:31 +0000117 abi_ulong target_v86;
bellard851e67a2003-03-29 16:53:14 +0000118 struct vm86_saved_state vm86_saved_regs;
bellardb333af02003-05-14 21:48:51 +0000119 struct target_vm86plus_struct vm86plus;
bellard631271d2003-05-10 13:14:52 +0000120 uint32_t v86flags;
121 uint32_t v86mask;
bellardb346ff42003-06-15 20:05:50 +0000122#endif
pbrookc2764712009-03-07 15:24:59 +0000123 abi_ulong child_tidptr;
pbrooke6e59062006-10-22 00:18:54 +0000124#ifdef TARGET_M68K
Peter Maydell1ccd9372013-07-16 18:44:55 +0100125 abi_ulong tp_value;
pbrooke6e59062006-10-22 00:18:54 +0000126#endif
Keith Packarda10b9d92021-01-08 22:42:52 +0000127#if defined(TARGET_ARM) || defined(TARGET_M68K) || defined(TARGET_RISCV)
pbrooka87295e2007-05-26 15:09:38 +0000128 /* Extra fields for semihosted binaries. */
Peter Maydelld3170912016-07-04 13:06:35 +0100129 abi_ulong heap_base;
130 abi_ulong heap_limit;
pbrooka87295e2007-05-26 15:09:38 +0000131#endif
Peter Maydelld3170912016-07-04 13:06:35 +0100132 abi_ulong stack_base;
bellard851e67a2003-03-29 16:53:14 +0000133 int used; /* non zero if used */
pbrook978efd62006-06-17 18:30:42 +0000134 struct image_info *info;
Mika Westerbergedf8e2a2009-04-07 09:57:11 +0300135 struct linux_binprm *bprm;
pbrook624f7972008-05-31 16:11:38 +0000136
Timothy E Baldwin655ed672016-05-27 15:51:53 +0100137 struct emulated_sigtable sync_signal;
pbrook624f7972008-05-31 16:11:38 +0000138 struct emulated_sigtable sigtab[TARGET_NSIG];
Peter Maydell3d3efba2016-05-27 15:51:49 +0100139 /* This thread's signal mask, as requested by the guest program.
140 * The actual signal mask of this thread may differ:
141 * + we don't let SIGSEGV and SIGBUS be blocked while running guest code
142 * + sometimes we block all signals to avoid races
143 */
144 sigset_t signal_mask;
145 /* The signal mask imposed by a guest sigsuspend syscall, if we are
146 * currently in the middle of such a syscall
147 */
148 sigset_t sigsuspend_mask;
149 /* Nonzero if we're leaving a sigsuspend and sigsuspend_mask is valid. */
150 int in_sigsuspend;
151
152 /* Nonzero if process_pending_signals() needs to do something (either
153 * handle a pending signal or unblock signals).
154 * This flag is written from a signal handler so should be accessed via
Stefan Hajnoczid73415a2020-09-23 11:56:46 +0100155 * the qatomic_read() and qatomic_set() functions. (It is not accessed
Peter Maydell3d3efba2016-05-27 15:51:49 +0100156 * from multiple threads.)
157 */
158 int signal_pending;
159
Peter Maydell5bfce0b2019-07-25 14:16:45 +0100160 /* This thread's sigaltstack, if it has one */
161 struct target_sigaltstack sigaltstack_used;
bellard851e67a2003-03-29 16:53:14 +0000162} __attribute__((aligned(16))) TaskState;
163
aurel32d088d662009-01-30 20:09:01 +0000164extern char *exec_path;
pbrook624f7972008-05-31 16:11:38 +0000165void init_task_state(TaskState *ts);
Mika Westerbergedf8e2a2009-04-07 09:57:11 +0300166void task_settid(TaskState *);
167void stop_all_tasks(void);
pbrookc5937222006-05-14 11:30:38 +0000168extern const char *qemu_uname_release;
Paul Brook379f6692009-07-17 12:48:08 +0100169extern unsigned long mmap_min_addr;
bellard851e67a2003-03-29 16:53:14 +0000170
pbrooke5fe0c52006-06-11 13:32:59 +0000171/* ??? See if we can avoid exposing so much of the loader internals. */
pbrooke5fe0c52006-06-11 13:32:59 +0000172
Richard Henderson9955ffa2010-07-27 10:25:30 -0700173/* Read a good amount of data initially, to hopefully get all the
174 program headers loaded. */
175#define BPRM_BUF_SIZE 1024
176
pbrooke5fe0c52006-06-11 13:32:59 +0000177/*
ths5fafdf22007-09-16 21:08:06 +0000178 * This structure is used to hold the arguments that are
pbrooke5fe0c52006-06-11 13:32:59 +0000179 * used when loading binaries.
180 */
181struct linux_binprm {
Richard Henderson9955ffa2010-07-27 10:25:30 -0700182 char buf[BPRM_BUF_SIZE] __attribute__((aligned));
blueswir1992f48a2007-10-14 16:27:31 +0000183 abi_ulong p;
Paolo Bonzini7d374352018-12-13 23:37:37 +0100184 int fd;
pbrooke5fe0c52006-06-11 13:32:59 +0000185 int e_uid, e_gid;
186 int argc, envc;
187 char **argv;
188 char **envp;
189 char * filename; /* Name of binary */
Andreas Färber9349b4f2012-03-14 01:38:32 +0100190 int (*core_dump)(int, const CPUArchState *); /* coredump routine */
pbrooke5fe0c52006-06-11 13:32:59 +0000191};
192
Filip Bozuta79482e592020-06-19 14:47:27 +0200193typedef struct IOCTLEntry IOCTLEntry;
194
195typedef abi_long do_ioctl_fn(const IOCTLEntry *ie, uint8_t *buf_temp,
196 int fd, int cmd, abi_long arg);
197
198struct IOCTLEntry {
199 int target_cmd;
200 unsigned int host_cmd;
201 const char *name;
202 int access;
203 do_ioctl_fn *do_ioctl;
204 const argtype arg_type[5];
205};
206
207extern IOCTLEntry ioctl_entries[];
208
209#define IOC_R 0x0001
210#define IOC_W 0x0002
211#define IOC_RW (IOC_R | IOC_W)
212
pbrooke5fe0c52006-06-11 13:32:59 +0000213void do_init_thread(struct target_pt_regs *regs, struct image_info *infop);
blueswir1992f48a2007-10-14 16:27:31 +0000214abi_ulong loader_build_argptr(int envc, int argc, abi_ulong sp,
215 abi_ulong stringp, int push_ptr);
Laurent Vivier03cfd8f2013-08-30 01:46:44 +0200216int loader_exec(int fdexec, const char *filename, char **argv, char **envp,
Mika Westerbergedf8e2a2009-04-07 09:57:11 +0300217 struct target_pt_regs * regs, struct image_info *infop,
218 struct linux_binprm *);
bellard31e31b82003-02-18 22:55:36 +0000219
Christophe Lyon3cb10cf2018-04-30 10:03:43 +0200220/* Returns true if the image uses the FDPIC ABI. If this is the case,
221 * we have to provide some information (loadmap, pt_dynamic_info) such
222 * that the program can be relocated adequately. This is also useful
223 * when handling signals.
224 */
225int info_is_fdpic(struct image_info *info);
226
YunQiang Su768fe762018-02-20 18:33:05 +0100227uint32_t get_elf_eflags(int fd);
Will Newtonf0116c52014-01-09 09:10:50 +0000228int load_elf_binary(struct linux_binprm *bprm, struct image_info *info);
229int load_flt_binary(struct linux_binprm *bprm, struct image_info *info);
pbrooke5fe0c52006-06-11 13:32:59 +0000230
bellard579a97f2007-11-11 14:26:47 +0000231abi_long memcpy_to_target(abi_ulong dest, const void *src,
232 unsigned long len);
blueswir1992f48a2007-10-14 16:27:31 +0000233void target_set_brk(abi_ulong new_brk);
234abi_long do_brk(abi_ulong new_brk);
bellard31e31b82003-02-18 22:55:36 +0000235void syscall_init(void);
blueswir1992f48a2007-10-14 16:27:31 +0000236abi_long do_syscall(void *cpu_env, int num, abi_long arg1,
237 abi_long arg2, abi_long arg3, abi_long arg4,
Peter Maydell5945cfc2011-06-16 17:37:13 +0100238 abi_long arg5, abi_long arg6, abi_long arg7,
239 abi_long arg8);
Peter Maydellb44316f2018-02-13 13:22:46 +0000240extern __thread CPUState *thread_cpu;
Andreas Färber9349b4f2012-03-14 01:38:32 +0100241void cpu_loop(CPUArchState *env);
Peter Maydell7dcdaea2016-06-06 19:58:18 +0100242const char *target_strerror(int err);
pbrooka745ec62008-05-06 15:36:17 +0000243int get_osversion(void);
Peter Maydell4a24a752013-09-03 20:12:20 +0100244void init_qemu_uname_release(void);
pbrookd5975362008-06-07 20:50:51 +0000245void fork_start(void);
246void fork_end(int child);
bellard6977fbf2003-04-29 20:39:23 +0000247
Alex Bennéeee947432020-05-13 18:51:28 +0100248/**
249 * probe_guest_base:
250 * @image_name: the executable being loaded
251 * @loaddr: the lowest fixed address in the executable
252 * @hiaddr: the highest fixed address in the executable
253 *
254 * Creates the initial guest address space in the host memory space.
255 *
256 * If @loaddr == 0, then no address in the executable is fixed,
257 * i.e. it is fully relocatable. In that case @hiaddr is the size
258 * of the executable.
259 *
260 * This function will not return if a valid value for guest_base
261 * cannot be chosen. On return, the executable loader can expect
262 *
263 * target_mmap(loaddr, hiaddr - loaddr, ...)
264 *
265 * to succeed.
Meador Ingedce10402012-07-26 16:50:01 +0000266 */
Alex Bennéeee947432020-05-13 18:51:28 +0100267void probe_guest_base(const char *image_name,
268 abi_ulong loaddr, abi_ulong hiaddr);
Meador Ingedce10402012-07-26 16:50:01 +0000269
Paolo Bonzini1de7afc2012-12-17 18:20:00 +0100270#include "qemu/log.h"
bellard631271d2003-05-10 13:14:52 +0000271
Timothy E Baldwin4d330ce2016-05-12 18:47:46 +0100272/* safe_syscall.S */
273
274/**
275 * safe_syscall:
276 * @int number: number of system call to make
277 * ...: arguments to the system call
278 *
279 * Call a system call if guest signal not pending.
280 * This has the same API as the libc syscall() function, except that it
281 * may return -1 with errno == TARGET_ERESTARTSYS if a signal was pending.
282 *
283 * Returns: the system call result, or -1 with an error code in errno
284 * (Errnos are host errnos; we rely on TARGET_ERESTARTSYS not clashing
285 * with any of the host errno values.)
286 */
287
288/* A guide to using safe_syscall() to handle interactions between guest
289 * syscalls and guest signals:
290 *
291 * Guest syscalls come in two flavours:
292 *
293 * (1) Non-interruptible syscalls
294 *
295 * These are guest syscalls that never get interrupted by signals and
296 * so never return EINTR. They can be implemented straightforwardly in
297 * QEMU: just make sure that if the implementation code has to make any
298 * blocking calls that those calls are retried if they return EINTR.
299 * It's also OK to implement these with safe_syscall, though it will be
300 * a little less efficient if a signal is delivered at the 'wrong' moment.
301 *
Peter Maydell3d3efba2016-05-27 15:51:49 +0100302 * Some non-interruptible syscalls need to be handled using block_signals()
303 * to block signals for the duration of the syscall. This mainly applies
304 * to code which needs to modify the data structures used by the
305 * host_signal_handler() function and the functions it calls, including
306 * all syscalls which change the thread's signal mask.
307 *
Timothy E Baldwin4d330ce2016-05-12 18:47:46 +0100308 * (2) Interruptible syscalls
309 *
310 * These are guest syscalls that can be interrupted by signals and
311 * for which we need to either return EINTR or arrange for the guest
312 * syscall to be restarted. This category includes both syscalls which
313 * always restart (and in the kernel return -ERESTARTNOINTR), ones
314 * which only restart if there is no handler (kernel returns -ERESTARTNOHAND
315 * or -ERESTART_RESTARTBLOCK), and the most common kind which restart
316 * if the handler was registered with SA_RESTART (kernel returns
317 * -ERESTARTSYS). System calls which are only interruptible in some
318 * situations (like 'open') also need to be handled this way.
319 *
320 * Here it is important that the host syscall is made
321 * via this safe_syscall() function, and *not* via the host libc.
322 * If the host libc is used then the implementation will appear to work
323 * most of the time, but there will be a race condition where a
324 * signal could arrive just before we make the host syscall inside libc,
325 * and then then guest syscall will not correctly be interrupted.
326 * Instead the implementation of the guest syscall can use the safe_syscall
327 * function but otherwise just return the result or errno in the usual
328 * way; the main loop code will take care of restarting the syscall
329 * if appropriate.
330 *
331 * (If the implementation needs to make multiple host syscalls this is
332 * OK; any which might really block must be via safe_syscall(); for those
333 * which are only technically blocking (ie which we know in practice won't
334 * stay in the host kernel indefinitely) it's OK to use libc if necessary.
335 * You must be able to cope with backing out correctly if some safe_syscall
336 * you make in the implementation returns either -TARGET_ERESTARTSYS or
337 * EINTR though.)
338 *
Peter Maydell3d3efba2016-05-27 15:51:49 +0100339 * block_signals() cannot be used for interruptible syscalls.
340 *
Timothy E Baldwin4d330ce2016-05-12 18:47:46 +0100341 *
342 * How and why the safe_syscall implementation works:
343 *
344 * The basic setup is that we make the host syscall via a known
345 * section of host native assembly. If a signal occurs, our signal
346 * handler checks the interrupted host PC against the addresse of that
347 * known section. If the PC is before or at the address of the syscall
348 * instruction then we change the PC to point at a "return
349 * -TARGET_ERESTARTSYS" code path instead, and then exit the signal handler
350 * (causing the safe_syscall() call to immediately return that value).
351 * Then in the main.c loop if we see this magic return value we adjust
352 * the guest PC to wind it back to before the system call, and invoke
353 * the guest signal handler as usual.
354 *
355 * This winding-back will happen in two cases:
356 * (1) signal came in just before we took the host syscall (a race);
357 * in this case we'll take the guest signal and have another go
358 * at the syscall afterwards, and this is indistinguishable for the
359 * guest from the timing having been different such that the guest
360 * signal really did win the race
361 * (2) signal came in while the host syscall was blocking, and the
362 * host kernel decided the syscall should be restarted;
363 * in this case we want to restart the guest syscall also, and so
364 * rewinding is the right thing. (Note that "restart" semantics mean
365 * "first call the signal handler, then reattempt the syscall".)
366 * The other situation to consider is when a signal came in while the
367 * host syscall was blocking, and the host kernel decided that the syscall
368 * should not be restarted; in this case QEMU's host signal handler will
369 * be invoked with the PC pointing just after the syscall instruction,
370 * with registers indicating an EINTR return; the special code in the
371 * handler will not kick in, and we will return EINTR to the guest as
372 * we should.
373 *
374 * Notice that we can leave the host kernel to make the decision for
375 * us about whether to do a restart of the syscall or not; we do not
376 * need to check SA_RESTART flags in QEMU or distinguish the various
377 * kinds of restartability.
378 */
379#ifdef HAVE_SAFE_SYSCALL
380/* The core part of this function is implemented in assembly */
381extern long safe_syscall_base(int *pending, long number, ...);
382
383#define safe_syscall(...) \
384 ({ \
385 long ret_; \
386 int *psp_ = &((TaskState *)thread_cpu->opaque)->signal_pending; \
387 ret_ = safe_syscall_base(psp_, __VA_ARGS__); \
388 if (is_error(ret_)) { \
389 errno = -ret_; \
390 ret_ = -1; \
391 } \
392 ret_; \
393 })
394
395#else
396
397/* Fallback for architectures which don't yet provide a safe-syscall assembly
398 * fragment; note that this is racy!
399 * This should go away when all host architectures have been updated.
400 */
401#define safe_syscall syscall
402
403#endif
404
Richard Hendersona05c6402012-09-15 11:34:20 -0700405/* syscall.c */
406int host_to_target_waitstatus(int status);
407
thsb92c47c2007-11-01 00:07:38 +0000408/* strace.c */
Filip Bozutae400e112020-08-11 18:45:49 +0200409void print_syscall(void *cpu_env, int num,
bellardc16f9ed2007-11-11 17:23:29 +0000410 abi_long arg1, abi_long arg2, abi_long arg3,
411 abi_long arg4, abi_long arg5, abi_long arg6);
Filip Bozutae400e112020-08-11 18:45:49 +0200412void print_syscall_ret(void *cpu_env, int num, abi_long ret,
Filip Bozutac84be712020-06-19 14:33:26 +0200413 abi_long arg1, abi_long arg2, abi_long arg3,
414 abi_long arg4, abi_long arg5, abi_long arg6);
Peter Maydell0cb581d2016-07-18 18:12:24 +0100415/**
416 * print_taken_signal:
417 * @target_signum: target signal being taken
418 * @tinfo: target_siginfo_t which will be passed to the guest for the signal
419 *
420 * Print strace output indicating that this signal is being taken by the guest,
421 * in a format similar to:
422 * --- SIGSEGV {si_signo=SIGSEGV, si_code=SI_KERNEL, si_addr=0} ---
423 */
424void print_taken_signal(int target_signum, const target_siginfo_t *tinfo);
thsb92c47c2007-11-01 00:07:38 +0000425
bellardb346ff42003-06-15 20:05:50 +0000426/* signal.c */
Andreas Färber9349b4f2012-03-14 01:38:32 +0100427void process_pending_signals(CPUArchState *cpu_env);
bellardb346ff42003-06-15 20:05:50 +0000428void signal_init(void);
Peter Maydell9d2803f2016-07-28 16:44:46 +0100429int queue_signal(CPUArchState *env, int sig, int si_type,
430 target_siginfo_t *info);
Anthony Liguoric227f092009-10-01 16:12:16 -0500431void host_to_target_siginfo(target_siginfo_t *tinfo, const siginfo_t *info);
432void target_to_host_siginfo(siginfo_t *info, const target_siginfo_t *tinfo);
pbrook4cb05962008-05-30 18:05:19 +0000433int target_to_host_signal(int sig);
pbrook1d9d8b52009-04-16 15:17:02 +0000434int host_to_target_signal(int sig);
Andreas Färber9349b4f2012-03-14 01:38:32 +0100435long do_sigreturn(CPUArchState *env);
436long do_rt_sigreturn(CPUArchState *env);
bellard579a97f2007-11-11 14:26:47 +0000437abi_long do_sigaltstack(abi_ulong uss_addr, abi_ulong uoss_addr, abi_ulong sp);
Alex Barcelo1c275922014-03-14 14:36:55 +0000438int do_sigprocmask(int how, const sigset_t *set, sigset_t *oldset);
Richard Hendersonfa97e382018-07-18 13:06:48 -0700439abi_long do_swapcontext(CPUArchState *env, abi_ulong uold_ctx,
440 abi_ulong unew_ctx, abi_long ctx_size);
Peter Maydell3d3efba2016-05-27 15:51:49 +0100441/**
442 * block_signals: block all signals while handling this guest syscall
443 *
444 * Block all signals, and arrange that the signal mask is returned to
445 * its correct value for the guest before we resume execution of guest code.
446 * If this function returns non-zero, then the caller should immediately
447 * return -TARGET_ERESTARTSYS to the main loop, which will take the pending
448 * signal and restart execution of the syscall.
449 * If block_signals() returns zero, then the caller can continue with
450 * emulation of the system call knowing that no signals can be taken
451 * (and therefore that no race conditions will result).
452 * This should only be called once, because if it is called a second time
453 * it will always return non-zero. (Think of it like a mutex that can't
454 * be recursively locked.)
455 * Signals will be unblocked again by process_pending_signals().
456 *
457 * Return value: non-zero if there was a pending signal, zero if not.
458 */
459int block_signals(void); /* Returns non zero if signal pending */
bellardb346ff42003-06-15 20:05:50 +0000460
461#ifdef TARGET_I386
bellard631271d2003-05-10 13:14:52 +0000462/* vm86.c */
463void save_v86_state(CPUX86State *env);
bellard447db212003-05-10 15:10:36 +0000464void handle_vm86_trap(CPUX86State *env, int trapno);
bellard631271d2003-05-10 13:14:52 +0000465void handle_vm86_fault(CPUX86State *env);
blueswir1992f48a2007-10-14 16:27:31 +0000466int do_vm86(CPUX86State *env, long subfunction, abi_ulong v86_addr);
blueswir15bfb56b2007-10-05 17:01:51 +0000467#elif defined(TARGET_SPARC64)
468void sparc64_set_context(CPUSPARCState *env);
469void sparc64_get_context(CPUSPARCState *env);
bellardb346ff42003-06-15 20:05:50 +0000470#endif
bellard631271d2003-05-10 13:14:52 +0000471
bellard54936002003-05-13 00:25:15 +0000472/* mmap.c */
blueswir1992f48a2007-10-14 16:27:31 +0000473int target_mprotect(abi_ulong start, abi_ulong len, int prot);
474abi_long target_mmap(abi_ulong start, abi_ulong len, int prot,
475 int flags, int fd, abi_ulong offset);
476int target_munmap(abi_ulong start, abi_ulong len);
477abi_long target_mremap(abi_ulong old_addr, abi_ulong old_size,
478 abi_ulong new_size, unsigned long flags,
479 abi_ulong new_addr);
pbrook07765902008-05-31 16:33:53 +0000480extern unsigned long last_brk;
Peter Maydell59e9d912012-03-08 14:40:33 +0000481extern abi_ulong mmap_next_start;
Richard Henderson30ab9ef2019-05-19 13:19:52 -0700482abi_ulong mmap_find_vma(abi_ulong, abi_ulong, abi_ulong);
pbrookd5975362008-06-07 20:50:51 +0000483void mmap_fork_start(void);
484void mmap_fork_end(int child);
bellard54936002003-05-13 00:25:15 +0000485
blueswir1440c7e82008-10-05 11:05:14 +0000486/* main.c */
Richard Henderson703e0e82010-03-19 14:21:13 -0700487extern unsigned long guest_stack_size;
blueswir1440c7e82008-10-05 11:05:14 +0000488
bellardedf779f2004-02-22 13:40:13 +0000489/* user access */
490
Richard Henderson68f77662021-02-12 10:48:38 -0800491#define VERIFY_READ PAGE_READ
492#define VERIFY_WRITE (PAGE_READ | PAGE_WRITE)
bellardedf779f2004-02-22 13:40:13 +0000493
Richard Henderson4feac832021-02-12 10:48:37 -0800494static inline bool access_ok(int type, abi_ulong addr, abi_ulong size)
bellarddae32702007-11-14 10:51:00 +0000495{
Richard Henderson114556c2021-02-12 10:48:45 -0800496 if (size == 0
Richard Henderson46b12f42021-02-12 10:48:46 -0800497 ? !guest_addr_valid_untagged(addr)
498 : !guest_range_valid_untagged(addr, size)) {
Richard Henderson4feac832021-02-12 10:48:37 -0800499 return false;
500 }
Richard Henderson68f77662021-02-12 10:48:38 -0800501 return page_check_range((target_ulong)addr, size, type) == 0;
bellarddae32702007-11-14 10:51:00 +0000502}
bellardedf779f2004-02-22 13:40:13 +0000503
Richard Henderson658f2dc2013-01-04 16:39:31 -0800504/* NOTE __get_user and __put_user use host pointers and don't check access.
505 These are usually used to access struct data members once the struct has
506 been locked - usually with lock_user_struct. */
bellardedf779f2004-02-22 13:40:13 +0000507
Peter Maydell850d5e32018-10-09 17:18:14 +0100508/*
509 * Tricky points:
510 * - Use __builtin_choose_expr to avoid type promotion from ?:,
511 * - Invalid sizes result in a compile time error stemming from
512 * the fact that abort has no parameters.
513 * - It's easier to use the endian-specific unaligned load/store
514 * functions than host-endian unaligned load/store plus tswapN.
515 * - The pragmas are necessary only to silence a clang false-positive
516 * warning: see https://bugs.llvm.org/show_bug.cgi?id=39113 .
Peter Maydell850d5e32018-10-09 17:18:14 +0100517 * - gcc has bugs in its _Pragma() support in some versions, eg
518 * https://gcc.gnu.org/bugzilla/show_bug.cgi?id=83256 -- so we only
519 * include the warning-suppression pragmas for clang
520 */
Thomas Huth798b8582018-11-30 09:23:16 +0100521#if defined(__clang__) && __has_warning("-Waddress-of-packed-member")
Peter Maydell850d5e32018-10-09 17:18:14 +0100522#define PRAGMA_DISABLE_PACKED_WARNING \
523 _Pragma("GCC diagnostic push"); \
Peter Maydell850d5e32018-10-09 17:18:14 +0100524 _Pragma("GCC diagnostic ignored \"-Waddress-of-packed-member\"")
Richard Henderson658f2dc2013-01-04 16:39:31 -0800525
Peter Maydell850d5e32018-10-09 17:18:14 +0100526#define PRAGMA_REENABLE_PACKED_WARNING \
527 _Pragma("GCC diagnostic pop")
Richard Henderson658f2dc2013-01-04 16:39:31 -0800528
Peter Maydell850d5e32018-10-09 17:18:14 +0100529#else
530#define PRAGMA_DISABLE_PACKED_WARNING
531#define PRAGMA_REENABLE_PACKED_WARNING
532#endif
533
534#define __put_user_e(x, hptr, e) \
535 do { \
536 PRAGMA_DISABLE_PACKED_WARNING; \
537 (__builtin_choose_expr(sizeof(*(hptr)) == 1, stb_p, \
538 __builtin_choose_expr(sizeof(*(hptr)) == 2, stw_##e##_p, \
539 __builtin_choose_expr(sizeof(*(hptr)) == 4, stl_##e##_p, \
540 __builtin_choose_expr(sizeof(*(hptr)) == 8, stq_##e##_p, abort)))) \
541 ((hptr), (x)), (void)0); \
542 PRAGMA_REENABLE_PACKED_WARNING; \
543 } while (0)
544
545#define __get_user_e(x, hptr, e) \
546 do { \
547 PRAGMA_DISABLE_PACKED_WARNING; \
548 ((x) = (typeof(*hptr))( \
549 __builtin_choose_expr(sizeof(*(hptr)) == 1, ldub_p, \
550 __builtin_choose_expr(sizeof(*(hptr)) == 2, lduw_##e##_p, \
551 __builtin_choose_expr(sizeof(*(hptr)) == 4, ldl_##e##_p, \
552 __builtin_choose_expr(sizeof(*(hptr)) == 8, ldq_##e##_p, abort)))) \
553 (hptr)), (void)0); \
554 PRAGMA_REENABLE_PACKED_WARNING; \
555 } while (0)
556
Richard Henderson658f2dc2013-01-04 16:39:31 -0800557
558#ifdef TARGET_WORDS_BIGENDIAN
559# define __put_user(x, hptr) __put_user_e(x, hptr, be)
560# define __get_user(x, hptr) __get_user_e(x, hptr, be)
561#else
562# define __put_user(x, hptr) __put_user_e(x, hptr, le)
563# define __get_user(x, hptr) __get_user_e(x, hptr, le)
564#endif
bellardedf779f2004-02-22 13:40:13 +0000565
bellard579a97f2007-11-11 14:26:47 +0000566/* put_user()/get_user() take a guest address and check access */
567/* These are usually used to access an atomic data type, such as an int,
568 * that has been passed by address. These internally perform locking
569 * and unlocking on the data type.
570 */
571#define put_user(x, gaddr, target_type) \
572({ \
573 abi_ulong __gaddr = (gaddr); \
574 target_type *__hptr; \
Riku Voipioa42267e2014-04-22 15:40:50 +0300575 abi_long __ret = 0; \
bellard579a97f2007-11-11 14:26:47 +0000576 if ((__hptr = lock_user(VERIFY_WRITE, __gaddr, sizeof(target_type), 0))) { \
Riku Voipioa42267e2014-04-22 15:40:50 +0300577 __put_user((x), __hptr); \
bellard579a97f2007-11-11 14:26:47 +0000578 unlock_user(__hptr, __gaddr, sizeof(target_type)); \
579 } else \
580 __ret = -TARGET_EFAULT; \
581 __ret; \
bellardedf779f2004-02-22 13:40:13 +0000582})
583
bellard579a97f2007-11-11 14:26:47 +0000584#define get_user(x, gaddr, target_type) \
585({ \
586 abi_ulong __gaddr = (gaddr); \
587 target_type *__hptr; \
Riku Voipioa42267e2014-04-22 15:40:50 +0300588 abi_long __ret = 0; \
bellard579a97f2007-11-11 14:26:47 +0000589 if ((__hptr = lock_user(VERIFY_READ, __gaddr, sizeof(target_type), 1))) { \
Riku Voipioa42267e2014-04-22 15:40:50 +0300590 __get_user((x), __hptr); \
bellard579a97f2007-11-11 14:26:47 +0000591 unlock_user(__hptr, __gaddr, 0); \
bellard2f619692007-11-16 10:46:05 +0000592 } else { \
593 /* avoid warning */ \
594 (x) = 0; \
bellard579a97f2007-11-11 14:26:47 +0000595 __ret = -TARGET_EFAULT; \
bellard2f619692007-11-16 10:46:05 +0000596 } \
bellard579a97f2007-11-11 14:26:47 +0000597 __ret; \
bellardedf779f2004-02-22 13:40:13 +0000598})
599
bellard2f619692007-11-16 10:46:05 +0000600#define put_user_ual(x, gaddr) put_user((x), (gaddr), abi_ulong)
601#define put_user_sal(x, gaddr) put_user((x), (gaddr), abi_long)
602#define put_user_u64(x, gaddr) put_user((x), (gaddr), uint64_t)
603#define put_user_s64(x, gaddr) put_user((x), (gaddr), int64_t)
604#define put_user_u32(x, gaddr) put_user((x), (gaddr), uint32_t)
605#define put_user_s32(x, gaddr) put_user((x), (gaddr), int32_t)
606#define put_user_u16(x, gaddr) put_user((x), (gaddr), uint16_t)
607#define put_user_s16(x, gaddr) put_user((x), (gaddr), int16_t)
608#define put_user_u8(x, gaddr) put_user((x), (gaddr), uint8_t)
609#define put_user_s8(x, gaddr) put_user((x), (gaddr), int8_t)
610
611#define get_user_ual(x, gaddr) get_user((x), (gaddr), abi_ulong)
612#define get_user_sal(x, gaddr) get_user((x), (gaddr), abi_long)
613#define get_user_u64(x, gaddr) get_user((x), (gaddr), uint64_t)
614#define get_user_s64(x, gaddr) get_user((x), (gaddr), int64_t)
615#define get_user_u32(x, gaddr) get_user((x), (gaddr), uint32_t)
616#define get_user_s32(x, gaddr) get_user((x), (gaddr), int32_t)
617#define get_user_u16(x, gaddr) get_user((x), (gaddr), uint16_t)
618#define get_user_s16(x, gaddr) get_user((x), (gaddr), int16_t)
619#define get_user_u8(x, gaddr) get_user((x), (gaddr), uint8_t)
620#define get_user_s8(x, gaddr) get_user((x), (gaddr), int8_t)
621
bellard579a97f2007-11-11 14:26:47 +0000622/* copy_from_user() and copy_to_user() are usually used to copy data
623 * buffers between the target and host. These internally perform
624 * locking/unlocking of the memory.
625 */
626abi_long copy_from_user(void *hptr, abi_ulong gaddr, size_t len);
627abi_long copy_to_user(abi_ulong gaddr, void *hptr, size_t len);
628
pbrook53a59602006-03-25 19:31:22 +0000629/* Functions for accessing guest memory. The tget and tput functions
Stefan Weil6f20f552013-09-12 19:57:15 +0200630 read/write single values, byteswapping as necessary. The lock_user function
pbrook53a59602006-03-25 19:31:22 +0000631 gets a pointer to a contiguous area of guest memory, but does not perform
Stefan Weil6f20f552013-09-12 19:57:15 +0200632 any byteswapping. lock_user may return either a pointer to the guest
pbrook53a59602006-03-25 19:31:22 +0000633 memory, or a temporary buffer. */
634
635/* Lock an area of guest memory into the host. If copy is true then the
636 host area will have the same contents as the guest. */
bellard579a97f2007-11-11 14:26:47 +0000637static inline void *lock_user(int type, abi_ulong guest_addr, long len, int copy)
bellardedf779f2004-02-22 13:40:13 +0000638{
bellard579a97f2007-11-11 14:26:47 +0000639 if (!access_ok(type, guest_addr, len))
640 return NULL;
pbrook53a59602006-03-25 19:31:22 +0000641#ifdef DEBUG_REMAP
bellard579a97f2007-11-11 14:26:47 +0000642 {
643 void *addr;
Md Haris Iqbal38e826d2016-03-24 00:02:03 +0530644 addr = g_malloc(len);
bellard579a97f2007-11-11 14:26:47 +0000645 if (copy)
646 memcpy(addr, g2h(guest_addr), len);
647 else
648 memset(addr, 0, len);
649 return addr;
650 }
pbrook53a59602006-03-25 19:31:22 +0000651#else
Richard Henderson3e8f1622021-02-12 10:48:43 -0800652 return g2h_untagged(guest_addr);
pbrook53a59602006-03-25 19:31:22 +0000653#endif
bellardedf779f2004-02-22 13:40:13 +0000654}
655
bellard579a97f2007-11-11 14:26:47 +0000656/* Unlock an area of guest memory. The first LEN bytes must be
ths1235fc02008-06-03 19:51:57 +0000657 flushed back to guest memory. host_ptr = NULL is explicitly
bellard579a97f2007-11-11 14:26:47 +0000658 allowed and does nothing. */
659static inline void unlock_user(void *host_ptr, abi_ulong guest_addr,
blueswir1992f48a2007-10-14 16:27:31 +0000660 long len)
bellardedf779f2004-02-22 13:40:13 +0000661{
bellard579a97f2007-11-11 14:26:47 +0000662
pbrook53a59602006-03-25 19:31:22 +0000663#ifdef DEBUG_REMAP
bellard579a97f2007-11-11 14:26:47 +0000664 if (!host_ptr)
665 return;
Richard Henderson3e8f1622021-02-12 10:48:43 -0800666 if (host_ptr == g2h_untagged(guest_addr))
pbrook53a59602006-03-25 19:31:22 +0000667 return;
668 if (len > 0)
Richard Henderson3e8f1622021-02-12 10:48:43 -0800669 memcpy(g2h_untagged(guest_addr), host_ptr, len);
Md Haris Iqbal38e826d2016-03-24 00:02:03 +0530670 g_free(host_ptr);
pbrook53a59602006-03-25 19:31:22 +0000671#endif
bellardedf779f2004-02-22 13:40:13 +0000672}
673
bellard579a97f2007-11-11 14:26:47 +0000674/* Return the length of a string in target memory or -TARGET_EFAULT if
675 access error. */
676abi_long target_strlen(abi_ulong gaddr);
bellardedf779f2004-02-22 13:40:13 +0000677
pbrook53a59602006-03-25 19:31:22 +0000678/* Like lock_user but for null terminated strings. */
blueswir1992f48a2007-10-14 16:27:31 +0000679static inline void *lock_user_string(abi_ulong guest_addr)
pbrook53a59602006-03-25 19:31:22 +0000680{
bellard579a97f2007-11-11 14:26:47 +0000681 abi_long len;
682 len = target_strlen(guest_addr);
683 if (len < 0)
684 return NULL;
685 return lock_user(VERIFY_READ, guest_addr, (long)(len + 1), 1);
pbrook53a59602006-03-25 19:31:22 +0000686}
687
Stefan Weil41d1af42013-09-12 19:57:41 +0200688/* Helper macros for locking/unlocking a target struct. */
bellard579a97f2007-11-11 14:26:47 +0000689#define lock_user_struct(type, host_ptr, guest_addr, copy) \
690 (host_ptr = lock_user(type, guest_addr, sizeof(*host_ptr), copy))
691#define unlock_user_struct(host_ptr, guest_addr, copy) \
pbrook53a59602006-03-25 19:31:22 +0000692 unlock_user(host_ptr, guest_addr, (copy) ? sizeof(*host_ptr) : 0)
693
pbrookc8a706f2008-06-02 16:16:42 +0000694#include <pthread.h>
pbrookc8a706f2008-06-02 16:16:42 +0000695
Philippe Mathieu-Daudé1129dd72018-06-04 12:37:21 -0300696static inline int is_error(abi_long ret)
697{
698 return (abi_ulong)ret >= (abi_ulong)(-4096);
699}
700
Filip Bozutaf4d92c52020-06-19 14:33:31 +0200701#if TARGET_ABI_BITS == 32
702static inline uint64_t target_offset64(uint32_t word0, uint32_t word1)
703{
704#ifdef TARGET_WORDS_BIGENDIAN
705 return ((uint64_t)word0 << 32) | word1;
706#else
707 return ((uint64_t)word1 << 32) | word0;
708#endif
709}
710#else /* TARGET_ABI_BITS == 32 */
711static inline uint64_t target_offset64(uint64_t word0, uint64_t word1)
712{
713 return word0;
714}
715#endif /* TARGET_ABI_BITS != 32 */
716
Filip Bozuta888468d2020-07-23 23:02:33 +0200717void print_termios(void *arg);
Filip Bozuta7c89f342020-08-11 18:45:50 +0200718
719/* ARM EABI and MIPS expect 64bit types aligned even on pairs or registers */
720#ifdef TARGET_ARM
721static inline int regpairs_aligned(void *cpu_env, int num)
722{
723 return ((((CPUARMState *)cpu_env)->eabi) == 1) ;
724}
725#elif defined(TARGET_MIPS) && (TARGET_ABI_BITS == 32)
726static inline int regpairs_aligned(void *cpu_env, int num) { return 1; }
727#elif defined(TARGET_PPC) && !defined(TARGET_PPC64)
728/*
729 * SysV AVI for PPC32 expects 64bit parameters to be passed on odd/even pairs
730 * of registers which translates to the same as ARM/MIPS, because we start with
731 * r3 as arg1
732 */
733static inline int regpairs_aligned(void *cpu_env, int num) { return 1; }
734#elif defined(TARGET_SH4)
735/* SH4 doesn't align register pairs, except for p{read,write}64 */
736static inline int regpairs_aligned(void *cpu_env, int num)
737{
738 switch (num) {
739 case TARGET_NR_pread64:
740 case TARGET_NR_pwrite64:
741 return 1;
742
743 default:
744 return 0;
745 }
746}
747#elif defined(TARGET_XTENSA)
748static inline int regpairs_aligned(void *cpu_env, int num) { return 1; }
749#else
750static inline int regpairs_aligned(void *cpu_env, int num) { return 0; }
751#endif
752
Alex Bennée708b6a62018-06-22 17:09:10 +0100753/**
754 * preexit_cleanup: housekeeping before the guest exits
755 *
756 * env: the CPU state
757 * code: the exit code
758 */
759void preexit_cleanup(CPUArchState *env, int code);
760
Peter Maydelldfeab062013-07-16 18:44:52 +0100761/* Include target-specific struct and function definitions;
762 * they may need access to the target-independent structures
763 * above, so include them last.
764 */
765#include "target_cpu.h"
Petar Jovanovic55a2b162013-10-30 14:46:31 +0100766#include "target_structs.h"
Peter Maydelldfeab062013-07-16 18:44:52 +0100767
bellarde88de092005-02-07 12:35:39 +0000768#endif /* QEMU_H */