aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 1 | /* |
| 2 | * QEMU posix-aio emulation |
| 3 | * |
| 4 | * Copyright IBM, Corp. 2008 |
| 5 | * |
| 6 | * Authors: |
| 7 | * Anthony Liguori <aliguori@us.ibm.com> |
| 8 | * |
| 9 | * This work is licensed under the terms of the GNU GPL, version 2. See |
| 10 | * the COPYING file in the top-level directory. |
| 11 | * |
| 12 | */ |
| 13 | |
aliguori | 221f715 | 2009-03-28 17:28:41 +0000 | [diff] [blame^] | 14 | #include <sys/ioctl.h> |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 15 | #include <pthread.h> |
| 16 | #include <unistd.h> |
| 17 | #include <errno.h> |
malc | 30525af | 2009-02-21 05:48:13 +0000 | [diff] [blame] | 18 | #include <time.h> |
malc | 8653c01 | 2009-02-21 05:48:11 +0000 | [diff] [blame] | 19 | #include <string.h> |
| 20 | #include <stdlib.h> |
| 21 | #include <stdio.h> |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 22 | #include "osdep.h" |
| 23 | |
| 24 | #include "posix-aio-compat.h" |
| 25 | |
| 26 | static pthread_mutex_t lock = PTHREAD_MUTEX_INITIALIZER; |
| 27 | static pthread_cond_t cond = PTHREAD_COND_INITIALIZER; |
| 28 | static pthread_t thread_id; |
malc | a8227a5 | 2009-02-21 05:48:17 +0000 | [diff] [blame] | 29 | static pthread_attr_t attr; |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 30 | static int max_threads = 64; |
| 31 | static int cur_threads = 0; |
| 32 | static int idle_threads = 0; |
| 33 | static TAILQ_HEAD(, qemu_paiocb) request_list; |
| 34 | |
malc | 8653c01 | 2009-02-21 05:48:11 +0000 | [diff] [blame] | 35 | static void die2(int err, const char *what) |
| 36 | { |
| 37 | fprintf(stderr, "%s failed: %s\n", what, strerror(err)); |
| 38 | abort(); |
| 39 | } |
| 40 | |
| 41 | static void die(const char *what) |
| 42 | { |
| 43 | die2(errno, what); |
| 44 | } |
| 45 | |
| 46 | static void mutex_lock(pthread_mutex_t *mutex) |
| 47 | { |
| 48 | int ret = pthread_mutex_lock(mutex); |
| 49 | if (ret) die2(ret, "pthread_mutex_lock"); |
| 50 | } |
| 51 | |
| 52 | static void mutex_unlock(pthread_mutex_t *mutex) |
| 53 | { |
| 54 | int ret = pthread_mutex_unlock(mutex); |
| 55 | if (ret) die2(ret, "pthread_mutex_unlock"); |
| 56 | } |
| 57 | |
| 58 | static int cond_timedwait(pthread_cond_t *cond, pthread_mutex_t *mutex, |
| 59 | struct timespec *ts) |
| 60 | { |
| 61 | int ret = pthread_cond_timedwait(cond, mutex, ts); |
| 62 | if (ret && ret != ETIMEDOUT) die2(ret, "pthread_cond_timedwait"); |
| 63 | return ret; |
| 64 | } |
| 65 | |
malc | 5d47e37 | 2009-02-21 05:48:15 +0000 | [diff] [blame] | 66 | static void cond_signal(pthread_cond_t *cond) |
malc | 8653c01 | 2009-02-21 05:48:11 +0000 | [diff] [blame] | 67 | { |
malc | 5d47e37 | 2009-02-21 05:48:15 +0000 | [diff] [blame] | 68 | int ret = pthread_cond_signal(cond); |
| 69 | if (ret) die2(ret, "pthread_cond_signal"); |
malc | 8653c01 | 2009-02-21 05:48:11 +0000 | [diff] [blame] | 70 | } |
| 71 | |
| 72 | static void thread_create(pthread_t *thread, pthread_attr_t *attr, |
| 73 | void *(*start_routine)(void*), void *arg) |
| 74 | { |
| 75 | int ret = pthread_create(thread, attr, start_routine, arg); |
| 76 | if (ret) die2(ret, "pthread_create"); |
| 77 | } |
| 78 | |
aliguori | 221f715 | 2009-03-28 17:28:41 +0000 | [diff] [blame^] | 79 | static size_t handle_aiocb_readwrite(struct qemu_paiocb *aiocb) |
| 80 | { |
| 81 | size_t offset = 0; |
| 82 | ssize_t len; |
| 83 | |
| 84 | while (offset < aiocb->aio_nbytes) { |
| 85 | if (aiocb->aio_type == QEMU_PAIO_WRITE) |
| 86 | len = pwrite(aiocb->aio_fildes, |
| 87 | (const char *)aiocb->aio_buf + offset, |
| 88 | aiocb->aio_nbytes - offset, |
| 89 | aiocb->aio_offset + offset); |
| 90 | else |
| 91 | len = pread(aiocb->aio_fildes, |
| 92 | (char *)aiocb->aio_buf + offset, |
| 93 | aiocb->aio_nbytes - offset, |
| 94 | aiocb->aio_offset + offset); |
| 95 | |
| 96 | if (len == -1 && errno == EINTR) |
| 97 | continue; |
| 98 | else if (len == -1) { |
| 99 | offset = -errno; |
| 100 | break; |
| 101 | } else if (len == 0) |
| 102 | break; |
| 103 | |
| 104 | offset += len; |
| 105 | } |
| 106 | |
| 107 | return offset; |
| 108 | } |
| 109 | |
| 110 | static size_t handle_aiocb_ioctl(struct qemu_paiocb *aiocb) |
| 111 | { |
| 112 | int ret; |
| 113 | |
| 114 | ret = ioctl(aiocb->aio_fildes, aiocb->aio_ioctl_cmd, aiocb->aio_buf); |
| 115 | if (ret == -1) |
| 116 | return -errno; |
| 117 | return ret; |
| 118 | } |
| 119 | |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 120 | static void *aio_thread(void *unused) |
| 121 | { |
malc | a8227a5 | 2009-02-21 05:48:17 +0000 | [diff] [blame] | 122 | pid_t pid; |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 123 | sigset_t set; |
| 124 | |
malc | a8227a5 | 2009-02-21 05:48:17 +0000 | [diff] [blame] | 125 | pid = getpid(); |
| 126 | |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 127 | /* block all signals */ |
malc | 8653c01 | 2009-02-21 05:48:11 +0000 | [diff] [blame] | 128 | if (sigfillset(&set)) die("sigfillset"); |
| 129 | if (sigprocmask(SIG_BLOCK, &set, NULL)) die("sigprocmask"); |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 130 | |
| 131 | while (1) { |
| 132 | struct qemu_paiocb *aiocb; |
aliguori | 221f715 | 2009-03-28 17:28:41 +0000 | [diff] [blame^] | 133 | size_t ret = 0; |
malc | 30525af | 2009-02-21 05:48:13 +0000 | [diff] [blame] | 134 | qemu_timeval tv; |
| 135 | struct timespec ts; |
| 136 | |
| 137 | qemu_gettimeofday(&tv); |
| 138 | ts.tv_sec = tv.tv_sec + 10; |
| 139 | ts.tv_nsec = 0; |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 140 | |
malc | 8653c01 | 2009-02-21 05:48:11 +0000 | [diff] [blame] | 141 | mutex_lock(&lock); |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 142 | |
| 143 | while (TAILQ_EMPTY(&request_list) && |
| 144 | !(ret == ETIMEDOUT)) { |
malc | 8653c01 | 2009-02-21 05:48:11 +0000 | [diff] [blame] | 145 | ret = cond_timedwait(&cond, &lock, &ts); |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 146 | } |
| 147 | |
malc | 514f7a2 | 2009-02-21 05:48:19 +0000 | [diff] [blame] | 148 | if (TAILQ_EMPTY(&request_list)) |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 149 | break; |
| 150 | |
| 151 | aiocb = TAILQ_FIRST(&request_list); |
| 152 | TAILQ_REMOVE(&request_list, aiocb, node); |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 153 | aiocb->active = 1; |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 154 | idle_threads--; |
malc | 8653c01 | 2009-02-21 05:48:11 +0000 | [diff] [blame] | 155 | mutex_unlock(&lock); |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 156 | |
aliguori | 221f715 | 2009-03-28 17:28:41 +0000 | [diff] [blame^] | 157 | switch (aiocb->aio_type) { |
| 158 | case QEMU_PAIO_READ: |
| 159 | case QEMU_PAIO_WRITE: |
| 160 | ret = handle_aiocb_readwrite(aiocb); |
| 161 | break; |
| 162 | case QEMU_PAIO_IOCTL: |
| 163 | ret = handle_aiocb_ioctl(aiocb); |
| 164 | break; |
| 165 | default: |
| 166 | fprintf(stderr, "invalid aio request (0x%x)\n", aiocb->aio_type); |
| 167 | ret = -EINVAL; |
| 168 | break; |
| 169 | } |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 170 | |
malc | 8653c01 | 2009-02-21 05:48:11 +0000 | [diff] [blame] | 171 | mutex_lock(&lock); |
aliguori | 221f715 | 2009-03-28 17:28:41 +0000 | [diff] [blame^] | 172 | aiocb->ret = ret; |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 173 | idle_threads++; |
malc | 8653c01 | 2009-02-21 05:48:11 +0000 | [diff] [blame] | 174 | mutex_unlock(&lock); |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 175 | |
malc | a8227a5 | 2009-02-21 05:48:17 +0000 | [diff] [blame] | 176 | if (kill(pid, aiocb->ev_signo)) die("kill failed"); |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 177 | } |
| 178 | |
| 179 | idle_threads--; |
| 180 | cur_threads--; |
malc | 8653c01 | 2009-02-21 05:48:11 +0000 | [diff] [blame] | 181 | mutex_unlock(&lock); |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 182 | |
| 183 | return NULL; |
| 184 | } |
| 185 | |
malc | 8653c01 | 2009-02-21 05:48:11 +0000 | [diff] [blame] | 186 | static void spawn_thread(void) |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 187 | { |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 188 | cur_threads++; |
| 189 | idle_threads++; |
malc | 8653c01 | 2009-02-21 05:48:11 +0000 | [diff] [blame] | 190 | thread_create(&thread_id, &attr, aio_thread, NULL); |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 191 | } |
| 192 | |
| 193 | int qemu_paio_init(struct qemu_paioinit *aioinit) |
| 194 | { |
malc | a8227a5 | 2009-02-21 05:48:17 +0000 | [diff] [blame] | 195 | int ret; |
| 196 | |
| 197 | ret = pthread_attr_init(&attr); |
| 198 | if (ret) die2(ret, "pthread_attr_init"); |
| 199 | |
| 200 | ret = pthread_attr_setdetachstate(&attr, PTHREAD_CREATE_DETACHED); |
| 201 | if (ret) die2(ret, "pthread_attr_setdetachstate"); |
| 202 | |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 203 | TAILQ_INIT(&request_list); |
| 204 | |
| 205 | return 0; |
| 206 | } |
| 207 | |
aliguori | 221f715 | 2009-03-28 17:28:41 +0000 | [diff] [blame^] | 208 | static int qemu_paio_submit(struct qemu_paiocb *aiocb, int type) |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 209 | { |
aliguori | 221f715 | 2009-03-28 17:28:41 +0000 | [diff] [blame^] | 210 | aiocb->aio_type = type; |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 211 | aiocb->ret = -EINPROGRESS; |
| 212 | aiocb->active = 0; |
malc | 8653c01 | 2009-02-21 05:48:11 +0000 | [diff] [blame] | 213 | mutex_lock(&lock); |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 214 | if (idle_threads == 0 && cur_threads < max_threads) |
| 215 | spawn_thread(); |
| 216 | TAILQ_INSERT_TAIL(&request_list, aiocb, node); |
malc | 8653c01 | 2009-02-21 05:48:11 +0000 | [diff] [blame] | 217 | mutex_unlock(&lock); |
malc | 5d47e37 | 2009-02-21 05:48:15 +0000 | [diff] [blame] | 218 | cond_signal(&cond); |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 219 | |
| 220 | return 0; |
| 221 | } |
| 222 | |
| 223 | int qemu_paio_read(struct qemu_paiocb *aiocb) |
| 224 | { |
aliguori | 221f715 | 2009-03-28 17:28:41 +0000 | [diff] [blame^] | 225 | return qemu_paio_submit(aiocb, QEMU_PAIO_READ); |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 226 | } |
| 227 | |
| 228 | int qemu_paio_write(struct qemu_paiocb *aiocb) |
| 229 | { |
aliguori | 221f715 | 2009-03-28 17:28:41 +0000 | [diff] [blame^] | 230 | return qemu_paio_submit(aiocb, QEMU_PAIO_WRITE); |
| 231 | } |
| 232 | |
| 233 | int qemu_paio_ioctl(struct qemu_paiocb *aiocb) |
| 234 | { |
| 235 | return qemu_paio_submit(aiocb, QEMU_PAIO_IOCTL); |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 236 | } |
| 237 | |
| 238 | ssize_t qemu_paio_return(struct qemu_paiocb *aiocb) |
| 239 | { |
| 240 | ssize_t ret; |
| 241 | |
malc | 8653c01 | 2009-02-21 05:48:11 +0000 | [diff] [blame] | 242 | mutex_lock(&lock); |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 243 | ret = aiocb->ret; |
malc | 8653c01 | 2009-02-21 05:48:11 +0000 | [diff] [blame] | 244 | mutex_unlock(&lock); |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 245 | |
| 246 | return ret; |
| 247 | } |
| 248 | |
| 249 | int qemu_paio_error(struct qemu_paiocb *aiocb) |
| 250 | { |
| 251 | ssize_t ret = qemu_paio_return(aiocb); |
| 252 | |
| 253 | if (ret < 0) |
| 254 | ret = -ret; |
| 255 | else |
| 256 | ret = 0; |
| 257 | |
| 258 | return ret; |
| 259 | } |
| 260 | |
| 261 | int qemu_paio_cancel(int fd, struct qemu_paiocb *aiocb) |
| 262 | { |
| 263 | int ret; |
| 264 | |
malc | 8653c01 | 2009-02-21 05:48:11 +0000 | [diff] [blame] | 265 | mutex_lock(&lock); |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 266 | if (!aiocb->active) { |
| 267 | TAILQ_REMOVE(&request_list, aiocb, node); |
| 268 | aiocb->ret = -ECANCELED; |
| 269 | ret = QEMU_PAIO_CANCELED; |
| 270 | } else if (aiocb->ret == -EINPROGRESS) |
| 271 | ret = QEMU_PAIO_NOTCANCELED; |
| 272 | else |
| 273 | ret = QEMU_PAIO_ALLDONE; |
malc | 8653c01 | 2009-02-21 05:48:11 +0000 | [diff] [blame] | 274 | mutex_unlock(&lock); |
aliguori | 3c529d9 | 2008-12-12 16:41:40 +0000 | [diff] [blame] | 275 | |
| 276 | return ret; |
| 277 | } |