blob: a96aabdd875a2dc4e8f2e700743dc4f6368c1e38 [file] [log] [blame]
bellardea2384d2004-08-01 21:59:26 +00001/*
2 * QEMU System Emulator block driver
ths5fafdf22007-09-16 21:08:06 +00003 *
bellardea2384d2004-08-01 21:59:26 +00004 * Copyright (c) 2003 Fabrice Bellard
ths5fafdf22007-09-16 21:08:06 +00005 *
bellardea2384d2004-08-01 21:59:26 +00006 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
24#ifndef BLOCK_INT_H
25#define BLOCK_INT_H
26
pbrookfaf07962007-11-11 02:51:17 +000027#include "block.h"
Kevin Wolf0e7e1982009-05-18 16:42:10 +020028#include "qemu-option.h"
Stefan Hajnoczi1b7bdbc2010-04-10 07:02:42 +010029#include "qemu-queue.h"
Kevin Wolfda1fa912011-07-14 17:27:13 +020030#include "qemu-coroutine.h"
Christoph Hellwigc488c7f2011-08-25 08:26:10 +020031#include "qemu-timer.h"
Luiz Capitulinob2023812011-09-21 17:16:47 -030032#include "qapi-types.h"
pbrookfaf07962007-11-11 02:51:17 +000033
thsec36ba12007-09-16 21:59:02 +000034#define BLOCK_FLAG_ENCRYPT 1
thsec36ba12007-09-16 21:59:02 +000035#define BLOCK_FLAG_COMPAT6 4
36
Zhi Yong Wu0563e192011-11-03 16:57:25 +080037#define BLOCK_IO_LIMIT_READ 0
38#define BLOCK_IO_LIMIT_WRITE 1
39#define BLOCK_IO_LIMIT_TOTAL 2
40
41#define BLOCK_IO_SLICE_TIME 100000000
Zhi Yong Wu98f90db2011-11-08 13:00:14 +080042#define NANOSECONDS_PER_SECOND 1000000000.0
Zhi Yong Wu0563e192011-11-03 16:57:25 +080043
Kevin Wolf0e7e1982009-05-18 16:42:10 +020044#define BLOCK_OPT_SIZE "size"
45#define BLOCK_OPT_ENCRYPT "encryption"
46#define BLOCK_OPT_COMPAT6 "compat6"
47#define BLOCK_OPT_BACKING_FILE "backing_file"
48#define BLOCK_OPT_BACKING_FMT "backing_fmt"
Kevin Wolf73c632e2009-05-19 17:57:21 +020049#define BLOCK_OPT_CLUSTER_SIZE "cluster_size"
Stefan Hajnoczi75411d22010-12-06 16:08:00 +000050#define BLOCK_OPT_TABLE_SIZE "table_size"
Kevin Wolfa35e1c12009-08-17 15:50:10 +020051#define BLOCK_OPT_PREALLOC "preallocation"
Fam Zhengf66fd6c2011-07-19 08:45:23 +080052#define BLOCK_OPT_SUBFMT "subformat"
Kevin Wolf0e7e1982009-05-18 16:42:10 +020053
Stefan Hajnoczidbffbdc2011-11-17 13:40:27 +000054typedef struct BdrvTrackedRequest BdrvTrackedRequest;
55
Zhi Yong Wu0563e192011-11-03 16:57:25 +080056typedef struct BlockIOLimit {
57 int64_t bps[3];
58 int64_t iops[3];
59} BlockIOLimit;
60
61typedef struct BlockIOBaseValue {
62 uint64_t bytes[2];
63 uint64_t ios[2];
64} BlockIOBaseValue;
65
Stefan Hajnoczieeec61f2012-01-18 14:40:43 +000066typedef void BlockJobCancelFunc(void *opaque);
67typedef struct BlockJob BlockJob;
68typedef struct BlockJobType {
69 /** Derived BlockJob struct size */
70 size_t instance_size;
71
72 /** String describing the operation, part of query-block-jobs QMP API */
73 const char *job_type;
74
75 /** Optional callback for job types that support setting a speed limit */
76 int (*set_speed)(BlockJob *job, int64_t value);
77} BlockJobType;
78
79/**
80 * Long-running operation on a BlockDriverState
81 */
82struct BlockJob {
83 const BlockJobType *job_type;
84 BlockDriverState *bs;
85 bool cancelled;
Paolo Bonzini3e914652012-03-30 13:17:11 +020086 bool busy;
Stefan Hajnoczieeec61f2012-01-18 14:40:43 +000087
88 /* These fields are published by the query-block-jobs QMP API */
89 int64_t offset;
90 int64_t len;
91 int64_t speed;
92
93 BlockDriverCompletionFunc *cb;
94 void *opaque;
95};
96
bellardea2384d2004-08-01 21:59:26 +000097struct BlockDriver {
98 const char *format_name;
99 int instance_size;
100 int (*bdrv_probe)(const uint8_t *buf, int buf_size, const char *filename);
Christoph Hellwig508c7cb2009-06-15 14:04:22 +0200101 int (*bdrv_probe_device)(const char *filename);
Kevin Wolf66f82ce2010-04-14 14:17:38 +0200102 int (*bdrv_open)(BlockDriverState *bs, int flags);
103 int (*bdrv_file_open)(BlockDriverState *bs, const char *filename, int flags);
ths5fafdf22007-09-16 21:08:06 +0000104 int (*bdrv_read)(BlockDriverState *bs, int64_t sector_num,
bellardea2384d2004-08-01 21:59:26 +0000105 uint8_t *buf, int nb_sectors);
ths5fafdf22007-09-16 21:08:06 +0000106 int (*bdrv_write)(BlockDriverState *bs, int64_t sector_num,
bellardea2384d2004-08-01 21:59:26 +0000107 const uint8_t *buf, int nb_sectors);
bellarde2731ad2004-09-18 19:32:11 +0000108 void (*bdrv_close)(BlockDriverState *bs);
Kevin Wolf0e7e1982009-05-18 16:42:10 +0200109 int (*bdrv_create)(const char *filename, QEMUOptionParameter *options);
bellardea2384d2004-08-01 21:59:26 +0000110 int (*bdrv_set_key)(BlockDriverState *bs, const char *key);
bellard95389c82005-12-18 18:28:15 +0000111 int (*bdrv_make_empty)(BlockDriverState *bs);
bellard83f64092006-08-01 16:21:11 +0000112 /* aio */
aliguorif141eaf2009-04-07 18:43:24 +0000113 BlockDriverAIOCB *(*bdrv_aio_readv)(BlockDriverState *bs,
114 int64_t sector_num, QEMUIOVector *qiov, int nb_sectors,
pbrookce1a14d2006-08-07 02:38:06 +0000115 BlockDriverCompletionFunc *cb, void *opaque);
aliguorif141eaf2009-04-07 18:43:24 +0000116 BlockDriverAIOCB *(*bdrv_aio_writev)(BlockDriverState *bs,
117 int64_t sector_num, QEMUIOVector *qiov, int nb_sectors,
pbrookce1a14d2006-08-07 02:38:06 +0000118 BlockDriverCompletionFunc *cb, void *opaque);
Christoph Hellwigb2e12bc2009-09-04 19:01:49 +0200119 BlockDriverAIOCB *(*bdrv_aio_flush)(BlockDriverState *bs,
120 BlockDriverCompletionFunc *cb, void *opaque);
Paolo Bonzini4265d622011-10-17 12:32:14 +0200121 BlockDriverAIOCB *(*bdrv_aio_discard)(BlockDriverState *bs,
122 int64_t sector_num, int nb_sectors,
123 BlockDriverCompletionFunc *cb, void *opaque);
bellard83f64092006-08-01 16:21:11 +0000124
Kevin Wolfda1fa912011-07-14 17:27:13 +0200125 int coroutine_fn (*bdrv_co_readv)(BlockDriverState *bs,
126 int64_t sector_num, int nb_sectors, QEMUIOVector *qiov);
127 int coroutine_fn (*bdrv_co_writev)(BlockDriverState *bs,
128 int64_t sector_num, int nb_sectors, QEMUIOVector *qiov);
Stefan Hajnoczif08f2dd2012-02-07 13:27:25 +0000129 /*
130 * Efficiently zero a region of the disk image. Typically an image format
131 * would use a compact metadata representation to implement this. This
132 * function pointer may be NULL and .bdrv_co_writev() will be called
133 * instead.
134 */
135 int coroutine_fn (*bdrv_co_write_zeroes)(BlockDriverState *bs,
136 int64_t sector_num, int nb_sectors);
Paolo Bonzini4265d622011-10-17 12:32:14 +0200137 int coroutine_fn (*bdrv_co_discard)(BlockDriverState *bs,
138 int64_t sector_num, int nb_sectors);
Stefan Hajnoczi376ae3f2011-11-14 12:44:19 +0000139 int coroutine_fn (*bdrv_co_is_allocated)(BlockDriverState *bs,
140 int64_t sector_num, int nb_sectors, int *pnum);
Kevin Wolfda1fa912011-07-14 17:27:13 +0200141
Kevin Wolfc68b89a2011-11-10 17:25:44 +0100142 /*
Anthony Liguori0f154232011-11-14 15:09:45 -0600143 * Invalidate any cached meta-data.
144 */
145 void (*bdrv_invalidate_cache)(BlockDriverState *bs);
146
147 /*
Kevin Wolfc68b89a2011-11-10 17:25:44 +0100148 * Flushes all data that was already written to the OS all the way down to
149 * the disk (for example raw-posix calls fsync()).
150 */
151 int coroutine_fn (*bdrv_co_flush_to_disk)(BlockDriverState *bs);
152
Kevin Wolfeb489bb2011-11-10 18:10:11 +0100153 /*
154 * Flushes all internal caches to the OS. The data may still sit in a
155 * writeback cache of the host OS, but it will survive a crash of the qemu
156 * process.
157 */
158 int coroutine_fn (*bdrv_co_flush_to_os)(BlockDriverState *bs);
159
bellard83f64092006-08-01 16:21:11 +0000160 const char *protocol_name;
bellard83f64092006-08-01 16:21:11 +0000161 int (*bdrv_truncate)(BlockDriverState *bs, int64_t offset);
162 int64_t (*bdrv_getlength)(BlockDriverState *bs);
Fam Zheng4a1d5e12011-07-12 19:56:39 +0800163 int64_t (*bdrv_get_allocated_file_size)(BlockDriverState *bs);
ths5fafdf22007-09-16 21:08:06 +0000164 int (*bdrv_write_compressed)(BlockDriverState *bs, int64_t sector_num,
bellardfaea38e2006-08-05 21:31:00 +0000165 const uint8_t *buf, int nb_sectors);
166
ths5fafdf22007-09-16 21:08:06 +0000167 int (*bdrv_snapshot_create)(BlockDriverState *bs,
bellardfaea38e2006-08-05 21:31:00 +0000168 QEMUSnapshotInfo *sn_info);
ths5fafdf22007-09-16 21:08:06 +0000169 int (*bdrv_snapshot_goto)(BlockDriverState *bs,
bellardfaea38e2006-08-05 21:31:00 +0000170 const char *snapshot_id);
171 int (*bdrv_snapshot_delete)(BlockDriverState *bs, const char *snapshot_id);
ths5fafdf22007-09-16 21:08:06 +0000172 int (*bdrv_snapshot_list)(BlockDriverState *bs,
bellardfaea38e2006-08-05 21:31:00 +0000173 QEMUSnapshotInfo **psn_info);
edison51ef6722010-09-21 19:58:41 -0700174 int (*bdrv_snapshot_load_tmp)(BlockDriverState *bs,
175 const char *snapshot_name);
bellardfaea38e2006-08-05 21:31:00 +0000176 int (*bdrv_get_info)(BlockDriverState *bs, BlockDriverInfo *bdi);
bellard83f64092006-08-01 16:21:11 +0000177
Christoph Hellwig45566e92009-07-10 23:11:57 +0200178 int (*bdrv_save_vmstate)(BlockDriverState *bs, const uint8_t *buf,
179 int64_t pos, int size);
180 int (*bdrv_load_vmstate)(BlockDriverState *bs, uint8_t *buf,
181 int64_t pos, int size);
aliguori178e08a2009-04-05 19:10:55 +0000182
Kevin Wolf756e6732010-01-12 12:55:17 +0100183 int (*bdrv_change_backing_file)(BlockDriverState *bs,
184 const char *backing_file, const char *backing_fmt);
185
bellard19cb3732006-08-19 11:45:59 +0000186 /* removable device specific */
187 int (*bdrv_is_inserted)(BlockDriverState *bs);
188 int (*bdrv_media_changed)(BlockDriverState *bs);
Luiz Capitulinof36f3942012-02-03 16:24:53 -0200189 void (*bdrv_eject)(BlockDriverState *bs, bool eject_flag);
Markus Armbruster025e8492011-09-06 18:58:47 +0200190 void (*bdrv_lock_medium)(BlockDriverState *bs, bool locked);
ths3b46e622007-09-17 08:09:54 +0000191
ths985a03b2007-12-24 16:10:43 +0000192 /* to control generic scsi devices */
193 int (*bdrv_ioctl)(BlockDriverState *bs, unsigned long int req, void *buf);
aliguori221f7152009-03-28 17:28:41 +0000194 BlockDriverAIOCB *(*bdrv_aio_ioctl)(BlockDriverState *bs,
195 unsigned long int req, void *buf,
196 BlockDriverCompletionFunc *cb, void *opaque);
ths985a03b2007-12-24 16:10:43 +0000197
Kevin Wolf0e7e1982009-05-18 16:42:10 +0200198 /* List of options for creating images, terminated by name == NULL */
199 QEMUOptionParameter *create_options;
200
aliguori5eb45632009-03-28 17:55:10 +0000201
Kevin Wolf9ac228e2010-06-29 12:37:54 +0200202 /*
203 * Returns 0 for completed check, -errno for internal errors.
204 * The check results are stored in result.
205 */
206 int (*bdrv_check)(BlockDriverState* bs, BdrvCheckResult *result);
aliguorie97fc192009-04-21 23:11:50 +0000207
Kevin Wolf8b9b0cc2010-03-15 17:27:00 +0100208 void (*bdrv_debug_event)(BlockDriverState *bs, BlkDebugEvent event);
209
Kevin Wolf336c1c12010-07-28 11:26:29 +0200210 /*
211 * Returns 1 if newly created images are guaranteed to contain only
212 * zeros, 0 otherwise.
213 */
214 int (*bdrv_has_zero_init)(BlockDriverState *bs);
Kevin Wolf12c09b82009-11-30 16:54:15 +0100215
Stefan Hajnoczi8a22f022010-04-13 10:29:33 +0100216 QLIST_ENTRY(BlockDriver) list;
bellardea2384d2004-08-01 21:59:26 +0000217};
218
Jeff Cody8802d1f2012-02-28 15:54:06 -0500219/*
220 * Note: the function bdrv_append() copies and swaps contents of
221 * BlockDriverStates, so if you add new fields to this struct, please
222 * inspect bdrv_append() to determine if the new fields need to be
223 * copied as well.
224 */
bellardea2384d2004-08-01 21:59:26 +0000225struct BlockDriverState {
bellardd15a7712006-08-06 13:35:09 +0000226 int64_t total_sectors; /* if we are reading a disk image, give its
227 size in sectors */
bellardea2384d2004-08-01 21:59:26 +0000228 int read_only; /* if true, the media is read only */
Naphtali Sprei4dca4b62010-02-14 13:39:18 +0200229 int keep_read_only; /* if true, the media was requested to stay read only */
230 int open_flags; /* flags used to open the file, re-used for re-open */
bellardea2384d2004-08-01 21:59:26 +0000231 int encrypted; /* if true, the media is encrypted */
aliguoric0f4ce72009-03-05 23:01:01 +0000232 int valid_key; /* if true, a valid encryption key has been set */
ths985a03b2007-12-24 16:10:43 +0000233 int sg; /* if true, the device is a /dev/sg* */
Stefan Hajnoczi53fec9d2011-11-28 16:08:47 +0000234 int copy_on_read; /* if true, copy read backing sectors into image
235 note this is a reference count */
bellardea2384d2004-08-01 21:59:26 +0000236
bellard19cb3732006-08-19 11:45:59 +0000237 BlockDriver *drv; /* NULL means no media */
bellardea2384d2004-08-01 21:59:26 +0000238 void *opaque;
239
Markus Armbrusterfa879d62011-08-03 15:07:40 +0200240 void *dev; /* attached device model, if any */
241 /* TODO change to DeviceState when all users are qdevified */
Markus Armbruster0e49de52011-08-03 15:07:41 +0200242 const BlockDevOps *dev_ops;
243 void *dev_opaque;
Markus Armbruster18846de2010-06-29 16:58:30 +0200244
bellardea2384d2004-08-01 21:59:26 +0000245 char filename[1024];
246 char backing_file[1024]; /* if non zero, the image is a diff of
247 this file image */
aliguori5eb45632009-03-28 17:55:10 +0000248 char backing_format[16]; /* if non-zero and backing_file exists */
bellardea2384d2004-08-01 21:59:26 +0000249 int is_temporary;
bellard19cb3732006-08-19 11:45:59 +0000250
bellardea2384d2004-08-01 21:59:26 +0000251 BlockDriverState *backing_hd;
Kevin Wolf66f82ce2010-04-14 14:17:38 +0200252 BlockDriverState *file;
253
Stefan Hajnoczi470c0502012-01-18 14:40:42 +0000254 /* number of in-flight copy-on-read requests */
255 unsigned int copy_on_read_in_flight;
256
Zhi Yong Wu0563e192011-11-03 16:57:25 +0800257 /* the time for latest disk I/O */
258 int64_t slice_time;
259 int64_t slice_start;
260 int64_t slice_end;
261 BlockIOLimit io_limits;
262 BlockIOBaseValue io_base;
263 CoQueue throttled_reqs;
264 QEMUTimer *block_timer;
265 bool io_limits_enabled;
266
thsa36e69d2007-12-02 05:18:19 +0000267 /* I/O stats (display with "info blockstats"). */
Christoph Hellwiga597e792011-08-25 08:26:01 +0200268 uint64_t nr_bytes[BDRV_MAX_IOTYPE];
269 uint64_t nr_ops[BDRV_MAX_IOTYPE];
Christoph Hellwigc488c7f2011-08-25 08:26:10 +0200270 uint64_t total_time_ns[BDRV_MAX_IOTYPE];
Kevin Wolf294cc352010-04-28 14:34:01 +0200271 uint64_t wr_highest_sector;
thsa36e69d2007-12-02 05:18:19 +0000272
aliguori71d07702009-03-03 17:37:16 +0000273 /* Whether the disk can expand beyond total_sectors */
274 int growable;
275
aliguorie268ca52009-04-22 20:20:00 +0000276 /* the memory alignment required for the buffers handled by this driver */
277 int buffer_alignment;
278
Christoph Hellwige900a7b2009-09-04 19:01:15 +0200279 /* do we need to tell the quest if we have a volatile write cache? */
280 int enable_write_cache;
281
bellardea2384d2004-08-01 21:59:26 +0000282 /* NOTE: the following infos are only hints for real hardware
283 drivers. They are not used by the block driver */
bellard46d47672004-11-16 01:45:27 +0000284 int cyls, heads, secs, translation;
Markus Armbrusterabd7f682010-06-02 18:55:17 +0200285 BlockErrorAction on_read_error, on_write_error;
Luiz Capitulinod6bf2792011-10-14 17:11:23 -0300286 bool iostatus_enabled;
Luiz Capitulinob2023812011-09-21 17:16:47 -0300287 BlockDeviceIoStatus iostatus;
bellardea2384d2004-08-01 21:59:26 +0000288 char device_name[32];
Jan Kiszkac6d22832009-11-30 18:21:20 +0100289 unsigned long *dirty_bitmap;
Liran Schouraaa0eb72010-01-26 10:31:48 +0200290 int64_t dirty_count;
Marcelo Tosattidb593f22011-01-26 12:12:34 -0200291 int in_use; /* users other than guest access, eg. block migration */
Stefan Hajnoczi1b7bdbc2010-04-10 07:02:42 +0100292 QTAILQ_ENTRY(BlockDriverState) list;
Stefan Hajnoczidbffbdc2011-11-17 13:40:27 +0000293
294 QLIST_HEAD(, BdrvTrackedRequest) tracked_requests;
Stefan Hajnoczieeec61f2012-01-18 14:40:43 +0000295
296 /* long-running background operation */
297 BlockJob *job;
bellardea2384d2004-08-01 21:59:26 +0000298};
299
bellard95389c82005-12-18 18:28:15 +0000300void get_tmp_filename(char *filename, int size);
301
Zhi Yong Wu0563e192011-11-03 16:57:25 +0800302void bdrv_set_io_limits(BlockDriverState *bs,
303 BlockIOLimit *io_limits);
304
Christoph Hellwig508c7cb2009-06-15 14:04:22 +0200305#ifdef _WIN32
306int is_windows_drive(const char *filename);
307#endif
308
Stefan Hajnoczieeec61f2012-01-18 14:40:43 +0000309void *block_job_create(const BlockJobType *job_type, BlockDriverState *bs,
310 BlockDriverCompletionFunc *cb, void *opaque);
311void block_job_complete(BlockJob *job, int ret);
312int block_job_set_speed(BlockJob *job, int64_t value);
313void block_job_cancel(BlockJob *job);
314bool block_job_is_cancelled(BlockJob *job);
Paolo Bonzini3e914652012-03-30 13:17:11 +0200315void block_job_cancel_sync(BlockJob *job);
Stefan Hajnoczieeec61f2012-01-18 14:40:43 +0000316
Stefan Hajnoczi4f1043b2012-01-18 14:40:44 +0000317int stream_start(BlockDriverState *bs, BlockDriverState *base,
Marcelo Tosattic8c30802012-01-18 14:40:53 +0000318 const char *base_id, BlockDriverCompletionFunc *cb,
319 void *opaque);
Stefan Hajnoczi4f1043b2012-01-18 14:40:44 +0000320
bellardea2384d2004-08-01 21:59:26 +0000321#endif /* BLOCK_INT_H */