blob: ecc0885fae9b528817b32f13dd07879a1c85b0ab [file] [log] [blame]
bellardfc01f7e2003-06-30 10:03:06 +00001/*
2 * QEMU System Emulator block driver
ths5fafdf22007-09-16 21:08:06 +00003 *
bellardfc01f7e2003-06-30 10:03:06 +00004 * Copyright (c) 2003 Fabrice Bellard
ths5fafdf22007-09-16 21:08:06 +00005 *
bellardfc01f7e2003-06-30 10:03:06 +00006 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
blueswir13990d092008-12-05 17:53:21 +000024#include "config-host.h"
pbrookfaf07962007-11-11 02:51:17 +000025#include "qemu-common.h"
Stefan Hajnoczi6d519a52010-05-22 18:15:08 +010026#include "trace.h"
Paolo Bonzini737e1502012-12-17 18:19:44 +010027#include "block/block_int.h"
28#include "block/blockjob.h"
Markus Armbrusterd49b6832015-03-17 18:29:20 +010029#include "qemu/error-report.h"
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010030#include "qemu/module.h"
Markus Armbrustercc7a8ea2015-03-17 17:22:46 +010031#include "qapi/qmp/qerror.h"
Paolo Bonzini7b1b5d12012-12-17 18:19:43 +010032#include "qapi/qmp/qjson.h"
Markus Armbrusterbfb197e2014-10-07 13:59:11 +020033#include "sysemu/block-backend.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010034#include "sysemu/sysemu.h"
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010035#include "qemu/notify.h"
Paolo Bonzini737e1502012-12-17 18:19:44 +010036#include "block/coroutine.h"
Benoît Canetc13163f2014-01-23 21:31:34 +010037#include "block/qapi.h"
Luiz Capitulinob2023812011-09-21 17:16:47 -030038#include "qmp-commands.h"
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010039#include "qemu/timer.h"
Wenchao Xiaa5ee7bd2014-06-18 08:43:44 +020040#include "qapi-event.h"
Alberto Garciadb628332015-06-08 18:17:45 +020041#include "block/throttle-groups.h"
bellardfc01f7e2003-06-30 10:03:06 +000042
Juan Quintela71e72a12009-07-27 16:12:56 +020043#ifdef CONFIG_BSD
bellard7674e7b2005-04-26 21:59:26 +000044#include <sys/types.h>
45#include <sys/stat.h>
46#include <sys/ioctl.h>
Blue Swirl72cf2d42009-09-12 07:36:22 +000047#include <sys/queue.h>
blueswir1c5e97232009-03-07 20:06:23 +000048#ifndef __DragonFly__
bellard7674e7b2005-04-26 21:59:26 +000049#include <sys/disk.h>
50#endif
blueswir1c5e97232009-03-07 20:06:23 +000051#endif
bellard7674e7b2005-04-26 21:59:26 +000052
aliguori49dc7682009-03-08 16:26:59 +000053#ifdef _WIN32
54#include <windows.h>
55#endif
56
John Snow9bd2b082015-04-17 19:49:57 -040057/**
58 * A BdrvDirtyBitmap can be in three possible states:
59 * (1) successor is NULL and disabled is false: full r/w mode
60 * (2) successor is NULL and disabled is true: read only mode ("disabled")
61 * (3) successor is set: frozen mode.
62 * A frozen bitmap cannot be renamed, deleted, anonymized, cleared, set,
63 * or enabled. A frozen bitmap can only abdicate() or reclaim().
64 */
Fam Zhenge4654d22013-11-13 18:29:43 +080065struct BdrvDirtyBitmap {
John Snowaa0c7ca2015-04-17 19:50:01 -040066 HBitmap *bitmap; /* Dirty sector bitmap implementation */
67 BdrvDirtyBitmap *successor; /* Anonymous child; implies frozen status */
68 char *name; /* Optional non-empty unique ID */
69 int64_t size; /* Size of the bitmap (Number of sectors) */
70 bool disabled; /* Bitmap is read-only */
Fam Zhenge4654d22013-11-13 18:29:43 +080071 QLIST_ENTRY(BdrvDirtyBitmap) list;
72};
73
Stefan Hajnoczi1c9805a2011-10-13 13:08:22 +010074#define NOT_DONE 0x7fffffff /* used while emulated sync operation in progress */
75
Stefan Hajnoczi1b7bdbc2010-04-10 07:02:42 +010076static QTAILQ_HEAD(, BlockDriverState) bdrv_states =
77 QTAILQ_HEAD_INITIALIZER(bdrv_states);
blueswir17ee930d2008-09-17 19:04:14 +000078
Benoît Canetdc364f42014-01-23 21:31:32 +010079static QTAILQ_HEAD(, BlockDriverState) graph_bdrv_states =
80 QTAILQ_HEAD_INITIALIZER(graph_bdrv_states);
81
Stefan Hajnoczi8a22f022010-04-13 10:29:33 +010082static QLIST_HEAD(, BlockDriver) bdrv_drivers =
83 QLIST_HEAD_INITIALIZER(bdrv_drivers);
bellardea2384d2004-08-01 21:59:26 +000084
Kevin Wolff3930ed2015-04-08 13:43:47 +020085static int bdrv_open_inherit(BlockDriverState **pbs, const char *filename,
86 const char *reference, QDict *options, int flags,
87 BlockDriverState *parent,
Max Reitzce343772015-08-26 19:47:50 +020088 const BdrvChildRole *child_role, Error **errp);
Kevin Wolff3930ed2015-04-08 13:43:47 +020089
John Snowce1ffea2015-04-17 19:50:03 -040090static void bdrv_dirty_bitmap_truncate(BlockDriverState *bs);
Markus Armbrustereb852012009-10-27 18:41:44 +010091/* If non-zero, use only whitelisted block drivers */
92static int use_bdrv_whitelist;
93
Stefan Hajnoczi9e0b22f2010-12-09 11:53:00 +000094#ifdef _WIN32
95static int is_windows_drive_prefix(const char *filename)
96{
97 return (((filename[0] >= 'a' && filename[0] <= 'z') ||
98 (filename[0] >= 'A' && filename[0] <= 'Z')) &&
99 filename[1] == ':');
100}
101
102int is_windows_drive(const char *filename)
103{
104 if (is_windows_drive_prefix(filename) &&
105 filename[2] == '\0')
106 return 1;
107 if (strstart(filename, "\\\\.\\", NULL) ||
108 strstart(filename, "//./", NULL))
109 return 1;
110 return 0;
111}
112#endif
113
Kevin Wolf339064d2013-11-28 10:23:32 +0100114size_t bdrv_opt_mem_align(BlockDriverState *bs)
115{
116 if (!bs || !bs->drv) {
Denis V. Lunev459b4e62015-05-12 17:30:56 +0300117 /* page size or 4k (hdd sector size) should be on the safe side */
118 return MAX(4096, getpagesize());
Kevin Wolf339064d2013-11-28 10:23:32 +0100119 }
120
121 return bs->bl.opt_mem_alignment;
122}
123
Denis V. Lunev4196d2f2015-05-12 17:30:55 +0300124size_t bdrv_min_mem_align(BlockDriverState *bs)
125{
126 if (!bs || !bs->drv) {
Denis V. Lunev459b4e62015-05-12 17:30:56 +0300127 /* page size or 4k (hdd sector size) should be on the safe side */
128 return MAX(4096, getpagesize());
Denis V. Lunev4196d2f2015-05-12 17:30:55 +0300129 }
130
131 return bs->bl.min_mem_alignment;
132}
133
Stefan Hajnoczi9e0b22f2010-12-09 11:53:00 +0000134/* check if the path starts with "<protocol>:" */
Max Reitz5c984152014-12-03 14:57:22 +0100135int path_has_protocol(const char *path)
Stefan Hajnoczi9e0b22f2010-12-09 11:53:00 +0000136{
Paolo Bonzini947995c2012-05-08 16:51:48 +0200137 const char *p;
138
Stefan Hajnoczi9e0b22f2010-12-09 11:53:00 +0000139#ifdef _WIN32
140 if (is_windows_drive(path) ||
141 is_windows_drive_prefix(path)) {
142 return 0;
143 }
Paolo Bonzini947995c2012-05-08 16:51:48 +0200144 p = path + strcspn(path, ":/\\");
145#else
146 p = path + strcspn(path, ":/");
Stefan Hajnoczi9e0b22f2010-12-09 11:53:00 +0000147#endif
148
Paolo Bonzini947995c2012-05-08 16:51:48 +0200149 return *p == ':';
Stefan Hajnoczi9e0b22f2010-12-09 11:53:00 +0000150}
151
bellard83f64092006-08-01 16:21:11 +0000152int path_is_absolute(const char *path)
153{
bellard21664422007-01-07 18:22:37 +0000154#ifdef _WIN32
155 /* specific case for names like: "\\.\d:" */
Paolo Bonzinif53f4da2012-05-08 16:51:47 +0200156 if (is_windows_drive(path) || is_windows_drive_prefix(path)) {
bellard21664422007-01-07 18:22:37 +0000157 return 1;
Paolo Bonzinif53f4da2012-05-08 16:51:47 +0200158 }
159 return (*path == '/' || *path == '\\');
bellard3b9f94e2007-01-07 17:27:07 +0000160#else
Paolo Bonzinif53f4da2012-05-08 16:51:47 +0200161 return (*path == '/');
bellard3b9f94e2007-01-07 17:27:07 +0000162#endif
bellard83f64092006-08-01 16:21:11 +0000163}
164
165/* if filename is absolute, just copy it to dest. Otherwise, build a
166 path to it by considering it is relative to base_path. URL are
167 supported. */
168void path_combine(char *dest, int dest_size,
169 const char *base_path,
170 const char *filename)
171{
172 const char *p, *p1;
173 int len;
174
175 if (dest_size <= 0)
176 return;
177 if (path_is_absolute(filename)) {
178 pstrcpy(dest, dest_size, filename);
179 } else {
180 p = strchr(base_path, ':');
181 if (p)
182 p++;
183 else
184 p = base_path;
bellard3b9f94e2007-01-07 17:27:07 +0000185 p1 = strrchr(base_path, '/');
186#ifdef _WIN32
187 {
188 const char *p2;
189 p2 = strrchr(base_path, '\\');
190 if (!p1 || p2 > p1)
191 p1 = p2;
192 }
193#endif
bellard83f64092006-08-01 16:21:11 +0000194 if (p1)
195 p1++;
196 else
197 p1 = base_path;
198 if (p1 > p)
199 p = p1;
200 len = p - base_path;
201 if (len > dest_size - 1)
202 len = dest_size - 1;
203 memcpy(dest, base_path, len);
204 dest[len] = '\0';
205 pstrcat(dest, dest_size, filename);
206 }
207}
208
Max Reitz0a828552014-11-26 17:20:25 +0100209void bdrv_get_full_backing_filename_from_filename(const char *backed,
210 const char *backing,
Max Reitz9f074292014-11-26 17:20:26 +0100211 char *dest, size_t sz,
212 Error **errp)
Max Reitz0a828552014-11-26 17:20:25 +0100213{
Max Reitz9f074292014-11-26 17:20:26 +0100214 if (backing[0] == '\0' || path_has_protocol(backing) ||
215 path_is_absolute(backing))
216 {
Max Reitz0a828552014-11-26 17:20:25 +0100217 pstrcpy(dest, sz, backing);
Max Reitz9f074292014-11-26 17:20:26 +0100218 } else if (backed[0] == '\0' || strstart(backed, "json:", NULL)) {
219 error_setg(errp, "Cannot use relative backing file names for '%s'",
220 backed);
Max Reitz0a828552014-11-26 17:20:25 +0100221 } else {
222 path_combine(dest, sz, backed, backing);
223 }
224}
225
Max Reitz9f074292014-11-26 17:20:26 +0100226void bdrv_get_full_backing_filename(BlockDriverState *bs, char *dest, size_t sz,
227 Error **errp)
Paolo Bonzinidc5a1372012-05-08 16:51:50 +0200228{
Max Reitz9f074292014-11-26 17:20:26 +0100229 char *backed = bs->exact_filename[0] ? bs->exact_filename : bs->filename;
230
231 bdrv_get_full_backing_filename_from_filename(backed, bs->backing_file,
232 dest, sz, errp);
Paolo Bonzinidc5a1372012-05-08 16:51:50 +0200233}
234
Stefan Hajnoczi0eb72172015-04-28 14:27:51 +0100235void bdrv_register(BlockDriver *bdrv)
236{
237 bdrv_setup_io_funcs(bdrv);
Christoph Hellwigb2e12bc2009-09-04 19:01:49 +0200238
Stefan Hajnoczi8a22f022010-04-13 10:29:33 +0100239 QLIST_INSERT_HEAD(&bdrv_drivers, bdrv, list);
bellardea2384d2004-08-01 21:59:26 +0000240}
bellardb3380822004-03-14 21:38:54 +0000241
Markus Armbruster7f06d472014-10-07 13:59:12 +0200242BlockDriverState *bdrv_new_root(void)
bellardfc01f7e2003-06-30 10:03:06 +0000243{
Markus Armbruster7f06d472014-10-07 13:59:12 +0200244 BlockDriverState *bs = bdrv_new();
Markus Armbrustere4e99862014-10-07 13:59:03 +0200245
Markus Armbrustere4e99862014-10-07 13:59:03 +0200246 QTAILQ_INSERT_TAIL(&bdrv_states, bs, device_list);
Markus Armbrustere4e99862014-10-07 13:59:03 +0200247 return bs;
248}
249
250BlockDriverState *bdrv_new(void)
251{
252 BlockDriverState *bs;
253 int i;
254
Markus Armbruster5839e532014-08-19 10:31:08 +0200255 bs = g_new0(BlockDriverState, 1);
Fam Zhenge4654d22013-11-13 18:29:43 +0800256 QLIST_INIT(&bs->dirty_bitmaps);
Fam Zhengfbe40ff2014-05-23 21:29:42 +0800257 for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
258 QLIST_INIT(&bs->op_blockers[i]);
259 }
Luiz Capitulino28a72822011-09-26 17:43:50 -0300260 bdrv_iostatus_disable(bs);
Paolo Bonzinid7d512f2012-08-23 11:20:36 +0200261 notifier_list_init(&bs->close_notifiers);
Stefan Hajnoczid616b222013-06-24 17:13:10 +0200262 notifier_with_return_list_init(&bs->before_write_notifiers);
Benoît Canetcc0681c2013-09-02 14:14:39 +0200263 qemu_co_queue_init(&bs->throttled_reqs[0]);
264 qemu_co_queue_init(&bs->throttled_reqs[1]);
Fam Zheng9fcb0252013-08-23 09:14:46 +0800265 bs->refcnt = 1;
Stefan Hajnoczidcd04222014-05-08 16:34:37 +0200266 bs->aio_context = qemu_get_aio_context();
Paolo Bonzinid7d512f2012-08-23 11:20:36 +0200267
bellardb3380822004-03-14 21:38:54 +0000268 return bs;
269}
270
Paolo Bonzinid7d512f2012-08-23 11:20:36 +0200271void bdrv_add_close_notifier(BlockDriverState *bs, Notifier *notify)
272{
273 notifier_list_add(&bs->close_notifiers, notify);
274}
275
bellardea2384d2004-08-01 21:59:26 +0000276BlockDriver *bdrv_find_format(const char *format_name)
277{
278 BlockDriver *drv1;
Stefan Hajnoczi8a22f022010-04-13 10:29:33 +0100279 QLIST_FOREACH(drv1, &bdrv_drivers, list) {
280 if (!strcmp(drv1->format_name, format_name)) {
bellardea2384d2004-08-01 21:59:26 +0000281 return drv1;
Stefan Hajnoczi8a22f022010-04-13 10:29:33 +0100282 }
bellardea2384d2004-08-01 21:59:26 +0000283 }
284 return NULL;
285}
286
Fam Zhengb64ec4e2013-05-29 19:35:40 +0800287static int bdrv_is_whitelisted(BlockDriver *drv, bool read_only)
Markus Armbrustereb852012009-10-27 18:41:44 +0100288{
Fam Zhengb64ec4e2013-05-29 19:35:40 +0800289 static const char *whitelist_rw[] = {
290 CONFIG_BDRV_RW_WHITELIST
291 };
292 static const char *whitelist_ro[] = {
293 CONFIG_BDRV_RO_WHITELIST
Markus Armbrustereb852012009-10-27 18:41:44 +0100294 };
295 const char **p;
296
Fam Zhengb64ec4e2013-05-29 19:35:40 +0800297 if (!whitelist_rw[0] && !whitelist_ro[0]) {
Markus Armbrustereb852012009-10-27 18:41:44 +0100298 return 1; /* no whitelist, anything goes */
Fam Zhengb64ec4e2013-05-29 19:35:40 +0800299 }
Markus Armbrustereb852012009-10-27 18:41:44 +0100300
Fam Zhengb64ec4e2013-05-29 19:35:40 +0800301 for (p = whitelist_rw; *p; p++) {
Markus Armbrustereb852012009-10-27 18:41:44 +0100302 if (!strcmp(drv->format_name, *p)) {
303 return 1;
304 }
305 }
Fam Zhengb64ec4e2013-05-29 19:35:40 +0800306 if (read_only) {
307 for (p = whitelist_ro; *p; p++) {
308 if (!strcmp(drv->format_name, *p)) {
309 return 1;
310 }
311 }
312 }
Markus Armbrustereb852012009-10-27 18:41:44 +0100313 return 0;
314}
315
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800316typedef struct CreateCo {
317 BlockDriver *drv;
318 char *filename;
Chunyan Liu83d05212014-06-05 17:20:51 +0800319 QemuOpts *opts;
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800320 int ret;
Max Reitzcc84d902013-09-06 17:14:26 +0200321 Error *err;
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800322} CreateCo;
323
324static void coroutine_fn bdrv_create_co_entry(void *opaque)
325{
Max Reitzcc84d902013-09-06 17:14:26 +0200326 Error *local_err = NULL;
327 int ret;
328
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800329 CreateCo *cco = opaque;
330 assert(cco->drv);
331
Chunyan Liuc282e1f2014-06-05 17:21:11 +0800332 ret = cco->drv->bdrv_create(cco->filename, cco->opts, &local_err);
Markus Armbruster84d18f02014-01-30 15:07:28 +0100333 if (local_err) {
Max Reitzcc84d902013-09-06 17:14:26 +0200334 error_propagate(&cco->err, local_err);
335 }
336 cco->ret = ret;
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800337}
338
Kevin Wolf0e7e1982009-05-18 16:42:10 +0200339int bdrv_create(BlockDriver *drv, const char* filename,
Chunyan Liu83d05212014-06-05 17:20:51 +0800340 QemuOpts *opts, Error **errp)
bellardea2384d2004-08-01 21:59:26 +0000341{
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800342 int ret;
Kevin Wolf0e7e1982009-05-18 16:42:10 +0200343
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800344 Coroutine *co;
345 CreateCo cco = {
346 .drv = drv,
347 .filename = g_strdup(filename),
Chunyan Liu83d05212014-06-05 17:20:51 +0800348 .opts = opts,
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800349 .ret = NOT_DONE,
Max Reitzcc84d902013-09-06 17:14:26 +0200350 .err = NULL,
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800351 };
352
Chunyan Liuc282e1f2014-06-05 17:21:11 +0800353 if (!drv->bdrv_create) {
Max Reitzcc84d902013-09-06 17:14:26 +0200354 error_setg(errp, "Driver '%s' does not support image creation", drv->format_name);
Luiz Capitulino80168bf2012-10-17 16:45:25 -0300355 ret = -ENOTSUP;
356 goto out;
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800357 }
358
359 if (qemu_in_coroutine()) {
360 /* Fast-path if already in coroutine context */
361 bdrv_create_co_entry(&cco);
362 } else {
363 co = qemu_coroutine_create(bdrv_create_co_entry);
364 qemu_coroutine_enter(co, &cco);
365 while (cco.ret == NOT_DONE) {
Paolo Bonzinib47ec2c2014-07-07 15:18:01 +0200366 aio_poll(qemu_get_aio_context(), true);
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800367 }
368 }
369
370 ret = cco.ret;
Max Reitzcc84d902013-09-06 17:14:26 +0200371 if (ret < 0) {
Markus Armbruster84d18f02014-01-30 15:07:28 +0100372 if (cco.err) {
Max Reitzcc84d902013-09-06 17:14:26 +0200373 error_propagate(errp, cco.err);
374 } else {
375 error_setg_errno(errp, -ret, "Could not create image");
376 }
377 }
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800378
Luiz Capitulino80168bf2012-10-17 16:45:25 -0300379out:
380 g_free(cco.filename);
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800381 return ret;
bellardea2384d2004-08-01 21:59:26 +0000382}
383
Chunyan Liuc282e1f2014-06-05 17:21:11 +0800384int bdrv_create_file(const char *filename, QemuOpts *opts, Error **errp)
Christoph Hellwig84a12e62010-04-07 22:30:24 +0200385{
386 BlockDriver *drv;
Max Reitzcc84d902013-09-06 17:14:26 +0200387 Error *local_err = NULL;
388 int ret;
Christoph Hellwig84a12e62010-04-07 22:30:24 +0200389
Max Reitzb65a5e12015-02-05 13:58:12 -0500390 drv = bdrv_find_protocol(filename, true, errp);
Christoph Hellwig84a12e62010-04-07 22:30:24 +0200391 if (drv == NULL) {
Stefan Hajnoczi16905d72010-11-30 15:14:14 +0000392 return -ENOENT;
Christoph Hellwig84a12e62010-04-07 22:30:24 +0200393 }
394
Chunyan Liuc282e1f2014-06-05 17:21:11 +0800395 ret = bdrv_create(drv, filename, opts, &local_err);
Markus Armbruster84d18f02014-01-30 15:07:28 +0100396 if (local_err) {
Max Reitzcc84d902013-09-06 17:14:26 +0200397 error_propagate(errp, local_err);
398 }
399 return ret;
Christoph Hellwig84a12e62010-04-07 22:30:24 +0200400}
401
Ekaterina Tumanova892b7de2015-02-16 12:47:54 +0100402/**
403 * Try to get @bs's logical and physical block size.
404 * On success, store them in @bsz struct and return 0.
405 * On failure return -errno.
406 * @bs must not be empty.
407 */
408int bdrv_probe_blocksizes(BlockDriverState *bs, BlockSizes *bsz)
409{
410 BlockDriver *drv = bs->drv;
411
412 if (drv && drv->bdrv_probe_blocksizes) {
413 return drv->bdrv_probe_blocksizes(bs, bsz);
414 }
415
416 return -ENOTSUP;
417}
418
419/**
420 * Try to get @bs's geometry (cyls, heads, sectors).
421 * On success, store them in @geo struct and return 0.
422 * On failure return -errno.
423 * @bs must not be empty.
424 */
425int bdrv_probe_geometry(BlockDriverState *bs, HDGeometry *geo)
426{
427 BlockDriver *drv = bs->drv;
428
429 if (drv && drv->bdrv_probe_geometry) {
430 return drv->bdrv_probe_geometry(bs, geo);
431 }
432
433 return -ENOTSUP;
434}
435
Jim Meyeringeba25052012-05-28 09:27:54 +0200436/*
437 * Create a uniquely-named empty temporary file.
438 * Return 0 upon success, otherwise a negative errno value.
439 */
440int get_tmp_filename(char *filename, int size)
441{
bellardd5249392004-08-03 21:14:23 +0000442#ifdef _WIN32
bellard3b9f94e2007-01-07 17:27:07 +0000443 char temp_dir[MAX_PATH];
Jim Meyeringeba25052012-05-28 09:27:54 +0200444 /* GetTempFileName requires that its output buffer (4th param)
445 have length MAX_PATH or greater. */
446 assert(size >= MAX_PATH);
447 return (GetTempPath(MAX_PATH, temp_dir)
448 && GetTempFileName(temp_dir, "qem", 0, filename)
449 ? 0 : -GetLastError());
bellardd5249392004-08-03 21:14:23 +0000450#else
bellardea2384d2004-08-01 21:59:26 +0000451 int fd;
blueswir17ccfb2e2008-09-14 06:45:34 +0000452 const char *tmpdir;
aurel320badc1e2008-03-10 00:05:34 +0000453 tmpdir = getenv("TMPDIR");
Amit Shah69bef792014-02-26 15:12:37 +0530454 if (!tmpdir) {
455 tmpdir = "/var/tmp";
456 }
Jim Meyeringeba25052012-05-28 09:27:54 +0200457 if (snprintf(filename, size, "%s/vl.XXXXXX", tmpdir) >= size) {
458 return -EOVERFLOW;
459 }
bellardea2384d2004-08-01 21:59:26 +0000460 fd = mkstemp(filename);
Dunrong Huangfe235a02012-09-05 21:26:22 +0800461 if (fd < 0) {
462 return -errno;
463 }
464 if (close(fd) != 0) {
465 unlink(filename);
Jim Meyeringeba25052012-05-28 09:27:54 +0200466 return -errno;
467 }
468 return 0;
bellardd5249392004-08-03 21:14:23 +0000469#endif
Jim Meyeringeba25052012-05-28 09:27:54 +0200470}
bellardea2384d2004-08-01 21:59:26 +0000471
Christoph Hellwigf3a5d3f2009-06-15 13:55:19 +0200472/*
473 * Detect host devices. By convention, /dev/cdrom[N] is always
474 * recognized as a host CDROM.
475 */
Christoph Hellwigf3a5d3f2009-06-15 13:55:19 +0200476static BlockDriver *find_hdev_driver(const char *filename)
477{
Christoph Hellwig508c7cb2009-06-15 14:04:22 +0200478 int score_max = 0, score;
479 BlockDriver *drv = NULL, *d;
Christoph Hellwigf3a5d3f2009-06-15 13:55:19 +0200480
Stefan Hajnoczi8a22f022010-04-13 10:29:33 +0100481 QLIST_FOREACH(d, &bdrv_drivers, list) {
Christoph Hellwig508c7cb2009-06-15 14:04:22 +0200482 if (d->bdrv_probe_device) {
483 score = d->bdrv_probe_device(filename);
484 if (score > score_max) {
485 score_max = score;
486 drv = d;
487 }
488 }
Christoph Hellwigf3a5d3f2009-06-15 13:55:19 +0200489 }
490
Christoph Hellwig508c7cb2009-06-15 14:04:22 +0200491 return drv;
Christoph Hellwigf3a5d3f2009-06-15 13:55:19 +0200492}
Christoph Hellwigf3a5d3f2009-06-15 13:55:19 +0200493
Kevin Wolf98289622013-07-10 15:47:39 +0200494BlockDriver *bdrv_find_protocol(const char *filename,
Max Reitzb65a5e12015-02-05 13:58:12 -0500495 bool allow_protocol_prefix,
496 Error **errp)
Christoph Hellwig84a12e62010-04-07 22:30:24 +0200497{
498 BlockDriver *drv1;
499 char protocol[128];
500 int len;
501 const char *p;
502
Kevin Wolf66f82ce2010-04-14 14:17:38 +0200503 /* TODO Drivers without bdrv_file_open must be specified explicitly */
504
Christoph Hellwig39508e72010-06-23 12:25:17 +0200505 /*
506 * XXX(hch): we really should not let host device detection
507 * override an explicit protocol specification, but moving this
508 * later breaks access to device names with colons in them.
509 * Thanks to the brain-dead persistent naming schemes on udev-
510 * based Linux systems those actually are quite common.
511 */
512 drv1 = find_hdev_driver(filename);
513 if (drv1) {
Christoph Hellwig84a12e62010-04-07 22:30:24 +0200514 return drv1;
515 }
Christoph Hellwig39508e72010-06-23 12:25:17 +0200516
Kevin Wolf98289622013-07-10 15:47:39 +0200517 if (!path_has_protocol(filename) || !allow_protocol_prefix) {
Max Reitzef810432014-12-02 18:32:42 +0100518 return &bdrv_file;
Christoph Hellwig39508e72010-06-23 12:25:17 +0200519 }
Kevin Wolf98289622013-07-10 15:47:39 +0200520
Stefan Hajnoczi9e0b22f2010-12-09 11:53:00 +0000521 p = strchr(filename, ':');
522 assert(p != NULL);
Christoph Hellwig84a12e62010-04-07 22:30:24 +0200523 len = p - filename;
524 if (len > sizeof(protocol) - 1)
525 len = sizeof(protocol) - 1;
526 memcpy(protocol, filename, len);
527 protocol[len] = '\0';
528 QLIST_FOREACH(drv1, &bdrv_drivers, list) {
529 if (drv1->protocol_name &&
530 !strcmp(drv1->protocol_name, protocol)) {
531 return drv1;
532 }
533 }
Max Reitzb65a5e12015-02-05 13:58:12 -0500534
535 error_setg(errp, "Unknown protocol '%s'", protocol);
Christoph Hellwig84a12e62010-04-07 22:30:24 +0200536 return NULL;
537}
538
Markus Armbrusterc6684242014-11-20 16:27:10 +0100539/*
540 * Guess image format by probing its contents.
541 * This is not a good idea when your image is raw (CVE-2008-2004), but
542 * we do it anyway for backward compatibility.
543 *
544 * @buf contains the image's first @buf_size bytes.
Kevin Wolf7cddd372014-11-20 16:27:11 +0100545 * @buf_size is the buffer size in bytes (generally BLOCK_PROBE_BUF_SIZE,
546 * but can be smaller if the image file is smaller)
Markus Armbrusterc6684242014-11-20 16:27:10 +0100547 * @filename is its filename.
548 *
549 * For all block drivers, call the bdrv_probe() method to get its
550 * probing score.
551 * Return the first block driver with the highest probing score.
552 */
Kevin Wolf38f3ef52014-11-20 16:27:12 +0100553BlockDriver *bdrv_probe_all(const uint8_t *buf, int buf_size,
554 const char *filename)
Markus Armbrusterc6684242014-11-20 16:27:10 +0100555{
556 int score_max = 0, score;
557 BlockDriver *drv = NULL, *d;
558
559 QLIST_FOREACH(d, &bdrv_drivers, list) {
560 if (d->bdrv_probe) {
561 score = d->bdrv_probe(buf, buf_size, filename);
562 if (score > score_max) {
563 score_max = score;
564 drv = d;
565 }
566 }
567 }
568
569 return drv;
570}
571
Kevin Wolff500a6d2012-11-12 17:35:27 +0100572static int find_image_format(BlockDriverState *bs, const char *filename,
Max Reitz34b5d2c2013-09-05 14:45:29 +0200573 BlockDriver **pdrv, Error **errp)
bellardea2384d2004-08-01 21:59:26 +0000574{
Markus Armbrusterc6684242014-11-20 16:27:10 +0100575 BlockDriver *drv;
Kevin Wolf7cddd372014-11-20 16:27:11 +0100576 uint8_t buf[BLOCK_PROBE_BUF_SIZE];
Kevin Wolff500a6d2012-11-12 17:35:27 +0100577 int ret = 0;
Nicholas Bellingerf8ea0b02010-05-17 09:45:57 -0700578
Kevin Wolf08a00552010-06-01 18:37:31 +0200579 /* Return the raw BlockDriver * to scsi-generic devices or empty drives */
Dimitris Aragiorgisb192af82015-06-23 13:44:56 +0300580 if (bdrv_is_sg(bs) || !bdrv_is_inserted(bs) || bdrv_getlength(bs) == 0) {
Max Reitzef810432014-12-02 18:32:42 +0100581 *pdrv = &bdrv_raw;
Stefan Weilc98ac352010-07-21 21:51:51 +0200582 return ret;
Nicholas A. Bellinger1a396852010-05-27 08:56:28 -0700583 }
Nicholas Bellingerf8ea0b02010-05-17 09:45:57 -0700584
bellard83f64092006-08-01 16:21:11 +0000585 ret = bdrv_pread(bs, 0, buf, sizeof(buf));
bellard83f64092006-08-01 16:21:11 +0000586 if (ret < 0) {
Max Reitz34b5d2c2013-09-05 14:45:29 +0200587 error_setg_errno(errp, -ret, "Could not read image for determining its "
588 "format");
Stefan Weilc98ac352010-07-21 21:51:51 +0200589 *pdrv = NULL;
590 return ret;
bellard83f64092006-08-01 16:21:11 +0000591 }
592
Markus Armbrusterc6684242014-11-20 16:27:10 +0100593 drv = bdrv_probe_all(buf, ret, filename);
Stefan Weilc98ac352010-07-21 21:51:51 +0200594 if (!drv) {
Max Reitz34b5d2c2013-09-05 14:45:29 +0200595 error_setg(errp, "Could not determine image format: No compatible "
596 "driver found");
Stefan Weilc98ac352010-07-21 21:51:51 +0200597 ret = -ENOENT;
598 }
599 *pdrv = drv;
600 return ret;
bellardea2384d2004-08-01 21:59:26 +0000601}
602
Stefan Hajnoczi51762282010-04-19 16:56:41 +0100603/**
604 * Set the current 'total_sectors' value
Markus Armbruster65a9bb22014-06-26 13:23:17 +0200605 * Return 0 on success, -errno on error.
Stefan Hajnoczi51762282010-04-19 16:56:41 +0100606 */
607static int refresh_total_sectors(BlockDriverState *bs, int64_t hint)
608{
609 BlockDriver *drv = bs->drv;
610
Nicholas Bellinger396759a2010-05-17 09:46:04 -0700611 /* Do not attempt drv->bdrv_getlength() on scsi-generic devices */
Dimitris Aragiorgisb192af82015-06-23 13:44:56 +0300612 if (bdrv_is_sg(bs))
Nicholas Bellinger396759a2010-05-17 09:46:04 -0700613 return 0;
614
Stefan Hajnoczi51762282010-04-19 16:56:41 +0100615 /* query actual device if possible, otherwise just trust the hint */
616 if (drv->bdrv_getlength) {
617 int64_t length = drv->bdrv_getlength(bs);
618 if (length < 0) {
619 return length;
620 }
Fam Zheng7e382002013-11-06 19:48:06 +0800621 hint = DIV_ROUND_UP(length, BDRV_SECTOR_SIZE);
Stefan Hajnoczi51762282010-04-19 16:56:41 +0100622 }
623
624 bs->total_sectors = hint;
625 return 0;
626}
627
Stefan Hajnoczic3993cd2011-08-04 12:26:51 +0100628/**
Paolo Bonzini9e8f1832013-02-08 14:06:11 +0100629 * Set open flags for a given discard mode
630 *
631 * Return 0 on success, -1 if the discard mode was invalid.
632 */
633int bdrv_parse_discard_flags(const char *mode, int *flags)
634{
635 *flags &= ~BDRV_O_UNMAP;
636
637 if (!strcmp(mode, "off") || !strcmp(mode, "ignore")) {
638 /* do nothing */
639 } else if (!strcmp(mode, "on") || !strcmp(mode, "unmap")) {
640 *flags |= BDRV_O_UNMAP;
641 } else {
642 return -1;
643 }
644
645 return 0;
646}
647
648/**
Stefan Hajnoczic3993cd2011-08-04 12:26:51 +0100649 * Set open flags for a given cache mode
650 *
651 * Return 0 on success, -1 if the cache mode was invalid.
652 */
653int bdrv_parse_cache_flags(const char *mode, int *flags)
654{
655 *flags &= ~BDRV_O_CACHE_MASK;
656
657 if (!strcmp(mode, "off") || !strcmp(mode, "none")) {
658 *flags |= BDRV_O_NOCACHE | BDRV_O_CACHE_WB;
Stefan Hajnoczi92196b22011-08-04 12:26:52 +0100659 } else if (!strcmp(mode, "directsync")) {
660 *flags |= BDRV_O_NOCACHE;
Stefan Hajnoczic3993cd2011-08-04 12:26:51 +0100661 } else if (!strcmp(mode, "writeback")) {
662 *flags |= BDRV_O_CACHE_WB;
663 } else if (!strcmp(mode, "unsafe")) {
664 *flags |= BDRV_O_CACHE_WB;
665 *flags |= BDRV_O_NO_FLUSH;
666 } else if (!strcmp(mode, "writethrough")) {
667 /* this is the default */
668 } else {
669 return -1;
670 }
671
672 return 0;
673}
674
Kevin Wolf0b50cc82014-04-11 21:29:52 +0200675/*
Kevin Wolfb1e6fc02014-05-06 12:11:42 +0200676 * Returns the flags that a temporary snapshot should get, based on the
677 * originally requested flags (the originally requested image will have flags
678 * like a backing file)
679 */
680static int bdrv_temp_snapshot_flags(int flags)
681{
682 return (flags & ~BDRV_O_SNAPSHOT) | BDRV_O_TEMPORARY;
683}
684
685/*
Kevin Wolff3930ed2015-04-08 13:43:47 +0200686 * Returns the flags that bs->file should get if a protocol driver is expected,
687 * based on the given flags for the parent BDS
Kevin Wolf0b50cc82014-04-11 21:29:52 +0200688 */
689static int bdrv_inherited_flags(int flags)
690{
691 /* Enable protocol handling, disable format probing for bs->file */
692 flags |= BDRV_O_PROTOCOL;
693
694 /* Our block drivers take care to send flushes and respect unmap policy,
695 * so we can enable both unconditionally on lower layers. */
696 flags |= BDRV_O_CACHE_WB | BDRV_O_UNMAP;
697
Kevin Wolf0b50cc82014-04-11 21:29:52 +0200698 /* Clear flags that only apply to the top layer */
Kevin Wolf5669b442014-04-11 21:36:45 +0200699 flags &= ~(BDRV_O_SNAPSHOT | BDRV_O_NO_BACKING | BDRV_O_COPY_ON_READ);
Kevin Wolf0b50cc82014-04-11 21:29:52 +0200700
701 return flags;
702}
703
Kevin Wolff3930ed2015-04-08 13:43:47 +0200704const BdrvChildRole child_file = {
705 .inherit_flags = bdrv_inherited_flags,
706};
707
708/*
709 * Returns the flags that bs->file should get if the use of formats (and not
710 * only protocols) is permitted for it, based on the given flags for the parent
711 * BDS
712 */
713static int bdrv_inherited_fmt_flags(int parent_flags)
714{
715 int flags = child_file.inherit_flags(parent_flags);
716 return flags & ~BDRV_O_PROTOCOL;
717}
718
719const BdrvChildRole child_format = {
720 .inherit_flags = bdrv_inherited_fmt_flags,
721};
722
Kevin Wolf317fc442014-04-25 13:27:34 +0200723/*
Kevin Wolf760e0062015-06-17 14:55:21 +0200724 * Returns the flags that bs->backing should get, based on the given flags
Kevin Wolf317fc442014-04-25 13:27:34 +0200725 * for the parent BDS
726 */
727static int bdrv_backing_flags(int flags)
728{
729 /* backing files always opened read-only */
730 flags &= ~(BDRV_O_RDWR | BDRV_O_COPY_ON_READ);
731
732 /* snapshot=on is handled on the top layer */
Kevin Wolf8bfea152014-04-11 19:16:36 +0200733 flags &= ~(BDRV_O_SNAPSHOT | BDRV_O_TEMPORARY);
Kevin Wolf317fc442014-04-25 13:27:34 +0200734
735 return flags;
736}
737
Kevin Wolff3930ed2015-04-08 13:43:47 +0200738static const BdrvChildRole child_backing = {
739 .inherit_flags = bdrv_backing_flags,
740};
741
Kevin Wolf7b272452012-11-12 17:05:39 +0100742static int bdrv_open_flags(BlockDriverState *bs, int flags)
743{
744 int open_flags = flags | BDRV_O_CACHE_WB;
745
746 /*
747 * Clear flags that are internal to the block layer before opening the
748 * image.
749 */
Kevin Wolf20cca272014-06-04 14:33:27 +0200750 open_flags &= ~(BDRV_O_SNAPSHOT | BDRV_O_NO_BACKING | BDRV_O_PROTOCOL);
Kevin Wolf7b272452012-11-12 17:05:39 +0100751
752 /*
753 * Snapshots should be writable.
754 */
Kevin Wolf8bfea152014-04-11 19:16:36 +0200755 if (flags & BDRV_O_TEMPORARY) {
Kevin Wolf7b272452012-11-12 17:05:39 +0100756 open_flags |= BDRV_O_RDWR;
757 }
758
759 return open_flags;
760}
761
Kevin Wolf636ea372014-01-24 14:11:52 +0100762static void bdrv_assign_node_name(BlockDriverState *bs,
763 const char *node_name,
764 Error **errp)
Benoît Canet6913c0c2014-01-23 21:31:33 +0100765{
766 if (!node_name) {
Kevin Wolf636ea372014-01-24 14:11:52 +0100767 return;
Benoît Canet6913c0c2014-01-23 21:31:33 +0100768 }
769
Kevin Wolf9aebf3b2014-09-25 09:54:02 +0200770 /* Check for empty string or invalid characters */
Markus Armbrusterf5bebbb2014-09-30 13:59:30 +0200771 if (!id_wellformed(node_name)) {
Kevin Wolf9aebf3b2014-09-25 09:54:02 +0200772 error_setg(errp, "Invalid node name");
Kevin Wolf636ea372014-01-24 14:11:52 +0100773 return;
Benoît Canet6913c0c2014-01-23 21:31:33 +0100774 }
775
Benoît Canet0c5e94e2014-02-12 17:15:07 +0100776 /* takes care of avoiding namespaces collisions */
Markus Armbruster7f06d472014-10-07 13:59:12 +0200777 if (blk_by_name(node_name)) {
Benoît Canet0c5e94e2014-02-12 17:15:07 +0100778 error_setg(errp, "node-name=%s is conflicting with a device id",
779 node_name);
Kevin Wolf636ea372014-01-24 14:11:52 +0100780 return;
Benoît Canet0c5e94e2014-02-12 17:15:07 +0100781 }
782
Benoît Canet6913c0c2014-01-23 21:31:33 +0100783 /* takes care of avoiding duplicates node names */
784 if (bdrv_find_node(node_name)) {
785 error_setg(errp, "Duplicate node name");
Kevin Wolf636ea372014-01-24 14:11:52 +0100786 return;
Benoît Canet6913c0c2014-01-23 21:31:33 +0100787 }
788
789 /* copy node name into the bs and insert it into the graph list */
790 pstrcpy(bs->node_name, sizeof(bs->node_name), node_name);
791 QTAILQ_INSERT_TAIL(&graph_bdrv_states, bs, node_list);
Benoît Canet6913c0c2014-01-23 21:31:33 +0100792}
793
Kevin Wolf18edf282015-04-07 17:12:56 +0200794static QemuOptsList bdrv_runtime_opts = {
795 .name = "bdrv_common",
796 .head = QTAILQ_HEAD_INITIALIZER(bdrv_runtime_opts.head),
797 .desc = {
798 {
799 .name = "node-name",
800 .type = QEMU_OPT_STRING,
801 .help = "Node name of the block device node",
802 },
803 { /* end of list */ }
804 },
805};
806
Kevin Wolfb6ce07a2010-04-12 16:37:13 +0200807/*
Kevin Wolf57915332010-04-14 15:24:50 +0200808 * Common part for opening disk images and files
Kevin Wolfb6ad4912013-03-15 10:35:04 +0100809 *
810 * Removes all processed options from *options.
Kevin Wolf57915332010-04-14 15:24:50 +0200811 */
Kevin Wolf9a4f4c32015-06-16 14:19:22 +0200812static int bdrv_open_common(BlockDriverState *bs, BdrvChild *file,
Max Reitz34b5d2c2013-09-05 14:45:29 +0200813 QDict *options, int flags, BlockDriver *drv, Error **errp)
Kevin Wolf57915332010-04-14 15:24:50 +0200814{
815 int ret, open_flags;
Kevin Wolf035fccd2013-04-09 14:34:19 +0200816 const char *filename;
Benoît Canet6913c0c2014-01-23 21:31:33 +0100817 const char *node_name = NULL;
Kevin Wolf18edf282015-04-07 17:12:56 +0200818 QemuOpts *opts;
Max Reitz34b5d2c2013-09-05 14:45:29 +0200819 Error *local_err = NULL;
Kevin Wolf57915332010-04-14 15:24:50 +0200820
821 assert(drv != NULL);
Paolo Bonzini64058752012-05-08 16:51:49 +0200822 assert(bs->file == NULL);
Kevin Wolf707ff822013-03-06 12:20:31 +0100823 assert(options != NULL && bs->options != options);
Kevin Wolf57915332010-04-14 15:24:50 +0200824
Kevin Wolf45673672013-04-22 17:48:40 +0200825 if (file != NULL) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +0200826 filename = file->bs->filename;
Kevin Wolf45673672013-04-22 17:48:40 +0200827 } else {
828 filename = qdict_get_try_str(options, "filename");
829 }
830
Kevin Wolf765003d2014-02-03 14:49:42 +0100831 if (drv->bdrv_needs_filename && !filename) {
832 error_setg(errp, "The '%s' block driver requires a file name",
833 drv->format_name);
834 return -EINVAL;
835 }
836
Kevin Wolf45673672013-04-22 17:48:40 +0200837 trace_bdrv_open_common(bs, filename ?: "", flags, drv->format_name);
Stefan Hajnoczi28dcee12011-09-22 20:14:12 +0100838
Kevin Wolf18edf282015-04-07 17:12:56 +0200839 opts = qemu_opts_create(&bdrv_runtime_opts, NULL, 0, &error_abort);
840 qemu_opts_absorb_qdict(opts, options, &local_err);
841 if (local_err) {
842 error_propagate(errp, local_err);
843 ret = -EINVAL;
844 goto fail_opts;
845 }
846
847 node_name = qemu_opt_get(opts, "node-name");
Kevin Wolf636ea372014-01-24 14:11:52 +0100848 bdrv_assign_node_name(bs, node_name, &local_err);
Markus Armbruster0fb63952014-04-25 16:50:31 +0200849 if (local_err) {
Kevin Wolf636ea372014-01-24 14:11:52 +0100850 error_propagate(errp, local_err);
Kevin Wolf18edf282015-04-07 17:12:56 +0200851 ret = -EINVAL;
852 goto fail_opts;
Kevin Wolf5d186eb2013-03-27 17:28:18 +0100853 }
854
Paolo Bonzini1b7fd722011-11-29 11:35:47 +0100855 bs->guest_block_size = 512;
Paolo Bonzinic25f53b2011-11-29 12:42:20 +0100856 bs->request_alignment = 512;
Asias He0d51b4d2013-08-22 15:24:14 +0800857 bs->zero_beyond_eof = true;
Fam Zhengb64ec4e2013-05-29 19:35:40 +0800858 open_flags = bdrv_open_flags(bs, flags);
859 bs->read_only = !(open_flags & BDRV_O_RDWR);
860
861 if (use_bdrv_whitelist && !bdrv_is_whitelisted(drv, bs->read_only)) {
Kevin Wolf8f94a6e2013-10-10 11:45:55 +0200862 error_setg(errp,
863 !bs->read_only && bdrv_is_whitelisted(drv, true)
864 ? "Driver '%s' can only be used for read-only devices"
865 : "Driver '%s' is not whitelisted",
866 drv->format_name);
Kevin Wolf18edf282015-04-07 17:12:56 +0200867 ret = -ENOTSUP;
868 goto fail_opts;
Fam Zhengb64ec4e2013-05-29 19:35:40 +0800869 }
Kevin Wolf57915332010-04-14 15:24:50 +0200870
Stefan Hajnoczi53fec9d2011-11-28 16:08:47 +0000871 assert(bs->copy_on_read == 0); /* bdrv_new() and bdrv_close() make it so */
Kevin Wolf0ebd24e2013-09-19 15:12:18 +0200872 if (flags & BDRV_O_COPY_ON_READ) {
873 if (!bs->read_only) {
874 bdrv_enable_copy_on_read(bs);
875 } else {
876 error_setg(errp, "Can't use copy-on-read on read-only device");
Kevin Wolf18edf282015-04-07 17:12:56 +0200877 ret = -EINVAL;
878 goto fail_opts;
Kevin Wolf0ebd24e2013-09-19 15:12:18 +0200879 }
Stefan Hajnoczi53fec9d2011-11-28 16:08:47 +0000880 }
881
Kevin Wolfc2ad1b02013-03-18 16:40:51 +0100882 if (filename != NULL) {
883 pstrcpy(bs->filename, sizeof(bs->filename), filename);
884 } else {
885 bs->filename[0] = '\0';
886 }
Max Reitz91af7012014-07-18 20:24:56 +0200887 pstrcpy(bs->exact_filename, sizeof(bs->exact_filename), bs->filename);
Kevin Wolf57915332010-04-14 15:24:50 +0200888
Kevin Wolf57915332010-04-14 15:24:50 +0200889 bs->drv = drv;
Anthony Liguori7267c092011-08-20 22:09:37 -0500890 bs->opaque = g_malloc0(drv->instance_size);
Kevin Wolf57915332010-04-14 15:24:50 +0200891
Stefan Hajnoczi03f541b2011-10-27 10:54:28 +0100892 bs->enable_write_cache = !!(flags & BDRV_O_CACHE_WB);
Stefan Hajnoczie7c63792011-10-27 10:54:27 +0100893
Kevin Wolf66f82ce2010-04-14 14:17:38 +0200894 /* Open the image, either directly or using a protocol */
895 if (drv->bdrv_file_open) {
Kevin Wolf5d186eb2013-03-27 17:28:18 +0100896 assert(file == NULL);
Benoît Canet030be322013-09-24 17:07:04 +0200897 assert(!drv->bdrv_needs_filename || filename != NULL);
Max Reitz34b5d2c2013-09-05 14:45:29 +0200898 ret = drv->bdrv_file_open(bs, options, open_flags, &local_err);
Kevin Wolff500a6d2012-11-12 17:35:27 +0100899 } else {
Kevin Wolf2af5ef72013-04-09 13:19:18 +0200900 if (file == NULL) {
Max Reitz34b5d2c2013-09-05 14:45:29 +0200901 error_setg(errp, "Can't use '%s' as a block driver for the "
902 "protocol level", drv->format_name);
Kevin Wolf2af5ef72013-04-09 13:19:18 +0200903 ret = -EINVAL;
904 goto free_and_fail;
905 }
Kevin Wolff500a6d2012-11-12 17:35:27 +0100906 bs->file = file;
Max Reitz34b5d2c2013-09-05 14:45:29 +0200907 ret = drv->bdrv_open(bs, options, open_flags, &local_err);
Kevin Wolf66f82ce2010-04-14 14:17:38 +0200908 }
909
Kevin Wolf57915332010-04-14 15:24:50 +0200910 if (ret < 0) {
Markus Armbruster84d18f02014-01-30 15:07:28 +0100911 if (local_err) {
Max Reitz34b5d2c2013-09-05 14:45:29 +0200912 error_propagate(errp, local_err);
Dunrong Huang2fa9aa52013-09-24 18:14:01 +0800913 } else if (bs->filename[0]) {
914 error_setg_errno(errp, -ret, "Could not open '%s'", bs->filename);
Max Reitz34b5d2c2013-09-05 14:45:29 +0200915 } else {
916 error_setg_errno(errp, -ret, "Could not open image");
917 }
Kevin Wolf57915332010-04-14 15:24:50 +0200918 goto free_and_fail;
919 }
920
Markus Armbrustera1f688f2015-03-13 21:09:40 +0100921 if (bs->encrypted) {
922 error_report("Encrypted images are deprecated");
923 error_printf("Support for them will be removed in a future release.\n"
924 "You can use 'qemu-img convert' to convert your image"
925 " to an unencrypted one.\n");
926 }
927
Stefan Hajnoczi51762282010-04-19 16:56:41 +0100928 ret = refresh_total_sectors(bs, bs->total_sectors);
929 if (ret < 0) {
Max Reitz34b5d2c2013-09-05 14:45:29 +0200930 error_setg_errno(errp, -ret, "Could not refresh total sector count");
Stefan Hajnoczi51762282010-04-19 16:56:41 +0100931 goto free_and_fail;
Kevin Wolf57915332010-04-14 15:24:50 +0200932 }
Stefan Hajnoczi51762282010-04-19 16:56:41 +0100933
Kevin Wolf3baca892014-07-16 17:48:16 +0200934 bdrv_refresh_limits(bs, &local_err);
935 if (local_err) {
936 error_propagate(errp, local_err);
937 ret = -EINVAL;
938 goto free_and_fail;
939 }
940
Paolo Bonzinic25f53b2011-11-29 12:42:20 +0100941 assert(bdrv_opt_mem_align(bs) != 0);
Denis V. Lunev4196d2f2015-05-12 17:30:55 +0300942 assert(bdrv_min_mem_align(bs) != 0);
Dimitris Aragiorgisb192af82015-06-23 13:44:56 +0300943 assert((bs->request_alignment != 0) || bdrv_is_sg(bs));
Kevin Wolf18edf282015-04-07 17:12:56 +0200944
945 qemu_opts_del(opts);
Kevin Wolf57915332010-04-14 15:24:50 +0200946 return 0;
947
948free_and_fail:
Kevin Wolff500a6d2012-11-12 17:35:27 +0100949 bs->file = NULL;
Anthony Liguori7267c092011-08-20 22:09:37 -0500950 g_free(bs->opaque);
Kevin Wolf57915332010-04-14 15:24:50 +0200951 bs->opaque = NULL;
952 bs->drv = NULL;
Kevin Wolf18edf282015-04-07 17:12:56 +0200953fail_opts:
954 qemu_opts_del(opts);
Kevin Wolf57915332010-04-14 15:24:50 +0200955 return ret;
956}
957
Kevin Wolf5e5c4f62014-05-26 11:45:08 +0200958static QDict *parse_json_filename(const char *filename, Error **errp)
959{
960 QObject *options_obj;
961 QDict *options;
962 int ret;
963
964 ret = strstart(filename, "json:", &filename);
965 assert(ret);
966
967 options_obj = qobject_from_json(filename);
968 if (!options_obj) {
969 error_setg(errp, "Could not parse the JSON options");
970 return NULL;
971 }
972
973 if (qobject_type(options_obj) != QTYPE_QDICT) {
974 qobject_decref(options_obj);
975 error_setg(errp, "Invalid JSON object given");
976 return NULL;
977 }
978
979 options = qobject_to_qdict(options_obj);
980 qdict_flatten(options);
981
982 return options;
983}
984
Kevin Wolf57915332010-04-14 15:24:50 +0200985/*
Kevin Wolff54120f2014-05-26 11:09:59 +0200986 * Fills in default options for opening images and converts the legacy
987 * filename/flags pair to option QDict entries.
Max Reitz53a29512015-03-19 14:53:16 -0400988 * The BDRV_O_PROTOCOL flag in *flags will be set or cleared accordingly if a
989 * block driver has been specified explicitly.
Kevin Wolff54120f2014-05-26 11:09:59 +0200990 */
Max Reitz53a29512015-03-19 14:53:16 -0400991static int bdrv_fill_options(QDict **options, const char **pfilename,
Max Reitz053e1572015-08-26 19:47:51 +0200992 int *flags, Error **errp)
Kevin Wolff54120f2014-05-26 11:09:59 +0200993{
Kevin Wolf5e5c4f62014-05-26 11:45:08 +0200994 const char *filename = *pfilename;
Kevin Wolff54120f2014-05-26 11:09:59 +0200995 const char *drvname;
Max Reitz53a29512015-03-19 14:53:16 -0400996 bool protocol = *flags & BDRV_O_PROTOCOL;
Kevin Wolff54120f2014-05-26 11:09:59 +0200997 bool parse_filename = false;
Max Reitz053e1572015-08-26 19:47:51 +0200998 BlockDriver *drv = NULL;
Kevin Wolff54120f2014-05-26 11:09:59 +0200999 Error *local_err = NULL;
Kevin Wolff54120f2014-05-26 11:09:59 +02001000
Kevin Wolf5e5c4f62014-05-26 11:45:08 +02001001 /* Parse json: pseudo-protocol */
1002 if (filename && g_str_has_prefix(filename, "json:")) {
1003 QDict *json_options = parse_json_filename(filename, &local_err);
1004 if (local_err) {
1005 error_propagate(errp, local_err);
1006 return -EINVAL;
1007 }
1008
1009 /* Options given in the filename have lower priority than options
1010 * specified directly */
1011 qdict_join(*options, json_options, false);
1012 QDECREF(json_options);
1013 *pfilename = filename = NULL;
1014 }
1015
Max Reitz53a29512015-03-19 14:53:16 -04001016 drvname = qdict_get_try_str(*options, "driver");
Max Reitz053e1572015-08-26 19:47:51 +02001017 if (drvname) {
1018 drv = bdrv_find_format(drvname);
1019 if (!drv) {
1020 error_setg(errp, "Unknown driver '%s'", drvname);
1021 return -ENOENT;
1022 }
1023 /* If the user has explicitly specified the driver, this choice should
1024 * override the BDRV_O_PROTOCOL flag */
1025 protocol = drv->bdrv_file_open;
Max Reitz53a29512015-03-19 14:53:16 -04001026 }
1027
1028 if (protocol) {
1029 *flags |= BDRV_O_PROTOCOL;
1030 } else {
1031 *flags &= ~BDRV_O_PROTOCOL;
1032 }
1033
Kevin Wolff54120f2014-05-26 11:09:59 +02001034 /* Fetch the file name from the options QDict if necessary */
Kevin Wolf17b005f2014-05-27 10:50:29 +02001035 if (protocol && filename) {
Kevin Wolff54120f2014-05-26 11:09:59 +02001036 if (!qdict_haskey(*options, "filename")) {
1037 qdict_put(*options, "filename", qstring_from_str(filename));
1038 parse_filename = true;
1039 } else {
1040 error_setg(errp, "Can't specify 'file' and 'filename' options at "
1041 "the same time");
1042 return -EINVAL;
1043 }
1044 }
1045
1046 /* Find the right block driver */
1047 filename = qdict_get_try_str(*options, "filename");
Kevin Wolff54120f2014-05-26 11:09:59 +02001048
Max Reitz053e1572015-08-26 19:47:51 +02001049 if (!drvname && protocol) {
1050 if (filename) {
1051 drv = bdrv_find_protocol(filename, parse_filename, errp);
1052 if (!drv) {
Kevin Wolff54120f2014-05-26 11:09:59 +02001053 return -EINVAL;
1054 }
Max Reitz053e1572015-08-26 19:47:51 +02001055
1056 drvname = drv->format_name;
1057 qdict_put(*options, "driver", qstring_from_str(drvname));
1058 } else {
1059 error_setg(errp, "Must specify either driver or file");
1060 return -EINVAL;
Kevin Wolff54120f2014-05-26 11:09:59 +02001061 }
1062 }
1063
Kevin Wolf17b005f2014-05-27 10:50:29 +02001064 assert(drv || !protocol);
Kevin Wolff54120f2014-05-26 11:09:59 +02001065
1066 /* Driver-specific filename parsing */
Kevin Wolf17b005f2014-05-27 10:50:29 +02001067 if (drv && drv->bdrv_parse_filename && parse_filename) {
Kevin Wolff54120f2014-05-26 11:09:59 +02001068 drv->bdrv_parse_filename(filename, *options, &local_err);
1069 if (local_err) {
1070 error_propagate(errp, local_err);
1071 return -EINVAL;
1072 }
1073
1074 if (!drv->bdrv_needs_filename) {
1075 qdict_del(*options, "filename");
1076 }
1077 }
1078
1079 return 0;
1080}
1081
Kevin Wolfb4b059f2015-06-15 13:24:19 +02001082static BdrvChild *bdrv_attach_child(BlockDriverState *parent_bs,
1083 BlockDriverState *child_bs,
1084 const BdrvChildRole *child_role)
Kevin Wolfdf581792015-06-15 11:53:47 +02001085{
1086 BdrvChild *child = g_new(BdrvChild, 1);
1087 *child = (BdrvChild) {
1088 .bs = child_bs,
1089 .role = child_role,
1090 };
1091
1092 QLIST_INSERT_HEAD(&parent_bs->children, child, next);
Kevin Wolfb4b059f2015-06-15 13:24:19 +02001093
1094 return child;
Kevin Wolfdf581792015-06-15 11:53:47 +02001095}
1096
Kevin Wolf33a60402015-06-15 13:51:04 +02001097static void bdrv_detach_child(BdrvChild *child)
1098{
1099 QLIST_REMOVE(child, next);
1100 g_free(child);
1101}
1102
1103void bdrv_unref_child(BlockDriverState *parent, BdrvChild *child)
1104{
1105 BlockDriverState *child_bs = child->bs;
1106
1107 if (child->bs->inherits_from == parent) {
1108 child->bs->inherits_from = NULL;
1109 }
1110
1111 bdrv_detach_child(child);
1112 bdrv_unref(child_bs);
1113}
1114
Fam Zheng8d24cce2014-05-23 21:29:45 +08001115void bdrv_set_backing_hd(BlockDriverState *bs, BlockDriverState *backing_hd)
1116{
1117
Kevin Wolf760e0062015-06-17 14:55:21 +02001118 if (bs->backing) {
Fam Zheng826b6ca2014-05-23 21:29:47 +08001119 assert(bs->backing_blocker);
Kevin Wolf760e0062015-06-17 14:55:21 +02001120 bdrv_op_unblock_all(bs->backing->bs, bs->backing_blocker);
1121 bdrv_detach_child(bs->backing);
Fam Zheng826b6ca2014-05-23 21:29:47 +08001122 } else if (backing_hd) {
1123 error_setg(&bs->backing_blocker,
Alberto Garcia81e5f782015-04-08 12:29:19 +03001124 "node is used as backing hd of '%s'",
1125 bdrv_get_device_or_node_name(bs));
Fam Zheng826b6ca2014-05-23 21:29:47 +08001126 }
1127
Fam Zheng8d24cce2014-05-23 21:29:45 +08001128 if (!backing_hd) {
Fam Zheng826b6ca2014-05-23 21:29:47 +08001129 error_free(bs->backing_blocker);
1130 bs->backing_blocker = NULL;
Kevin Wolf760e0062015-06-17 14:55:21 +02001131 bs->backing = NULL;
Fam Zheng8d24cce2014-05-23 21:29:45 +08001132 goto out;
1133 }
Kevin Wolf760e0062015-06-17 14:55:21 +02001134 bs->backing = bdrv_attach_child(bs, backing_hd, &child_backing);
Fam Zheng8d24cce2014-05-23 21:29:45 +08001135 bs->open_flags &= ~BDRV_O_NO_BACKING;
1136 pstrcpy(bs->backing_file, sizeof(bs->backing_file), backing_hd->filename);
1137 pstrcpy(bs->backing_format, sizeof(bs->backing_format),
1138 backing_hd->drv ? backing_hd->drv->format_name : "");
Fam Zheng826b6ca2014-05-23 21:29:47 +08001139
Kevin Wolf760e0062015-06-17 14:55:21 +02001140 bdrv_op_block_all(backing_hd, bs->backing_blocker);
Fam Zheng826b6ca2014-05-23 21:29:47 +08001141 /* Otherwise we won't be able to commit due to check in bdrv_commit */
Kevin Wolf760e0062015-06-17 14:55:21 +02001142 bdrv_op_unblock(backing_hd, BLOCK_OP_TYPE_COMMIT_TARGET,
Fam Zheng826b6ca2014-05-23 21:29:47 +08001143 bs->backing_blocker);
Fam Zheng8d24cce2014-05-23 21:29:45 +08001144out:
Kevin Wolf3baca892014-07-16 17:48:16 +02001145 bdrv_refresh_limits(bs, NULL);
Fam Zheng8d24cce2014-05-23 21:29:45 +08001146}
1147
Kevin Wolf31ca6d02013-03-28 15:29:24 +01001148/*
1149 * Opens the backing file for a BlockDriverState if not yet open
1150 *
1151 * options is a QDict of options to pass to the block drivers, or NULL for an
1152 * empty set of options. The reference to the QDict is transferred to this
1153 * function (even on failure), so if the caller intends to reuse the dictionary,
1154 * it needs to use QINCREF() before calling bdrv_file_open.
1155 */
Max Reitz34b5d2c2013-09-05 14:45:29 +02001156int bdrv_open_backing_file(BlockDriverState *bs, QDict *options, Error **errp)
Paolo Bonzini9156df12012-10-18 16:49:17 +02001157{
Benoît Canet1ba4b6a2014-04-22 17:05:27 +02001158 char *backing_filename = g_malloc0(PATH_MAX);
Kevin Wolf317fc442014-04-25 13:27:34 +02001159 int ret = 0;
Fam Zheng8d24cce2014-05-23 21:29:45 +08001160 BlockDriverState *backing_hd;
Max Reitz34b5d2c2013-09-05 14:45:29 +02001161 Error *local_err = NULL;
Paolo Bonzini9156df12012-10-18 16:49:17 +02001162
Kevin Wolf760e0062015-06-17 14:55:21 +02001163 if (bs->backing != NULL) {
Kevin Wolf31ca6d02013-03-28 15:29:24 +01001164 QDECREF(options);
Benoît Canet1ba4b6a2014-04-22 17:05:27 +02001165 goto free_exit;
Paolo Bonzini9156df12012-10-18 16:49:17 +02001166 }
1167
Kevin Wolf31ca6d02013-03-28 15:29:24 +01001168 /* NULL means an empty set of options */
1169 if (options == NULL) {
1170 options = qdict_new();
1171 }
1172
Paolo Bonzini9156df12012-10-18 16:49:17 +02001173 bs->open_flags &= ~BDRV_O_NO_BACKING;
Kevin Wolf1cb6f502013-04-12 20:27:07 +02001174 if (qdict_haskey(options, "file.filename")) {
1175 backing_filename[0] = '\0';
1176 } else if (bs->backing_file[0] == '\0' && qdict_size(options) == 0) {
Kevin Wolf31ca6d02013-03-28 15:29:24 +01001177 QDECREF(options);
Benoît Canet1ba4b6a2014-04-22 17:05:27 +02001178 goto free_exit;
Fam Zhengdbecebd2013-09-22 20:05:06 +08001179 } else {
Max Reitz9f074292014-11-26 17:20:26 +01001180 bdrv_get_full_backing_filename(bs, backing_filename, PATH_MAX,
1181 &local_err);
1182 if (local_err) {
1183 ret = -EINVAL;
1184 error_propagate(errp, local_err);
1185 QDECREF(options);
1186 goto free_exit;
1187 }
Paolo Bonzini9156df12012-10-18 16:49:17 +02001188 }
1189
Kevin Wolf8ee79e72014-06-04 15:09:35 +02001190 if (!bs->drv || !bs->drv->supports_backing) {
1191 ret = -EINVAL;
1192 error_setg(errp, "Driver doesn't support backing files");
1193 QDECREF(options);
1194 goto free_exit;
1195 }
1196
Markus Armbrustere4e99862014-10-07 13:59:03 +02001197 backing_hd = bdrv_new();
Fam Zheng8d24cce2014-05-23 21:29:45 +08001198
Kevin Wolfc5f6e492014-11-25 18:12:42 +01001199 if (bs->backing_format[0] != '\0' && !qdict_haskey(options, "driver")) {
1200 qdict_put(options, "driver", qstring_from_str(bs->backing_format));
Paolo Bonzini9156df12012-10-18 16:49:17 +02001201 }
1202
Kevin Wolf760e0062015-06-17 14:55:21 +02001203 assert(bs->backing == NULL);
Kevin Wolff3930ed2015-04-08 13:43:47 +02001204 ret = bdrv_open_inherit(&backing_hd,
1205 *backing_filename ? backing_filename : NULL,
Max Reitzce343772015-08-26 19:47:50 +02001206 NULL, options, 0, bs, &child_backing, &local_err);
Paolo Bonzini9156df12012-10-18 16:49:17 +02001207 if (ret < 0) {
Fam Zheng8d24cce2014-05-23 21:29:45 +08001208 bdrv_unref(backing_hd);
1209 backing_hd = NULL;
Paolo Bonzini9156df12012-10-18 16:49:17 +02001210 bs->open_flags |= BDRV_O_NO_BACKING;
Fam Zhengb04b6b62013-11-08 11:26:49 +08001211 error_setg(errp, "Could not open backing file: %s",
1212 error_get_pretty(local_err));
1213 error_free(local_err);
Benoît Canet1ba4b6a2014-04-22 17:05:27 +02001214 goto free_exit;
Paolo Bonzini9156df12012-10-18 16:49:17 +02001215 }
Kevin Wolfdf581792015-06-15 11:53:47 +02001216
Fam Zheng8d24cce2014-05-23 21:29:45 +08001217 bdrv_set_backing_hd(bs, backing_hd);
Peter Feinerd80ac652014-01-08 19:43:25 +00001218
Benoît Canet1ba4b6a2014-04-22 17:05:27 +02001219free_exit:
1220 g_free(backing_filename);
1221 return ret;
Paolo Bonzini9156df12012-10-18 16:49:17 +02001222}
1223
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001224/*
Max Reitzda557aa2013-12-20 19:28:11 +01001225 * Opens a disk image whose options are given as BlockdevRef in another block
1226 * device's options.
1227 *
Max Reitzda557aa2013-12-20 19:28:11 +01001228 * If allow_none is true, no image will be opened if filename is false and no
Kevin Wolfb4b059f2015-06-15 13:24:19 +02001229 * BlockdevRef is given. NULL will be returned, but errp remains unset.
Max Reitzda557aa2013-12-20 19:28:11 +01001230 *
1231 * bdrev_key specifies the key for the image's BlockdevRef in the options QDict.
1232 * That QDict has to be flattened; therefore, if the BlockdevRef is a QDict
1233 * itself, all options starting with "${bdref_key}." are considered part of the
1234 * BlockdevRef.
1235 *
1236 * The BlockdevRef will be removed from the options QDict.
1237 */
Kevin Wolfb4b059f2015-06-15 13:24:19 +02001238BdrvChild *bdrv_open_child(const char *filename,
1239 QDict *options, const char *bdref_key,
1240 BlockDriverState* parent,
1241 const BdrvChildRole *child_role,
1242 bool allow_none, Error **errp)
Max Reitzda557aa2013-12-20 19:28:11 +01001243{
Kevin Wolfb4b059f2015-06-15 13:24:19 +02001244 BdrvChild *c = NULL;
1245 BlockDriverState *bs;
Max Reitzda557aa2013-12-20 19:28:11 +01001246 QDict *image_options;
1247 int ret;
1248 char *bdref_key_dot;
1249 const char *reference;
1250
Kevin Wolfdf581792015-06-15 11:53:47 +02001251 assert(child_role != NULL);
Max Reitzf67503e2014-02-18 18:33:05 +01001252
Max Reitzda557aa2013-12-20 19:28:11 +01001253 bdref_key_dot = g_strdup_printf("%s.", bdref_key);
1254 qdict_extract_subqdict(options, &image_options, bdref_key_dot);
1255 g_free(bdref_key_dot);
1256
1257 reference = qdict_get_try_str(options, bdref_key);
1258 if (!filename && !reference && !qdict_size(image_options)) {
Kevin Wolfb4b059f2015-06-15 13:24:19 +02001259 if (!allow_none) {
Max Reitzda557aa2013-12-20 19:28:11 +01001260 error_setg(errp, "A block device must be specified for \"%s\"",
1261 bdref_key);
Max Reitzda557aa2013-12-20 19:28:11 +01001262 }
Markus Armbrusterb20e61e2014-05-28 11:16:57 +02001263 QDECREF(image_options);
Max Reitzda557aa2013-12-20 19:28:11 +01001264 goto done;
1265 }
1266
Kevin Wolfb4b059f2015-06-15 13:24:19 +02001267 bs = NULL;
1268 ret = bdrv_open_inherit(&bs, filename, reference, image_options, 0,
Max Reitzce343772015-08-26 19:47:50 +02001269 parent, child_role, errp);
Kevin Wolfdf581792015-06-15 11:53:47 +02001270 if (ret < 0) {
1271 goto done;
1272 }
1273
Kevin Wolfb4b059f2015-06-15 13:24:19 +02001274 c = bdrv_attach_child(parent, bs, child_role);
Max Reitzda557aa2013-12-20 19:28:11 +01001275
1276done:
1277 qdict_del(options, bdref_key);
Kevin Wolfb4b059f2015-06-15 13:24:19 +02001278 return c;
1279}
1280
Chen Gang6b8aeca2014-06-23 23:28:23 +08001281int bdrv_append_temp_snapshot(BlockDriverState *bs, int flags, Error **errp)
Kevin Wolfb9988752014-04-03 12:09:34 +02001282{
1283 /* TODO: extra byte is a hack to ensure MAX_PATH space on Windows. */
Benoît Canet1ba4b6a2014-04-22 17:05:27 +02001284 char *tmp_filename = g_malloc0(PATH_MAX + 1);
Kevin Wolfb9988752014-04-03 12:09:34 +02001285 int64_t total_size;
Chunyan Liu83d05212014-06-05 17:20:51 +08001286 QemuOpts *opts = NULL;
Kevin Wolfb9988752014-04-03 12:09:34 +02001287 QDict *snapshot_options;
1288 BlockDriverState *bs_snapshot;
Fam Zhengc2e0dbb2015-07-06 12:24:44 +08001289 Error *local_err = NULL;
Kevin Wolfb9988752014-04-03 12:09:34 +02001290 int ret;
1291
1292 /* if snapshot, we create a temporary backing file and open it
1293 instead of opening 'filename' directly */
1294
1295 /* Get the required size from the image */
Kevin Wolff1877432014-04-04 17:07:19 +02001296 total_size = bdrv_getlength(bs);
1297 if (total_size < 0) {
Chen Gang6b8aeca2014-06-23 23:28:23 +08001298 ret = total_size;
Kevin Wolff1877432014-04-04 17:07:19 +02001299 error_setg_errno(errp, -total_size, "Could not get image size");
Benoît Canet1ba4b6a2014-04-22 17:05:27 +02001300 goto out;
Kevin Wolff1877432014-04-04 17:07:19 +02001301 }
Kevin Wolfb9988752014-04-03 12:09:34 +02001302
1303 /* Create the temporary image */
Benoît Canet1ba4b6a2014-04-22 17:05:27 +02001304 ret = get_tmp_filename(tmp_filename, PATH_MAX + 1);
Kevin Wolfb9988752014-04-03 12:09:34 +02001305 if (ret < 0) {
1306 error_setg_errno(errp, -ret, "Could not get temporary filename");
Benoît Canet1ba4b6a2014-04-22 17:05:27 +02001307 goto out;
Kevin Wolfb9988752014-04-03 12:09:34 +02001308 }
1309
Max Reitzef810432014-12-02 18:32:42 +01001310 opts = qemu_opts_create(bdrv_qcow2.create_opts, NULL, 0,
Chunyan Liuc282e1f2014-06-05 17:21:11 +08001311 &error_abort);
Markus Armbruster39101f22015-02-12 16:46:36 +01001312 qemu_opt_set_number(opts, BLOCK_OPT_SIZE, total_size, &error_abort);
Max Reitzef810432014-12-02 18:32:42 +01001313 ret = bdrv_create(&bdrv_qcow2, tmp_filename, opts, &local_err);
Chunyan Liu83d05212014-06-05 17:20:51 +08001314 qemu_opts_del(opts);
Kevin Wolfb9988752014-04-03 12:09:34 +02001315 if (ret < 0) {
1316 error_setg_errno(errp, -ret, "Could not create temporary overlay "
1317 "'%s': %s", tmp_filename,
1318 error_get_pretty(local_err));
1319 error_free(local_err);
Benoît Canet1ba4b6a2014-04-22 17:05:27 +02001320 goto out;
Kevin Wolfb9988752014-04-03 12:09:34 +02001321 }
1322
1323 /* Prepare a new options QDict for the temporary file */
1324 snapshot_options = qdict_new();
1325 qdict_put(snapshot_options, "file.driver",
1326 qstring_from_str("file"));
1327 qdict_put(snapshot_options, "file.filename",
1328 qstring_from_str(tmp_filename));
Max Reitze6641712015-08-26 19:47:48 +02001329 qdict_put(snapshot_options, "driver",
1330 qstring_from_str("qcow2"));
Kevin Wolfb9988752014-04-03 12:09:34 +02001331
Markus Armbrustere4e99862014-10-07 13:59:03 +02001332 bs_snapshot = bdrv_new();
Kevin Wolfb9988752014-04-03 12:09:34 +02001333
1334 ret = bdrv_open(&bs_snapshot, NULL, NULL, snapshot_options,
Max Reitz6ebf9aa2015-08-26 19:47:49 +02001335 flags, &local_err);
Kevin Wolfb9988752014-04-03 12:09:34 +02001336 if (ret < 0) {
1337 error_propagate(errp, local_err);
Benoît Canet1ba4b6a2014-04-22 17:05:27 +02001338 goto out;
Kevin Wolfb9988752014-04-03 12:09:34 +02001339 }
1340
1341 bdrv_append(bs_snapshot, bs);
Benoît Canet1ba4b6a2014-04-22 17:05:27 +02001342
1343out:
1344 g_free(tmp_filename);
Chen Gang6b8aeca2014-06-23 23:28:23 +08001345 return ret;
Kevin Wolfb9988752014-04-03 12:09:34 +02001346}
1347
Max Reitzda557aa2013-12-20 19:28:11 +01001348/*
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001349 * Opens a disk image (raw, qcow2, vmdk, ...)
Kevin Wolfde9c0ce2013-03-15 10:35:02 +01001350 *
1351 * options is a QDict of options to pass to the block drivers, or NULL for an
1352 * empty set of options. The reference to the QDict belongs to the block layer
1353 * after the call (even on failure), so if the caller intends to reuse the
1354 * dictionary, it needs to use QINCREF() before calling bdrv_open.
Max Reitzf67503e2014-02-18 18:33:05 +01001355 *
1356 * If *pbs is NULL, a new BDS will be created with a pointer to it stored there.
1357 * If it is not NULL, the referenced BDS will be reused.
Max Reitzddf56362014-02-18 18:33:06 +01001358 *
1359 * The reference parameter may be used to specify an existing block device which
1360 * should be opened. If specified, neither options nor a filename may be given,
1361 * nor can an existing BDS be reused (that is, *pbs has to be NULL).
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001362 */
Kevin Wolff3930ed2015-04-08 13:43:47 +02001363static int bdrv_open_inherit(BlockDriverState **pbs, const char *filename,
1364 const char *reference, QDict *options, int flags,
1365 BlockDriverState *parent,
Max Reitzce343772015-08-26 19:47:50 +02001366 const BdrvChildRole *child_role, Error **errp)
bellardea2384d2004-08-01 21:59:26 +00001367{
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001368 int ret;
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02001369 BdrvChild *file = NULL;
1370 BlockDriverState *bs;
Max Reitzce343772015-08-26 19:47:50 +02001371 BlockDriver *drv = NULL;
Kevin Wolf74fe54f2013-07-09 11:09:02 +02001372 const char *drvname;
Max Reitz34b5d2c2013-09-05 14:45:29 +02001373 Error *local_err = NULL;
Kevin Wolfb1e6fc02014-05-06 12:11:42 +02001374 int snapshot_flags = 0;
bellard712e7872005-04-28 21:09:32 +00001375
Max Reitzf67503e2014-02-18 18:33:05 +01001376 assert(pbs);
Kevin Wolff3930ed2015-04-08 13:43:47 +02001377 assert(!child_role || !flags);
1378 assert(!child_role == !parent);
Max Reitzf67503e2014-02-18 18:33:05 +01001379
Max Reitzddf56362014-02-18 18:33:06 +01001380 if (reference) {
1381 bool options_non_empty = options ? qdict_size(options) : false;
1382 QDECREF(options);
1383
1384 if (*pbs) {
1385 error_setg(errp, "Cannot reuse an existing BDS when referencing "
1386 "another block device");
1387 return -EINVAL;
1388 }
1389
1390 if (filename || options_non_empty) {
1391 error_setg(errp, "Cannot reference an existing block device with "
1392 "additional options or a new filename");
1393 return -EINVAL;
1394 }
1395
1396 bs = bdrv_lookup_bs(reference, reference, errp);
1397 if (!bs) {
1398 return -ENODEV;
1399 }
1400 bdrv_ref(bs);
1401 *pbs = bs;
1402 return 0;
1403 }
1404
Max Reitzf67503e2014-02-18 18:33:05 +01001405 if (*pbs) {
1406 bs = *pbs;
1407 } else {
Markus Armbrustere4e99862014-10-07 13:59:03 +02001408 bs = bdrv_new();
Max Reitzf67503e2014-02-18 18:33:05 +01001409 }
1410
Kevin Wolfde9c0ce2013-03-15 10:35:02 +01001411 /* NULL means an empty set of options */
1412 if (options == NULL) {
1413 options = qdict_new();
1414 }
1415
Kevin Wolff3930ed2015-04-08 13:43:47 +02001416 if (child_role) {
Kevin Wolfbddcec32015-04-09 18:47:50 +02001417 bs->inherits_from = parent;
Kevin Wolff3930ed2015-04-08 13:43:47 +02001418 flags = child_role->inherit_flags(parent->open_flags);
1419 }
1420
Max Reitz053e1572015-08-26 19:47:51 +02001421 ret = bdrv_fill_options(&options, &filename, &flags, &local_err);
Kevin Wolf462f5bc2014-05-26 11:39:55 +02001422 if (local_err) {
1423 goto fail;
1424 }
1425
Kevin Wolf76c591b2014-06-04 14:19:44 +02001426 /* Find the right image format driver */
Kevin Wolf76c591b2014-06-04 14:19:44 +02001427 drvname = qdict_get_try_str(options, "driver");
1428 if (drvname) {
1429 drv = bdrv_find_format(drvname);
1430 qdict_del(options, "driver");
1431 if (!drv) {
1432 error_setg(errp, "Unknown driver: '%s'", drvname);
1433 ret = -EINVAL;
1434 goto fail;
1435 }
1436 }
1437
1438 assert(drvname || !(flags & BDRV_O_PROTOCOL));
Kevin Wolf76c591b2014-06-04 14:19:44 +02001439
Kevin Wolff3930ed2015-04-08 13:43:47 +02001440 bs->open_flags = flags;
Kevin Wolfde9c0ce2013-03-15 10:35:02 +01001441 bs->options = options;
Kevin Wolfb6ad4912013-03-15 10:35:04 +01001442 options = qdict_clone_shallow(options);
Kevin Wolfde9c0ce2013-03-15 10:35:02 +01001443
Kevin Wolff4788ad2014-06-03 16:44:19 +02001444 /* Open image file without format layer */
1445 if ((flags & BDRV_O_PROTOCOL) == 0) {
1446 if (flags & BDRV_O_RDWR) {
1447 flags |= BDRV_O_ALLOW_RDWR;
1448 }
1449 if (flags & BDRV_O_SNAPSHOT) {
1450 snapshot_flags = bdrv_temp_snapshot_flags(flags);
1451 flags = bdrv_backing_flags(flags);
1452 }
1453
Kevin Wolff3930ed2015-04-08 13:43:47 +02001454 bs->open_flags = flags;
Kevin Wolf1fdd6932015-06-15 14:11:51 +02001455
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02001456 file = bdrv_open_child(filename, options, "file", bs,
1457 &child_file, true, &local_err);
Kevin Wolf1fdd6932015-06-15 14:11:51 +02001458 if (local_err) {
1459 ret = -EINVAL;
Max Reitz5469a2a2014-02-18 18:33:10 +01001460 goto fail;
1461 }
1462 }
1463
Kevin Wolf76c591b2014-06-04 14:19:44 +02001464 /* Image format probing */
Kevin Wolf38f3ef52014-11-20 16:27:12 +01001465 bs->probed = !drv;
Kevin Wolf76c591b2014-06-04 14:19:44 +02001466 if (!drv && file) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02001467 ret = find_image_format(file->bs, filename, &drv, &local_err);
Kevin Wolf17b005f2014-05-27 10:50:29 +02001468 if (ret < 0) {
Kevin Wolf8bfea152014-04-11 19:16:36 +02001469 goto fail;
Max Reitz2a05cbe2013-12-20 19:28:10 +01001470 }
Kevin Wolf76c591b2014-06-04 14:19:44 +02001471 } else if (!drv) {
Kevin Wolf17b005f2014-05-27 10:50:29 +02001472 error_setg(errp, "Must specify either driver or file");
1473 ret = -EINVAL;
Kevin Wolf8bfea152014-04-11 19:16:36 +02001474 goto fail;
Kevin Wolff500a6d2012-11-12 17:35:27 +01001475 }
1476
Max Reitz53a29512015-03-19 14:53:16 -04001477 /* BDRV_O_PROTOCOL must be set iff a protocol BDS is about to be created */
1478 assert(!!(flags & BDRV_O_PROTOCOL) == !!drv->bdrv_file_open);
1479 /* file must be NULL if a protocol BDS is about to be created
1480 * (the inverse results in an error message from bdrv_open_common()) */
1481 assert(!(flags & BDRV_O_PROTOCOL) || !file);
1482
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001483 /* Open the image */
Max Reitz34b5d2c2013-09-05 14:45:29 +02001484 ret = bdrv_open_common(bs, file, options, flags, drv, &local_err);
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001485 if (ret < 0) {
Kevin Wolf8bfea152014-04-11 19:16:36 +02001486 goto fail;
Christoph Hellwig69873072010-01-20 18:13:25 +01001487 }
1488
Max Reitz2a05cbe2013-12-20 19:28:10 +01001489 if (file && (bs->file != file)) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02001490 bdrv_unref_child(bs, file);
Kevin Wolff500a6d2012-11-12 17:35:27 +01001491 file = NULL;
1492 }
1493
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001494 /* If there is a backing file, use it */
Paolo Bonzini9156df12012-10-18 16:49:17 +02001495 if ((flags & BDRV_O_NO_BACKING) == 0) {
Kevin Wolf31ca6d02013-03-28 15:29:24 +01001496 QDict *backing_options;
1497
Benoît Canet5726d872013-09-25 13:30:01 +02001498 qdict_extract_subqdict(options, &backing_options, "backing.");
Max Reitz34b5d2c2013-09-05 14:45:29 +02001499 ret = bdrv_open_backing_file(bs, backing_options, &local_err);
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001500 if (ret < 0) {
Kevin Wolfb6ad4912013-03-15 10:35:04 +01001501 goto close_and_fail;
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001502 }
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001503 }
1504
Max Reitz91af7012014-07-18 20:24:56 +02001505 bdrv_refresh_filename(bs);
1506
Kevin Wolfb9988752014-04-03 12:09:34 +02001507 /* For snapshot=on, create a temporary qcow2 overlay. bs points to the
1508 * temporary snapshot afterwards. */
Kevin Wolfb1e6fc02014-05-06 12:11:42 +02001509 if (snapshot_flags) {
Chen Gang6b8aeca2014-06-23 23:28:23 +08001510 ret = bdrv_append_temp_snapshot(bs, snapshot_flags, &local_err);
Kevin Wolfb9988752014-04-03 12:09:34 +02001511 if (local_err) {
Kevin Wolfb9988752014-04-03 12:09:34 +02001512 goto close_and_fail;
1513 }
1514 }
1515
Kevin Wolfb6ad4912013-03-15 10:35:04 +01001516 /* Check if any unknown options were used */
Max Reitz5acd9d82014-02-18 18:33:11 +01001517 if (options && (qdict_size(options) != 0)) {
Kevin Wolfb6ad4912013-03-15 10:35:04 +01001518 const QDictEntry *entry = qdict_first(options);
Max Reitz5acd9d82014-02-18 18:33:11 +01001519 if (flags & BDRV_O_PROTOCOL) {
1520 error_setg(errp, "Block protocol '%s' doesn't support the option "
1521 "'%s'", drv->format_name, entry->key);
1522 } else {
1523 error_setg(errp, "Block format '%s' used by device '%s' doesn't "
1524 "support the option '%s'", drv->format_name,
Markus Armbrusterbfb197e2014-10-07 13:59:11 +02001525 bdrv_get_device_name(bs), entry->key);
Max Reitz5acd9d82014-02-18 18:33:11 +01001526 }
Kevin Wolfb6ad4912013-03-15 10:35:04 +01001527
1528 ret = -EINVAL;
1529 goto close_and_fail;
1530 }
Kevin Wolfb6ad4912013-03-15 10:35:04 +01001531
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001532 if (!bdrv_key_required(bs)) {
Markus Armbrustera7f53e22014-10-07 13:59:25 +02001533 if (bs->blk) {
1534 blk_dev_change_media_cb(bs->blk, true);
1535 }
Markus Armbrusterc3adb582014-03-14 09:22:48 +01001536 } else if (!runstate_check(RUN_STATE_PRELAUNCH)
1537 && !runstate_check(RUN_STATE_INMIGRATE)
1538 && !runstate_check(RUN_STATE_PAUSED)) { /* HACK */
1539 error_setg(errp,
1540 "Guest must be stopped for opening of encrypted image");
1541 ret = -EBUSY;
1542 goto close_and_fail;
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001543 }
1544
Markus Armbrusterc3adb582014-03-14 09:22:48 +01001545 QDECREF(options);
Max Reitzf67503e2014-02-18 18:33:05 +01001546 *pbs = bs;
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001547 return 0;
1548
Kevin Wolf8bfea152014-04-11 19:16:36 +02001549fail:
Kevin Wolff500a6d2012-11-12 17:35:27 +01001550 if (file != NULL) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02001551 bdrv_unref_child(bs, file);
Kevin Wolff500a6d2012-11-12 17:35:27 +01001552 }
Kevin Wolfde9c0ce2013-03-15 10:35:02 +01001553 QDECREF(bs->options);
Kevin Wolfb6ad4912013-03-15 10:35:04 +01001554 QDECREF(options);
Kevin Wolfde9c0ce2013-03-15 10:35:02 +01001555 bs->options = NULL;
Max Reitzf67503e2014-02-18 18:33:05 +01001556 if (!*pbs) {
1557 /* If *pbs is NULL, a new BDS has been created in this function and
1558 needs to be freed now. Otherwise, it does not need to be closed,
1559 since it has not really been opened yet. */
1560 bdrv_unref(bs);
1561 }
Markus Armbruster84d18f02014-01-30 15:07:28 +01001562 if (local_err) {
Max Reitz34b5d2c2013-09-05 14:45:29 +02001563 error_propagate(errp, local_err);
1564 }
Kevin Wolfb6ad4912013-03-15 10:35:04 +01001565 return ret;
Kevin Wolfde9c0ce2013-03-15 10:35:02 +01001566
Kevin Wolfb6ad4912013-03-15 10:35:04 +01001567close_and_fail:
Max Reitzf67503e2014-02-18 18:33:05 +01001568 /* See fail path, but now the BDS has to be always closed */
1569 if (*pbs) {
1570 bdrv_close(bs);
1571 } else {
1572 bdrv_unref(bs);
1573 }
Kevin Wolfb6ad4912013-03-15 10:35:04 +01001574 QDECREF(options);
Markus Armbruster84d18f02014-01-30 15:07:28 +01001575 if (local_err) {
Max Reitz34b5d2c2013-09-05 14:45:29 +02001576 error_propagate(errp, local_err);
1577 }
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001578 return ret;
1579}
1580
Kevin Wolff3930ed2015-04-08 13:43:47 +02001581int bdrv_open(BlockDriverState **pbs, const char *filename,
Max Reitz6ebf9aa2015-08-26 19:47:49 +02001582 const char *reference, QDict *options, int flags, Error **errp)
Kevin Wolff3930ed2015-04-08 13:43:47 +02001583{
1584 return bdrv_open_inherit(pbs, filename, reference, options, flags, NULL,
Max Reitzce343772015-08-26 19:47:50 +02001585 NULL, errp);
Kevin Wolff3930ed2015-04-08 13:43:47 +02001586}
1587
Jeff Codye971aa12012-09-20 15:13:19 -04001588typedef struct BlockReopenQueueEntry {
1589 bool prepared;
1590 BDRVReopenState state;
1591 QSIMPLEQ_ENTRY(BlockReopenQueueEntry) entry;
1592} BlockReopenQueueEntry;
1593
1594/*
1595 * Adds a BlockDriverState to a simple queue for an atomic, transactional
1596 * reopen of multiple devices.
1597 *
1598 * bs_queue can either be an existing BlockReopenQueue that has had QSIMPLE_INIT
1599 * already performed, or alternatively may be NULL a new BlockReopenQueue will
1600 * be created and initialized. This newly created BlockReopenQueue should be
1601 * passed back in for subsequent calls that are intended to be of the same
1602 * atomic 'set'.
1603 *
1604 * bs is the BlockDriverState to add to the reopen queue.
1605 *
Kevin Wolf4d2cb092015-04-10 17:50:50 +02001606 * options contains the changed options for the associated bs
1607 * (the BlockReopenQueue takes ownership)
1608 *
Jeff Codye971aa12012-09-20 15:13:19 -04001609 * flags contains the open flags for the associated bs
1610 *
1611 * returns a pointer to bs_queue, which is either the newly allocated
1612 * bs_queue, or the existing bs_queue being used.
1613 *
1614 */
1615BlockReopenQueue *bdrv_reopen_queue(BlockReopenQueue *bs_queue,
Kevin Wolf4d2cb092015-04-10 17:50:50 +02001616 BlockDriverState *bs,
1617 QDict *options, int flags)
Jeff Codye971aa12012-09-20 15:13:19 -04001618{
1619 assert(bs != NULL);
1620
1621 BlockReopenQueueEntry *bs_entry;
Kevin Wolf67251a32015-04-09 18:54:04 +02001622 BdrvChild *child;
Kevin Wolf4d2cb092015-04-10 17:50:50 +02001623 QDict *old_options;
Kevin Wolf67251a32015-04-09 18:54:04 +02001624
Jeff Codye971aa12012-09-20 15:13:19 -04001625 if (bs_queue == NULL) {
1626 bs_queue = g_new0(BlockReopenQueue, 1);
1627 QSIMPLEQ_INIT(bs_queue);
1628 }
1629
Kevin Wolf4d2cb092015-04-10 17:50:50 +02001630 if (!options) {
1631 options = qdict_new();
1632 }
1633
1634 old_options = qdict_clone_shallow(bs->options);
1635 qdict_join(options, old_options, false);
1636 QDECREF(old_options);
1637
Kevin Wolff1f25a22014-04-25 19:04:55 +02001638 /* bdrv_open() masks this flag out */
1639 flags &= ~BDRV_O_PROTOCOL;
1640
Kevin Wolf67251a32015-04-09 18:54:04 +02001641 QLIST_FOREACH(child, &bs->children, next) {
1642 int child_flags;
1643
1644 if (child->bs->inherits_from != bs) {
1645 continue;
1646 }
1647
1648 child_flags = child->role->inherit_flags(flags);
Kevin Wolf4d2cb092015-04-10 17:50:50 +02001649 /* TODO Pass down child flags (backing.*, extents.*, ...) */
1650 bdrv_reopen_queue(bs_queue, child->bs, NULL, child_flags);
Jeff Codye971aa12012-09-20 15:13:19 -04001651 }
1652
1653 bs_entry = g_new0(BlockReopenQueueEntry, 1);
1654 QSIMPLEQ_INSERT_TAIL(bs_queue, bs_entry, entry);
1655
1656 bs_entry->state.bs = bs;
Kevin Wolf4d2cb092015-04-10 17:50:50 +02001657 bs_entry->state.options = options;
Jeff Codye971aa12012-09-20 15:13:19 -04001658 bs_entry->state.flags = flags;
1659
1660 return bs_queue;
1661}
1662
1663/*
1664 * Reopen multiple BlockDriverStates atomically & transactionally.
1665 *
1666 * The queue passed in (bs_queue) must have been built up previous
1667 * via bdrv_reopen_queue().
1668 *
1669 * Reopens all BDS specified in the queue, with the appropriate
1670 * flags. All devices are prepared for reopen, and failure of any
1671 * device will cause all device changes to be abandonded, and intermediate
1672 * data cleaned up.
1673 *
1674 * If all devices prepare successfully, then the changes are committed
1675 * to all devices.
1676 *
1677 */
1678int bdrv_reopen_multiple(BlockReopenQueue *bs_queue, Error **errp)
1679{
1680 int ret = -1;
1681 BlockReopenQueueEntry *bs_entry, *next;
1682 Error *local_err = NULL;
1683
1684 assert(bs_queue != NULL);
1685
1686 bdrv_drain_all();
1687
1688 QSIMPLEQ_FOREACH(bs_entry, bs_queue, entry) {
1689 if (bdrv_reopen_prepare(&bs_entry->state, bs_queue, &local_err)) {
1690 error_propagate(errp, local_err);
1691 goto cleanup;
1692 }
1693 bs_entry->prepared = true;
1694 }
1695
1696 /* If we reach this point, we have success and just need to apply the
1697 * changes
1698 */
1699 QSIMPLEQ_FOREACH(bs_entry, bs_queue, entry) {
1700 bdrv_reopen_commit(&bs_entry->state);
1701 }
1702
1703 ret = 0;
1704
1705cleanup:
1706 QSIMPLEQ_FOREACH_SAFE(bs_entry, bs_queue, entry, next) {
1707 if (ret && bs_entry->prepared) {
1708 bdrv_reopen_abort(&bs_entry->state);
1709 }
Kevin Wolf4d2cb092015-04-10 17:50:50 +02001710 QDECREF(bs_entry->state.options);
Jeff Codye971aa12012-09-20 15:13:19 -04001711 g_free(bs_entry);
1712 }
1713 g_free(bs_queue);
1714 return ret;
1715}
1716
1717
1718/* Reopen a single BlockDriverState with the specified flags. */
1719int bdrv_reopen(BlockDriverState *bs, int bdrv_flags, Error **errp)
1720{
1721 int ret = -1;
1722 Error *local_err = NULL;
Kevin Wolf4d2cb092015-04-10 17:50:50 +02001723 BlockReopenQueue *queue = bdrv_reopen_queue(NULL, bs, NULL, bdrv_flags);
Jeff Codye971aa12012-09-20 15:13:19 -04001724
1725 ret = bdrv_reopen_multiple(queue, &local_err);
1726 if (local_err != NULL) {
1727 error_propagate(errp, local_err);
1728 }
1729 return ret;
1730}
1731
1732
1733/*
1734 * Prepares a BlockDriverState for reopen. All changes are staged in the
1735 * 'opaque' field of the BDRVReopenState, which is used and allocated by
1736 * the block driver layer .bdrv_reopen_prepare()
1737 *
1738 * bs is the BlockDriverState to reopen
1739 * flags are the new open flags
1740 * queue is the reopen queue
1741 *
1742 * Returns 0 on success, non-zero on error. On error errp will be set
1743 * as well.
1744 *
1745 * On failure, bdrv_reopen_abort() will be called to clean up any data.
1746 * It is the responsibility of the caller to then call the abort() or
1747 * commit() for any other BDS that have been left in a prepare() state
1748 *
1749 */
1750int bdrv_reopen_prepare(BDRVReopenState *reopen_state, BlockReopenQueue *queue,
1751 Error **errp)
1752{
1753 int ret = -1;
1754 Error *local_err = NULL;
1755 BlockDriver *drv;
1756
1757 assert(reopen_state != NULL);
1758 assert(reopen_state->bs->drv != NULL);
1759 drv = reopen_state->bs->drv;
1760
1761 /* if we are to stay read-only, do not allow permission change
1762 * to r/w */
1763 if (!(reopen_state->bs->open_flags & BDRV_O_ALLOW_RDWR) &&
1764 reopen_state->flags & BDRV_O_RDWR) {
Alberto Garcia81e5f782015-04-08 12:29:19 +03001765 error_setg(errp, "Node '%s' is read only",
1766 bdrv_get_device_or_node_name(reopen_state->bs));
Jeff Codye971aa12012-09-20 15:13:19 -04001767 goto error;
1768 }
1769
1770
1771 ret = bdrv_flush(reopen_state->bs);
1772 if (ret) {
1773 error_set(errp, ERROR_CLASS_GENERIC_ERROR, "Error (%s) flushing drive",
1774 strerror(-ret));
1775 goto error;
1776 }
1777
1778 if (drv->bdrv_reopen_prepare) {
1779 ret = drv->bdrv_reopen_prepare(reopen_state, queue, &local_err);
1780 if (ret) {
1781 if (local_err != NULL) {
1782 error_propagate(errp, local_err);
1783 } else {
Luiz Capitulinod8b68952013-06-10 11:29:27 -04001784 error_setg(errp, "failed while preparing to reopen image '%s'",
1785 reopen_state->bs->filename);
Jeff Codye971aa12012-09-20 15:13:19 -04001786 }
1787 goto error;
1788 }
1789 } else {
1790 /* It is currently mandatory to have a bdrv_reopen_prepare()
1791 * handler for each supported drv. */
Alberto Garcia81e5f782015-04-08 12:29:19 +03001792 error_setg(errp, "Block format '%s' used by node '%s' "
1793 "does not support reopening files", drv->format_name,
1794 bdrv_get_device_or_node_name(reopen_state->bs));
Jeff Codye971aa12012-09-20 15:13:19 -04001795 ret = -1;
1796 goto error;
1797 }
1798
Kevin Wolf4d2cb092015-04-10 17:50:50 +02001799 /* Options that are not handled are only okay if they are unchanged
1800 * compared to the old state. It is expected that some options are only
1801 * used for the initial open, but not reopen (e.g. filename) */
1802 if (qdict_size(reopen_state->options)) {
1803 const QDictEntry *entry = qdict_first(reopen_state->options);
1804
1805 do {
1806 QString *new_obj = qobject_to_qstring(entry->value);
1807 const char *new = qstring_get_str(new_obj);
1808 const char *old = qdict_get_try_str(reopen_state->bs->options,
1809 entry->key);
1810
1811 if (!old || strcmp(new, old)) {
1812 error_setg(errp, "Cannot change the option '%s'", entry->key);
1813 ret = -EINVAL;
1814 goto error;
1815 }
1816 } while ((entry = qdict_next(reopen_state->options, entry)));
1817 }
1818
Jeff Codye971aa12012-09-20 15:13:19 -04001819 ret = 0;
1820
1821error:
1822 return ret;
1823}
1824
1825/*
1826 * Takes the staged changes for the reopen from bdrv_reopen_prepare(), and
1827 * makes them final by swapping the staging BlockDriverState contents into
1828 * the active BlockDriverState contents.
1829 */
1830void bdrv_reopen_commit(BDRVReopenState *reopen_state)
1831{
1832 BlockDriver *drv;
1833
1834 assert(reopen_state != NULL);
1835 drv = reopen_state->bs->drv;
1836 assert(drv != NULL);
1837
1838 /* If there are any driver level actions to take */
1839 if (drv->bdrv_reopen_commit) {
1840 drv->bdrv_reopen_commit(reopen_state);
1841 }
1842
1843 /* set BDS specific flags now */
1844 reopen_state->bs->open_flags = reopen_state->flags;
1845 reopen_state->bs->enable_write_cache = !!(reopen_state->flags &
1846 BDRV_O_CACHE_WB);
1847 reopen_state->bs->read_only = !(reopen_state->flags & BDRV_O_RDWR);
Kevin Wolf355ef4a2013-12-11 20:14:09 +01001848
Kevin Wolf3baca892014-07-16 17:48:16 +02001849 bdrv_refresh_limits(reopen_state->bs, NULL);
Jeff Codye971aa12012-09-20 15:13:19 -04001850}
1851
1852/*
1853 * Abort the reopen, and delete and free the staged changes in
1854 * reopen_state
1855 */
1856void bdrv_reopen_abort(BDRVReopenState *reopen_state)
1857{
1858 BlockDriver *drv;
1859
1860 assert(reopen_state != NULL);
1861 drv = reopen_state->bs->drv;
1862 assert(drv != NULL);
1863
1864 if (drv->bdrv_reopen_abort) {
1865 drv->bdrv_reopen_abort(reopen_state);
1866 }
1867}
1868
1869
bellardfc01f7e2003-06-30 10:03:06 +00001870void bdrv_close(BlockDriverState *bs)
1871{
Max Reitz33384422014-06-20 21:57:33 +02001872 BdrvAioNotifier *ban, *ban_next;
1873
Paolo Bonzini3cbc0022012-10-19 11:36:48 +02001874 if (bs->job) {
1875 block_job_cancel_sync(bs->job);
1876 }
Alberto Garcia99b7e772015-09-25 16:41:44 +03001877
1878 /* Disable I/O limits and drain all pending throttled requests */
1879 if (bs->io_limits_enabled) {
1880 bdrv_io_limits_disable(bs);
1881 }
1882
Fam Zheng53ec73e2015-05-29 18:53:14 +08001883 bdrv_drain(bs); /* complete I/O */
Stefan Hajnoczi58fda172013-07-02 15:36:25 +02001884 bdrv_flush(bs);
Fam Zheng53ec73e2015-05-29 18:53:14 +08001885 bdrv_drain(bs); /* in case flush left pending I/O */
Paolo Bonzinid7d512f2012-08-23 11:20:36 +02001886 notifier_list_notify(&bs->close_notifiers, bs);
Kevin Wolf7094f122012-04-11 11:06:37 +02001887
Paolo Bonzini3cbc0022012-10-19 11:36:48 +02001888 if (bs->drv) {
Kevin Wolf6e93e7c2015-04-08 13:49:41 +02001889 BdrvChild *child, *next;
1890
Kevin Wolf9a7dedb2015-06-16 10:58:20 +02001891 bs->drv->bdrv_close(bs);
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02001892 bs->drv = NULL;
Kevin Wolf9a7dedb2015-06-16 10:58:20 +02001893
Kevin Wolf760e0062015-06-17 14:55:21 +02001894 if (bs->backing) {
1895 BlockDriverState *backing_hd = bs->backing->bs;
Kevin Wolf9a7dedb2015-06-16 10:58:20 +02001896 bdrv_set_backing_hd(bs, NULL);
1897 bdrv_unref(backing_hd);
1898 }
1899
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02001900 if (bs->file != NULL) {
1901 bdrv_unref_child(bs, bs->file);
1902 bs->file = NULL;
1903 }
1904
Kevin Wolf6e93e7c2015-04-08 13:49:41 +02001905 QLIST_FOREACH_SAFE(child, &bs->children, next, next) {
Kevin Wolf33a60402015-06-15 13:51:04 +02001906 /* TODO Remove bdrv_unref() from drivers' close function and use
1907 * bdrv_unref_child() here */
Kevin Wolfbddcec32015-04-09 18:47:50 +02001908 if (child->bs->inherits_from == bs) {
1909 child->bs->inherits_from = NULL;
1910 }
Kevin Wolf33a60402015-06-15 13:51:04 +02001911 bdrv_detach_child(child);
Kevin Wolf6e93e7c2015-04-08 13:49:41 +02001912 }
1913
Anthony Liguori7267c092011-08-20 22:09:37 -05001914 g_free(bs->opaque);
bellardea2384d2004-08-01 21:59:26 +00001915 bs->opaque = NULL;
Stefan Hajnoczi53fec9d2011-11-28 16:08:47 +00001916 bs->copy_on_read = 0;
Paolo Bonzinia275fa42012-05-08 16:51:43 +02001917 bs->backing_file[0] = '\0';
1918 bs->backing_format[0] = '\0';
Paolo Bonzini64058752012-05-08 16:51:49 +02001919 bs->total_sectors = 0;
1920 bs->encrypted = 0;
1921 bs->valid_key = 0;
1922 bs->sg = 0;
Asias He0d51b4d2013-08-22 15:24:14 +08001923 bs->zero_beyond_eof = false;
Kevin Wolfde9c0ce2013-03-15 10:35:02 +01001924 QDECREF(bs->options);
1925 bs->options = NULL;
Max Reitz91af7012014-07-18 20:24:56 +02001926 QDECREF(bs->full_open_options);
1927 bs->full_open_options = NULL;
bellardb3380822004-03-14 21:38:54 +00001928 }
Zhi Yong Wu98f90db2011-11-08 13:00:14 +08001929
Markus Armbrustera7f53e22014-10-07 13:59:25 +02001930 if (bs->blk) {
1931 blk_dev_change_media_cb(bs->blk, false);
1932 }
Pavel Hrdina9ca11152012-08-09 12:44:48 +02001933
Max Reitz33384422014-06-20 21:57:33 +02001934 QLIST_FOREACH_SAFE(ban, &bs->aio_notifiers, list, ban_next) {
1935 g_free(ban);
1936 }
1937 QLIST_INIT(&bs->aio_notifiers);
bellardb3380822004-03-14 21:38:54 +00001938}
1939
MORITA Kazutaka2bc93fe2010-05-28 11:44:57 +09001940void bdrv_close_all(void)
1941{
1942 BlockDriverState *bs;
1943
Benoît Canetdc364f42014-01-23 21:31:32 +01001944 QTAILQ_FOREACH(bs, &bdrv_states, device_list) {
Stefan Hajnoczied78cda2014-05-08 16:34:35 +02001945 AioContext *aio_context = bdrv_get_aio_context(bs);
1946
1947 aio_context_acquire(aio_context);
MORITA Kazutaka2bc93fe2010-05-28 11:44:57 +09001948 bdrv_close(bs);
Stefan Hajnoczied78cda2014-05-08 16:34:35 +02001949 aio_context_release(aio_context);
MORITA Kazutaka2bc93fe2010-05-28 11:44:57 +09001950 }
1951}
1952
Benoît Canetdc364f42014-01-23 21:31:32 +01001953/* make a BlockDriverState anonymous by removing from bdrv_state and
1954 * graph_bdrv_state list.
Ryan Harperd22b2f42011-03-29 20:51:47 -05001955 Also, NULL terminate the device_name to prevent double remove */
1956void bdrv_make_anon(BlockDriverState *bs)
1957{
Markus Armbrusterbfb197e2014-10-07 13:59:11 +02001958 /*
1959 * Take care to remove bs from bdrv_states only when it's actually
1960 * in it. Note that bs->device_list.tqe_prev is initially null,
1961 * and gets set to non-null by QTAILQ_INSERT_TAIL(). Establish
1962 * the useful invariant "bs in bdrv_states iff bs->tqe_prev" by
1963 * resetting it to null on remove.
1964 */
1965 if (bs->device_list.tqe_prev) {
Benoît Canetdc364f42014-01-23 21:31:32 +01001966 QTAILQ_REMOVE(&bdrv_states, bs, device_list);
Markus Armbrusterbfb197e2014-10-07 13:59:11 +02001967 bs->device_list.tqe_prev = NULL;
Ryan Harperd22b2f42011-03-29 20:51:47 -05001968 }
Benoît Canetdc364f42014-01-23 21:31:32 +01001969 if (bs->node_name[0] != '\0') {
1970 QTAILQ_REMOVE(&graph_bdrv_states, bs, node_list);
1971 }
1972 bs->node_name[0] = '\0';
Ryan Harperd22b2f42011-03-29 20:51:47 -05001973}
1974
Paolo Bonzinie023b2e2012-05-08 16:51:41 +02001975static void bdrv_rebind(BlockDriverState *bs)
1976{
1977 if (bs->drv && bs->drv->bdrv_rebind) {
1978 bs->drv->bdrv_rebind(bs);
1979 }
1980}
1981
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02001982static void bdrv_move_feature_fields(BlockDriverState *bs_dest,
1983 BlockDriverState *bs_src)
1984{
1985 /* move some fields that need to stay attached to the device */
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02001986
1987 /* dev info */
Paolo Bonzini1b7fd722011-11-29 11:35:47 +01001988 bs_dest->guest_block_size = bs_src->guest_block_size;
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02001989 bs_dest->copy_on_read = bs_src->copy_on_read;
1990
1991 bs_dest->enable_write_cache = bs_src->enable_write_cache;
1992
Benoît Canetcc0681c2013-09-02 14:14:39 +02001993 /* i/o throttled req */
Alberto Garcia76f4afb2015-06-08 18:17:44 +02001994 bs_dest->throttle_state = bs_src->throttle_state,
1995 bs_dest->io_limits_enabled = bs_src->io_limits_enabled;
1996 bs_dest->pending_reqs[0] = bs_src->pending_reqs[0];
1997 bs_dest->pending_reqs[1] = bs_src->pending_reqs[1];
1998 bs_dest->throttled_reqs[0] = bs_src->throttled_reqs[0];
1999 bs_dest->throttled_reqs[1] = bs_src->throttled_reqs[1];
2000 memcpy(&bs_dest->round_robin,
2001 &bs_src->round_robin,
2002 sizeof(bs_dest->round_robin));
Benoît Canet0e5b0a22015-06-08 18:17:41 +02002003 memcpy(&bs_dest->throttle_timers,
2004 &bs_src->throttle_timers,
2005 sizeof(ThrottleTimers));
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002006
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002007 /* r/w error */
2008 bs_dest->on_read_error = bs_src->on_read_error;
2009 bs_dest->on_write_error = bs_src->on_write_error;
2010
2011 /* i/o status */
2012 bs_dest->iostatus_enabled = bs_src->iostatus_enabled;
2013 bs_dest->iostatus = bs_src->iostatus;
2014
2015 /* dirty bitmap */
Fam Zhenge4654d22013-11-13 18:29:43 +08002016 bs_dest->dirty_bitmaps = bs_src->dirty_bitmaps;
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002017
Fam Zheng9fcb0252013-08-23 09:14:46 +08002018 /* reference count */
2019 bs_dest->refcnt = bs_src->refcnt;
2020
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002021 /* job */
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002022 bs_dest->job = bs_src->job;
2023
2024 /* keep the same entry in bdrv_states */
Benoît Canetdc364f42014-01-23 21:31:32 +01002025 bs_dest->device_list = bs_src->device_list;
Markus Armbruster7e7d56d2014-10-07 13:59:05 +02002026 bs_dest->blk = bs_src->blk;
2027
Fam Zhengfbe40ff2014-05-23 21:29:42 +08002028 memcpy(bs_dest->op_blockers, bs_src->op_blockers,
2029 sizeof(bs_dest->op_blockers));
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002030}
2031
2032/*
2033 * Swap bs contents for two image chains while they are live,
2034 * while keeping required fields on the BlockDriverState that is
2035 * actually attached to a device.
2036 *
2037 * This will modify the BlockDriverState fields, and swap contents
2038 * between bs_new and bs_old. Both bs_new and bs_old are modified.
2039 *
Markus Armbrusterbfb197e2014-10-07 13:59:11 +02002040 * bs_new must not be attached to a BlockBackend.
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002041 *
2042 * This function does not create any image files.
2043 */
2044void bdrv_swap(BlockDriverState *bs_new, BlockDriverState *bs_old)
2045{
2046 BlockDriverState tmp;
Kevin Wolfbddcec32015-04-09 18:47:50 +02002047 BdrvChild *child;
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002048
Kevin Wolf6ee4ce12015-06-10 13:33:17 +02002049 bdrv_drain(bs_new);
2050 bdrv_drain(bs_old);
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002051
Benoît Canet90ce8a02014-03-05 23:48:29 +01002052 /* The code needs to swap the node_name but simply swapping node_list won't
2053 * work so first remove the nodes from the graph list, do the swap then
2054 * insert them back if needed.
2055 */
2056 if (bs_new->node_name[0] != '\0') {
2057 QTAILQ_REMOVE(&graph_bdrv_states, bs_new, node_list);
2058 }
2059 if (bs_old->node_name[0] != '\0') {
2060 QTAILQ_REMOVE(&graph_bdrv_states, bs_old, node_list);
2061 }
2062
Alberto Garciadb628332015-06-08 18:17:45 +02002063 /* If the BlockDriverState is part of a throttling group acquire
2064 * its lock since we're going to mess with the protected fields.
2065 * Otherwise there's no need to worry since no one else can touch
2066 * them. */
2067 if (bs_old->throttle_state) {
2068 throttle_group_lock(bs_old);
2069 }
2070
Markus Armbrusterbfb197e2014-10-07 13:59:11 +02002071 /* bs_new must be unattached and shouldn't have anything fancy enabled */
Markus Armbruster7e7d56d2014-10-07 13:59:05 +02002072 assert(!bs_new->blk);
Fam Zhenge4654d22013-11-13 18:29:43 +08002073 assert(QLIST_EMPTY(&bs_new->dirty_bitmaps));
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002074 assert(bs_new->job == NULL);
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002075 assert(bs_new->io_limits_enabled == false);
Alberto Garciadb628332015-06-08 18:17:45 +02002076 assert(bs_new->throttle_state == NULL);
Benoît Canet0e5b0a22015-06-08 18:17:41 +02002077 assert(!throttle_timers_are_initialized(&bs_new->throttle_timers));
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002078
2079 tmp = *bs_new;
2080 *bs_new = *bs_old;
2081 *bs_old = tmp;
2082
2083 /* there are some fields that should not be swapped, move them back */
2084 bdrv_move_feature_fields(&tmp, bs_old);
2085 bdrv_move_feature_fields(bs_old, bs_new);
2086 bdrv_move_feature_fields(bs_new, &tmp);
2087
Markus Armbrusterbfb197e2014-10-07 13:59:11 +02002088 /* bs_new must remain unattached */
Markus Armbruster7e7d56d2014-10-07 13:59:05 +02002089 assert(!bs_new->blk);
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002090
2091 /* Check a few fields that should remain attached to the device */
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002092 assert(bs_new->job == NULL);
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002093 assert(bs_new->io_limits_enabled == false);
Alberto Garciadb628332015-06-08 18:17:45 +02002094 assert(bs_new->throttle_state == NULL);
Benoît Canet0e5b0a22015-06-08 18:17:41 +02002095 assert(!throttle_timers_are_initialized(&bs_new->throttle_timers));
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002096
Alberto Garciadb628332015-06-08 18:17:45 +02002097 /* Release the ThrottleGroup lock */
2098 if (bs_old->throttle_state) {
2099 throttle_group_unlock(bs_old);
2100 }
2101
Benoît Canet90ce8a02014-03-05 23:48:29 +01002102 /* insert the nodes back into the graph node list if needed */
2103 if (bs_new->node_name[0] != '\0') {
2104 QTAILQ_INSERT_TAIL(&graph_bdrv_states, bs_new, node_list);
2105 }
2106 if (bs_old->node_name[0] != '\0') {
2107 QTAILQ_INSERT_TAIL(&graph_bdrv_states, bs_old, node_list);
2108 }
2109
Kevin Wolf6e93e7c2015-04-08 13:49:41 +02002110 /*
2111 * Update lh_first.le_prev for non-empty lists.
2112 *
2113 * The head of the op blocker list doesn't change because it is moved back
2114 * in bdrv_move_feature_fields().
2115 */
Kevin Wolf6ee4ce12015-06-10 13:33:17 +02002116 assert(QLIST_EMPTY(&bs_old->tracked_requests));
2117 assert(QLIST_EMPTY(&bs_new->tracked_requests));
2118
Kevin Wolf6e93e7c2015-04-08 13:49:41 +02002119 QLIST_FIX_HEAD_PTR(&bs_new->children, next);
2120 QLIST_FIX_HEAD_PTR(&bs_old->children, next);
2121
Kevin Wolfbddcec32015-04-09 18:47:50 +02002122 /* Update references in bs->opaque and children */
2123 QLIST_FOREACH(child, &bs_old->children, next) {
2124 if (child->bs->inherits_from == bs_new) {
2125 child->bs->inherits_from = bs_old;
2126 }
2127 }
2128 QLIST_FOREACH(child, &bs_new->children, next) {
2129 if (child->bs->inherits_from == bs_old) {
2130 child->bs->inherits_from = bs_new;
2131 }
2132 }
2133
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002134 bdrv_rebind(bs_new);
2135 bdrv_rebind(bs_old);
2136}
2137
Jeff Cody8802d1f2012-02-28 15:54:06 -05002138/*
2139 * Add new bs contents at the top of an image chain while the chain is
2140 * live, while keeping required fields on the top layer.
2141 *
2142 * This will modify the BlockDriverState fields, and swap contents
2143 * between bs_new and bs_top. Both bs_new and bs_top are modified.
2144 *
Markus Armbrusterbfb197e2014-10-07 13:59:11 +02002145 * bs_new must not be attached to a BlockBackend.
Jeff Codyf6801b82012-03-27 16:30:19 -04002146 *
Jeff Cody8802d1f2012-02-28 15:54:06 -05002147 * This function does not create any image files.
2148 */
2149void bdrv_append(BlockDriverState *bs_new, BlockDriverState *bs_top)
2150{
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002151 bdrv_swap(bs_new, bs_top);
Jeff Cody8802d1f2012-02-28 15:54:06 -05002152
2153 /* The contents of 'tmp' will become bs_top, as we are
2154 * swapping bs_new and bs_top contents. */
Fam Zheng8d24cce2014-05-23 21:29:45 +08002155 bdrv_set_backing_hd(bs_top, bs_new);
Jeff Cody8802d1f2012-02-28 15:54:06 -05002156}
2157
Fam Zheng4f6fd342013-08-23 09:14:47 +08002158static void bdrv_delete(BlockDriverState *bs)
bellardb3380822004-03-14 21:38:54 +00002159{
Paolo Bonzini3e914652012-03-30 13:17:11 +02002160 assert(!bs->job);
Fam Zheng3718d8a2014-05-23 21:29:43 +08002161 assert(bdrv_op_blocker_is_empty(bs));
Fam Zheng4f6fd342013-08-23 09:14:47 +08002162 assert(!bs->refcnt);
Fam Zhenge4654d22013-11-13 18:29:43 +08002163 assert(QLIST_EMPTY(&bs->dirty_bitmaps));
Markus Armbruster18846de2010-06-29 16:58:30 +02002164
Stefan Hajnoczie1b5c522013-06-27 15:32:26 +02002165 bdrv_close(bs);
2166
Stefan Hajnoczi1b7bdbc2010-04-10 07:02:42 +01002167 /* remove from list, if necessary */
Ryan Harperd22b2f42011-03-29 20:51:47 -05002168 bdrv_make_anon(bs);
aurel3234c6f052008-04-08 19:51:21 +00002169
Anthony Liguori7267c092011-08-20 22:09:37 -05002170 g_free(bs);
bellardfc01f7e2003-06-30 10:03:06 +00002171}
2172
aliguorie97fc192009-04-21 23:11:50 +00002173/*
2174 * Run consistency checks on an image
2175 *
Kevin Wolfe076f332010-06-29 11:43:13 +02002176 * Returns 0 if the check could be completed (it doesn't mean that the image is
Stefan Weila1c72732011-04-28 17:20:38 +02002177 * free of errors) or -errno when an internal error occurred. The results of the
Kevin Wolfe076f332010-06-29 11:43:13 +02002178 * check are stored in res.
aliguorie97fc192009-04-21 23:11:50 +00002179 */
Kevin Wolf4534ff52012-05-11 16:07:02 +02002180int bdrv_check(BlockDriverState *bs, BdrvCheckResult *res, BdrvCheckMode fix)
aliguorie97fc192009-04-21 23:11:50 +00002181{
Max Reitz908bcd52014-08-07 22:47:55 +02002182 if (bs->drv == NULL) {
2183 return -ENOMEDIUM;
2184 }
aliguorie97fc192009-04-21 23:11:50 +00002185 if (bs->drv->bdrv_check == NULL) {
2186 return -ENOTSUP;
2187 }
2188
Kevin Wolfe076f332010-06-29 11:43:13 +02002189 memset(res, 0, sizeof(*res));
Kevin Wolf4534ff52012-05-11 16:07:02 +02002190 return bs->drv->bdrv_check(bs, res, fix);
aliguorie97fc192009-04-21 23:11:50 +00002191}
2192
Kevin Wolf8a426612010-07-16 17:17:01 +02002193#define COMMIT_BUF_SECTORS 2048
2194
bellard33e39632003-07-06 17:15:21 +00002195/* commit COW file into the raw image */
2196int bdrv_commit(BlockDriverState *bs)
2197{
bellard19cb3732006-08-19 11:45:59 +00002198 BlockDriver *drv = bs->drv;
Jeff Cody72706ea2014-01-24 09:02:35 -05002199 int64_t sector, total_sectors, length, backing_length;
Kevin Wolf8a426612010-07-16 17:17:01 +02002200 int n, ro, open_flags;
Jeff Cody0bce5972012-09-20 15:13:34 -04002201 int ret = 0;
Jeff Cody72706ea2014-01-24 09:02:35 -05002202 uint8_t *buf = NULL;
bellard33e39632003-07-06 17:15:21 +00002203
bellard19cb3732006-08-19 11:45:59 +00002204 if (!drv)
2205 return -ENOMEDIUM;
Liu Yuan6bb45152014-09-01 13:35:21 +08002206
Kevin Wolf760e0062015-06-17 14:55:21 +02002207 if (!bs->backing) {
Naphtali Sprei4dca4b62010-02-14 13:39:18 +02002208 return -ENOTSUP;
bellard33e39632003-07-06 17:15:21 +00002209 }
2210
Fam Zhengbb000212014-09-11 13:14:00 +08002211 if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_COMMIT_SOURCE, NULL) ||
Kevin Wolf760e0062015-06-17 14:55:21 +02002212 bdrv_op_is_blocked(bs->backing->bs, BLOCK_OP_TYPE_COMMIT_TARGET, NULL)) {
Stefan Hajnoczi2d3735d2012-01-18 14:40:41 +00002213 return -EBUSY;
2214 }
2215
Kevin Wolf760e0062015-06-17 14:55:21 +02002216 ro = bs->backing->bs->read_only;
2217 open_flags = bs->backing->bs->open_flags;
Naphtali Sprei4dca4b62010-02-14 13:39:18 +02002218
2219 if (ro) {
Kevin Wolf760e0062015-06-17 14:55:21 +02002220 if (bdrv_reopen(bs->backing->bs, open_flags | BDRV_O_RDWR, NULL)) {
Jeff Cody0bce5972012-09-20 15:13:34 -04002221 return -EACCES;
Naphtali Sprei4dca4b62010-02-14 13:39:18 +02002222 }
bellard33e39632003-07-06 17:15:21 +00002223 }
bellardea2384d2004-08-01 21:59:26 +00002224
Jeff Cody72706ea2014-01-24 09:02:35 -05002225 length = bdrv_getlength(bs);
2226 if (length < 0) {
2227 ret = length;
2228 goto ro_cleanup;
2229 }
2230
Kevin Wolf760e0062015-06-17 14:55:21 +02002231 backing_length = bdrv_getlength(bs->backing->bs);
Jeff Cody72706ea2014-01-24 09:02:35 -05002232 if (backing_length < 0) {
2233 ret = backing_length;
2234 goto ro_cleanup;
2235 }
2236
2237 /* If our top snapshot is larger than the backing file image,
2238 * grow the backing file image if possible. If not possible,
2239 * we must return an error */
2240 if (length > backing_length) {
Kevin Wolf760e0062015-06-17 14:55:21 +02002241 ret = bdrv_truncate(bs->backing->bs, length);
Jeff Cody72706ea2014-01-24 09:02:35 -05002242 if (ret < 0) {
2243 goto ro_cleanup;
2244 }
2245 }
2246
2247 total_sectors = length >> BDRV_SECTOR_BITS;
Kevin Wolf857d4f42014-05-20 13:16:51 +02002248
2249 /* qemu_try_blockalign() for bs will choose an alignment that works for
Kevin Wolf760e0062015-06-17 14:55:21 +02002250 * bs->backing->bs as well, so no need to compare the alignment manually. */
Kevin Wolf857d4f42014-05-20 13:16:51 +02002251 buf = qemu_try_blockalign(bs, COMMIT_BUF_SECTORS * BDRV_SECTOR_SIZE);
2252 if (buf == NULL) {
2253 ret = -ENOMEM;
2254 goto ro_cleanup;
2255 }
bellardea2384d2004-08-01 21:59:26 +00002256
Kevin Wolf8a426612010-07-16 17:17:01 +02002257 for (sector = 0; sector < total_sectors; sector += n) {
Paolo Bonzinid6636402013-09-04 19:00:25 +02002258 ret = bdrv_is_allocated(bs, sector, COMMIT_BUF_SECTORS, &n);
2259 if (ret < 0) {
2260 goto ro_cleanup;
2261 }
2262 if (ret) {
Kevin Wolfdabfa6c2014-01-24 14:00:43 +01002263 ret = bdrv_read(bs, sector, buf, n);
2264 if (ret < 0) {
Kevin Wolf8a426612010-07-16 17:17:01 +02002265 goto ro_cleanup;
2266 }
2267
Kevin Wolf760e0062015-06-17 14:55:21 +02002268 ret = bdrv_write(bs->backing->bs, sector, buf, n);
Kevin Wolfdabfa6c2014-01-24 14:00:43 +01002269 if (ret < 0) {
Kevin Wolf8a426612010-07-16 17:17:01 +02002270 goto ro_cleanup;
2271 }
bellardea2384d2004-08-01 21:59:26 +00002272 }
2273 }
bellard95389c82005-12-18 18:28:15 +00002274
Christoph Hellwig1d449522010-01-17 12:32:30 +01002275 if (drv->bdrv_make_empty) {
2276 ret = drv->bdrv_make_empty(bs);
Kevin Wolfdabfa6c2014-01-24 14:00:43 +01002277 if (ret < 0) {
2278 goto ro_cleanup;
2279 }
Christoph Hellwig1d449522010-01-17 12:32:30 +01002280 bdrv_flush(bs);
2281 }
bellard95389c82005-12-18 18:28:15 +00002282
Christoph Hellwig3f5075a2010-01-12 13:49:23 +01002283 /*
2284 * Make sure all data we wrote to the backing device is actually
2285 * stable on disk.
2286 */
Kevin Wolf760e0062015-06-17 14:55:21 +02002287 if (bs->backing) {
2288 bdrv_flush(bs->backing->bs);
Kevin Wolfdabfa6c2014-01-24 14:00:43 +01002289 }
Naphtali Sprei4dca4b62010-02-14 13:39:18 +02002290
Kevin Wolfdabfa6c2014-01-24 14:00:43 +01002291 ret = 0;
Naphtali Sprei4dca4b62010-02-14 13:39:18 +02002292ro_cleanup:
Kevin Wolf857d4f42014-05-20 13:16:51 +02002293 qemu_vfree(buf);
Naphtali Sprei4dca4b62010-02-14 13:39:18 +02002294
2295 if (ro) {
Jeff Cody0bce5972012-09-20 15:13:34 -04002296 /* ignoring error return here */
Kevin Wolf760e0062015-06-17 14:55:21 +02002297 bdrv_reopen(bs->backing->bs, open_flags & ~BDRV_O_RDWR, NULL);
Naphtali Sprei4dca4b62010-02-14 13:39:18 +02002298 }
2299
Christoph Hellwig1d449522010-01-17 12:32:30 +01002300 return ret;
bellard33e39632003-07-06 17:15:21 +00002301}
2302
Stefan Hajnoczie8877492012-03-05 18:10:11 +00002303int bdrv_commit_all(void)
Markus Armbruster6ab4b5a2010-06-02 18:55:18 +02002304{
2305 BlockDriverState *bs;
2306
Benoît Canetdc364f42014-01-23 21:31:32 +01002307 QTAILQ_FOREACH(bs, &bdrv_states, device_list) {
Stefan Hajnoczied78cda2014-05-08 16:34:35 +02002308 AioContext *aio_context = bdrv_get_aio_context(bs);
2309
2310 aio_context_acquire(aio_context);
Kevin Wolf760e0062015-06-17 14:55:21 +02002311 if (bs->drv && bs->backing) {
Jeff Cody272d2d82013-02-26 09:55:48 -05002312 int ret = bdrv_commit(bs);
2313 if (ret < 0) {
Stefan Hajnoczied78cda2014-05-08 16:34:35 +02002314 aio_context_release(aio_context);
Jeff Cody272d2d82013-02-26 09:55:48 -05002315 return ret;
2316 }
Stefan Hajnoczie8877492012-03-05 18:10:11 +00002317 }
Stefan Hajnoczied78cda2014-05-08 16:34:35 +02002318 aio_context_release(aio_context);
Markus Armbruster6ab4b5a2010-06-02 18:55:18 +02002319 }
Stefan Hajnoczie8877492012-03-05 18:10:11 +00002320 return 0;
Markus Armbruster6ab4b5a2010-06-02 18:55:18 +02002321}
2322
Kevin Wolf756e6732010-01-12 12:55:17 +01002323/*
2324 * Return values:
2325 * 0 - success
2326 * -EINVAL - backing format specified, but no file
2327 * -ENOSPC - can't update the backing file because no space is left in the
2328 * image file header
2329 * -ENOTSUP - format driver doesn't support changing the backing file
2330 */
2331int bdrv_change_backing_file(BlockDriverState *bs,
2332 const char *backing_file, const char *backing_fmt)
2333{
2334 BlockDriver *drv = bs->drv;
Paolo Bonzini469ef352012-04-12 14:01:02 +02002335 int ret;
Kevin Wolf756e6732010-01-12 12:55:17 +01002336
Paolo Bonzini5f377792012-04-12 14:01:01 +02002337 /* Backing file format doesn't make sense without a backing file */
2338 if (backing_fmt && !backing_file) {
2339 return -EINVAL;
2340 }
2341
Kevin Wolf756e6732010-01-12 12:55:17 +01002342 if (drv->bdrv_change_backing_file != NULL) {
Paolo Bonzini469ef352012-04-12 14:01:02 +02002343 ret = drv->bdrv_change_backing_file(bs, backing_file, backing_fmt);
Kevin Wolf756e6732010-01-12 12:55:17 +01002344 } else {
Paolo Bonzini469ef352012-04-12 14:01:02 +02002345 ret = -ENOTSUP;
Kevin Wolf756e6732010-01-12 12:55:17 +01002346 }
Paolo Bonzini469ef352012-04-12 14:01:02 +02002347
2348 if (ret == 0) {
2349 pstrcpy(bs->backing_file, sizeof(bs->backing_file), backing_file ?: "");
2350 pstrcpy(bs->backing_format, sizeof(bs->backing_format), backing_fmt ?: "");
2351 }
2352 return ret;
Kevin Wolf756e6732010-01-12 12:55:17 +01002353}
2354
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002355/*
2356 * Finds the image layer in the chain that has 'bs' as its backing file.
2357 *
2358 * active is the current topmost image.
2359 *
2360 * Returns NULL if bs is not found in active's image chain,
2361 * or if active == bs.
Jeff Cody4caf0fc2014-06-25 15:35:26 -04002362 *
2363 * Returns the bottommost base image if bs == NULL.
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002364 */
2365BlockDriverState *bdrv_find_overlay(BlockDriverState *active,
2366 BlockDriverState *bs)
2367{
Kevin Wolf760e0062015-06-17 14:55:21 +02002368 while (active && bs != backing_bs(active)) {
2369 active = backing_bs(active);
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002370 }
2371
Jeff Cody4caf0fc2014-06-25 15:35:26 -04002372 return active;
2373}
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002374
Jeff Cody4caf0fc2014-06-25 15:35:26 -04002375/* Given a BDS, searches for the base layer. */
2376BlockDriverState *bdrv_find_base(BlockDriverState *bs)
2377{
2378 return bdrv_find_overlay(bs, NULL);
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002379}
2380
2381typedef struct BlkIntermediateStates {
2382 BlockDriverState *bs;
2383 QSIMPLEQ_ENTRY(BlkIntermediateStates) entry;
2384} BlkIntermediateStates;
2385
2386
2387/*
2388 * Drops images above 'base' up to and including 'top', and sets the image
2389 * above 'top' to have base as its backing file.
2390 *
2391 * Requires that the overlay to 'top' is opened r/w, so that the backing file
2392 * information in 'bs' can be properly updated.
2393 *
2394 * E.g., this will convert the following chain:
2395 * bottom <- base <- intermediate <- top <- active
2396 *
2397 * to
2398 *
2399 * bottom <- base <- active
2400 *
2401 * It is allowed for bottom==base, in which case it converts:
2402 *
2403 * base <- intermediate <- top <- active
2404 *
2405 * to
2406 *
2407 * base <- active
2408 *
Jeff Cody54e26902014-06-25 15:40:10 -04002409 * If backing_file_str is non-NULL, it will be used when modifying top's
2410 * overlay image metadata.
2411 *
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002412 * Error conditions:
2413 * if active == top, that is considered an error
2414 *
2415 */
2416int bdrv_drop_intermediate(BlockDriverState *active, BlockDriverState *top,
Jeff Cody54e26902014-06-25 15:40:10 -04002417 BlockDriverState *base, const char *backing_file_str)
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002418{
2419 BlockDriverState *intermediate;
2420 BlockDriverState *base_bs = NULL;
2421 BlockDriverState *new_top_bs = NULL;
2422 BlkIntermediateStates *intermediate_state, *next;
2423 int ret = -EIO;
2424
2425 QSIMPLEQ_HEAD(states_to_delete, BlkIntermediateStates) states_to_delete;
2426 QSIMPLEQ_INIT(&states_to_delete);
2427
2428 if (!top->drv || !base->drv) {
2429 goto exit;
2430 }
2431
2432 new_top_bs = bdrv_find_overlay(active, top);
2433
2434 if (new_top_bs == NULL) {
2435 /* we could not find the image above 'top', this is an error */
2436 goto exit;
2437 }
2438
Kevin Wolf760e0062015-06-17 14:55:21 +02002439 /* special case of new_top_bs->backing->bs already pointing to base - nothing
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002440 * to do, no intermediate images */
Kevin Wolf760e0062015-06-17 14:55:21 +02002441 if (backing_bs(new_top_bs) == base) {
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002442 ret = 0;
2443 goto exit;
2444 }
2445
2446 intermediate = top;
2447
2448 /* now we will go down through the list, and add each BDS we find
2449 * into our deletion queue, until we hit the 'base'
2450 */
2451 while (intermediate) {
Markus Armbruster5839e532014-08-19 10:31:08 +02002452 intermediate_state = g_new0(BlkIntermediateStates, 1);
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002453 intermediate_state->bs = intermediate;
2454 QSIMPLEQ_INSERT_TAIL(&states_to_delete, intermediate_state, entry);
2455
Kevin Wolf760e0062015-06-17 14:55:21 +02002456 if (backing_bs(intermediate) == base) {
2457 base_bs = backing_bs(intermediate);
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002458 break;
2459 }
Kevin Wolf760e0062015-06-17 14:55:21 +02002460 intermediate = backing_bs(intermediate);
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002461 }
2462 if (base_bs == NULL) {
2463 /* something went wrong, we did not end at the base. safely
2464 * unravel everything, and exit with error */
2465 goto exit;
2466 }
2467
2468 /* success - we can delete the intermediate states, and link top->base */
Jeff Cody54e26902014-06-25 15:40:10 -04002469 backing_file_str = backing_file_str ? backing_file_str : base_bs->filename;
2470 ret = bdrv_change_backing_file(new_top_bs, backing_file_str,
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002471 base_bs->drv ? base_bs->drv->format_name : "");
2472 if (ret) {
2473 goto exit;
2474 }
Fam Zheng920beae2014-05-23 21:29:46 +08002475 bdrv_set_backing_hd(new_top_bs, base_bs);
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002476
2477 QSIMPLEQ_FOREACH_SAFE(intermediate_state, &states_to_delete, entry, next) {
2478 /* so that bdrv_close() does not recursively close the chain */
Fam Zheng920beae2014-05-23 21:29:46 +08002479 bdrv_set_backing_hd(intermediate_state->bs, NULL);
Fam Zheng4f6fd342013-08-23 09:14:47 +08002480 bdrv_unref(intermediate_state->bs);
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002481 }
2482 ret = 0;
2483
2484exit:
2485 QSIMPLEQ_FOREACH_SAFE(intermediate_state, &states_to_delete, entry, next) {
2486 g_free(intermediate_state);
2487 }
2488 return ret;
2489}
2490
bellard83f64092006-08-01 16:21:11 +00002491/**
bellard83f64092006-08-01 16:21:11 +00002492 * Truncate file to 'offset' bytes (needed only for file protocols)
2493 */
2494int bdrv_truncate(BlockDriverState *bs, int64_t offset)
2495{
2496 BlockDriver *drv = bs->drv;
Stefan Hajnoczi51762282010-04-19 16:56:41 +01002497 int ret;
bellard83f64092006-08-01 16:21:11 +00002498 if (!drv)
bellard19cb3732006-08-19 11:45:59 +00002499 return -ENOMEDIUM;
bellard83f64092006-08-01 16:21:11 +00002500 if (!drv->bdrv_truncate)
2501 return -ENOTSUP;
Naphtali Sprei59f26892009-10-26 16:25:16 +02002502 if (bs->read_only)
2503 return -EACCES;
Jeff Cody9c75e162014-06-25 16:55:30 -04002504
Stefan Hajnoczi51762282010-04-19 16:56:41 +01002505 ret = drv->bdrv_truncate(bs, offset);
2506 if (ret == 0) {
2507 ret = refresh_total_sectors(bs, offset >> BDRV_SECTOR_BITS);
John Snowce1ffea2015-04-17 19:50:03 -04002508 bdrv_dirty_bitmap_truncate(bs);
Markus Armbrustera7f53e22014-10-07 13:59:25 +02002509 if (bs->blk) {
2510 blk_dev_resize_cb(bs->blk);
2511 }
Stefan Hajnoczi51762282010-04-19 16:56:41 +01002512 }
2513 return ret;
bellard83f64092006-08-01 16:21:11 +00002514}
2515
2516/**
Fam Zheng4a1d5e12011-07-12 19:56:39 +08002517 * Length of a allocated file in bytes. Sparse files are counted by actual
2518 * allocated space. Return < 0 if error or unknown.
2519 */
2520int64_t bdrv_get_allocated_file_size(BlockDriverState *bs)
2521{
2522 BlockDriver *drv = bs->drv;
2523 if (!drv) {
2524 return -ENOMEDIUM;
2525 }
2526 if (drv->bdrv_get_allocated_file_size) {
2527 return drv->bdrv_get_allocated_file_size(bs);
2528 }
2529 if (bs->file) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02002530 return bdrv_get_allocated_file_size(bs->file->bs);
Fam Zheng4a1d5e12011-07-12 19:56:39 +08002531 }
2532 return -ENOTSUP;
2533}
2534
2535/**
Markus Armbruster65a9bb22014-06-26 13:23:17 +02002536 * Return number of sectors on success, -errno on error.
bellard83f64092006-08-01 16:21:11 +00002537 */
Markus Armbruster65a9bb22014-06-26 13:23:17 +02002538int64_t bdrv_nb_sectors(BlockDriverState *bs)
bellard83f64092006-08-01 16:21:11 +00002539{
2540 BlockDriver *drv = bs->drv;
Markus Armbruster65a9bb22014-06-26 13:23:17 +02002541
bellard83f64092006-08-01 16:21:11 +00002542 if (!drv)
bellard19cb3732006-08-19 11:45:59 +00002543 return -ENOMEDIUM;
Stefan Hajnoczi51762282010-04-19 16:56:41 +01002544
Kevin Wolfb94a2612013-10-29 12:18:58 +01002545 if (drv->has_variable_length) {
2546 int ret = refresh_total_sectors(bs, bs->total_sectors);
2547 if (ret < 0) {
2548 return ret;
Stefan Hajnoczi46a4e4e2011-03-29 20:04:41 +01002549 }
bellard83f64092006-08-01 16:21:11 +00002550 }
Markus Armbruster65a9bb22014-06-26 13:23:17 +02002551 return bs->total_sectors;
2552}
2553
2554/**
2555 * Return length in bytes on success, -errno on error.
2556 * The length is always a multiple of BDRV_SECTOR_SIZE.
2557 */
2558int64_t bdrv_getlength(BlockDriverState *bs)
2559{
2560 int64_t ret = bdrv_nb_sectors(bs);
2561
Fam Zheng4a9c9ea2015-05-15 16:36:05 +08002562 ret = ret > INT64_MAX / BDRV_SECTOR_SIZE ? -EFBIG : ret;
Markus Armbruster65a9bb22014-06-26 13:23:17 +02002563 return ret < 0 ? ret : ret * BDRV_SECTOR_SIZE;
bellardfc01f7e2003-06-30 10:03:06 +00002564}
2565
bellard19cb3732006-08-19 11:45:59 +00002566/* return 0 as number of sectors if no device present or error */
ths96b8f132007-12-17 01:35:20 +00002567void bdrv_get_geometry(BlockDriverState *bs, uint64_t *nb_sectors_ptr)
bellardfc01f7e2003-06-30 10:03:06 +00002568{
Markus Armbruster65a9bb22014-06-26 13:23:17 +02002569 int64_t nb_sectors = bdrv_nb_sectors(bs);
2570
2571 *nb_sectors_ptr = nb_sectors < 0 ? 0 : nb_sectors;
bellardfc01f7e2003-06-30 10:03:06 +00002572}
bellardcf989512004-02-16 21:56:36 +00002573
Paolo Bonziniff06f5f2012-09-28 17:22:54 +02002574void bdrv_set_on_error(BlockDriverState *bs, BlockdevOnError on_read_error,
2575 BlockdevOnError on_write_error)
Markus Armbrusterabd7f682010-06-02 18:55:17 +02002576{
2577 bs->on_read_error = on_read_error;
2578 bs->on_write_error = on_write_error;
2579}
2580
Paolo Bonzini1ceee0d2012-09-28 17:22:56 +02002581BlockdevOnError bdrv_get_on_error(BlockDriverState *bs, bool is_read)
Markus Armbrusterabd7f682010-06-02 18:55:17 +02002582{
2583 return is_read ? bs->on_read_error : bs->on_write_error;
2584}
2585
Paolo Bonzini3e1caa52012-09-28 17:22:57 +02002586BlockErrorAction bdrv_get_error_action(BlockDriverState *bs, bool is_read, int error)
2587{
2588 BlockdevOnError on_err = is_read ? bs->on_read_error : bs->on_write_error;
2589
2590 switch (on_err) {
2591 case BLOCKDEV_ON_ERROR_ENOSPC:
Wenchao Xiaa5895692014-06-18 08:43:30 +02002592 return (error == ENOSPC) ?
2593 BLOCK_ERROR_ACTION_STOP : BLOCK_ERROR_ACTION_REPORT;
Paolo Bonzini3e1caa52012-09-28 17:22:57 +02002594 case BLOCKDEV_ON_ERROR_STOP:
Wenchao Xiaa5895692014-06-18 08:43:30 +02002595 return BLOCK_ERROR_ACTION_STOP;
Paolo Bonzini3e1caa52012-09-28 17:22:57 +02002596 case BLOCKDEV_ON_ERROR_REPORT:
Wenchao Xiaa5895692014-06-18 08:43:30 +02002597 return BLOCK_ERROR_ACTION_REPORT;
Paolo Bonzini3e1caa52012-09-28 17:22:57 +02002598 case BLOCKDEV_ON_ERROR_IGNORE:
Wenchao Xiaa5895692014-06-18 08:43:30 +02002599 return BLOCK_ERROR_ACTION_IGNORE;
Paolo Bonzini3e1caa52012-09-28 17:22:57 +02002600 default:
2601 abort();
2602 }
2603}
2604
Luiz Capitulinoc7c2ff02014-08-29 16:07:27 -04002605static void send_qmp_error_event(BlockDriverState *bs,
2606 BlockErrorAction action,
2607 bool is_read, int error)
2608{
Peter Maydell573742a2014-10-10 20:33:03 +01002609 IoOperationType optype;
Luiz Capitulinoc7c2ff02014-08-29 16:07:27 -04002610
Peter Maydell573742a2014-10-10 20:33:03 +01002611 optype = is_read ? IO_OPERATION_TYPE_READ : IO_OPERATION_TYPE_WRITE;
2612 qapi_event_send_block_io_error(bdrv_get_device_name(bs), optype, action,
Luiz Capitulinoc7c2ff02014-08-29 16:07:27 -04002613 bdrv_iostatus_is_enabled(bs),
Luiz Capitulino624ff572014-09-11 10:25:48 -04002614 error == ENOSPC, strerror(error),
2615 &error_abort);
Luiz Capitulinoc7c2ff02014-08-29 16:07:27 -04002616}
2617
Paolo Bonzini3e1caa52012-09-28 17:22:57 +02002618/* This is done by device models because, while the block layer knows
2619 * about the error, it does not know whether an operation comes from
2620 * the device or the block layer (from a job, for example).
2621 */
2622void bdrv_error_action(BlockDriverState *bs, BlockErrorAction action,
2623 bool is_read, int error)
2624{
2625 assert(error >= 0);
Paolo Bonzini2bd3bce2014-06-05 14:53:59 +02002626
Wenchao Xiaa5895692014-06-18 08:43:30 +02002627 if (action == BLOCK_ERROR_ACTION_STOP) {
Paolo Bonzini2bd3bce2014-06-05 14:53:59 +02002628 /* First set the iostatus, so that "info block" returns an iostatus
2629 * that matches the events raised so far (an additional error iostatus
2630 * is fine, but not a lost one).
2631 */
Paolo Bonzini3e1caa52012-09-28 17:22:57 +02002632 bdrv_iostatus_set_err(bs, error);
Paolo Bonzini2bd3bce2014-06-05 14:53:59 +02002633
2634 /* Then raise the request to stop the VM and the event.
2635 * qemu_system_vmstop_request_prepare has two effects. First,
2636 * it ensures that the STOP event always comes after the
2637 * BLOCK_IO_ERROR event. Second, it ensures that even if management
2638 * can observe the STOP event and do a "cont" before the STOP
2639 * event is issued, the VM will not stop. In this case, vm_start()
2640 * also ensures that the STOP/RESUME pair of events is emitted.
2641 */
2642 qemu_system_vmstop_request_prepare();
Luiz Capitulinoc7c2ff02014-08-29 16:07:27 -04002643 send_qmp_error_event(bs, action, is_read, error);
Paolo Bonzini2bd3bce2014-06-05 14:53:59 +02002644 qemu_system_vmstop_request(RUN_STATE_IO_ERROR);
2645 } else {
Luiz Capitulinoc7c2ff02014-08-29 16:07:27 -04002646 send_qmp_error_event(bs, action, is_read, error);
Paolo Bonzini3e1caa52012-09-28 17:22:57 +02002647 }
2648}
2649
bellardb3380822004-03-14 21:38:54 +00002650int bdrv_is_read_only(BlockDriverState *bs)
2651{
2652 return bs->read_only;
2653}
2654
ths985a03b2007-12-24 16:10:43 +00002655int bdrv_is_sg(BlockDriverState *bs)
2656{
2657 return bs->sg;
2658}
2659
Christoph Hellwige900a7b2009-09-04 19:01:15 +02002660int bdrv_enable_write_cache(BlockDriverState *bs)
2661{
2662 return bs->enable_write_cache;
2663}
2664
Paolo Bonzini425b0142012-06-06 00:04:52 +02002665void bdrv_set_enable_write_cache(BlockDriverState *bs, bool wce)
2666{
2667 bs->enable_write_cache = wce;
Jeff Cody55b110f2012-09-20 15:13:18 -04002668
2669 /* so a reopen() will preserve wce */
2670 if (wce) {
2671 bs->open_flags |= BDRV_O_CACHE_WB;
2672 } else {
2673 bs->open_flags &= ~BDRV_O_CACHE_WB;
2674 }
Paolo Bonzini425b0142012-06-06 00:04:52 +02002675}
2676
bellardea2384d2004-08-01 21:59:26 +00002677int bdrv_is_encrypted(BlockDriverState *bs)
2678{
Kevin Wolf760e0062015-06-17 14:55:21 +02002679 if (bs->backing && bs->backing->bs->encrypted) {
bellardea2384d2004-08-01 21:59:26 +00002680 return 1;
Kevin Wolf760e0062015-06-17 14:55:21 +02002681 }
bellardea2384d2004-08-01 21:59:26 +00002682 return bs->encrypted;
2683}
2684
aliguoric0f4ce72009-03-05 23:01:01 +00002685int bdrv_key_required(BlockDriverState *bs)
2686{
Kevin Wolf760e0062015-06-17 14:55:21 +02002687 BdrvChild *backing = bs->backing;
aliguoric0f4ce72009-03-05 23:01:01 +00002688
Kevin Wolf760e0062015-06-17 14:55:21 +02002689 if (backing && backing->bs->encrypted && !backing->bs->valid_key) {
aliguoric0f4ce72009-03-05 23:01:01 +00002690 return 1;
Kevin Wolf760e0062015-06-17 14:55:21 +02002691 }
aliguoric0f4ce72009-03-05 23:01:01 +00002692 return (bs->encrypted && !bs->valid_key);
2693}
2694
bellardea2384d2004-08-01 21:59:26 +00002695int bdrv_set_key(BlockDriverState *bs, const char *key)
2696{
2697 int ret;
Kevin Wolf760e0062015-06-17 14:55:21 +02002698 if (bs->backing && bs->backing->bs->encrypted) {
2699 ret = bdrv_set_key(bs->backing->bs, key);
bellardea2384d2004-08-01 21:59:26 +00002700 if (ret < 0)
2701 return ret;
2702 if (!bs->encrypted)
2703 return 0;
2704 }
Shahar Havivifd04a2a2010-03-06 00:26:13 +02002705 if (!bs->encrypted) {
2706 return -EINVAL;
2707 } else if (!bs->drv || !bs->drv->bdrv_set_key) {
2708 return -ENOMEDIUM;
2709 }
aliguoric0f4ce72009-03-05 23:01:01 +00002710 ret = bs->drv->bdrv_set_key(bs, key);
aliguoribb5fc202009-03-05 23:01:15 +00002711 if (ret < 0) {
2712 bs->valid_key = 0;
2713 } else if (!bs->valid_key) {
2714 bs->valid_key = 1;
Markus Armbrustera7f53e22014-10-07 13:59:25 +02002715 if (bs->blk) {
2716 /* call the change callback now, we skipped it on open */
2717 blk_dev_change_media_cb(bs->blk, true);
2718 }
aliguoribb5fc202009-03-05 23:01:15 +00002719 }
aliguoric0f4ce72009-03-05 23:01:01 +00002720 return ret;
bellardea2384d2004-08-01 21:59:26 +00002721}
2722
Markus Armbruster4d2855a2015-01-29 10:37:00 +01002723/*
2724 * Provide an encryption key for @bs.
2725 * If @key is non-null:
2726 * If @bs is not encrypted, fail.
2727 * Else if the key is invalid, fail.
2728 * Else set @bs's key to @key, replacing the existing key, if any.
2729 * If @key is null:
2730 * If @bs is encrypted and still lacks a key, fail.
2731 * Else do nothing.
2732 * On failure, store an error object through @errp if non-null.
2733 */
2734void bdrv_add_key(BlockDriverState *bs, const char *key, Error **errp)
2735{
2736 if (key) {
2737 if (!bdrv_is_encrypted(bs)) {
Alberto Garcia81e5f782015-04-08 12:29:19 +03002738 error_setg(errp, "Node '%s' is not encrypted",
2739 bdrv_get_device_or_node_name(bs));
Markus Armbruster4d2855a2015-01-29 10:37:00 +01002740 } else if (bdrv_set_key(bs, key) < 0) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01002741 error_setg(errp, QERR_INVALID_PASSWORD);
Markus Armbruster4d2855a2015-01-29 10:37:00 +01002742 }
2743 } else {
2744 if (bdrv_key_required(bs)) {
Markus Armbrusterb1ca6392015-01-29 10:37:01 +01002745 error_set(errp, ERROR_CLASS_DEVICE_ENCRYPTED,
2746 "'%s' (%s) is encrypted",
Alberto Garcia81e5f782015-04-08 12:29:19 +03002747 bdrv_get_device_or_node_name(bs),
Markus Armbruster4d2855a2015-01-29 10:37:00 +01002748 bdrv_get_encrypted_filename(bs));
2749 }
2750 }
2751}
2752
Markus Armbrusterf8d6bba2012-06-13 10:11:48 +02002753const char *bdrv_get_format_name(BlockDriverState *bs)
bellardea2384d2004-08-01 21:59:26 +00002754{
Markus Armbrusterf8d6bba2012-06-13 10:11:48 +02002755 return bs->drv ? bs->drv->format_name : NULL;
bellardea2384d2004-08-01 21:59:26 +00002756}
2757
Stefan Hajnocziada42402014-08-27 12:08:55 +01002758static int qsort_strcmp(const void *a, const void *b)
2759{
2760 return strcmp(a, b);
2761}
2762
ths5fafdf22007-09-16 21:08:06 +00002763void bdrv_iterate_format(void (*it)(void *opaque, const char *name),
bellardea2384d2004-08-01 21:59:26 +00002764 void *opaque)
2765{
2766 BlockDriver *drv;
Jeff Codye855e4f2014-04-28 18:29:54 -04002767 int count = 0;
Stefan Hajnocziada42402014-08-27 12:08:55 +01002768 int i;
Jeff Codye855e4f2014-04-28 18:29:54 -04002769 const char **formats = NULL;
bellardea2384d2004-08-01 21:59:26 +00002770
Stefan Hajnoczi8a22f022010-04-13 10:29:33 +01002771 QLIST_FOREACH(drv, &bdrv_drivers, list) {
Jeff Codye855e4f2014-04-28 18:29:54 -04002772 if (drv->format_name) {
2773 bool found = false;
2774 int i = count;
2775 while (formats && i && !found) {
2776 found = !strcmp(formats[--i], drv->format_name);
2777 }
2778
2779 if (!found) {
Markus Armbruster5839e532014-08-19 10:31:08 +02002780 formats = g_renew(const char *, formats, count + 1);
Jeff Codye855e4f2014-04-28 18:29:54 -04002781 formats[count++] = drv->format_name;
Jeff Codye855e4f2014-04-28 18:29:54 -04002782 }
2783 }
bellardea2384d2004-08-01 21:59:26 +00002784 }
Stefan Hajnocziada42402014-08-27 12:08:55 +01002785
2786 qsort(formats, count, sizeof(formats[0]), qsort_strcmp);
2787
2788 for (i = 0; i < count; i++) {
2789 it(opaque, formats[i]);
2790 }
2791
Jeff Codye855e4f2014-04-28 18:29:54 -04002792 g_free(formats);
bellardea2384d2004-08-01 21:59:26 +00002793}
2794
Benoît Canetdc364f42014-01-23 21:31:32 +01002795/* This function is to find a node in the bs graph */
2796BlockDriverState *bdrv_find_node(const char *node_name)
2797{
2798 BlockDriverState *bs;
2799
2800 assert(node_name);
2801
2802 QTAILQ_FOREACH(bs, &graph_bdrv_states, node_list) {
2803 if (!strcmp(node_name, bs->node_name)) {
2804 return bs;
2805 }
2806 }
2807 return NULL;
2808}
2809
Benoît Canetc13163f2014-01-23 21:31:34 +01002810/* Put this QMP function here so it can access the static graph_bdrv_states. */
Alberto Garciad5a8ee62015-04-17 14:52:43 +03002811BlockDeviceInfoList *bdrv_named_nodes_list(Error **errp)
Benoît Canetc13163f2014-01-23 21:31:34 +01002812{
2813 BlockDeviceInfoList *list, *entry;
2814 BlockDriverState *bs;
2815
2816 list = NULL;
2817 QTAILQ_FOREACH(bs, &graph_bdrv_states, node_list) {
Alberto Garciad5a8ee62015-04-17 14:52:43 +03002818 BlockDeviceInfo *info = bdrv_block_device_info(bs, errp);
2819 if (!info) {
2820 qapi_free_BlockDeviceInfoList(list);
2821 return NULL;
2822 }
Benoît Canetc13163f2014-01-23 21:31:34 +01002823 entry = g_malloc0(sizeof(*entry));
Alberto Garciad5a8ee62015-04-17 14:52:43 +03002824 entry->value = info;
Benoît Canetc13163f2014-01-23 21:31:34 +01002825 entry->next = list;
2826 list = entry;
2827 }
2828
2829 return list;
2830}
2831
Benoît Canet12d3ba82014-01-23 21:31:35 +01002832BlockDriverState *bdrv_lookup_bs(const char *device,
2833 const char *node_name,
2834 Error **errp)
2835{
Markus Armbruster7f06d472014-10-07 13:59:12 +02002836 BlockBackend *blk;
2837 BlockDriverState *bs;
Benoît Canet12d3ba82014-01-23 21:31:35 +01002838
Benoît Canet12d3ba82014-01-23 21:31:35 +01002839 if (device) {
Markus Armbruster7f06d472014-10-07 13:59:12 +02002840 blk = blk_by_name(device);
Benoît Canet12d3ba82014-01-23 21:31:35 +01002841
Markus Armbruster7f06d472014-10-07 13:59:12 +02002842 if (blk) {
2843 return blk_bs(blk);
Benoît Canet12d3ba82014-01-23 21:31:35 +01002844 }
Benoît Canet12d3ba82014-01-23 21:31:35 +01002845 }
2846
Benoît Canetdd67fa52014-02-12 17:15:06 +01002847 if (node_name) {
2848 bs = bdrv_find_node(node_name);
Benoît Canet12d3ba82014-01-23 21:31:35 +01002849
Benoît Canetdd67fa52014-02-12 17:15:06 +01002850 if (bs) {
2851 return bs;
2852 }
Benoît Canet12d3ba82014-01-23 21:31:35 +01002853 }
2854
Benoît Canetdd67fa52014-02-12 17:15:06 +01002855 error_setg(errp, "Cannot find device=%s nor node_name=%s",
2856 device ? device : "",
2857 node_name ? node_name : "");
2858 return NULL;
Benoît Canet12d3ba82014-01-23 21:31:35 +01002859}
2860
Jeff Cody5a6684d2014-06-25 15:40:09 -04002861/* If 'base' is in the same chain as 'top', return true. Otherwise,
2862 * return false. If either argument is NULL, return false. */
2863bool bdrv_chain_contains(BlockDriverState *top, BlockDriverState *base)
2864{
2865 while (top && top != base) {
Kevin Wolf760e0062015-06-17 14:55:21 +02002866 top = backing_bs(top);
Jeff Cody5a6684d2014-06-25 15:40:09 -04002867 }
2868
2869 return top != NULL;
2870}
2871
Fam Zheng04df7652014-10-31 11:32:54 +08002872BlockDriverState *bdrv_next_node(BlockDriverState *bs)
2873{
2874 if (!bs) {
2875 return QTAILQ_FIRST(&graph_bdrv_states);
2876 }
2877 return QTAILQ_NEXT(bs, node_list);
2878}
2879
Markus Armbruster2f399b02010-06-02 18:55:20 +02002880BlockDriverState *bdrv_next(BlockDriverState *bs)
2881{
2882 if (!bs) {
2883 return QTAILQ_FIRST(&bdrv_states);
2884 }
Benoît Canetdc364f42014-01-23 21:31:32 +01002885 return QTAILQ_NEXT(bs, device_list);
Markus Armbruster2f399b02010-06-02 18:55:20 +02002886}
2887
Fam Zheng20a9e772014-10-31 11:32:55 +08002888const char *bdrv_get_node_name(const BlockDriverState *bs)
2889{
2890 return bs->node_name;
2891}
2892
Markus Armbruster7f06d472014-10-07 13:59:12 +02002893/* TODO check what callers really want: bs->node_name or blk_name() */
Markus Armbrusterbfb197e2014-10-07 13:59:11 +02002894const char *bdrv_get_device_name(const BlockDriverState *bs)
bellardea2384d2004-08-01 21:59:26 +00002895{
Markus Armbrusterbfb197e2014-10-07 13:59:11 +02002896 return bs->blk ? blk_name(bs->blk) : "";
bellardea2384d2004-08-01 21:59:26 +00002897}
2898
Alberto Garcia9b2aa842015-04-08 12:29:18 +03002899/* This can be used to identify nodes that might not have a device
2900 * name associated. Since node and device names live in the same
2901 * namespace, the result is unambiguous. The exception is if both are
2902 * absent, then this returns an empty (non-null) string. */
2903const char *bdrv_get_device_or_node_name(const BlockDriverState *bs)
2904{
2905 return bs->blk ? blk_name(bs->blk) : bs->node_name;
2906}
2907
Markus Armbrusterc8433282012-06-05 16:49:24 +02002908int bdrv_get_flags(BlockDriverState *bs)
2909{
2910 return bs->open_flags;
2911}
2912
Peter Lieven3ac21622013-06-28 12:47:42 +02002913int bdrv_has_zero_init_1(BlockDriverState *bs)
2914{
2915 return 1;
2916}
2917
Kevin Wolff2feebb2010-04-14 17:30:35 +02002918int bdrv_has_zero_init(BlockDriverState *bs)
2919{
2920 assert(bs->drv);
2921
Paolo Bonzini11212d82013-09-04 19:00:27 +02002922 /* If BS is a copy on write image, it is initialized to
2923 the contents of the base image, which may not be zeroes. */
Kevin Wolf760e0062015-06-17 14:55:21 +02002924 if (bs->backing) {
Paolo Bonzini11212d82013-09-04 19:00:27 +02002925 return 0;
2926 }
Kevin Wolf336c1c12010-07-28 11:26:29 +02002927 if (bs->drv->bdrv_has_zero_init) {
2928 return bs->drv->bdrv_has_zero_init(bs);
Kevin Wolff2feebb2010-04-14 17:30:35 +02002929 }
2930
Peter Lieven3ac21622013-06-28 12:47:42 +02002931 /* safe default */
2932 return 0;
Kevin Wolff2feebb2010-04-14 17:30:35 +02002933}
2934
Peter Lieven4ce78692013-10-24 12:06:54 +02002935bool bdrv_unallocated_blocks_are_zero(BlockDriverState *bs)
2936{
2937 BlockDriverInfo bdi;
2938
Kevin Wolf760e0062015-06-17 14:55:21 +02002939 if (bs->backing) {
Peter Lieven4ce78692013-10-24 12:06:54 +02002940 return false;
2941 }
2942
2943 if (bdrv_get_info(bs, &bdi) == 0) {
2944 return bdi.unallocated_blocks_are_zero;
2945 }
2946
2947 return false;
2948}
2949
2950bool bdrv_can_write_zeroes_with_unmap(BlockDriverState *bs)
2951{
2952 BlockDriverInfo bdi;
2953
Kevin Wolf760e0062015-06-17 14:55:21 +02002954 if (bs->backing || !(bs->open_flags & BDRV_O_UNMAP)) {
Peter Lieven4ce78692013-10-24 12:06:54 +02002955 return false;
2956 }
2957
2958 if (bdrv_get_info(bs, &bdi) == 0) {
2959 return bdi.can_write_zeroes_with_unmap;
2960 }
2961
2962 return false;
2963}
2964
aliguori045df332009-03-05 23:00:48 +00002965const char *bdrv_get_encrypted_filename(BlockDriverState *bs)
2966{
Kevin Wolf760e0062015-06-17 14:55:21 +02002967 if (bs->backing && bs->backing->bs->encrypted)
aliguori045df332009-03-05 23:00:48 +00002968 return bs->backing_file;
2969 else if (bs->encrypted)
2970 return bs->filename;
2971 else
2972 return NULL;
2973}
2974
ths5fafdf22007-09-16 21:08:06 +00002975void bdrv_get_backing_filename(BlockDriverState *bs,
bellard83f64092006-08-01 16:21:11 +00002976 char *filename, int filename_size)
bellardea2384d2004-08-01 21:59:26 +00002977{
Kevin Wolf3574c602011-10-26 11:02:11 +02002978 pstrcpy(filename, filename_size, bs->backing_file);
bellardea2384d2004-08-01 21:59:26 +00002979}
2980
bellardfaea38e2006-08-05 21:31:00 +00002981int bdrv_get_info(BlockDriverState *bs, BlockDriverInfo *bdi)
2982{
2983 BlockDriver *drv = bs->drv;
2984 if (!drv)
bellard19cb3732006-08-19 11:45:59 +00002985 return -ENOMEDIUM;
bellardfaea38e2006-08-05 21:31:00 +00002986 if (!drv->bdrv_get_info)
2987 return -ENOTSUP;
2988 memset(bdi, 0, sizeof(*bdi));
2989 return drv->bdrv_get_info(bs, bdi);
2990}
2991
Max Reitzeae041f2013-10-09 10:46:16 +02002992ImageInfoSpecific *bdrv_get_specific_info(BlockDriverState *bs)
2993{
2994 BlockDriver *drv = bs->drv;
2995 if (drv && drv->bdrv_get_specific_info) {
2996 return drv->bdrv_get_specific_info(bs);
2997 }
2998 return NULL;
2999}
3000
Kevin Wolf8b9b0cc2010-03-15 17:27:00 +01003001void bdrv_debug_event(BlockDriverState *bs, BlkDebugEvent event)
3002{
Kevin Wolfbf736fe2013-06-05 15:17:55 +02003003 if (!bs || !bs->drv || !bs->drv->bdrv_debug_event) {
Kevin Wolf8b9b0cc2010-03-15 17:27:00 +01003004 return;
3005 }
3006
Kevin Wolfbf736fe2013-06-05 15:17:55 +02003007 bs->drv->bdrv_debug_event(bs, event);
Kevin Wolf41c695c2012-12-06 14:32:58 +01003008}
Kevin Wolf8b9b0cc2010-03-15 17:27:00 +01003009
Kevin Wolf41c695c2012-12-06 14:32:58 +01003010int bdrv_debug_breakpoint(BlockDriverState *bs, const char *event,
3011 const char *tag)
3012{
3013 while (bs && bs->drv && !bs->drv->bdrv_debug_breakpoint) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02003014 bs = bs->file ? bs->file->bs : NULL;
Kevin Wolf41c695c2012-12-06 14:32:58 +01003015 }
3016
3017 if (bs && bs->drv && bs->drv->bdrv_debug_breakpoint) {
3018 return bs->drv->bdrv_debug_breakpoint(bs, event, tag);
3019 }
3020
3021 return -ENOTSUP;
3022}
3023
Fam Zheng4cc70e92013-11-20 10:01:54 +08003024int bdrv_debug_remove_breakpoint(BlockDriverState *bs, const char *tag)
3025{
3026 while (bs && bs->drv && !bs->drv->bdrv_debug_remove_breakpoint) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02003027 bs = bs->file ? bs->file->bs : NULL;
Fam Zheng4cc70e92013-11-20 10:01:54 +08003028 }
3029
3030 if (bs && bs->drv && bs->drv->bdrv_debug_remove_breakpoint) {
3031 return bs->drv->bdrv_debug_remove_breakpoint(bs, tag);
3032 }
3033
3034 return -ENOTSUP;
3035}
3036
Kevin Wolf41c695c2012-12-06 14:32:58 +01003037int bdrv_debug_resume(BlockDriverState *bs, const char *tag)
3038{
Max Reitz938789e2014-03-10 23:44:08 +01003039 while (bs && (!bs->drv || !bs->drv->bdrv_debug_resume)) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02003040 bs = bs->file ? bs->file->bs : NULL;
Kevin Wolf41c695c2012-12-06 14:32:58 +01003041 }
3042
3043 if (bs && bs->drv && bs->drv->bdrv_debug_resume) {
3044 return bs->drv->bdrv_debug_resume(bs, tag);
3045 }
3046
3047 return -ENOTSUP;
3048}
3049
3050bool bdrv_debug_is_suspended(BlockDriverState *bs, const char *tag)
3051{
3052 while (bs && bs->drv && !bs->drv->bdrv_debug_is_suspended) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02003053 bs = bs->file ? bs->file->bs : NULL;
Kevin Wolf41c695c2012-12-06 14:32:58 +01003054 }
3055
3056 if (bs && bs->drv && bs->drv->bdrv_debug_is_suspended) {
3057 return bs->drv->bdrv_debug_is_suspended(bs, tag);
3058 }
3059
3060 return false;
Kevin Wolf8b9b0cc2010-03-15 17:27:00 +01003061}
3062
Blue Swirl199630b2010-07-25 20:49:34 +00003063int bdrv_is_snapshot(BlockDriverState *bs)
3064{
3065 return !!(bs->open_flags & BDRV_O_SNAPSHOT);
3066}
3067
Jeff Codyb1b1d782012-10-16 15:49:09 -04003068/* backing_file can either be relative, or absolute, or a protocol. If it is
3069 * relative, it must be relative to the chain. So, passing in bs->filename
3070 * from a BDS as backing_file should not be done, as that may be relative to
3071 * the CWD rather than the chain. */
Marcelo Tosattie8a6bb92012-01-18 14:40:51 +00003072BlockDriverState *bdrv_find_backing_image(BlockDriverState *bs,
3073 const char *backing_file)
3074{
Jeff Codyb1b1d782012-10-16 15:49:09 -04003075 char *filename_full = NULL;
3076 char *backing_file_full = NULL;
3077 char *filename_tmp = NULL;
3078 int is_protocol = 0;
3079 BlockDriverState *curr_bs = NULL;
3080 BlockDriverState *retval = NULL;
3081
3082 if (!bs || !bs->drv || !backing_file) {
Marcelo Tosattie8a6bb92012-01-18 14:40:51 +00003083 return NULL;
3084 }
3085
Jeff Codyb1b1d782012-10-16 15:49:09 -04003086 filename_full = g_malloc(PATH_MAX);
3087 backing_file_full = g_malloc(PATH_MAX);
3088 filename_tmp = g_malloc(PATH_MAX);
3089
3090 is_protocol = path_has_protocol(backing_file);
3091
Kevin Wolf760e0062015-06-17 14:55:21 +02003092 for (curr_bs = bs; curr_bs->backing; curr_bs = curr_bs->backing->bs) {
Jeff Codyb1b1d782012-10-16 15:49:09 -04003093
3094 /* If either of the filename paths is actually a protocol, then
3095 * compare unmodified paths; otherwise make paths relative */
3096 if (is_protocol || path_has_protocol(curr_bs->backing_file)) {
3097 if (strcmp(backing_file, curr_bs->backing_file) == 0) {
Kevin Wolf760e0062015-06-17 14:55:21 +02003098 retval = curr_bs->backing->bs;
Jeff Codyb1b1d782012-10-16 15:49:09 -04003099 break;
3100 }
Marcelo Tosattie8a6bb92012-01-18 14:40:51 +00003101 } else {
Jeff Codyb1b1d782012-10-16 15:49:09 -04003102 /* If not an absolute filename path, make it relative to the current
3103 * image's filename path */
3104 path_combine(filename_tmp, PATH_MAX, curr_bs->filename,
3105 backing_file);
3106
3107 /* We are going to compare absolute pathnames */
3108 if (!realpath(filename_tmp, filename_full)) {
3109 continue;
3110 }
3111
3112 /* We need to make sure the backing filename we are comparing against
3113 * is relative to the current image filename (or absolute) */
3114 path_combine(filename_tmp, PATH_MAX, curr_bs->filename,
3115 curr_bs->backing_file);
3116
3117 if (!realpath(filename_tmp, backing_file_full)) {
3118 continue;
3119 }
3120
3121 if (strcmp(backing_file_full, filename_full) == 0) {
Kevin Wolf760e0062015-06-17 14:55:21 +02003122 retval = curr_bs->backing->bs;
Jeff Codyb1b1d782012-10-16 15:49:09 -04003123 break;
3124 }
Marcelo Tosattie8a6bb92012-01-18 14:40:51 +00003125 }
3126 }
3127
Jeff Codyb1b1d782012-10-16 15:49:09 -04003128 g_free(filename_full);
3129 g_free(backing_file_full);
3130 g_free(filename_tmp);
3131 return retval;
Marcelo Tosattie8a6bb92012-01-18 14:40:51 +00003132}
3133
Benoît Canetf198fd12012-08-02 10:22:47 +02003134int bdrv_get_backing_file_depth(BlockDriverState *bs)
3135{
3136 if (!bs->drv) {
3137 return 0;
3138 }
3139
Kevin Wolf760e0062015-06-17 14:55:21 +02003140 if (!bs->backing) {
Benoît Canetf198fd12012-08-02 10:22:47 +02003141 return 0;
3142 }
3143
Kevin Wolf760e0062015-06-17 14:55:21 +02003144 return 1 + bdrv_get_backing_file_depth(bs->backing->bs);
Benoît Canetf198fd12012-08-02 10:22:47 +02003145}
3146
bellardea2384d2004-08-01 21:59:26 +00003147void bdrv_init(void)
3148{
Anthony Liguori5efa9d52009-05-09 17:03:42 -05003149 module_call_init(MODULE_INIT_BLOCK);
bellardea2384d2004-08-01 21:59:26 +00003150}
pbrookce1a14d2006-08-07 02:38:06 +00003151
Markus Armbrustereb852012009-10-27 18:41:44 +01003152void bdrv_init_with_whitelist(void)
3153{
3154 use_bdrv_whitelist = 1;
3155 bdrv_init();
3156}
3157
Kevin Wolf5a8a30d2014-03-12 15:59:16 +01003158void bdrv_invalidate_cache(BlockDriverState *bs, Error **errp)
Anthony Liguori0f154232011-11-14 15:09:45 -06003159{
Kevin Wolf5a8a30d2014-03-12 15:59:16 +01003160 Error *local_err = NULL;
3161 int ret;
3162
Kevin Wolf3456a8d2014-03-11 10:58:39 +01003163 if (!bs->drv) {
3164 return;
Anthony Liguori0f154232011-11-14 15:09:45 -06003165 }
Kevin Wolf3456a8d2014-03-11 10:58:39 +01003166
Alexey Kardashevskiy7ea2d262014-10-09 13:50:46 +11003167 if (!(bs->open_flags & BDRV_O_INCOMING)) {
3168 return;
3169 }
3170 bs->open_flags &= ~BDRV_O_INCOMING;
3171
Kevin Wolf3456a8d2014-03-11 10:58:39 +01003172 if (bs->drv->bdrv_invalidate_cache) {
Kevin Wolf5a8a30d2014-03-12 15:59:16 +01003173 bs->drv->bdrv_invalidate_cache(bs, &local_err);
Kevin Wolf3456a8d2014-03-11 10:58:39 +01003174 } else if (bs->file) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02003175 bdrv_invalidate_cache(bs->file->bs, &local_err);
Kevin Wolf5a8a30d2014-03-12 15:59:16 +01003176 }
3177 if (local_err) {
3178 error_propagate(errp, local_err);
3179 return;
Kevin Wolf3456a8d2014-03-11 10:58:39 +01003180 }
3181
Kevin Wolf5a8a30d2014-03-12 15:59:16 +01003182 ret = refresh_total_sectors(bs, bs->total_sectors);
3183 if (ret < 0) {
3184 error_setg_errno(errp, -ret, "Could not refresh total sector count");
3185 return;
3186 }
Anthony Liguori0f154232011-11-14 15:09:45 -06003187}
3188
Kevin Wolf5a8a30d2014-03-12 15:59:16 +01003189void bdrv_invalidate_cache_all(Error **errp)
Anthony Liguori0f154232011-11-14 15:09:45 -06003190{
3191 BlockDriverState *bs;
Kevin Wolf5a8a30d2014-03-12 15:59:16 +01003192 Error *local_err = NULL;
Anthony Liguori0f154232011-11-14 15:09:45 -06003193
Benoît Canetdc364f42014-01-23 21:31:32 +01003194 QTAILQ_FOREACH(bs, &bdrv_states, device_list) {
Stefan Hajnoczied78cda2014-05-08 16:34:35 +02003195 AioContext *aio_context = bdrv_get_aio_context(bs);
3196
3197 aio_context_acquire(aio_context);
Kevin Wolf5a8a30d2014-03-12 15:59:16 +01003198 bdrv_invalidate_cache(bs, &local_err);
Stefan Hajnoczied78cda2014-05-08 16:34:35 +02003199 aio_context_release(aio_context);
Kevin Wolf5a8a30d2014-03-12 15:59:16 +01003200 if (local_err) {
3201 error_propagate(errp, local_err);
3202 return;
3203 }
Anthony Liguori0f154232011-11-14 15:09:45 -06003204 }
3205}
3206
Kevin Wolff9f05dc2011-07-15 13:50:26 +02003207/**************************************************************/
bellard19cb3732006-08-19 11:45:59 +00003208/* removable device support */
3209
3210/**
3211 * Return TRUE if the media is present
3212 */
3213int bdrv_is_inserted(BlockDriverState *bs)
3214{
3215 BlockDriver *drv = bs->drv;
Markus Armbrustera1aff5b2011-09-06 18:58:41 +02003216
bellard19cb3732006-08-19 11:45:59 +00003217 if (!drv)
3218 return 0;
3219 if (!drv->bdrv_is_inserted)
Markus Armbrustera1aff5b2011-09-06 18:58:41 +02003220 return 1;
3221 return drv->bdrv_is_inserted(bs);
bellard19cb3732006-08-19 11:45:59 +00003222}
3223
3224/**
Markus Armbruster8e49ca42011-08-03 15:08:08 +02003225 * Return whether the media changed since the last call to this
3226 * function, or -ENOTSUP if we don't know. Most drivers don't know.
bellard19cb3732006-08-19 11:45:59 +00003227 */
3228int bdrv_media_changed(BlockDriverState *bs)
3229{
3230 BlockDriver *drv = bs->drv;
bellard19cb3732006-08-19 11:45:59 +00003231
Markus Armbruster8e49ca42011-08-03 15:08:08 +02003232 if (drv && drv->bdrv_media_changed) {
3233 return drv->bdrv_media_changed(bs);
3234 }
3235 return -ENOTSUP;
bellard19cb3732006-08-19 11:45:59 +00003236}
3237
3238/**
3239 * If eject_flag is TRUE, eject the media. Otherwise, close the tray
3240 */
Luiz Capitulinof36f3942012-02-03 16:24:53 -02003241void bdrv_eject(BlockDriverState *bs, bool eject_flag)
bellard19cb3732006-08-19 11:45:59 +00003242{
3243 BlockDriver *drv = bs->drv;
Markus Armbrusterbfb197e2014-10-07 13:59:11 +02003244 const char *device_name;
bellard19cb3732006-08-19 11:45:59 +00003245
Markus Armbruster822e1cd2011-07-20 18:23:42 +02003246 if (drv && drv->bdrv_eject) {
3247 drv->bdrv_eject(bs, eject_flag);
bellard19cb3732006-08-19 11:45:59 +00003248 }
Luiz Capitulino6f382ed2012-02-14 13:41:13 -02003249
Markus Armbrusterbfb197e2014-10-07 13:59:11 +02003250 device_name = bdrv_get_device_name(bs);
3251 if (device_name[0] != '\0') {
3252 qapi_event_send_device_tray_moved(device_name,
Wenchao Xiaa5ee7bd2014-06-18 08:43:44 +02003253 eject_flag, &error_abort);
Luiz Capitulino6f382ed2012-02-14 13:41:13 -02003254 }
bellard19cb3732006-08-19 11:45:59 +00003255}
3256
bellard19cb3732006-08-19 11:45:59 +00003257/**
3258 * Lock or unlock the media (if it is locked, the user won't be able
3259 * to eject it manually).
3260 */
Markus Armbruster025e8492011-09-06 18:58:47 +02003261void bdrv_lock_medium(BlockDriverState *bs, bool locked)
bellard19cb3732006-08-19 11:45:59 +00003262{
3263 BlockDriver *drv = bs->drv;
3264
Markus Armbruster025e8492011-09-06 18:58:47 +02003265 trace_bdrv_lock_medium(bs, locked);
Stefan Hajnoczib8c6d092011-03-29 20:04:40 +01003266
Markus Armbruster025e8492011-09-06 18:58:47 +02003267 if (drv && drv->bdrv_lock_medium) {
3268 drv->bdrv_lock_medium(bs, locked);
bellard19cb3732006-08-19 11:45:59 +00003269 }
3270}
ths985a03b2007-12-24 16:10:43 +00003271
Paolo Bonzini1b7fd722011-11-29 11:35:47 +01003272void bdrv_set_guest_block_size(BlockDriverState *bs, int align)
Markus Armbruster7b6f9302011-09-06 18:58:56 +02003273{
Paolo Bonzini1b7fd722011-11-29 11:35:47 +01003274 bs->guest_block_size = align;
Markus Armbruster7b6f9302011-09-06 18:58:56 +02003275}
lirans@il.ibm.com7cd1e322009-11-02 15:40:41 +02003276
Fam Zheng0db6e542015-04-17 19:49:50 -04003277BdrvDirtyBitmap *bdrv_find_dirty_bitmap(BlockDriverState *bs, const char *name)
3278{
3279 BdrvDirtyBitmap *bm;
3280
3281 assert(name);
3282 QLIST_FOREACH(bm, &bs->dirty_bitmaps, list) {
3283 if (bm->name && !strcmp(name, bm->name)) {
3284 return bm;
3285 }
3286 }
3287 return NULL;
3288}
3289
John Snow20dca812015-04-17 19:50:02 -04003290void bdrv_dirty_bitmap_make_anon(BdrvDirtyBitmap *bitmap)
Fam Zheng0db6e542015-04-17 19:49:50 -04003291{
John Snow9bd2b082015-04-17 19:49:57 -04003292 assert(!bdrv_dirty_bitmap_frozen(bitmap));
Fam Zheng0db6e542015-04-17 19:49:50 -04003293 g_free(bitmap->name);
3294 bitmap->name = NULL;
3295}
3296
3297BdrvDirtyBitmap *bdrv_create_dirty_bitmap(BlockDriverState *bs,
John Snow5fba6c02015-04-17 19:49:51 -04003298 uint32_t granularity,
Fam Zheng0db6e542015-04-17 19:49:50 -04003299 const char *name,
Fam Zhengb8afb522014-04-16 09:34:30 +08003300 Error **errp)
lirans@il.ibm.com7cd1e322009-11-02 15:40:41 +02003301{
3302 int64_t bitmap_size;
Fam Zhenge4654d22013-11-13 18:29:43 +08003303 BdrvDirtyBitmap *bitmap;
John Snow5fba6c02015-04-17 19:49:51 -04003304 uint32_t sector_granularity;
Jan Kiszkaa55eb922009-11-30 18:21:19 +01003305
Paolo Bonzini50717e92013-01-21 17:09:45 +01003306 assert((granularity & (granularity - 1)) == 0);
3307
Fam Zheng0db6e542015-04-17 19:49:50 -04003308 if (name && bdrv_find_dirty_bitmap(bs, name)) {
3309 error_setg(errp, "Bitmap already exists: %s", name);
3310 return NULL;
3311 }
John Snow5fba6c02015-04-17 19:49:51 -04003312 sector_granularity = granularity >> BDRV_SECTOR_BITS;
3313 assert(sector_granularity);
Markus Armbruster57322b72014-06-26 13:23:22 +02003314 bitmap_size = bdrv_nb_sectors(bs);
Fam Zhengb8afb522014-04-16 09:34:30 +08003315 if (bitmap_size < 0) {
3316 error_setg_errno(errp, -bitmap_size, "could not get length of device");
3317 errno = -bitmap_size;
3318 return NULL;
3319 }
Markus Armbruster5839e532014-08-19 10:31:08 +02003320 bitmap = g_new0(BdrvDirtyBitmap, 1);
John Snow5fba6c02015-04-17 19:49:51 -04003321 bitmap->bitmap = hbitmap_alloc(bitmap_size, ctz32(sector_granularity));
John Snowe74e6b72015-04-17 19:49:59 -04003322 bitmap->size = bitmap_size;
Fam Zheng0db6e542015-04-17 19:49:50 -04003323 bitmap->name = g_strdup(name);
John Snowb8e6fb72015-04-17 19:49:56 -04003324 bitmap->disabled = false;
Fam Zhenge4654d22013-11-13 18:29:43 +08003325 QLIST_INSERT_HEAD(&bs->dirty_bitmaps, bitmap, list);
3326 return bitmap;
3327}
3328
John Snow9bd2b082015-04-17 19:49:57 -04003329bool bdrv_dirty_bitmap_frozen(BdrvDirtyBitmap *bitmap)
3330{
3331 return bitmap->successor;
3332}
3333
John Snowb8e6fb72015-04-17 19:49:56 -04003334bool bdrv_dirty_bitmap_enabled(BdrvDirtyBitmap *bitmap)
3335{
John Snow9bd2b082015-04-17 19:49:57 -04003336 return !(bitmap->disabled || bitmap->successor);
3337}
3338
John Snow9abe3bd2015-05-12 15:53:01 -04003339DirtyBitmapStatus bdrv_dirty_bitmap_status(BdrvDirtyBitmap *bitmap)
3340{
3341 if (bdrv_dirty_bitmap_frozen(bitmap)) {
3342 return DIRTY_BITMAP_STATUS_FROZEN;
3343 } else if (!bdrv_dirty_bitmap_enabled(bitmap)) {
3344 return DIRTY_BITMAP_STATUS_DISABLED;
3345 } else {
3346 return DIRTY_BITMAP_STATUS_ACTIVE;
3347 }
3348}
3349
John Snow9bd2b082015-04-17 19:49:57 -04003350/**
3351 * Create a successor bitmap destined to replace this bitmap after an operation.
3352 * Requires that the bitmap is not frozen and has no successor.
3353 */
3354int bdrv_dirty_bitmap_create_successor(BlockDriverState *bs,
3355 BdrvDirtyBitmap *bitmap, Error **errp)
3356{
3357 uint64_t granularity;
3358 BdrvDirtyBitmap *child;
3359
3360 if (bdrv_dirty_bitmap_frozen(bitmap)) {
3361 error_setg(errp, "Cannot create a successor for a bitmap that is "
3362 "currently frozen");
3363 return -1;
3364 }
3365 assert(!bitmap->successor);
3366
3367 /* Create an anonymous successor */
3368 granularity = bdrv_dirty_bitmap_granularity(bitmap);
3369 child = bdrv_create_dirty_bitmap(bs, granularity, NULL, errp);
3370 if (!child) {
3371 return -1;
3372 }
3373
3374 /* Successor will be on or off based on our current state. */
3375 child->disabled = bitmap->disabled;
3376
3377 /* Install the successor and freeze the parent */
3378 bitmap->successor = child;
3379 return 0;
3380}
3381
3382/**
3383 * For a bitmap with a successor, yield our name to the successor,
3384 * delete the old bitmap, and return a handle to the new bitmap.
3385 */
3386BdrvDirtyBitmap *bdrv_dirty_bitmap_abdicate(BlockDriverState *bs,
3387 BdrvDirtyBitmap *bitmap,
3388 Error **errp)
3389{
3390 char *name;
3391 BdrvDirtyBitmap *successor = bitmap->successor;
3392
3393 if (successor == NULL) {
3394 error_setg(errp, "Cannot relinquish control if "
3395 "there's no successor present");
3396 return NULL;
3397 }
3398
3399 name = bitmap->name;
3400 bitmap->name = NULL;
3401 successor->name = name;
3402 bitmap->successor = NULL;
3403 bdrv_release_dirty_bitmap(bs, bitmap);
3404
3405 return successor;
3406}
3407
3408/**
3409 * In cases of failure where we can no longer safely delete the parent,
3410 * we may wish to re-join the parent and child/successor.
3411 * The merged parent will be un-frozen, but not explicitly re-enabled.
3412 */
3413BdrvDirtyBitmap *bdrv_reclaim_dirty_bitmap(BlockDriverState *bs,
3414 BdrvDirtyBitmap *parent,
3415 Error **errp)
3416{
3417 BdrvDirtyBitmap *successor = parent->successor;
3418
3419 if (!successor) {
3420 error_setg(errp, "Cannot reclaim a successor when none is present");
3421 return NULL;
3422 }
3423
3424 if (!hbitmap_merge(parent->bitmap, successor->bitmap)) {
3425 error_setg(errp, "Merging of parent and successor bitmap failed");
3426 return NULL;
3427 }
3428 bdrv_release_dirty_bitmap(bs, successor);
3429 parent->successor = NULL;
3430
3431 return parent;
John Snowb8e6fb72015-04-17 19:49:56 -04003432}
3433
John Snowce1ffea2015-04-17 19:50:03 -04003434/**
3435 * Truncates _all_ bitmaps attached to a BDS.
3436 */
3437static void bdrv_dirty_bitmap_truncate(BlockDriverState *bs)
3438{
3439 BdrvDirtyBitmap *bitmap;
3440 uint64_t size = bdrv_nb_sectors(bs);
3441
3442 QLIST_FOREACH(bitmap, &bs->dirty_bitmaps, list) {
John Snow06207b02015-06-10 13:24:54 -04003443 assert(!bdrv_dirty_bitmap_frozen(bitmap));
John Snowce1ffea2015-04-17 19:50:03 -04003444 hbitmap_truncate(bitmap->bitmap, size);
John Snow5270b6a2015-06-08 16:49:15 -04003445 bitmap->size = size;
John Snowce1ffea2015-04-17 19:50:03 -04003446 }
3447}
3448
Fam Zhenge4654d22013-11-13 18:29:43 +08003449void bdrv_release_dirty_bitmap(BlockDriverState *bs, BdrvDirtyBitmap *bitmap)
3450{
3451 BdrvDirtyBitmap *bm, *next;
3452 QLIST_FOREACH_SAFE(bm, &bs->dirty_bitmaps, list, next) {
3453 if (bm == bitmap) {
John Snow9bd2b082015-04-17 19:49:57 -04003454 assert(!bdrv_dirty_bitmap_frozen(bm));
Fam Zhenge4654d22013-11-13 18:29:43 +08003455 QLIST_REMOVE(bitmap, list);
3456 hbitmap_free(bitmap->bitmap);
Fam Zheng0db6e542015-04-17 19:49:50 -04003457 g_free(bitmap->name);
Fam Zhenge4654d22013-11-13 18:29:43 +08003458 g_free(bitmap);
3459 return;
Jan Kiszkaa55eb922009-11-30 18:21:19 +01003460 }
lirans@il.ibm.com7cd1e322009-11-02 15:40:41 +02003461 }
3462}
3463
John Snowb8e6fb72015-04-17 19:49:56 -04003464void bdrv_disable_dirty_bitmap(BdrvDirtyBitmap *bitmap)
3465{
John Snow9bd2b082015-04-17 19:49:57 -04003466 assert(!bdrv_dirty_bitmap_frozen(bitmap));
John Snowb8e6fb72015-04-17 19:49:56 -04003467 bitmap->disabled = true;
3468}
3469
3470void bdrv_enable_dirty_bitmap(BdrvDirtyBitmap *bitmap)
3471{
John Snow9bd2b082015-04-17 19:49:57 -04003472 assert(!bdrv_dirty_bitmap_frozen(bitmap));
John Snowb8e6fb72015-04-17 19:49:56 -04003473 bitmap->disabled = false;
3474}
3475
Fam Zheng21b56832013-11-13 18:29:44 +08003476BlockDirtyInfoList *bdrv_query_dirty_bitmaps(BlockDriverState *bs)
3477{
3478 BdrvDirtyBitmap *bm;
3479 BlockDirtyInfoList *list = NULL;
3480 BlockDirtyInfoList **plist = &list;
3481
3482 QLIST_FOREACH(bm, &bs->dirty_bitmaps, list) {
Markus Armbruster5839e532014-08-19 10:31:08 +02003483 BlockDirtyInfo *info = g_new0(BlockDirtyInfo, 1);
3484 BlockDirtyInfoList *entry = g_new0(BlockDirtyInfoList, 1);
John Snow20dca812015-04-17 19:50:02 -04003485 info->count = bdrv_get_dirty_count(bm);
John Snow592fdd02015-04-17 19:49:53 -04003486 info->granularity = bdrv_dirty_bitmap_granularity(bm);
Fam Zheng0db6e542015-04-17 19:49:50 -04003487 info->has_name = !!bm->name;
3488 info->name = g_strdup(bm->name);
John Snow9abe3bd2015-05-12 15:53:01 -04003489 info->status = bdrv_dirty_bitmap_status(bm);
Fam Zheng21b56832013-11-13 18:29:44 +08003490 entry->value = info;
3491 *plist = entry;
3492 plist = &entry->next;
3493 }
3494
3495 return list;
3496}
3497
Fam Zhenge4654d22013-11-13 18:29:43 +08003498int bdrv_get_dirty(BlockDriverState *bs, BdrvDirtyBitmap *bitmap, int64_t sector)
lirans@il.ibm.com7cd1e322009-11-02 15:40:41 +02003499{
Fam Zhenge4654d22013-11-13 18:29:43 +08003500 if (bitmap) {
3501 return hbitmap_get(bitmap->bitmap, sector);
lirans@il.ibm.com7cd1e322009-11-02 15:40:41 +02003502 } else {
3503 return 0;
3504 }
3505}
3506
John Snow341ebc22015-04-17 19:49:52 -04003507/**
3508 * Chooses a default granularity based on the existing cluster size,
3509 * but clamped between [4K, 64K]. Defaults to 64K in the case that there
3510 * is no cluster size information available.
3511 */
3512uint32_t bdrv_get_default_bitmap_granularity(BlockDriverState *bs)
3513{
3514 BlockDriverInfo bdi;
3515 uint32_t granularity;
3516
3517 if (bdrv_get_info(bs, &bdi) >= 0 && bdi.cluster_size > 0) {
3518 granularity = MAX(4096, bdi.cluster_size);
3519 granularity = MIN(65536, granularity);
3520 } else {
3521 granularity = 65536;
3522 }
3523
3524 return granularity;
3525}
3526
John Snow592fdd02015-04-17 19:49:53 -04003527uint32_t bdrv_dirty_bitmap_granularity(BdrvDirtyBitmap *bitmap)
3528{
3529 return BDRV_SECTOR_SIZE << hbitmap_granularity(bitmap->bitmap);
3530}
3531
John Snow20dca812015-04-17 19:50:02 -04003532void bdrv_dirty_iter_init(BdrvDirtyBitmap *bitmap, HBitmapIter *hbi)
Paolo Bonzini1755da12012-10-18 16:49:18 +02003533{
Fam Zhenge4654d22013-11-13 18:29:43 +08003534 hbitmap_iter_init(hbi, bitmap->bitmap, 0);
Paolo Bonzini1755da12012-10-18 16:49:18 +02003535}
3536
John Snow20dca812015-04-17 19:50:02 -04003537void bdrv_set_dirty_bitmap(BdrvDirtyBitmap *bitmap,
Vladimir Sementsov-Ogievskiyc4237df2014-11-27 12:40:46 +03003538 int64_t cur_sector, int nr_sectors)
3539{
John Snowb8e6fb72015-04-17 19:49:56 -04003540 assert(bdrv_dirty_bitmap_enabled(bitmap));
Vladimir Sementsov-Ogievskiyc4237df2014-11-27 12:40:46 +03003541 hbitmap_set(bitmap->bitmap, cur_sector, nr_sectors);
3542}
3543
John Snow20dca812015-04-17 19:50:02 -04003544void bdrv_reset_dirty_bitmap(BdrvDirtyBitmap *bitmap,
Vladimir Sementsov-Ogievskiyc4237df2014-11-27 12:40:46 +03003545 int64_t cur_sector, int nr_sectors)
3546{
John Snowb8e6fb72015-04-17 19:49:56 -04003547 assert(bdrv_dirty_bitmap_enabled(bitmap));
Vladimir Sementsov-Ogievskiyc4237df2014-11-27 12:40:46 +03003548 hbitmap_reset(bitmap->bitmap, cur_sector, nr_sectors);
3549}
3550
John Snowe74e6b72015-04-17 19:49:59 -04003551void bdrv_clear_dirty_bitmap(BdrvDirtyBitmap *bitmap)
3552{
3553 assert(bdrv_dirty_bitmap_enabled(bitmap));
Wen Congyangc6a8c322015-05-22 09:29:46 +08003554 hbitmap_reset_all(bitmap->bitmap);
John Snowe74e6b72015-04-17 19:49:59 -04003555}
3556
Stefan Hajnoczie0c47b62015-04-28 14:27:50 +01003557void bdrv_set_dirty(BlockDriverState *bs, int64_t cur_sector,
3558 int nr_sectors)
Paolo Bonzini1755da12012-10-18 16:49:18 +02003559{
Fam Zhenge4654d22013-11-13 18:29:43 +08003560 BdrvDirtyBitmap *bitmap;
3561 QLIST_FOREACH(bitmap, &bs->dirty_bitmaps, list) {
John Snowb8e6fb72015-04-17 19:49:56 -04003562 if (!bdrv_dirty_bitmap_enabled(bitmap)) {
3563 continue;
3564 }
Fam Zhenge4654d22013-11-13 18:29:43 +08003565 hbitmap_set(bitmap->bitmap, cur_sector, nr_sectors);
Paolo Bonzini8f0720e2013-01-21 17:09:41 +01003566 }
Liran Schouraaa0eb72010-01-26 10:31:48 +02003567}
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003568
John Snowd58d8452015-04-17 19:49:58 -04003569/**
3570 * Advance an HBitmapIter to an arbitrary offset.
3571 */
3572void bdrv_set_dirty_iter(HBitmapIter *hbi, int64_t offset)
3573{
3574 assert(hbi->hb);
3575 hbitmap_iter_init(hbi, hbi->hb, offset);
3576}
3577
John Snow20dca812015-04-17 19:50:02 -04003578int64_t bdrv_get_dirty_count(BdrvDirtyBitmap *bitmap)
Fam Zhenge4654d22013-11-13 18:29:43 +08003579{
3580 return hbitmap_count(bitmap->bitmap);
3581}
3582
Fam Zheng9fcb0252013-08-23 09:14:46 +08003583/* Get a reference to bs */
3584void bdrv_ref(BlockDriverState *bs)
3585{
3586 bs->refcnt++;
3587}
3588
3589/* Release a previously grabbed reference to bs.
3590 * If after releasing, reference count is zero, the BlockDriverState is
3591 * deleted. */
3592void bdrv_unref(BlockDriverState *bs)
3593{
Jeff Cody9a4d5ca2014-07-23 17:22:57 -04003594 if (!bs) {
3595 return;
3596 }
Fam Zheng9fcb0252013-08-23 09:14:46 +08003597 assert(bs->refcnt > 0);
3598 if (--bs->refcnt == 0) {
3599 bdrv_delete(bs);
3600 }
3601}
3602
Fam Zhengfbe40ff2014-05-23 21:29:42 +08003603struct BdrvOpBlocker {
3604 Error *reason;
3605 QLIST_ENTRY(BdrvOpBlocker) list;
3606};
3607
3608bool bdrv_op_is_blocked(BlockDriverState *bs, BlockOpType op, Error **errp)
3609{
3610 BdrvOpBlocker *blocker;
3611 assert((int) op >= 0 && op < BLOCK_OP_TYPE_MAX);
3612 if (!QLIST_EMPTY(&bs->op_blockers[op])) {
3613 blocker = QLIST_FIRST(&bs->op_blockers[op]);
3614 if (errp) {
Alberto Garcia81e5f782015-04-08 12:29:19 +03003615 error_setg(errp, "Node '%s' is busy: %s",
3616 bdrv_get_device_or_node_name(bs),
Markus Armbrusterbfb197e2014-10-07 13:59:11 +02003617 error_get_pretty(blocker->reason));
Fam Zhengfbe40ff2014-05-23 21:29:42 +08003618 }
3619 return true;
3620 }
3621 return false;
3622}
3623
3624void bdrv_op_block(BlockDriverState *bs, BlockOpType op, Error *reason)
3625{
3626 BdrvOpBlocker *blocker;
3627 assert((int) op >= 0 && op < BLOCK_OP_TYPE_MAX);
3628
Markus Armbruster5839e532014-08-19 10:31:08 +02003629 blocker = g_new0(BdrvOpBlocker, 1);
Fam Zhengfbe40ff2014-05-23 21:29:42 +08003630 blocker->reason = reason;
3631 QLIST_INSERT_HEAD(&bs->op_blockers[op], blocker, list);
3632}
3633
3634void bdrv_op_unblock(BlockDriverState *bs, BlockOpType op, Error *reason)
3635{
3636 BdrvOpBlocker *blocker, *next;
3637 assert((int) op >= 0 && op < BLOCK_OP_TYPE_MAX);
3638 QLIST_FOREACH_SAFE(blocker, &bs->op_blockers[op], list, next) {
3639 if (blocker->reason == reason) {
3640 QLIST_REMOVE(blocker, list);
3641 g_free(blocker);
3642 }
3643 }
3644}
3645
3646void bdrv_op_block_all(BlockDriverState *bs, Error *reason)
3647{
3648 int i;
3649 for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
3650 bdrv_op_block(bs, i, reason);
3651 }
3652}
3653
3654void bdrv_op_unblock_all(BlockDriverState *bs, Error *reason)
3655{
3656 int i;
3657 for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
3658 bdrv_op_unblock(bs, i, reason);
3659 }
3660}
3661
3662bool bdrv_op_blocker_is_empty(BlockDriverState *bs)
3663{
3664 int i;
3665
3666 for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
3667 if (!QLIST_EMPTY(&bs->op_blockers[i])) {
3668 return false;
3669 }
3670 }
3671 return true;
3672}
3673
Luiz Capitulino28a72822011-09-26 17:43:50 -03003674void bdrv_iostatus_enable(BlockDriverState *bs)
3675{
Luiz Capitulinod6bf2792011-10-14 17:11:23 -03003676 bs->iostatus_enabled = true;
Luiz Capitulino58e21ef2011-10-14 17:22:24 -03003677 bs->iostatus = BLOCK_DEVICE_IO_STATUS_OK;
Luiz Capitulino28a72822011-09-26 17:43:50 -03003678}
3679
3680/* The I/O status is only enabled if the drive explicitly
3681 * enables it _and_ the VM is configured to stop on errors */
3682bool bdrv_iostatus_is_enabled(const BlockDriverState *bs)
3683{
Luiz Capitulinod6bf2792011-10-14 17:11:23 -03003684 return (bs->iostatus_enabled &&
Paolo Bonzini92aa5c62012-09-28 17:22:55 +02003685 (bs->on_write_error == BLOCKDEV_ON_ERROR_ENOSPC ||
3686 bs->on_write_error == BLOCKDEV_ON_ERROR_STOP ||
3687 bs->on_read_error == BLOCKDEV_ON_ERROR_STOP));
Luiz Capitulino28a72822011-09-26 17:43:50 -03003688}
3689
3690void bdrv_iostatus_disable(BlockDriverState *bs)
3691{
Luiz Capitulinod6bf2792011-10-14 17:11:23 -03003692 bs->iostatus_enabled = false;
Luiz Capitulino28a72822011-09-26 17:43:50 -03003693}
3694
3695void bdrv_iostatus_reset(BlockDriverState *bs)
3696{
3697 if (bdrv_iostatus_is_enabled(bs)) {
Luiz Capitulino58e21ef2011-10-14 17:22:24 -03003698 bs->iostatus = BLOCK_DEVICE_IO_STATUS_OK;
Paolo Bonzini3bd293c2012-10-18 16:49:27 +02003699 if (bs->job) {
3700 block_job_iostatus_reset(bs->job);
3701 }
Luiz Capitulino28a72822011-09-26 17:43:50 -03003702 }
3703}
3704
Luiz Capitulino28a72822011-09-26 17:43:50 -03003705void bdrv_iostatus_set_err(BlockDriverState *bs, int error)
3706{
Paolo Bonzini3e1caa52012-09-28 17:22:57 +02003707 assert(bdrv_iostatus_is_enabled(bs));
3708 if (bs->iostatus == BLOCK_DEVICE_IO_STATUS_OK) {
Luiz Capitulino58e21ef2011-10-14 17:22:24 -03003709 bs->iostatus = error == ENOSPC ? BLOCK_DEVICE_IO_STATUS_NOSPACE :
3710 BLOCK_DEVICE_IO_STATUS_FAILED;
Luiz Capitulino28a72822011-09-26 17:43:50 -03003711 }
3712}
3713
Luiz Capitulinod92ada22012-11-30 10:52:09 -02003714void bdrv_img_create(const char *filename, const char *fmt,
3715 const char *base_filename, const char *base_fmt,
Miroslav Rezaninaf382d432013-02-13 09:09:40 +01003716 char *options, uint64_t img_size, int flags,
3717 Error **errp, bool quiet)
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003718{
Chunyan Liu83d05212014-06-05 17:20:51 +08003719 QemuOptsList *create_opts = NULL;
3720 QemuOpts *opts = NULL;
3721 const char *backing_fmt, *backing_file;
3722 int64_t size;
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003723 BlockDriver *drv, *proto_drv;
Max Reitzcc84d902013-09-06 17:14:26 +02003724 Error *local_err = NULL;
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003725 int ret = 0;
3726
3727 /* Find driver and parse its options */
3728 drv = bdrv_find_format(fmt);
3729 if (!drv) {
Luiz Capitulino71c79812012-11-30 10:52:04 -02003730 error_setg(errp, "Unknown file format '%s'", fmt);
Luiz Capitulinod92ada22012-11-30 10:52:09 -02003731 return;
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003732 }
3733
Max Reitzb65a5e12015-02-05 13:58:12 -05003734 proto_drv = bdrv_find_protocol(filename, true, errp);
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003735 if (!proto_drv) {
Luiz Capitulinod92ada22012-11-30 10:52:09 -02003736 return;
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003737 }
3738
Max Reitzc6149722014-12-02 18:32:45 +01003739 if (!drv->create_opts) {
3740 error_setg(errp, "Format driver '%s' does not support image creation",
3741 drv->format_name);
3742 return;
3743 }
3744
3745 if (!proto_drv->create_opts) {
3746 error_setg(errp, "Protocol driver '%s' does not support image creation",
3747 proto_drv->format_name);
3748 return;
3749 }
3750
Chunyan Liuc282e1f2014-06-05 17:21:11 +08003751 create_opts = qemu_opts_append(create_opts, drv->create_opts);
3752 create_opts = qemu_opts_append(create_opts, proto_drv->create_opts);
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003753
3754 /* Create parameter list with default values */
Chunyan Liu83d05212014-06-05 17:20:51 +08003755 opts = qemu_opts_create(create_opts, NULL, 0, &error_abort);
Markus Armbruster39101f22015-02-12 16:46:36 +01003756 qemu_opt_set_number(opts, BLOCK_OPT_SIZE, img_size, &error_abort);
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003757
3758 /* Parse -o options */
3759 if (options) {
Markus Armbrusterdc523cd342015-02-12 18:37:11 +01003760 qemu_opts_do_parse(opts, options, NULL, &local_err);
3761 if (local_err) {
3762 error_report_err(local_err);
3763 local_err = NULL;
Chunyan Liu83d05212014-06-05 17:20:51 +08003764 error_setg(errp, "Invalid options for file format '%s'", fmt);
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003765 goto out;
3766 }
3767 }
3768
3769 if (base_filename) {
Markus Armbrusterf43e47d2015-02-12 17:52:20 +01003770 qemu_opt_set(opts, BLOCK_OPT_BACKING_FILE, base_filename, &local_err);
Markus Armbruster6be41942015-02-12 17:49:02 +01003771 if (local_err) {
Luiz Capitulino71c79812012-11-30 10:52:04 -02003772 error_setg(errp, "Backing file not supported for file format '%s'",
3773 fmt);
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003774 goto out;
3775 }
3776 }
3777
3778 if (base_fmt) {
Markus Armbrusterf43e47d2015-02-12 17:52:20 +01003779 qemu_opt_set(opts, BLOCK_OPT_BACKING_FMT, base_fmt, &local_err);
Markus Armbruster6be41942015-02-12 17:49:02 +01003780 if (local_err) {
Luiz Capitulino71c79812012-11-30 10:52:04 -02003781 error_setg(errp, "Backing file format not supported for file "
3782 "format '%s'", fmt);
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003783 goto out;
3784 }
3785 }
3786
Chunyan Liu83d05212014-06-05 17:20:51 +08003787 backing_file = qemu_opt_get(opts, BLOCK_OPT_BACKING_FILE);
3788 if (backing_file) {
3789 if (!strcmp(filename, backing_file)) {
Luiz Capitulino71c79812012-11-30 10:52:04 -02003790 error_setg(errp, "Error: Trying to create an image with the "
3791 "same filename as the backing file");
Jes Sorensen792da932010-12-16 13:52:17 +01003792 goto out;
3793 }
3794 }
3795
Chunyan Liu83d05212014-06-05 17:20:51 +08003796 backing_fmt = qemu_opt_get(opts, BLOCK_OPT_BACKING_FMT);
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003797
3798 // The size for the image must always be specified, with one exception:
3799 // If we are using a backing file, we can obtain the size from there
Chunyan Liu83d05212014-06-05 17:20:51 +08003800 size = qemu_opt_get_size(opts, BLOCK_OPT_SIZE, 0);
3801 if (size == -1) {
3802 if (backing_file) {
Max Reitz66f6b812013-12-03 14:57:52 +01003803 BlockDriverState *bs;
Max Reitz29168012014-11-26 17:20:27 +01003804 char *full_backing = g_new0(char, PATH_MAX);
Markus Armbruster52bf1e72014-06-26 13:23:25 +02003805 int64_t size;
Paolo Bonzini63090da2012-04-12 14:01:03 +02003806 int back_flags;
Max Reitze6641712015-08-26 19:47:48 +02003807 QDict *backing_options = NULL;
Paolo Bonzini63090da2012-04-12 14:01:03 +02003808
Max Reitz29168012014-11-26 17:20:27 +01003809 bdrv_get_full_backing_filename_from_filename(filename, backing_file,
3810 full_backing, PATH_MAX,
3811 &local_err);
3812 if (local_err) {
3813 g_free(full_backing);
3814 goto out;
3815 }
3816
Paolo Bonzini63090da2012-04-12 14:01:03 +02003817 /* backing files always opened read-only */
3818 back_flags =
3819 flags & ~(BDRV_O_RDWR | BDRV_O_SNAPSHOT | BDRV_O_NO_BACKING);
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003820
Max Reitze6641712015-08-26 19:47:48 +02003821 if (backing_fmt) {
3822 backing_options = qdict_new();
3823 qdict_put(backing_options, "driver",
3824 qstring_from_str(backing_fmt));
3825 }
3826
Max Reitzf67503e2014-02-18 18:33:05 +01003827 bs = NULL;
Max Reitze6641712015-08-26 19:47:48 +02003828 ret = bdrv_open(&bs, full_backing, NULL, backing_options,
Max Reitz6ebf9aa2015-08-26 19:47:49 +02003829 back_flags, &local_err);
Max Reitz29168012014-11-26 17:20:27 +01003830 g_free(full_backing);
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003831 if (ret < 0) {
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003832 goto out;
3833 }
Markus Armbruster52bf1e72014-06-26 13:23:25 +02003834 size = bdrv_getlength(bs);
3835 if (size < 0) {
3836 error_setg_errno(errp, -size, "Could not get size of '%s'",
3837 backing_file);
3838 bdrv_unref(bs);
3839 goto out;
3840 }
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003841
Markus Armbruster39101f22015-02-12 16:46:36 +01003842 qemu_opt_set_number(opts, BLOCK_OPT_SIZE, size, &error_abort);
Max Reitz66f6b812013-12-03 14:57:52 +01003843
3844 bdrv_unref(bs);
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003845 } else {
Luiz Capitulino71c79812012-11-30 10:52:04 -02003846 error_setg(errp, "Image creation needs a size parameter");
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003847 goto out;
3848 }
3849 }
3850
Miroslav Rezaninaf382d432013-02-13 09:09:40 +01003851 if (!quiet) {
Kővágó, Zoltánfe646692015-07-07 16:42:10 +02003852 printf("Formatting '%s', fmt=%s ", filename, fmt);
Fam Zheng43c5d8f2014-12-09 15:38:04 +08003853 qemu_opts_print(opts, " ");
Miroslav Rezaninaf382d432013-02-13 09:09:40 +01003854 puts("");
3855 }
Chunyan Liu83d05212014-06-05 17:20:51 +08003856
Chunyan Liuc282e1f2014-06-05 17:21:11 +08003857 ret = bdrv_create(drv, filename, opts, &local_err);
Chunyan Liu83d05212014-06-05 17:20:51 +08003858
Max Reitzcc84d902013-09-06 17:14:26 +02003859 if (ret == -EFBIG) {
3860 /* This is generally a better message than whatever the driver would
3861 * deliver (especially because of the cluster_size_hint), since that
3862 * is most probably not much different from "image too large". */
3863 const char *cluster_size_hint = "";
Chunyan Liu83d05212014-06-05 17:20:51 +08003864 if (qemu_opt_get_size(opts, BLOCK_OPT_CLUSTER_SIZE, 0)) {
Max Reitzcc84d902013-09-06 17:14:26 +02003865 cluster_size_hint = " (try using a larger cluster size)";
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003866 }
Max Reitzcc84d902013-09-06 17:14:26 +02003867 error_setg(errp, "The image size is too large for file format '%s'"
3868 "%s", fmt, cluster_size_hint);
3869 error_free(local_err);
3870 local_err = NULL;
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003871 }
3872
3873out:
Chunyan Liu83d05212014-06-05 17:20:51 +08003874 qemu_opts_del(opts);
3875 qemu_opts_free(create_opts);
Markus Armbruster84d18f02014-01-30 15:07:28 +01003876 if (local_err) {
Max Reitzcc84d902013-09-06 17:14:26 +02003877 error_propagate(errp, local_err);
3878 }
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003879}
Stefan Hajnoczi85d126f2013-03-07 13:41:48 +01003880
3881AioContext *bdrv_get_aio_context(BlockDriverState *bs)
3882{
Stefan Hajnoczidcd04222014-05-08 16:34:37 +02003883 return bs->aio_context;
3884}
3885
3886void bdrv_detach_aio_context(BlockDriverState *bs)
3887{
Max Reitz33384422014-06-20 21:57:33 +02003888 BdrvAioNotifier *baf;
3889
Stefan Hajnoczidcd04222014-05-08 16:34:37 +02003890 if (!bs->drv) {
3891 return;
3892 }
3893
Max Reitz33384422014-06-20 21:57:33 +02003894 QLIST_FOREACH(baf, &bs->aio_notifiers, list) {
3895 baf->detach_aio_context(baf->opaque);
3896 }
3897
Stefan Hajnoczi13af91e2014-05-14 16:22:45 +02003898 if (bs->io_limits_enabled) {
Benoît Canet0e5b0a22015-06-08 18:17:41 +02003899 throttle_timers_detach_aio_context(&bs->throttle_timers);
Stefan Hajnoczi13af91e2014-05-14 16:22:45 +02003900 }
Stefan Hajnoczidcd04222014-05-08 16:34:37 +02003901 if (bs->drv->bdrv_detach_aio_context) {
3902 bs->drv->bdrv_detach_aio_context(bs);
3903 }
3904 if (bs->file) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02003905 bdrv_detach_aio_context(bs->file->bs);
Stefan Hajnoczidcd04222014-05-08 16:34:37 +02003906 }
Kevin Wolf760e0062015-06-17 14:55:21 +02003907 if (bs->backing) {
3908 bdrv_detach_aio_context(bs->backing->bs);
Stefan Hajnoczidcd04222014-05-08 16:34:37 +02003909 }
3910
3911 bs->aio_context = NULL;
3912}
3913
3914void bdrv_attach_aio_context(BlockDriverState *bs,
3915 AioContext *new_context)
3916{
Max Reitz33384422014-06-20 21:57:33 +02003917 BdrvAioNotifier *ban;
3918
Stefan Hajnoczidcd04222014-05-08 16:34:37 +02003919 if (!bs->drv) {
3920 return;
3921 }
3922
3923 bs->aio_context = new_context;
3924
Kevin Wolf760e0062015-06-17 14:55:21 +02003925 if (bs->backing) {
3926 bdrv_attach_aio_context(bs->backing->bs, new_context);
Stefan Hajnoczidcd04222014-05-08 16:34:37 +02003927 }
3928 if (bs->file) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02003929 bdrv_attach_aio_context(bs->file->bs, new_context);
Stefan Hajnoczidcd04222014-05-08 16:34:37 +02003930 }
3931 if (bs->drv->bdrv_attach_aio_context) {
3932 bs->drv->bdrv_attach_aio_context(bs, new_context);
3933 }
Stefan Hajnoczi13af91e2014-05-14 16:22:45 +02003934 if (bs->io_limits_enabled) {
Benoît Canet0e5b0a22015-06-08 18:17:41 +02003935 throttle_timers_attach_aio_context(&bs->throttle_timers, new_context);
Stefan Hajnoczi13af91e2014-05-14 16:22:45 +02003936 }
Max Reitz33384422014-06-20 21:57:33 +02003937
3938 QLIST_FOREACH(ban, &bs->aio_notifiers, list) {
3939 ban->attached_aio_context(new_context, ban->opaque);
3940 }
Stefan Hajnoczidcd04222014-05-08 16:34:37 +02003941}
3942
3943void bdrv_set_aio_context(BlockDriverState *bs, AioContext *new_context)
3944{
Fam Zheng53ec73e2015-05-29 18:53:14 +08003945 bdrv_drain(bs); /* ensure there are no in-flight requests */
Stefan Hajnoczidcd04222014-05-08 16:34:37 +02003946
3947 bdrv_detach_aio_context(bs);
3948
3949 /* This function executes in the old AioContext so acquire the new one in
3950 * case it runs in a different thread.
3951 */
3952 aio_context_acquire(new_context);
3953 bdrv_attach_aio_context(bs, new_context);
3954 aio_context_release(new_context);
Stefan Hajnoczi85d126f2013-03-07 13:41:48 +01003955}
Stefan Hajnoczid616b222013-06-24 17:13:10 +02003956
Max Reitz33384422014-06-20 21:57:33 +02003957void bdrv_add_aio_context_notifier(BlockDriverState *bs,
3958 void (*attached_aio_context)(AioContext *new_context, void *opaque),
3959 void (*detach_aio_context)(void *opaque), void *opaque)
3960{
3961 BdrvAioNotifier *ban = g_new(BdrvAioNotifier, 1);
3962 *ban = (BdrvAioNotifier){
3963 .attached_aio_context = attached_aio_context,
3964 .detach_aio_context = detach_aio_context,
3965 .opaque = opaque
3966 };
3967
3968 QLIST_INSERT_HEAD(&bs->aio_notifiers, ban, list);
3969}
3970
3971void bdrv_remove_aio_context_notifier(BlockDriverState *bs,
3972 void (*attached_aio_context)(AioContext *,
3973 void *),
3974 void (*detach_aio_context)(void *),
3975 void *opaque)
3976{
3977 BdrvAioNotifier *ban, *ban_next;
3978
3979 QLIST_FOREACH_SAFE(ban, &bs->aio_notifiers, list, ban_next) {
3980 if (ban->attached_aio_context == attached_aio_context &&
3981 ban->detach_aio_context == detach_aio_context &&
3982 ban->opaque == opaque)
3983 {
3984 QLIST_REMOVE(ban, list);
3985 g_free(ban);
3986
3987 return;
3988 }
3989 }
3990
3991 abort();
3992}
3993
Max Reitz77485432014-10-27 11:12:50 +01003994int bdrv_amend_options(BlockDriverState *bs, QemuOpts *opts,
3995 BlockDriverAmendStatusCB *status_cb)
Max Reitz6f176b42013-09-03 10:09:50 +02003996{
Chunyan Liuc282e1f2014-06-05 17:21:11 +08003997 if (!bs->drv->bdrv_amend_options) {
Max Reitz6f176b42013-09-03 10:09:50 +02003998 return -ENOTSUP;
3999 }
Max Reitz77485432014-10-27 11:12:50 +01004000 return bs->drv->bdrv_amend_options(bs, opts, status_cb);
Max Reitz6f176b42013-09-03 10:09:50 +02004001}
Benoît Canetf6186f42013-10-02 14:33:48 +02004002
Benoît Canetb5042a32014-03-03 19:11:34 +01004003/* This function will be called by the bdrv_recurse_is_first_non_filter method
4004 * of block filter and by bdrv_is_first_non_filter.
4005 * It is used to test if the given bs is the candidate or recurse more in the
4006 * node graph.
Benoît Canet212a5a82014-01-23 21:31:36 +01004007 */
Benoît Canet212a5a82014-01-23 21:31:36 +01004008bool bdrv_recurse_is_first_non_filter(BlockDriverState *bs,
4009 BlockDriverState *candidate)
Benoît Canetf6186f42013-10-02 14:33:48 +02004010{
Benoît Canetb5042a32014-03-03 19:11:34 +01004011 /* return false if basic checks fails */
4012 if (!bs || !bs->drv) {
4013 return false;
4014 }
4015
4016 /* the code reached a non block filter driver -> check if the bs is
4017 * the same as the candidate. It's the recursion termination condition.
4018 */
4019 if (!bs->drv->is_filter) {
4020 return bs == candidate;
4021 }
4022 /* Down this path the driver is a block filter driver */
4023
4024 /* If the block filter recursion method is defined use it to recurse down
4025 * the node graph.
4026 */
4027 if (bs->drv->bdrv_recurse_is_first_non_filter) {
Benoît Canet212a5a82014-01-23 21:31:36 +01004028 return bs->drv->bdrv_recurse_is_first_non_filter(bs, candidate);
4029 }
4030
Benoît Canetb5042a32014-03-03 19:11:34 +01004031 /* the driver is a block filter but don't allow to recurse -> return false
4032 */
4033 return false;
Benoît Canet212a5a82014-01-23 21:31:36 +01004034}
4035
4036/* This function checks if the candidate is the first non filter bs down it's
4037 * bs chain. Since we don't have pointers to parents it explore all bs chains
4038 * from the top. Some filters can choose not to pass down the recursion.
4039 */
4040bool bdrv_is_first_non_filter(BlockDriverState *candidate)
4041{
4042 BlockDriverState *bs;
4043
4044 /* walk down the bs forest recursively */
4045 QTAILQ_FOREACH(bs, &bdrv_states, device_list) {
4046 bool perm;
4047
Benoît Canetb5042a32014-03-03 19:11:34 +01004048 /* try to recurse in this top level bs */
Kevin Wolfe6dc8a12014-02-04 11:45:31 +01004049 perm = bdrv_recurse_is_first_non_filter(bs, candidate);
Benoît Canet212a5a82014-01-23 21:31:36 +01004050
4051 /* candidate is the first non filter */
4052 if (perm) {
4053 return true;
4054 }
4055 }
4056
4057 return false;
Benoît Canetf6186f42013-10-02 14:33:48 +02004058}
Benoît Canet09158f02014-06-27 18:25:25 +02004059
Wen Congyange12f3782015-07-17 10:12:22 +08004060BlockDriverState *check_to_replace_node(BlockDriverState *parent_bs,
4061 const char *node_name, Error **errp)
Benoît Canet09158f02014-06-27 18:25:25 +02004062{
4063 BlockDriverState *to_replace_bs = bdrv_find_node(node_name);
Stefan Hajnoczi5a7e7a02014-10-21 12:03:58 +01004064 AioContext *aio_context;
4065
Benoît Canet09158f02014-06-27 18:25:25 +02004066 if (!to_replace_bs) {
4067 error_setg(errp, "Node name '%s' not found", node_name);
4068 return NULL;
4069 }
4070
Stefan Hajnoczi5a7e7a02014-10-21 12:03:58 +01004071 aio_context = bdrv_get_aio_context(to_replace_bs);
4072 aio_context_acquire(aio_context);
4073
Benoît Canet09158f02014-06-27 18:25:25 +02004074 if (bdrv_op_is_blocked(to_replace_bs, BLOCK_OP_TYPE_REPLACE, errp)) {
Stefan Hajnoczi5a7e7a02014-10-21 12:03:58 +01004075 to_replace_bs = NULL;
4076 goto out;
Benoît Canet09158f02014-06-27 18:25:25 +02004077 }
4078
4079 /* We don't want arbitrary node of the BDS chain to be replaced only the top
4080 * most non filter in order to prevent data corruption.
4081 * Another benefit is that this tests exclude backing files which are
4082 * blocked by the backing blockers.
4083 */
Wen Congyange12f3782015-07-17 10:12:22 +08004084 if (!bdrv_recurse_is_first_non_filter(parent_bs, to_replace_bs)) {
Benoît Canet09158f02014-06-27 18:25:25 +02004085 error_setg(errp, "Only top most non filter can be replaced");
Stefan Hajnoczi5a7e7a02014-10-21 12:03:58 +01004086 to_replace_bs = NULL;
4087 goto out;
Benoît Canet09158f02014-06-27 18:25:25 +02004088 }
4089
Stefan Hajnoczi5a7e7a02014-10-21 12:03:58 +01004090out:
4091 aio_context_release(aio_context);
Benoît Canet09158f02014-06-27 18:25:25 +02004092 return to_replace_bs;
4093}
Ming Lei448ad912014-07-04 18:04:33 +08004094
Max Reitz91af7012014-07-18 20:24:56 +02004095static bool append_open_options(QDict *d, BlockDriverState *bs)
4096{
4097 const QDictEntry *entry;
4098 bool found_any = false;
4099
4100 for (entry = qdict_first(bs->options); entry;
4101 entry = qdict_next(bs->options, entry))
4102 {
4103 /* Only take options for this level and exclude all non-driver-specific
4104 * options */
4105 if (!strchr(qdict_entry_key(entry), '.') &&
4106 strcmp(qdict_entry_key(entry), "node-name"))
4107 {
4108 qobject_incref(qdict_entry_value(entry));
4109 qdict_put_obj(d, qdict_entry_key(entry), qdict_entry_value(entry));
4110 found_any = true;
4111 }
4112 }
4113
4114 return found_any;
4115}
4116
4117/* Updates the following BDS fields:
4118 * - exact_filename: A filename which may be used for opening a block device
4119 * which (mostly) equals the given BDS (even without any
4120 * other options; so reading and writing must return the same
4121 * results, but caching etc. may be different)
4122 * - full_open_options: Options which, when given when opening a block device
4123 * (without a filename), result in a BDS (mostly)
4124 * equalling the given one
4125 * - filename: If exact_filename is set, it is copied here. Otherwise,
4126 * full_open_options is converted to a JSON object, prefixed with
4127 * "json:" (for use through the JSON pseudo protocol) and put here.
4128 */
4129void bdrv_refresh_filename(BlockDriverState *bs)
4130{
4131 BlockDriver *drv = bs->drv;
4132 QDict *opts;
4133
4134 if (!drv) {
4135 return;
4136 }
4137
4138 /* This BDS's file name will most probably depend on its file's name, so
4139 * refresh that first */
4140 if (bs->file) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02004141 bdrv_refresh_filename(bs->file->bs);
Max Reitz91af7012014-07-18 20:24:56 +02004142 }
4143
4144 if (drv->bdrv_refresh_filename) {
4145 /* Obsolete information is of no use here, so drop the old file name
4146 * information before refreshing it */
4147 bs->exact_filename[0] = '\0';
4148 if (bs->full_open_options) {
4149 QDECREF(bs->full_open_options);
4150 bs->full_open_options = NULL;
4151 }
4152
4153 drv->bdrv_refresh_filename(bs);
4154 } else if (bs->file) {
4155 /* Try to reconstruct valid information from the underlying file */
4156 bool has_open_options;
4157
4158 bs->exact_filename[0] = '\0';
4159 if (bs->full_open_options) {
4160 QDECREF(bs->full_open_options);
4161 bs->full_open_options = NULL;
4162 }
4163
4164 opts = qdict_new();
4165 has_open_options = append_open_options(opts, bs);
4166
4167 /* If no specific options have been given for this BDS, the filename of
4168 * the underlying file should suffice for this one as well */
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02004169 if (bs->file->bs->exact_filename[0] && !has_open_options) {
4170 strcpy(bs->exact_filename, bs->file->bs->exact_filename);
Max Reitz91af7012014-07-18 20:24:56 +02004171 }
4172 /* Reconstructing the full options QDict is simple for most format block
4173 * drivers, as long as the full options are known for the underlying
4174 * file BDS. The full options QDict of that file BDS should somehow
4175 * contain a representation of the filename, therefore the following
4176 * suffices without querying the (exact_)filename of this BDS. */
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02004177 if (bs->file->bs->full_open_options) {
Max Reitz91af7012014-07-18 20:24:56 +02004178 qdict_put_obj(opts, "driver",
4179 QOBJECT(qstring_from_str(drv->format_name)));
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02004180 QINCREF(bs->file->bs->full_open_options);
4181 qdict_put_obj(opts, "file",
4182 QOBJECT(bs->file->bs->full_open_options));
Max Reitz91af7012014-07-18 20:24:56 +02004183
4184 bs->full_open_options = opts;
4185 } else {
4186 QDECREF(opts);
4187 }
4188 } else if (!bs->full_open_options && qdict_size(bs->options)) {
4189 /* There is no underlying file BDS (at least referenced by BDS.file),
4190 * so the full options QDict should be equal to the options given
4191 * specifically for this block device when it was opened (plus the
4192 * driver specification).
4193 * Because those options don't change, there is no need to update
4194 * full_open_options when it's already set. */
4195
4196 opts = qdict_new();
4197 append_open_options(opts, bs);
4198 qdict_put_obj(opts, "driver",
4199 QOBJECT(qstring_from_str(drv->format_name)));
4200
4201 if (bs->exact_filename[0]) {
4202 /* This may not work for all block protocol drivers (some may
4203 * require this filename to be parsed), but we have to find some
4204 * default solution here, so just include it. If some block driver
4205 * does not support pure options without any filename at all or
4206 * needs some special format of the options QDict, it needs to
4207 * implement the driver-specific bdrv_refresh_filename() function.
4208 */
4209 qdict_put_obj(opts, "filename",
4210 QOBJECT(qstring_from_str(bs->exact_filename)));
4211 }
4212
4213 bs->full_open_options = opts;
4214 }
4215
4216 if (bs->exact_filename[0]) {
4217 pstrcpy(bs->filename, sizeof(bs->filename), bs->exact_filename);
4218 } else if (bs->full_open_options) {
4219 QString *json = qobject_to_json(QOBJECT(bs->full_open_options));
4220 snprintf(bs->filename, sizeof(bs->filename), "json:%s",
4221 qstring_get_str(json));
4222 QDECREF(json);
4223 }
4224}
Benoît Canet5366d0c2014-09-05 15:46:18 +02004225
4226/* This accessor function purpose is to allow the device models to access the
4227 * BlockAcctStats structure embedded inside a BlockDriverState without being
4228 * aware of the BlockDriverState structure layout.
4229 * It will go away when the BlockAcctStats structure will be moved inside
4230 * the device models.
4231 */
4232BlockAcctStats *bdrv_get_stats(BlockDriverState *bs)
4233{
4234 return &bs->stats;
4235}