blob: 8fd345bb4f8068df45d3ff919a0d4958edd34993 [file] [log] [blame]
bellardfc01f7e2003-06-30 10:03:06 +00001/*
2 * QEMU System Emulator block driver
ths5fafdf22007-09-16 21:08:06 +00003 *
bellardfc01f7e2003-06-30 10:03:06 +00004 * Copyright (c) 2003 Fabrice Bellard
ths5fafdf22007-09-16 21:08:06 +00005 *
bellardfc01f7e2003-06-30 10:03:06 +00006 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
blueswir13990d092008-12-05 17:53:21 +000024#include "config-host.h"
pbrookfaf07962007-11-11 02:51:17 +000025#include "qemu-common.h"
Stefan Hajnoczi6d519a52010-05-22 18:15:08 +010026#include "trace.h"
Paolo Bonzini737e1502012-12-17 18:19:44 +010027#include "block/block_int.h"
28#include "block/blockjob.h"
Markus Armbrusterd49b6832015-03-17 18:29:20 +010029#include "qemu/error-report.h"
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010030#include "qemu/module.h"
Markus Armbrustercc7a8ea2015-03-17 17:22:46 +010031#include "qapi/qmp/qerror.h"
Paolo Bonzini7b1b5d12012-12-17 18:19:43 +010032#include "qapi/qmp/qjson.h"
Markus Armbrusterbfb197e2014-10-07 13:59:11 +020033#include "sysemu/block-backend.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010034#include "sysemu/sysemu.h"
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010035#include "qemu/notify.h"
Paolo Bonzini737e1502012-12-17 18:19:44 +010036#include "block/coroutine.h"
Benoît Canetc13163f2014-01-23 21:31:34 +010037#include "block/qapi.h"
Luiz Capitulinob2023812011-09-21 17:16:47 -030038#include "qmp-commands.h"
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010039#include "qemu/timer.h"
Wenchao Xiaa5ee7bd2014-06-18 08:43:44 +020040#include "qapi-event.h"
Alberto Garciadb628332015-06-08 18:17:45 +020041#include "block/throttle-groups.h"
bellardfc01f7e2003-06-30 10:03:06 +000042
Juan Quintela71e72a12009-07-27 16:12:56 +020043#ifdef CONFIG_BSD
bellard7674e7b2005-04-26 21:59:26 +000044#include <sys/types.h>
45#include <sys/stat.h>
46#include <sys/ioctl.h>
Blue Swirl72cf2d42009-09-12 07:36:22 +000047#include <sys/queue.h>
blueswir1c5e97232009-03-07 20:06:23 +000048#ifndef __DragonFly__
bellard7674e7b2005-04-26 21:59:26 +000049#include <sys/disk.h>
50#endif
blueswir1c5e97232009-03-07 20:06:23 +000051#endif
bellard7674e7b2005-04-26 21:59:26 +000052
aliguori49dc7682009-03-08 16:26:59 +000053#ifdef _WIN32
54#include <windows.h>
55#endif
56
John Snow9bd2b082015-04-17 19:49:57 -040057/**
58 * A BdrvDirtyBitmap can be in three possible states:
59 * (1) successor is NULL and disabled is false: full r/w mode
60 * (2) successor is NULL and disabled is true: read only mode ("disabled")
61 * (3) successor is set: frozen mode.
62 * A frozen bitmap cannot be renamed, deleted, anonymized, cleared, set,
63 * or enabled. A frozen bitmap can only abdicate() or reclaim().
64 */
Fam Zhenge4654d22013-11-13 18:29:43 +080065struct BdrvDirtyBitmap {
John Snowaa0c7ca2015-04-17 19:50:01 -040066 HBitmap *bitmap; /* Dirty sector bitmap implementation */
67 BdrvDirtyBitmap *successor; /* Anonymous child; implies frozen status */
68 char *name; /* Optional non-empty unique ID */
69 int64_t size; /* Size of the bitmap (Number of sectors) */
70 bool disabled; /* Bitmap is read-only */
Fam Zhenge4654d22013-11-13 18:29:43 +080071 QLIST_ENTRY(BdrvDirtyBitmap) list;
72};
73
Stefan Hajnoczi1c9805a2011-10-13 13:08:22 +010074#define NOT_DONE 0x7fffffff /* used while emulated sync operation in progress */
75
Stefan Hajnoczi1b7bdbc2010-04-10 07:02:42 +010076static QTAILQ_HEAD(, BlockDriverState) bdrv_states =
77 QTAILQ_HEAD_INITIALIZER(bdrv_states);
blueswir17ee930d2008-09-17 19:04:14 +000078
Benoît Canetdc364f42014-01-23 21:31:32 +010079static QTAILQ_HEAD(, BlockDriverState) graph_bdrv_states =
80 QTAILQ_HEAD_INITIALIZER(graph_bdrv_states);
81
Stefan Hajnoczi8a22f022010-04-13 10:29:33 +010082static QLIST_HEAD(, BlockDriver) bdrv_drivers =
83 QLIST_HEAD_INITIALIZER(bdrv_drivers);
bellardea2384d2004-08-01 21:59:26 +000084
Kevin Wolff3930ed2015-04-08 13:43:47 +020085static int bdrv_open_inherit(BlockDriverState **pbs, const char *filename,
86 const char *reference, QDict *options, int flags,
87 BlockDriverState *parent,
Max Reitzce343772015-08-26 19:47:50 +020088 const BdrvChildRole *child_role, Error **errp);
Kevin Wolff3930ed2015-04-08 13:43:47 +020089
John Snowce1ffea2015-04-17 19:50:03 -040090static void bdrv_dirty_bitmap_truncate(BlockDriverState *bs);
Markus Armbrustereb852012009-10-27 18:41:44 +010091/* If non-zero, use only whitelisted block drivers */
92static int use_bdrv_whitelist;
93
Stefan Hajnoczi9e0b22f2010-12-09 11:53:00 +000094#ifdef _WIN32
95static int is_windows_drive_prefix(const char *filename)
96{
97 return (((filename[0] >= 'a' && filename[0] <= 'z') ||
98 (filename[0] >= 'A' && filename[0] <= 'Z')) &&
99 filename[1] == ':');
100}
101
102int is_windows_drive(const char *filename)
103{
104 if (is_windows_drive_prefix(filename) &&
105 filename[2] == '\0')
106 return 1;
107 if (strstart(filename, "\\\\.\\", NULL) ||
108 strstart(filename, "//./", NULL))
109 return 1;
110 return 0;
111}
112#endif
113
Kevin Wolf339064d2013-11-28 10:23:32 +0100114size_t bdrv_opt_mem_align(BlockDriverState *bs)
115{
116 if (!bs || !bs->drv) {
Denis V. Lunev459b4e62015-05-12 17:30:56 +0300117 /* page size or 4k (hdd sector size) should be on the safe side */
118 return MAX(4096, getpagesize());
Kevin Wolf339064d2013-11-28 10:23:32 +0100119 }
120
121 return bs->bl.opt_mem_alignment;
122}
123
Denis V. Lunev4196d2f2015-05-12 17:30:55 +0300124size_t bdrv_min_mem_align(BlockDriverState *bs)
125{
126 if (!bs || !bs->drv) {
Denis V. Lunev459b4e62015-05-12 17:30:56 +0300127 /* page size or 4k (hdd sector size) should be on the safe side */
128 return MAX(4096, getpagesize());
Denis V. Lunev4196d2f2015-05-12 17:30:55 +0300129 }
130
131 return bs->bl.min_mem_alignment;
132}
133
Stefan Hajnoczi9e0b22f2010-12-09 11:53:00 +0000134/* check if the path starts with "<protocol>:" */
Max Reitz5c984152014-12-03 14:57:22 +0100135int path_has_protocol(const char *path)
Stefan Hajnoczi9e0b22f2010-12-09 11:53:00 +0000136{
Paolo Bonzini947995c2012-05-08 16:51:48 +0200137 const char *p;
138
Stefan Hajnoczi9e0b22f2010-12-09 11:53:00 +0000139#ifdef _WIN32
140 if (is_windows_drive(path) ||
141 is_windows_drive_prefix(path)) {
142 return 0;
143 }
Paolo Bonzini947995c2012-05-08 16:51:48 +0200144 p = path + strcspn(path, ":/\\");
145#else
146 p = path + strcspn(path, ":/");
Stefan Hajnoczi9e0b22f2010-12-09 11:53:00 +0000147#endif
148
Paolo Bonzini947995c2012-05-08 16:51:48 +0200149 return *p == ':';
Stefan Hajnoczi9e0b22f2010-12-09 11:53:00 +0000150}
151
bellard83f64092006-08-01 16:21:11 +0000152int path_is_absolute(const char *path)
153{
bellard21664422007-01-07 18:22:37 +0000154#ifdef _WIN32
155 /* specific case for names like: "\\.\d:" */
Paolo Bonzinif53f4da2012-05-08 16:51:47 +0200156 if (is_windows_drive(path) || is_windows_drive_prefix(path)) {
bellard21664422007-01-07 18:22:37 +0000157 return 1;
Paolo Bonzinif53f4da2012-05-08 16:51:47 +0200158 }
159 return (*path == '/' || *path == '\\');
bellard3b9f94e2007-01-07 17:27:07 +0000160#else
Paolo Bonzinif53f4da2012-05-08 16:51:47 +0200161 return (*path == '/');
bellard3b9f94e2007-01-07 17:27:07 +0000162#endif
bellard83f64092006-08-01 16:21:11 +0000163}
164
165/* if filename is absolute, just copy it to dest. Otherwise, build a
166 path to it by considering it is relative to base_path. URL are
167 supported. */
168void path_combine(char *dest, int dest_size,
169 const char *base_path,
170 const char *filename)
171{
172 const char *p, *p1;
173 int len;
174
175 if (dest_size <= 0)
176 return;
177 if (path_is_absolute(filename)) {
178 pstrcpy(dest, dest_size, filename);
179 } else {
180 p = strchr(base_path, ':');
181 if (p)
182 p++;
183 else
184 p = base_path;
bellard3b9f94e2007-01-07 17:27:07 +0000185 p1 = strrchr(base_path, '/');
186#ifdef _WIN32
187 {
188 const char *p2;
189 p2 = strrchr(base_path, '\\');
190 if (!p1 || p2 > p1)
191 p1 = p2;
192 }
193#endif
bellard83f64092006-08-01 16:21:11 +0000194 if (p1)
195 p1++;
196 else
197 p1 = base_path;
198 if (p1 > p)
199 p = p1;
200 len = p - base_path;
201 if (len > dest_size - 1)
202 len = dest_size - 1;
203 memcpy(dest, base_path, len);
204 dest[len] = '\0';
205 pstrcat(dest, dest_size, filename);
206 }
207}
208
Max Reitz0a828552014-11-26 17:20:25 +0100209void bdrv_get_full_backing_filename_from_filename(const char *backed,
210 const char *backing,
Max Reitz9f074292014-11-26 17:20:26 +0100211 char *dest, size_t sz,
212 Error **errp)
Max Reitz0a828552014-11-26 17:20:25 +0100213{
Max Reitz9f074292014-11-26 17:20:26 +0100214 if (backing[0] == '\0' || path_has_protocol(backing) ||
215 path_is_absolute(backing))
216 {
Max Reitz0a828552014-11-26 17:20:25 +0100217 pstrcpy(dest, sz, backing);
Max Reitz9f074292014-11-26 17:20:26 +0100218 } else if (backed[0] == '\0' || strstart(backed, "json:", NULL)) {
219 error_setg(errp, "Cannot use relative backing file names for '%s'",
220 backed);
Max Reitz0a828552014-11-26 17:20:25 +0100221 } else {
222 path_combine(dest, sz, backed, backing);
223 }
224}
225
Max Reitz9f074292014-11-26 17:20:26 +0100226void bdrv_get_full_backing_filename(BlockDriverState *bs, char *dest, size_t sz,
227 Error **errp)
Paolo Bonzinidc5a1372012-05-08 16:51:50 +0200228{
Max Reitz9f074292014-11-26 17:20:26 +0100229 char *backed = bs->exact_filename[0] ? bs->exact_filename : bs->filename;
230
231 bdrv_get_full_backing_filename_from_filename(backed, bs->backing_file,
232 dest, sz, errp);
Paolo Bonzinidc5a1372012-05-08 16:51:50 +0200233}
234
Stefan Hajnoczi0eb72172015-04-28 14:27:51 +0100235void bdrv_register(BlockDriver *bdrv)
236{
237 bdrv_setup_io_funcs(bdrv);
Christoph Hellwigb2e12bc2009-09-04 19:01:49 +0200238
Stefan Hajnoczi8a22f022010-04-13 10:29:33 +0100239 QLIST_INSERT_HEAD(&bdrv_drivers, bdrv, list);
bellardea2384d2004-08-01 21:59:26 +0000240}
bellardb3380822004-03-14 21:38:54 +0000241
Markus Armbruster7f06d472014-10-07 13:59:12 +0200242BlockDriverState *bdrv_new_root(void)
bellardfc01f7e2003-06-30 10:03:06 +0000243{
Markus Armbruster7f06d472014-10-07 13:59:12 +0200244 BlockDriverState *bs = bdrv_new();
Markus Armbrustere4e99862014-10-07 13:59:03 +0200245
Markus Armbrustere4e99862014-10-07 13:59:03 +0200246 QTAILQ_INSERT_TAIL(&bdrv_states, bs, device_list);
Markus Armbrustere4e99862014-10-07 13:59:03 +0200247 return bs;
248}
249
250BlockDriverState *bdrv_new(void)
251{
252 BlockDriverState *bs;
253 int i;
254
Markus Armbruster5839e532014-08-19 10:31:08 +0200255 bs = g_new0(BlockDriverState, 1);
Fam Zhenge4654d22013-11-13 18:29:43 +0800256 QLIST_INIT(&bs->dirty_bitmaps);
Fam Zhengfbe40ff2014-05-23 21:29:42 +0800257 for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
258 QLIST_INIT(&bs->op_blockers[i]);
259 }
Luiz Capitulino28a72822011-09-26 17:43:50 -0300260 bdrv_iostatus_disable(bs);
Paolo Bonzinid7d512f2012-08-23 11:20:36 +0200261 notifier_list_init(&bs->close_notifiers);
Stefan Hajnoczid616b222013-06-24 17:13:10 +0200262 notifier_with_return_list_init(&bs->before_write_notifiers);
Benoît Canetcc0681c2013-09-02 14:14:39 +0200263 qemu_co_queue_init(&bs->throttled_reqs[0]);
264 qemu_co_queue_init(&bs->throttled_reqs[1]);
Fam Zheng9fcb0252013-08-23 09:14:46 +0800265 bs->refcnt = 1;
Stefan Hajnoczidcd04222014-05-08 16:34:37 +0200266 bs->aio_context = qemu_get_aio_context();
Paolo Bonzinid7d512f2012-08-23 11:20:36 +0200267
bellardb3380822004-03-14 21:38:54 +0000268 return bs;
269}
270
Paolo Bonzinid7d512f2012-08-23 11:20:36 +0200271void bdrv_add_close_notifier(BlockDriverState *bs, Notifier *notify)
272{
273 notifier_list_add(&bs->close_notifiers, notify);
274}
275
bellardea2384d2004-08-01 21:59:26 +0000276BlockDriver *bdrv_find_format(const char *format_name)
277{
278 BlockDriver *drv1;
Stefan Hajnoczi8a22f022010-04-13 10:29:33 +0100279 QLIST_FOREACH(drv1, &bdrv_drivers, list) {
280 if (!strcmp(drv1->format_name, format_name)) {
bellardea2384d2004-08-01 21:59:26 +0000281 return drv1;
Stefan Hajnoczi8a22f022010-04-13 10:29:33 +0100282 }
bellardea2384d2004-08-01 21:59:26 +0000283 }
284 return NULL;
285}
286
Fam Zhengb64ec4e2013-05-29 19:35:40 +0800287static int bdrv_is_whitelisted(BlockDriver *drv, bool read_only)
Markus Armbrustereb852012009-10-27 18:41:44 +0100288{
Fam Zhengb64ec4e2013-05-29 19:35:40 +0800289 static const char *whitelist_rw[] = {
290 CONFIG_BDRV_RW_WHITELIST
291 };
292 static const char *whitelist_ro[] = {
293 CONFIG_BDRV_RO_WHITELIST
Markus Armbrustereb852012009-10-27 18:41:44 +0100294 };
295 const char **p;
296
Fam Zhengb64ec4e2013-05-29 19:35:40 +0800297 if (!whitelist_rw[0] && !whitelist_ro[0]) {
Markus Armbrustereb852012009-10-27 18:41:44 +0100298 return 1; /* no whitelist, anything goes */
Fam Zhengb64ec4e2013-05-29 19:35:40 +0800299 }
Markus Armbrustereb852012009-10-27 18:41:44 +0100300
Fam Zhengb64ec4e2013-05-29 19:35:40 +0800301 for (p = whitelist_rw; *p; p++) {
Markus Armbrustereb852012009-10-27 18:41:44 +0100302 if (!strcmp(drv->format_name, *p)) {
303 return 1;
304 }
305 }
Fam Zhengb64ec4e2013-05-29 19:35:40 +0800306 if (read_only) {
307 for (p = whitelist_ro; *p; p++) {
308 if (!strcmp(drv->format_name, *p)) {
309 return 1;
310 }
311 }
312 }
Markus Armbrustereb852012009-10-27 18:41:44 +0100313 return 0;
314}
315
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800316typedef struct CreateCo {
317 BlockDriver *drv;
318 char *filename;
Chunyan Liu83d05212014-06-05 17:20:51 +0800319 QemuOpts *opts;
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800320 int ret;
Max Reitzcc84d902013-09-06 17:14:26 +0200321 Error *err;
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800322} CreateCo;
323
324static void coroutine_fn bdrv_create_co_entry(void *opaque)
325{
Max Reitzcc84d902013-09-06 17:14:26 +0200326 Error *local_err = NULL;
327 int ret;
328
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800329 CreateCo *cco = opaque;
330 assert(cco->drv);
331
Chunyan Liuc282e1f2014-06-05 17:21:11 +0800332 ret = cco->drv->bdrv_create(cco->filename, cco->opts, &local_err);
Markus Armbruster84d18f02014-01-30 15:07:28 +0100333 if (local_err) {
Max Reitzcc84d902013-09-06 17:14:26 +0200334 error_propagate(&cco->err, local_err);
335 }
336 cco->ret = ret;
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800337}
338
Kevin Wolf0e7e1982009-05-18 16:42:10 +0200339int bdrv_create(BlockDriver *drv, const char* filename,
Chunyan Liu83d05212014-06-05 17:20:51 +0800340 QemuOpts *opts, Error **errp)
bellardea2384d2004-08-01 21:59:26 +0000341{
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800342 int ret;
Kevin Wolf0e7e1982009-05-18 16:42:10 +0200343
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800344 Coroutine *co;
345 CreateCo cco = {
346 .drv = drv,
347 .filename = g_strdup(filename),
Chunyan Liu83d05212014-06-05 17:20:51 +0800348 .opts = opts,
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800349 .ret = NOT_DONE,
Max Reitzcc84d902013-09-06 17:14:26 +0200350 .err = NULL,
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800351 };
352
Chunyan Liuc282e1f2014-06-05 17:21:11 +0800353 if (!drv->bdrv_create) {
Max Reitzcc84d902013-09-06 17:14:26 +0200354 error_setg(errp, "Driver '%s' does not support image creation", drv->format_name);
Luiz Capitulino80168bf2012-10-17 16:45:25 -0300355 ret = -ENOTSUP;
356 goto out;
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800357 }
358
359 if (qemu_in_coroutine()) {
360 /* Fast-path if already in coroutine context */
361 bdrv_create_co_entry(&cco);
362 } else {
363 co = qemu_coroutine_create(bdrv_create_co_entry);
364 qemu_coroutine_enter(co, &cco);
365 while (cco.ret == NOT_DONE) {
Paolo Bonzinib47ec2c2014-07-07 15:18:01 +0200366 aio_poll(qemu_get_aio_context(), true);
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800367 }
368 }
369
370 ret = cco.ret;
Max Reitzcc84d902013-09-06 17:14:26 +0200371 if (ret < 0) {
Markus Armbruster84d18f02014-01-30 15:07:28 +0100372 if (cco.err) {
Max Reitzcc84d902013-09-06 17:14:26 +0200373 error_propagate(errp, cco.err);
374 } else {
375 error_setg_errno(errp, -ret, "Could not create image");
376 }
377 }
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800378
Luiz Capitulino80168bf2012-10-17 16:45:25 -0300379out:
380 g_free(cco.filename);
Zhi Yong Wu5b7e1542012-05-07 16:50:42 +0800381 return ret;
bellardea2384d2004-08-01 21:59:26 +0000382}
383
Chunyan Liuc282e1f2014-06-05 17:21:11 +0800384int bdrv_create_file(const char *filename, QemuOpts *opts, Error **errp)
Christoph Hellwig84a12e62010-04-07 22:30:24 +0200385{
386 BlockDriver *drv;
Max Reitzcc84d902013-09-06 17:14:26 +0200387 Error *local_err = NULL;
388 int ret;
Christoph Hellwig84a12e62010-04-07 22:30:24 +0200389
Max Reitzb65a5e12015-02-05 13:58:12 -0500390 drv = bdrv_find_protocol(filename, true, errp);
Christoph Hellwig84a12e62010-04-07 22:30:24 +0200391 if (drv == NULL) {
Stefan Hajnoczi16905d72010-11-30 15:14:14 +0000392 return -ENOENT;
Christoph Hellwig84a12e62010-04-07 22:30:24 +0200393 }
394
Chunyan Liuc282e1f2014-06-05 17:21:11 +0800395 ret = bdrv_create(drv, filename, opts, &local_err);
Markus Armbruster84d18f02014-01-30 15:07:28 +0100396 if (local_err) {
Max Reitzcc84d902013-09-06 17:14:26 +0200397 error_propagate(errp, local_err);
398 }
399 return ret;
Christoph Hellwig84a12e62010-04-07 22:30:24 +0200400}
401
Ekaterina Tumanova892b7de2015-02-16 12:47:54 +0100402/**
403 * Try to get @bs's logical and physical block size.
404 * On success, store them in @bsz struct and return 0.
405 * On failure return -errno.
406 * @bs must not be empty.
407 */
408int bdrv_probe_blocksizes(BlockDriverState *bs, BlockSizes *bsz)
409{
410 BlockDriver *drv = bs->drv;
411
412 if (drv && drv->bdrv_probe_blocksizes) {
413 return drv->bdrv_probe_blocksizes(bs, bsz);
414 }
415
416 return -ENOTSUP;
417}
418
419/**
420 * Try to get @bs's geometry (cyls, heads, sectors).
421 * On success, store them in @geo struct and return 0.
422 * On failure return -errno.
423 * @bs must not be empty.
424 */
425int bdrv_probe_geometry(BlockDriverState *bs, HDGeometry *geo)
426{
427 BlockDriver *drv = bs->drv;
428
429 if (drv && drv->bdrv_probe_geometry) {
430 return drv->bdrv_probe_geometry(bs, geo);
431 }
432
433 return -ENOTSUP;
434}
435
Jim Meyeringeba25052012-05-28 09:27:54 +0200436/*
437 * Create a uniquely-named empty temporary file.
438 * Return 0 upon success, otherwise a negative errno value.
439 */
440int get_tmp_filename(char *filename, int size)
441{
bellardd5249392004-08-03 21:14:23 +0000442#ifdef _WIN32
bellard3b9f94e2007-01-07 17:27:07 +0000443 char temp_dir[MAX_PATH];
Jim Meyeringeba25052012-05-28 09:27:54 +0200444 /* GetTempFileName requires that its output buffer (4th param)
445 have length MAX_PATH or greater. */
446 assert(size >= MAX_PATH);
447 return (GetTempPath(MAX_PATH, temp_dir)
448 && GetTempFileName(temp_dir, "qem", 0, filename)
449 ? 0 : -GetLastError());
bellardd5249392004-08-03 21:14:23 +0000450#else
bellardea2384d2004-08-01 21:59:26 +0000451 int fd;
blueswir17ccfb2e2008-09-14 06:45:34 +0000452 const char *tmpdir;
aurel320badc1e2008-03-10 00:05:34 +0000453 tmpdir = getenv("TMPDIR");
Amit Shah69bef792014-02-26 15:12:37 +0530454 if (!tmpdir) {
455 tmpdir = "/var/tmp";
456 }
Jim Meyeringeba25052012-05-28 09:27:54 +0200457 if (snprintf(filename, size, "%s/vl.XXXXXX", tmpdir) >= size) {
458 return -EOVERFLOW;
459 }
bellardea2384d2004-08-01 21:59:26 +0000460 fd = mkstemp(filename);
Dunrong Huangfe235a02012-09-05 21:26:22 +0800461 if (fd < 0) {
462 return -errno;
463 }
464 if (close(fd) != 0) {
465 unlink(filename);
Jim Meyeringeba25052012-05-28 09:27:54 +0200466 return -errno;
467 }
468 return 0;
bellardd5249392004-08-03 21:14:23 +0000469#endif
Jim Meyeringeba25052012-05-28 09:27:54 +0200470}
bellardea2384d2004-08-01 21:59:26 +0000471
Christoph Hellwigf3a5d3f2009-06-15 13:55:19 +0200472/*
473 * Detect host devices. By convention, /dev/cdrom[N] is always
474 * recognized as a host CDROM.
475 */
Christoph Hellwigf3a5d3f2009-06-15 13:55:19 +0200476static BlockDriver *find_hdev_driver(const char *filename)
477{
Christoph Hellwig508c7cb2009-06-15 14:04:22 +0200478 int score_max = 0, score;
479 BlockDriver *drv = NULL, *d;
Christoph Hellwigf3a5d3f2009-06-15 13:55:19 +0200480
Stefan Hajnoczi8a22f022010-04-13 10:29:33 +0100481 QLIST_FOREACH(d, &bdrv_drivers, list) {
Christoph Hellwig508c7cb2009-06-15 14:04:22 +0200482 if (d->bdrv_probe_device) {
483 score = d->bdrv_probe_device(filename);
484 if (score > score_max) {
485 score_max = score;
486 drv = d;
487 }
488 }
Christoph Hellwigf3a5d3f2009-06-15 13:55:19 +0200489 }
490
Christoph Hellwig508c7cb2009-06-15 14:04:22 +0200491 return drv;
Christoph Hellwigf3a5d3f2009-06-15 13:55:19 +0200492}
Christoph Hellwigf3a5d3f2009-06-15 13:55:19 +0200493
Kevin Wolf98289622013-07-10 15:47:39 +0200494BlockDriver *bdrv_find_protocol(const char *filename,
Max Reitzb65a5e12015-02-05 13:58:12 -0500495 bool allow_protocol_prefix,
496 Error **errp)
Christoph Hellwig84a12e62010-04-07 22:30:24 +0200497{
498 BlockDriver *drv1;
499 char protocol[128];
500 int len;
501 const char *p;
502
Kevin Wolf66f82ce2010-04-14 14:17:38 +0200503 /* TODO Drivers without bdrv_file_open must be specified explicitly */
504
Christoph Hellwig39508e72010-06-23 12:25:17 +0200505 /*
506 * XXX(hch): we really should not let host device detection
507 * override an explicit protocol specification, but moving this
508 * later breaks access to device names with colons in them.
509 * Thanks to the brain-dead persistent naming schemes on udev-
510 * based Linux systems those actually are quite common.
511 */
512 drv1 = find_hdev_driver(filename);
513 if (drv1) {
Christoph Hellwig84a12e62010-04-07 22:30:24 +0200514 return drv1;
515 }
Christoph Hellwig39508e72010-06-23 12:25:17 +0200516
Kevin Wolf98289622013-07-10 15:47:39 +0200517 if (!path_has_protocol(filename) || !allow_protocol_prefix) {
Max Reitzef810432014-12-02 18:32:42 +0100518 return &bdrv_file;
Christoph Hellwig39508e72010-06-23 12:25:17 +0200519 }
Kevin Wolf98289622013-07-10 15:47:39 +0200520
Stefan Hajnoczi9e0b22f2010-12-09 11:53:00 +0000521 p = strchr(filename, ':');
522 assert(p != NULL);
Christoph Hellwig84a12e62010-04-07 22:30:24 +0200523 len = p - filename;
524 if (len > sizeof(protocol) - 1)
525 len = sizeof(protocol) - 1;
526 memcpy(protocol, filename, len);
527 protocol[len] = '\0';
528 QLIST_FOREACH(drv1, &bdrv_drivers, list) {
529 if (drv1->protocol_name &&
530 !strcmp(drv1->protocol_name, protocol)) {
531 return drv1;
532 }
533 }
Max Reitzb65a5e12015-02-05 13:58:12 -0500534
535 error_setg(errp, "Unknown protocol '%s'", protocol);
Christoph Hellwig84a12e62010-04-07 22:30:24 +0200536 return NULL;
537}
538
Markus Armbrusterc6684242014-11-20 16:27:10 +0100539/*
540 * Guess image format by probing its contents.
541 * This is not a good idea when your image is raw (CVE-2008-2004), but
542 * we do it anyway for backward compatibility.
543 *
544 * @buf contains the image's first @buf_size bytes.
Kevin Wolf7cddd372014-11-20 16:27:11 +0100545 * @buf_size is the buffer size in bytes (generally BLOCK_PROBE_BUF_SIZE,
546 * but can be smaller if the image file is smaller)
Markus Armbrusterc6684242014-11-20 16:27:10 +0100547 * @filename is its filename.
548 *
549 * For all block drivers, call the bdrv_probe() method to get its
550 * probing score.
551 * Return the first block driver with the highest probing score.
552 */
Kevin Wolf38f3ef52014-11-20 16:27:12 +0100553BlockDriver *bdrv_probe_all(const uint8_t *buf, int buf_size,
554 const char *filename)
Markus Armbrusterc6684242014-11-20 16:27:10 +0100555{
556 int score_max = 0, score;
557 BlockDriver *drv = NULL, *d;
558
559 QLIST_FOREACH(d, &bdrv_drivers, list) {
560 if (d->bdrv_probe) {
561 score = d->bdrv_probe(buf, buf_size, filename);
562 if (score > score_max) {
563 score_max = score;
564 drv = d;
565 }
566 }
567 }
568
569 return drv;
570}
571
Kevin Wolff500a6d2012-11-12 17:35:27 +0100572static int find_image_format(BlockDriverState *bs, const char *filename,
Max Reitz34b5d2c2013-09-05 14:45:29 +0200573 BlockDriver **pdrv, Error **errp)
bellardea2384d2004-08-01 21:59:26 +0000574{
Markus Armbrusterc6684242014-11-20 16:27:10 +0100575 BlockDriver *drv;
Kevin Wolf7cddd372014-11-20 16:27:11 +0100576 uint8_t buf[BLOCK_PROBE_BUF_SIZE];
Kevin Wolff500a6d2012-11-12 17:35:27 +0100577 int ret = 0;
Nicholas Bellingerf8ea0b02010-05-17 09:45:57 -0700578
Kevin Wolf08a00552010-06-01 18:37:31 +0200579 /* Return the raw BlockDriver * to scsi-generic devices or empty drives */
Dimitris Aragiorgisb192af82015-06-23 13:44:56 +0300580 if (bdrv_is_sg(bs) || !bdrv_is_inserted(bs) || bdrv_getlength(bs) == 0) {
Max Reitzef810432014-12-02 18:32:42 +0100581 *pdrv = &bdrv_raw;
Stefan Weilc98ac352010-07-21 21:51:51 +0200582 return ret;
Nicholas A. Bellinger1a396852010-05-27 08:56:28 -0700583 }
Nicholas Bellingerf8ea0b02010-05-17 09:45:57 -0700584
bellard83f64092006-08-01 16:21:11 +0000585 ret = bdrv_pread(bs, 0, buf, sizeof(buf));
bellard83f64092006-08-01 16:21:11 +0000586 if (ret < 0) {
Max Reitz34b5d2c2013-09-05 14:45:29 +0200587 error_setg_errno(errp, -ret, "Could not read image for determining its "
588 "format");
Stefan Weilc98ac352010-07-21 21:51:51 +0200589 *pdrv = NULL;
590 return ret;
bellard83f64092006-08-01 16:21:11 +0000591 }
592
Markus Armbrusterc6684242014-11-20 16:27:10 +0100593 drv = bdrv_probe_all(buf, ret, filename);
Stefan Weilc98ac352010-07-21 21:51:51 +0200594 if (!drv) {
Max Reitz34b5d2c2013-09-05 14:45:29 +0200595 error_setg(errp, "Could not determine image format: No compatible "
596 "driver found");
Stefan Weilc98ac352010-07-21 21:51:51 +0200597 ret = -ENOENT;
598 }
599 *pdrv = drv;
600 return ret;
bellardea2384d2004-08-01 21:59:26 +0000601}
602
Stefan Hajnoczi51762282010-04-19 16:56:41 +0100603/**
604 * Set the current 'total_sectors' value
Markus Armbruster65a9bb22014-06-26 13:23:17 +0200605 * Return 0 on success, -errno on error.
Stefan Hajnoczi51762282010-04-19 16:56:41 +0100606 */
607static int refresh_total_sectors(BlockDriverState *bs, int64_t hint)
608{
609 BlockDriver *drv = bs->drv;
610
Nicholas Bellinger396759a2010-05-17 09:46:04 -0700611 /* Do not attempt drv->bdrv_getlength() on scsi-generic devices */
Dimitris Aragiorgisb192af82015-06-23 13:44:56 +0300612 if (bdrv_is_sg(bs))
Nicholas Bellinger396759a2010-05-17 09:46:04 -0700613 return 0;
614
Stefan Hajnoczi51762282010-04-19 16:56:41 +0100615 /* query actual device if possible, otherwise just trust the hint */
616 if (drv->bdrv_getlength) {
617 int64_t length = drv->bdrv_getlength(bs);
618 if (length < 0) {
619 return length;
620 }
Fam Zheng7e382002013-11-06 19:48:06 +0800621 hint = DIV_ROUND_UP(length, BDRV_SECTOR_SIZE);
Stefan Hajnoczi51762282010-04-19 16:56:41 +0100622 }
623
624 bs->total_sectors = hint;
625 return 0;
626}
627
Stefan Hajnoczic3993cd2011-08-04 12:26:51 +0100628/**
Paolo Bonzini9e8f1832013-02-08 14:06:11 +0100629 * Set open flags for a given discard mode
630 *
631 * Return 0 on success, -1 if the discard mode was invalid.
632 */
633int bdrv_parse_discard_flags(const char *mode, int *flags)
634{
635 *flags &= ~BDRV_O_UNMAP;
636
637 if (!strcmp(mode, "off") || !strcmp(mode, "ignore")) {
638 /* do nothing */
639 } else if (!strcmp(mode, "on") || !strcmp(mode, "unmap")) {
640 *flags |= BDRV_O_UNMAP;
641 } else {
642 return -1;
643 }
644
645 return 0;
646}
647
648/**
Stefan Hajnoczic3993cd2011-08-04 12:26:51 +0100649 * Set open flags for a given cache mode
650 *
651 * Return 0 on success, -1 if the cache mode was invalid.
652 */
653int bdrv_parse_cache_flags(const char *mode, int *flags)
654{
655 *flags &= ~BDRV_O_CACHE_MASK;
656
657 if (!strcmp(mode, "off") || !strcmp(mode, "none")) {
658 *flags |= BDRV_O_NOCACHE | BDRV_O_CACHE_WB;
Stefan Hajnoczi92196b22011-08-04 12:26:52 +0100659 } else if (!strcmp(mode, "directsync")) {
660 *flags |= BDRV_O_NOCACHE;
Stefan Hajnoczic3993cd2011-08-04 12:26:51 +0100661 } else if (!strcmp(mode, "writeback")) {
662 *flags |= BDRV_O_CACHE_WB;
663 } else if (!strcmp(mode, "unsafe")) {
664 *flags |= BDRV_O_CACHE_WB;
665 *flags |= BDRV_O_NO_FLUSH;
666 } else if (!strcmp(mode, "writethrough")) {
667 /* this is the default */
668 } else {
669 return -1;
670 }
671
672 return 0;
673}
674
Kevin Wolf0b50cc82014-04-11 21:29:52 +0200675/*
Kevin Wolfb1e6fc02014-05-06 12:11:42 +0200676 * Returns the flags that a temporary snapshot should get, based on the
677 * originally requested flags (the originally requested image will have flags
678 * like a backing file)
679 */
680static int bdrv_temp_snapshot_flags(int flags)
681{
682 return (flags & ~BDRV_O_SNAPSHOT) | BDRV_O_TEMPORARY;
683}
684
685/*
Kevin Wolff3930ed2015-04-08 13:43:47 +0200686 * Returns the flags that bs->file should get if a protocol driver is expected,
687 * based on the given flags for the parent BDS
Kevin Wolf0b50cc82014-04-11 21:29:52 +0200688 */
689static int bdrv_inherited_flags(int flags)
690{
691 /* Enable protocol handling, disable format probing for bs->file */
692 flags |= BDRV_O_PROTOCOL;
693
694 /* Our block drivers take care to send flushes and respect unmap policy,
695 * so we can enable both unconditionally on lower layers. */
696 flags |= BDRV_O_CACHE_WB | BDRV_O_UNMAP;
697
Kevin Wolf0b50cc82014-04-11 21:29:52 +0200698 /* Clear flags that only apply to the top layer */
Kevin Wolf5669b442014-04-11 21:36:45 +0200699 flags &= ~(BDRV_O_SNAPSHOT | BDRV_O_NO_BACKING | BDRV_O_COPY_ON_READ);
Kevin Wolf0b50cc82014-04-11 21:29:52 +0200700
701 return flags;
702}
703
Kevin Wolff3930ed2015-04-08 13:43:47 +0200704const BdrvChildRole child_file = {
705 .inherit_flags = bdrv_inherited_flags,
706};
707
708/*
709 * Returns the flags that bs->file should get if the use of formats (and not
710 * only protocols) is permitted for it, based on the given flags for the parent
711 * BDS
712 */
713static int bdrv_inherited_fmt_flags(int parent_flags)
714{
715 int flags = child_file.inherit_flags(parent_flags);
716 return flags & ~BDRV_O_PROTOCOL;
717}
718
719const BdrvChildRole child_format = {
720 .inherit_flags = bdrv_inherited_fmt_flags,
721};
722
Kevin Wolf317fc442014-04-25 13:27:34 +0200723/*
724 * Returns the flags that bs->backing_hd should get, based on the given flags
725 * for the parent BDS
726 */
727static int bdrv_backing_flags(int flags)
728{
729 /* backing files always opened read-only */
730 flags &= ~(BDRV_O_RDWR | BDRV_O_COPY_ON_READ);
731
732 /* snapshot=on is handled on the top layer */
Kevin Wolf8bfea152014-04-11 19:16:36 +0200733 flags &= ~(BDRV_O_SNAPSHOT | BDRV_O_TEMPORARY);
Kevin Wolf317fc442014-04-25 13:27:34 +0200734
735 return flags;
736}
737
Kevin Wolff3930ed2015-04-08 13:43:47 +0200738static const BdrvChildRole child_backing = {
739 .inherit_flags = bdrv_backing_flags,
740};
741
Kevin Wolf7b272452012-11-12 17:05:39 +0100742static int bdrv_open_flags(BlockDriverState *bs, int flags)
743{
744 int open_flags = flags | BDRV_O_CACHE_WB;
745
746 /*
747 * Clear flags that are internal to the block layer before opening the
748 * image.
749 */
Kevin Wolf20cca272014-06-04 14:33:27 +0200750 open_flags &= ~(BDRV_O_SNAPSHOT | BDRV_O_NO_BACKING | BDRV_O_PROTOCOL);
Kevin Wolf7b272452012-11-12 17:05:39 +0100751
752 /*
753 * Snapshots should be writable.
754 */
Kevin Wolf8bfea152014-04-11 19:16:36 +0200755 if (flags & BDRV_O_TEMPORARY) {
Kevin Wolf7b272452012-11-12 17:05:39 +0100756 open_flags |= BDRV_O_RDWR;
757 }
758
759 return open_flags;
760}
761
Kevin Wolf636ea372014-01-24 14:11:52 +0100762static void bdrv_assign_node_name(BlockDriverState *bs,
763 const char *node_name,
764 Error **errp)
Benoît Canet6913c0c2014-01-23 21:31:33 +0100765{
766 if (!node_name) {
Kevin Wolf636ea372014-01-24 14:11:52 +0100767 return;
Benoît Canet6913c0c2014-01-23 21:31:33 +0100768 }
769
Kevin Wolf9aebf3b2014-09-25 09:54:02 +0200770 /* Check for empty string or invalid characters */
Markus Armbrusterf5bebbb2014-09-30 13:59:30 +0200771 if (!id_wellformed(node_name)) {
Kevin Wolf9aebf3b2014-09-25 09:54:02 +0200772 error_setg(errp, "Invalid node name");
Kevin Wolf636ea372014-01-24 14:11:52 +0100773 return;
Benoît Canet6913c0c2014-01-23 21:31:33 +0100774 }
775
Benoît Canet0c5e94e2014-02-12 17:15:07 +0100776 /* takes care of avoiding namespaces collisions */
Markus Armbruster7f06d472014-10-07 13:59:12 +0200777 if (blk_by_name(node_name)) {
Benoît Canet0c5e94e2014-02-12 17:15:07 +0100778 error_setg(errp, "node-name=%s is conflicting with a device id",
779 node_name);
Kevin Wolf636ea372014-01-24 14:11:52 +0100780 return;
Benoît Canet0c5e94e2014-02-12 17:15:07 +0100781 }
782
Benoît Canet6913c0c2014-01-23 21:31:33 +0100783 /* takes care of avoiding duplicates node names */
784 if (bdrv_find_node(node_name)) {
785 error_setg(errp, "Duplicate node name");
Kevin Wolf636ea372014-01-24 14:11:52 +0100786 return;
Benoît Canet6913c0c2014-01-23 21:31:33 +0100787 }
788
789 /* copy node name into the bs and insert it into the graph list */
790 pstrcpy(bs->node_name, sizeof(bs->node_name), node_name);
791 QTAILQ_INSERT_TAIL(&graph_bdrv_states, bs, node_list);
Benoît Canet6913c0c2014-01-23 21:31:33 +0100792}
793
Kevin Wolf18edf282015-04-07 17:12:56 +0200794static QemuOptsList bdrv_runtime_opts = {
795 .name = "bdrv_common",
796 .head = QTAILQ_HEAD_INITIALIZER(bdrv_runtime_opts.head),
797 .desc = {
798 {
799 .name = "node-name",
800 .type = QEMU_OPT_STRING,
801 .help = "Node name of the block device node",
802 },
803 { /* end of list */ }
804 },
805};
806
Kevin Wolfb6ce07a2010-04-12 16:37:13 +0200807/*
Kevin Wolf57915332010-04-14 15:24:50 +0200808 * Common part for opening disk images and files
Kevin Wolfb6ad4912013-03-15 10:35:04 +0100809 *
810 * Removes all processed options from *options.
Kevin Wolf57915332010-04-14 15:24:50 +0200811 */
Kevin Wolf9a4f4c32015-06-16 14:19:22 +0200812static int bdrv_open_common(BlockDriverState *bs, BdrvChild *file,
Max Reitz34b5d2c2013-09-05 14:45:29 +0200813 QDict *options, int flags, BlockDriver *drv, Error **errp)
Kevin Wolf57915332010-04-14 15:24:50 +0200814{
815 int ret, open_flags;
Kevin Wolf035fccd2013-04-09 14:34:19 +0200816 const char *filename;
Benoît Canet6913c0c2014-01-23 21:31:33 +0100817 const char *node_name = NULL;
Kevin Wolf18edf282015-04-07 17:12:56 +0200818 QemuOpts *opts;
Max Reitz34b5d2c2013-09-05 14:45:29 +0200819 Error *local_err = NULL;
Kevin Wolf57915332010-04-14 15:24:50 +0200820
821 assert(drv != NULL);
Paolo Bonzini64058752012-05-08 16:51:49 +0200822 assert(bs->file == NULL);
Kevin Wolf707ff822013-03-06 12:20:31 +0100823 assert(options != NULL && bs->options != options);
Kevin Wolf57915332010-04-14 15:24:50 +0200824
Kevin Wolf45673672013-04-22 17:48:40 +0200825 if (file != NULL) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +0200826 filename = file->bs->filename;
Kevin Wolf45673672013-04-22 17:48:40 +0200827 } else {
828 filename = qdict_get_try_str(options, "filename");
829 }
830
Kevin Wolf765003d2014-02-03 14:49:42 +0100831 if (drv->bdrv_needs_filename && !filename) {
832 error_setg(errp, "The '%s' block driver requires a file name",
833 drv->format_name);
834 return -EINVAL;
835 }
836
Kevin Wolf45673672013-04-22 17:48:40 +0200837 trace_bdrv_open_common(bs, filename ?: "", flags, drv->format_name);
Stefan Hajnoczi28dcee12011-09-22 20:14:12 +0100838
Kevin Wolf18edf282015-04-07 17:12:56 +0200839 opts = qemu_opts_create(&bdrv_runtime_opts, NULL, 0, &error_abort);
840 qemu_opts_absorb_qdict(opts, options, &local_err);
841 if (local_err) {
842 error_propagate(errp, local_err);
843 ret = -EINVAL;
844 goto fail_opts;
845 }
846
847 node_name = qemu_opt_get(opts, "node-name");
Kevin Wolf636ea372014-01-24 14:11:52 +0100848 bdrv_assign_node_name(bs, node_name, &local_err);
Markus Armbruster0fb63952014-04-25 16:50:31 +0200849 if (local_err) {
Kevin Wolf636ea372014-01-24 14:11:52 +0100850 error_propagate(errp, local_err);
Kevin Wolf18edf282015-04-07 17:12:56 +0200851 ret = -EINVAL;
852 goto fail_opts;
Kevin Wolf5d186eb2013-03-27 17:28:18 +0100853 }
854
Paolo Bonzini1b7fd722011-11-29 11:35:47 +0100855 bs->guest_block_size = 512;
Paolo Bonzinic25f53b2011-11-29 12:42:20 +0100856 bs->request_alignment = 512;
Asias He0d51b4d2013-08-22 15:24:14 +0800857 bs->zero_beyond_eof = true;
Fam Zhengb64ec4e2013-05-29 19:35:40 +0800858 open_flags = bdrv_open_flags(bs, flags);
859 bs->read_only = !(open_flags & BDRV_O_RDWR);
860
861 if (use_bdrv_whitelist && !bdrv_is_whitelisted(drv, bs->read_only)) {
Kevin Wolf8f94a6e2013-10-10 11:45:55 +0200862 error_setg(errp,
863 !bs->read_only && bdrv_is_whitelisted(drv, true)
864 ? "Driver '%s' can only be used for read-only devices"
865 : "Driver '%s' is not whitelisted",
866 drv->format_name);
Kevin Wolf18edf282015-04-07 17:12:56 +0200867 ret = -ENOTSUP;
868 goto fail_opts;
Fam Zhengb64ec4e2013-05-29 19:35:40 +0800869 }
Kevin Wolf57915332010-04-14 15:24:50 +0200870
Stefan Hajnoczi53fec9d2011-11-28 16:08:47 +0000871 assert(bs->copy_on_read == 0); /* bdrv_new() and bdrv_close() make it so */
Kevin Wolf0ebd24e2013-09-19 15:12:18 +0200872 if (flags & BDRV_O_COPY_ON_READ) {
873 if (!bs->read_only) {
874 bdrv_enable_copy_on_read(bs);
875 } else {
876 error_setg(errp, "Can't use copy-on-read on read-only device");
Kevin Wolf18edf282015-04-07 17:12:56 +0200877 ret = -EINVAL;
878 goto fail_opts;
Kevin Wolf0ebd24e2013-09-19 15:12:18 +0200879 }
Stefan Hajnoczi53fec9d2011-11-28 16:08:47 +0000880 }
881
Kevin Wolfc2ad1b02013-03-18 16:40:51 +0100882 if (filename != NULL) {
883 pstrcpy(bs->filename, sizeof(bs->filename), filename);
884 } else {
885 bs->filename[0] = '\0';
886 }
Max Reitz91af7012014-07-18 20:24:56 +0200887 pstrcpy(bs->exact_filename, sizeof(bs->exact_filename), bs->filename);
Kevin Wolf57915332010-04-14 15:24:50 +0200888
Kevin Wolf57915332010-04-14 15:24:50 +0200889 bs->drv = drv;
Anthony Liguori7267c092011-08-20 22:09:37 -0500890 bs->opaque = g_malloc0(drv->instance_size);
Kevin Wolf57915332010-04-14 15:24:50 +0200891
Stefan Hajnoczi03f541b2011-10-27 10:54:28 +0100892 bs->enable_write_cache = !!(flags & BDRV_O_CACHE_WB);
Stefan Hajnoczie7c63792011-10-27 10:54:27 +0100893
Kevin Wolf66f82ce2010-04-14 14:17:38 +0200894 /* Open the image, either directly or using a protocol */
895 if (drv->bdrv_file_open) {
Kevin Wolf5d186eb2013-03-27 17:28:18 +0100896 assert(file == NULL);
Benoît Canet030be322013-09-24 17:07:04 +0200897 assert(!drv->bdrv_needs_filename || filename != NULL);
Max Reitz34b5d2c2013-09-05 14:45:29 +0200898 ret = drv->bdrv_file_open(bs, options, open_flags, &local_err);
Kevin Wolff500a6d2012-11-12 17:35:27 +0100899 } else {
Kevin Wolf2af5ef72013-04-09 13:19:18 +0200900 if (file == NULL) {
Max Reitz34b5d2c2013-09-05 14:45:29 +0200901 error_setg(errp, "Can't use '%s' as a block driver for the "
902 "protocol level", drv->format_name);
Kevin Wolf2af5ef72013-04-09 13:19:18 +0200903 ret = -EINVAL;
904 goto free_and_fail;
905 }
Kevin Wolff500a6d2012-11-12 17:35:27 +0100906 bs->file = file;
Max Reitz34b5d2c2013-09-05 14:45:29 +0200907 ret = drv->bdrv_open(bs, options, open_flags, &local_err);
Kevin Wolf66f82ce2010-04-14 14:17:38 +0200908 }
909
Kevin Wolf57915332010-04-14 15:24:50 +0200910 if (ret < 0) {
Markus Armbruster84d18f02014-01-30 15:07:28 +0100911 if (local_err) {
Max Reitz34b5d2c2013-09-05 14:45:29 +0200912 error_propagate(errp, local_err);
Dunrong Huang2fa9aa52013-09-24 18:14:01 +0800913 } else if (bs->filename[0]) {
914 error_setg_errno(errp, -ret, "Could not open '%s'", bs->filename);
Max Reitz34b5d2c2013-09-05 14:45:29 +0200915 } else {
916 error_setg_errno(errp, -ret, "Could not open image");
917 }
Kevin Wolf57915332010-04-14 15:24:50 +0200918 goto free_and_fail;
919 }
920
Markus Armbrustera1f688f2015-03-13 21:09:40 +0100921 if (bs->encrypted) {
922 error_report("Encrypted images are deprecated");
923 error_printf("Support for them will be removed in a future release.\n"
924 "You can use 'qemu-img convert' to convert your image"
925 " to an unencrypted one.\n");
926 }
927
Stefan Hajnoczi51762282010-04-19 16:56:41 +0100928 ret = refresh_total_sectors(bs, bs->total_sectors);
929 if (ret < 0) {
Max Reitz34b5d2c2013-09-05 14:45:29 +0200930 error_setg_errno(errp, -ret, "Could not refresh total sector count");
Stefan Hajnoczi51762282010-04-19 16:56:41 +0100931 goto free_and_fail;
Kevin Wolf57915332010-04-14 15:24:50 +0200932 }
Stefan Hajnoczi51762282010-04-19 16:56:41 +0100933
Kevin Wolf3baca892014-07-16 17:48:16 +0200934 bdrv_refresh_limits(bs, &local_err);
935 if (local_err) {
936 error_propagate(errp, local_err);
937 ret = -EINVAL;
938 goto free_and_fail;
939 }
940
Paolo Bonzinic25f53b2011-11-29 12:42:20 +0100941 assert(bdrv_opt_mem_align(bs) != 0);
Denis V. Lunev4196d2f2015-05-12 17:30:55 +0300942 assert(bdrv_min_mem_align(bs) != 0);
Dimitris Aragiorgisb192af82015-06-23 13:44:56 +0300943 assert((bs->request_alignment != 0) || bdrv_is_sg(bs));
Kevin Wolf18edf282015-04-07 17:12:56 +0200944
945 qemu_opts_del(opts);
Kevin Wolf57915332010-04-14 15:24:50 +0200946 return 0;
947
948free_and_fail:
Kevin Wolff500a6d2012-11-12 17:35:27 +0100949 bs->file = NULL;
Anthony Liguori7267c092011-08-20 22:09:37 -0500950 g_free(bs->opaque);
Kevin Wolf57915332010-04-14 15:24:50 +0200951 bs->opaque = NULL;
952 bs->drv = NULL;
Kevin Wolf18edf282015-04-07 17:12:56 +0200953fail_opts:
954 qemu_opts_del(opts);
Kevin Wolf57915332010-04-14 15:24:50 +0200955 return ret;
956}
957
Kevin Wolf5e5c4f62014-05-26 11:45:08 +0200958static QDict *parse_json_filename(const char *filename, Error **errp)
959{
960 QObject *options_obj;
961 QDict *options;
962 int ret;
963
964 ret = strstart(filename, "json:", &filename);
965 assert(ret);
966
967 options_obj = qobject_from_json(filename);
968 if (!options_obj) {
969 error_setg(errp, "Could not parse the JSON options");
970 return NULL;
971 }
972
973 if (qobject_type(options_obj) != QTYPE_QDICT) {
974 qobject_decref(options_obj);
975 error_setg(errp, "Invalid JSON object given");
976 return NULL;
977 }
978
979 options = qobject_to_qdict(options_obj);
980 qdict_flatten(options);
981
982 return options;
983}
984
Kevin Wolf57915332010-04-14 15:24:50 +0200985/*
Kevin Wolff54120f2014-05-26 11:09:59 +0200986 * Fills in default options for opening images and converts the legacy
987 * filename/flags pair to option QDict entries.
Max Reitz53a29512015-03-19 14:53:16 -0400988 * The BDRV_O_PROTOCOL flag in *flags will be set or cleared accordingly if a
989 * block driver has been specified explicitly.
Kevin Wolff54120f2014-05-26 11:09:59 +0200990 */
Max Reitz53a29512015-03-19 14:53:16 -0400991static int bdrv_fill_options(QDict **options, const char **pfilename,
Max Reitz053e1572015-08-26 19:47:51 +0200992 int *flags, Error **errp)
Kevin Wolff54120f2014-05-26 11:09:59 +0200993{
Kevin Wolf5e5c4f62014-05-26 11:45:08 +0200994 const char *filename = *pfilename;
Kevin Wolff54120f2014-05-26 11:09:59 +0200995 const char *drvname;
Max Reitz53a29512015-03-19 14:53:16 -0400996 bool protocol = *flags & BDRV_O_PROTOCOL;
Kevin Wolff54120f2014-05-26 11:09:59 +0200997 bool parse_filename = false;
Max Reitz053e1572015-08-26 19:47:51 +0200998 BlockDriver *drv = NULL;
Kevin Wolff54120f2014-05-26 11:09:59 +0200999 Error *local_err = NULL;
Kevin Wolff54120f2014-05-26 11:09:59 +02001000
Kevin Wolf5e5c4f62014-05-26 11:45:08 +02001001 /* Parse json: pseudo-protocol */
1002 if (filename && g_str_has_prefix(filename, "json:")) {
1003 QDict *json_options = parse_json_filename(filename, &local_err);
1004 if (local_err) {
1005 error_propagate(errp, local_err);
1006 return -EINVAL;
1007 }
1008
1009 /* Options given in the filename have lower priority than options
1010 * specified directly */
1011 qdict_join(*options, json_options, false);
1012 QDECREF(json_options);
1013 *pfilename = filename = NULL;
1014 }
1015
Max Reitz53a29512015-03-19 14:53:16 -04001016 drvname = qdict_get_try_str(*options, "driver");
Max Reitz053e1572015-08-26 19:47:51 +02001017 if (drvname) {
1018 drv = bdrv_find_format(drvname);
1019 if (!drv) {
1020 error_setg(errp, "Unknown driver '%s'", drvname);
1021 return -ENOENT;
1022 }
1023 /* If the user has explicitly specified the driver, this choice should
1024 * override the BDRV_O_PROTOCOL flag */
1025 protocol = drv->bdrv_file_open;
Max Reitz53a29512015-03-19 14:53:16 -04001026 }
1027
1028 if (protocol) {
1029 *flags |= BDRV_O_PROTOCOL;
1030 } else {
1031 *flags &= ~BDRV_O_PROTOCOL;
1032 }
1033
Kevin Wolff54120f2014-05-26 11:09:59 +02001034 /* Fetch the file name from the options QDict if necessary */
Kevin Wolf17b005f2014-05-27 10:50:29 +02001035 if (protocol && filename) {
Kevin Wolff54120f2014-05-26 11:09:59 +02001036 if (!qdict_haskey(*options, "filename")) {
1037 qdict_put(*options, "filename", qstring_from_str(filename));
1038 parse_filename = true;
1039 } else {
1040 error_setg(errp, "Can't specify 'file' and 'filename' options at "
1041 "the same time");
1042 return -EINVAL;
1043 }
1044 }
1045
1046 /* Find the right block driver */
1047 filename = qdict_get_try_str(*options, "filename");
Kevin Wolff54120f2014-05-26 11:09:59 +02001048
Max Reitz053e1572015-08-26 19:47:51 +02001049 if (!drvname && protocol) {
1050 if (filename) {
1051 drv = bdrv_find_protocol(filename, parse_filename, errp);
1052 if (!drv) {
Kevin Wolff54120f2014-05-26 11:09:59 +02001053 return -EINVAL;
1054 }
Max Reitz053e1572015-08-26 19:47:51 +02001055
1056 drvname = drv->format_name;
1057 qdict_put(*options, "driver", qstring_from_str(drvname));
1058 } else {
1059 error_setg(errp, "Must specify either driver or file");
1060 return -EINVAL;
Kevin Wolff54120f2014-05-26 11:09:59 +02001061 }
1062 }
1063
Kevin Wolf17b005f2014-05-27 10:50:29 +02001064 assert(drv || !protocol);
Kevin Wolff54120f2014-05-26 11:09:59 +02001065
1066 /* Driver-specific filename parsing */
Kevin Wolf17b005f2014-05-27 10:50:29 +02001067 if (drv && drv->bdrv_parse_filename && parse_filename) {
Kevin Wolff54120f2014-05-26 11:09:59 +02001068 drv->bdrv_parse_filename(filename, *options, &local_err);
1069 if (local_err) {
1070 error_propagate(errp, local_err);
1071 return -EINVAL;
1072 }
1073
1074 if (!drv->bdrv_needs_filename) {
1075 qdict_del(*options, "filename");
1076 }
1077 }
1078
1079 return 0;
1080}
1081
Kevin Wolfb4b059f2015-06-15 13:24:19 +02001082static BdrvChild *bdrv_attach_child(BlockDriverState *parent_bs,
1083 BlockDriverState *child_bs,
1084 const BdrvChildRole *child_role)
Kevin Wolfdf581792015-06-15 11:53:47 +02001085{
1086 BdrvChild *child = g_new(BdrvChild, 1);
1087 *child = (BdrvChild) {
1088 .bs = child_bs,
1089 .role = child_role,
1090 };
1091
1092 QLIST_INSERT_HEAD(&parent_bs->children, child, next);
Kevin Wolfb4b059f2015-06-15 13:24:19 +02001093
1094 return child;
Kevin Wolfdf581792015-06-15 11:53:47 +02001095}
1096
Kevin Wolf33a60402015-06-15 13:51:04 +02001097static void bdrv_detach_child(BdrvChild *child)
1098{
1099 QLIST_REMOVE(child, next);
1100 g_free(child);
1101}
1102
1103void bdrv_unref_child(BlockDriverState *parent, BdrvChild *child)
1104{
1105 BlockDriverState *child_bs = child->bs;
1106
1107 if (child->bs->inherits_from == parent) {
1108 child->bs->inherits_from = NULL;
1109 }
1110
1111 bdrv_detach_child(child);
1112 bdrv_unref(child_bs);
1113}
1114
Fam Zheng8d24cce2014-05-23 21:29:45 +08001115void bdrv_set_backing_hd(BlockDriverState *bs, BlockDriverState *backing_hd)
1116{
1117
Fam Zheng826b6ca2014-05-23 21:29:47 +08001118 if (bs->backing_hd) {
1119 assert(bs->backing_blocker);
1120 bdrv_op_unblock_all(bs->backing_hd, bs->backing_blocker);
Kevin Wolf80a1e132015-06-17 15:52:09 +02001121 bdrv_detach_child(bs->backing_child);
Fam Zheng826b6ca2014-05-23 21:29:47 +08001122 } else if (backing_hd) {
1123 error_setg(&bs->backing_blocker,
Alberto Garcia81e5f782015-04-08 12:29:19 +03001124 "node is used as backing hd of '%s'",
1125 bdrv_get_device_or_node_name(bs));
Fam Zheng826b6ca2014-05-23 21:29:47 +08001126 }
1127
Fam Zheng8d24cce2014-05-23 21:29:45 +08001128 bs->backing_hd = backing_hd;
1129 if (!backing_hd) {
Fam Zheng826b6ca2014-05-23 21:29:47 +08001130 error_free(bs->backing_blocker);
1131 bs->backing_blocker = NULL;
Kevin Wolf80a1e132015-06-17 15:52:09 +02001132 bs->backing_child = NULL;
Fam Zheng8d24cce2014-05-23 21:29:45 +08001133 goto out;
1134 }
Kevin Wolf80a1e132015-06-17 15:52:09 +02001135 bs->backing_child = bdrv_attach_child(bs, backing_hd, &child_backing);
Fam Zheng8d24cce2014-05-23 21:29:45 +08001136 bs->open_flags &= ~BDRV_O_NO_BACKING;
1137 pstrcpy(bs->backing_file, sizeof(bs->backing_file), backing_hd->filename);
1138 pstrcpy(bs->backing_format, sizeof(bs->backing_format),
1139 backing_hd->drv ? backing_hd->drv->format_name : "");
Fam Zheng826b6ca2014-05-23 21:29:47 +08001140
1141 bdrv_op_block_all(bs->backing_hd, bs->backing_blocker);
1142 /* Otherwise we won't be able to commit due to check in bdrv_commit */
Fam Zhengbb000212014-09-11 13:14:00 +08001143 bdrv_op_unblock(bs->backing_hd, BLOCK_OP_TYPE_COMMIT_TARGET,
Fam Zheng826b6ca2014-05-23 21:29:47 +08001144 bs->backing_blocker);
Fam Zheng8d24cce2014-05-23 21:29:45 +08001145out:
Kevin Wolf3baca892014-07-16 17:48:16 +02001146 bdrv_refresh_limits(bs, NULL);
Fam Zheng8d24cce2014-05-23 21:29:45 +08001147}
1148
Kevin Wolf31ca6d02013-03-28 15:29:24 +01001149/*
1150 * Opens the backing file for a BlockDriverState if not yet open
1151 *
1152 * options is a QDict of options to pass to the block drivers, or NULL for an
1153 * empty set of options. The reference to the QDict is transferred to this
1154 * function (even on failure), so if the caller intends to reuse the dictionary,
1155 * it needs to use QINCREF() before calling bdrv_file_open.
1156 */
Max Reitz34b5d2c2013-09-05 14:45:29 +02001157int bdrv_open_backing_file(BlockDriverState *bs, QDict *options, Error **errp)
Paolo Bonzini9156df12012-10-18 16:49:17 +02001158{
Benoît Canet1ba4b6a2014-04-22 17:05:27 +02001159 char *backing_filename = g_malloc0(PATH_MAX);
Kevin Wolf317fc442014-04-25 13:27:34 +02001160 int ret = 0;
Fam Zheng8d24cce2014-05-23 21:29:45 +08001161 BlockDriverState *backing_hd;
Max Reitz34b5d2c2013-09-05 14:45:29 +02001162 Error *local_err = NULL;
Paolo Bonzini9156df12012-10-18 16:49:17 +02001163
1164 if (bs->backing_hd != NULL) {
Kevin Wolf31ca6d02013-03-28 15:29:24 +01001165 QDECREF(options);
Benoît Canet1ba4b6a2014-04-22 17:05:27 +02001166 goto free_exit;
Paolo Bonzini9156df12012-10-18 16:49:17 +02001167 }
1168
Kevin Wolf31ca6d02013-03-28 15:29:24 +01001169 /* NULL means an empty set of options */
1170 if (options == NULL) {
1171 options = qdict_new();
1172 }
1173
Paolo Bonzini9156df12012-10-18 16:49:17 +02001174 bs->open_flags &= ~BDRV_O_NO_BACKING;
Kevin Wolf1cb6f502013-04-12 20:27:07 +02001175 if (qdict_haskey(options, "file.filename")) {
1176 backing_filename[0] = '\0';
1177 } else if (bs->backing_file[0] == '\0' && qdict_size(options) == 0) {
Kevin Wolf31ca6d02013-03-28 15:29:24 +01001178 QDECREF(options);
Benoît Canet1ba4b6a2014-04-22 17:05:27 +02001179 goto free_exit;
Fam Zhengdbecebd2013-09-22 20:05:06 +08001180 } else {
Max Reitz9f074292014-11-26 17:20:26 +01001181 bdrv_get_full_backing_filename(bs, backing_filename, PATH_MAX,
1182 &local_err);
1183 if (local_err) {
1184 ret = -EINVAL;
1185 error_propagate(errp, local_err);
1186 QDECREF(options);
1187 goto free_exit;
1188 }
Paolo Bonzini9156df12012-10-18 16:49:17 +02001189 }
1190
Kevin Wolf8ee79e72014-06-04 15:09:35 +02001191 if (!bs->drv || !bs->drv->supports_backing) {
1192 ret = -EINVAL;
1193 error_setg(errp, "Driver doesn't support backing files");
1194 QDECREF(options);
1195 goto free_exit;
1196 }
1197
Markus Armbrustere4e99862014-10-07 13:59:03 +02001198 backing_hd = bdrv_new();
Fam Zheng8d24cce2014-05-23 21:29:45 +08001199
Kevin Wolfc5f6e492014-11-25 18:12:42 +01001200 if (bs->backing_format[0] != '\0' && !qdict_haskey(options, "driver")) {
1201 qdict_put(options, "driver", qstring_from_str(bs->backing_format));
Paolo Bonzini9156df12012-10-18 16:49:17 +02001202 }
1203
Max Reitzf67503e2014-02-18 18:33:05 +01001204 assert(bs->backing_hd == NULL);
Kevin Wolff3930ed2015-04-08 13:43:47 +02001205 ret = bdrv_open_inherit(&backing_hd,
1206 *backing_filename ? backing_filename : NULL,
Max Reitzce343772015-08-26 19:47:50 +02001207 NULL, options, 0, bs, &child_backing, &local_err);
Paolo Bonzini9156df12012-10-18 16:49:17 +02001208 if (ret < 0) {
Fam Zheng8d24cce2014-05-23 21:29:45 +08001209 bdrv_unref(backing_hd);
1210 backing_hd = NULL;
Paolo Bonzini9156df12012-10-18 16:49:17 +02001211 bs->open_flags |= BDRV_O_NO_BACKING;
Fam Zhengb04b6b62013-11-08 11:26:49 +08001212 error_setg(errp, "Could not open backing file: %s",
1213 error_get_pretty(local_err));
1214 error_free(local_err);
Benoît Canet1ba4b6a2014-04-22 17:05:27 +02001215 goto free_exit;
Paolo Bonzini9156df12012-10-18 16:49:17 +02001216 }
Kevin Wolfdf581792015-06-15 11:53:47 +02001217
Fam Zheng8d24cce2014-05-23 21:29:45 +08001218 bdrv_set_backing_hd(bs, backing_hd);
Peter Feinerd80ac652014-01-08 19:43:25 +00001219
Benoît Canet1ba4b6a2014-04-22 17:05:27 +02001220free_exit:
1221 g_free(backing_filename);
1222 return ret;
Paolo Bonzini9156df12012-10-18 16:49:17 +02001223}
1224
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001225/*
Max Reitzda557aa2013-12-20 19:28:11 +01001226 * Opens a disk image whose options are given as BlockdevRef in another block
1227 * device's options.
1228 *
Max Reitzda557aa2013-12-20 19:28:11 +01001229 * If allow_none is true, no image will be opened if filename is false and no
Kevin Wolfb4b059f2015-06-15 13:24:19 +02001230 * BlockdevRef is given. NULL will be returned, but errp remains unset.
Max Reitzda557aa2013-12-20 19:28:11 +01001231 *
1232 * bdrev_key specifies the key for the image's BlockdevRef in the options QDict.
1233 * That QDict has to be flattened; therefore, if the BlockdevRef is a QDict
1234 * itself, all options starting with "${bdref_key}." are considered part of the
1235 * BlockdevRef.
1236 *
1237 * The BlockdevRef will be removed from the options QDict.
1238 */
Kevin Wolfb4b059f2015-06-15 13:24:19 +02001239BdrvChild *bdrv_open_child(const char *filename,
1240 QDict *options, const char *bdref_key,
1241 BlockDriverState* parent,
1242 const BdrvChildRole *child_role,
1243 bool allow_none, Error **errp)
Max Reitzda557aa2013-12-20 19:28:11 +01001244{
Kevin Wolfb4b059f2015-06-15 13:24:19 +02001245 BdrvChild *c = NULL;
1246 BlockDriverState *bs;
Max Reitzda557aa2013-12-20 19:28:11 +01001247 QDict *image_options;
1248 int ret;
1249 char *bdref_key_dot;
1250 const char *reference;
1251
Kevin Wolfdf581792015-06-15 11:53:47 +02001252 assert(child_role != NULL);
Max Reitzf67503e2014-02-18 18:33:05 +01001253
Max Reitzda557aa2013-12-20 19:28:11 +01001254 bdref_key_dot = g_strdup_printf("%s.", bdref_key);
1255 qdict_extract_subqdict(options, &image_options, bdref_key_dot);
1256 g_free(bdref_key_dot);
1257
1258 reference = qdict_get_try_str(options, bdref_key);
1259 if (!filename && !reference && !qdict_size(image_options)) {
Kevin Wolfb4b059f2015-06-15 13:24:19 +02001260 if (!allow_none) {
Max Reitzda557aa2013-12-20 19:28:11 +01001261 error_setg(errp, "A block device must be specified for \"%s\"",
1262 bdref_key);
Max Reitzda557aa2013-12-20 19:28:11 +01001263 }
Markus Armbrusterb20e61e2014-05-28 11:16:57 +02001264 QDECREF(image_options);
Max Reitzda557aa2013-12-20 19:28:11 +01001265 goto done;
1266 }
1267
Kevin Wolfb4b059f2015-06-15 13:24:19 +02001268 bs = NULL;
1269 ret = bdrv_open_inherit(&bs, filename, reference, image_options, 0,
Max Reitzce343772015-08-26 19:47:50 +02001270 parent, child_role, errp);
Kevin Wolfdf581792015-06-15 11:53:47 +02001271 if (ret < 0) {
1272 goto done;
1273 }
1274
Kevin Wolfb4b059f2015-06-15 13:24:19 +02001275 c = bdrv_attach_child(parent, bs, child_role);
Max Reitzda557aa2013-12-20 19:28:11 +01001276
1277done:
1278 qdict_del(options, bdref_key);
Kevin Wolfb4b059f2015-06-15 13:24:19 +02001279 return c;
1280}
1281
1282/*
1283 * This is a version of bdrv_open_child() that returns 0/-EINVAL instead of
1284 * a BdrvChild object.
1285 *
1286 * If allow_none is true, no image will be opened if filename is false and no
1287 * BlockdevRef is given. *pbs will remain unchanged and 0 will be returned.
1288 *
1289 * To conform with the behavior of bdrv_open(), *pbs has to be NULL.
1290 */
1291int bdrv_open_image(BlockDriverState **pbs, const char *filename,
1292 QDict *options, const char *bdref_key,
1293 BlockDriverState* parent, const BdrvChildRole *child_role,
1294 bool allow_none, Error **errp)
1295{
1296 Error *local_err = NULL;
1297 BdrvChild *c;
1298
1299 assert(pbs);
1300 assert(*pbs == NULL);
1301
1302 c = bdrv_open_child(filename, options, bdref_key, parent, child_role,
1303 allow_none, &local_err);
1304 if (local_err) {
1305 error_propagate(errp, local_err);
1306 return -EINVAL;
1307 }
1308
1309 if (c != NULL) {
1310 *pbs = c->bs;
1311 }
1312
1313 return 0;
Max Reitzda557aa2013-12-20 19:28:11 +01001314}
1315
Chen Gang6b8aeca2014-06-23 23:28:23 +08001316int bdrv_append_temp_snapshot(BlockDriverState *bs, int flags, Error **errp)
Kevin Wolfb9988752014-04-03 12:09:34 +02001317{
1318 /* TODO: extra byte is a hack to ensure MAX_PATH space on Windows. */
Benoît Canet1ba4b6a2014-04-22 17:05:27 +02001319 char *tmp_filename = g_malloc0(PATH_MAX + 1);
Kevin Wolfb9988752014-04-03 12:09:34 +02001320 int64_t total_size;
Chunyan Liu83d05212014-06-05 17:20:51 +08001321 QemuOpts *opts = NULL;
Kevin Wolfb9988752014-04-03 12:09:34 +02001322 QDict *snapshot_options;
1323 BlockDriverState *bs_snapshot;
Fam Zhengc2e0dbb2015-07-06 12:24:44 +08001324 Error *local_err = NULL;
Kevin Wolfb9988752014-04-03 12:09:34 +02001325 int ret;
1326
1327 /* if snapshot, we create a temporary backing file and open it
1328 instead of opening 'filename' directly */
1329
1330 /* Get the required size from the image */
Kevin Wolff1877432014-04-04 17:07:19 +02001331 total_size = bdrv_getlength(bs);
1332 if (total_size < 0) {
Chen Gang6b8aeca2014-06-23 23:28:23 +08001333 ret = total_size;
Kevin Wolff1877432014-04-04 17:07:19 +02001334 error_setg_errno(errp, -total_size, "Could not get image size");
Benoît Canet1ba4b6a2014-04-22 17:05:27 +02001335 goto out;
Kevin Wolff1877432014-04-04 17:07:19 +02001336 }
Kevin Wolfb9988752014-04-03 12:09:34 +02001337
1338 /* Create the temporary image */
Benoît Canet1ba4b6a2014-04-22 17:05:27 +02001339 ret = get_tmp_filename(tmp_filename, PATH_MAX + 1);
Kevin Wolfb9988752014-04-03 12:09:34 +02001340 if (ret < 0) {
1341 error_setg_errno(errp, -ret, "Could not get temporary filename");
Benoît Canet1ba4b6a2014-04-22 17:05:27 +02001342 goto out;
Kevin Wolfb9988752014-04-03 12:09:34 +02001343 }
1344
Max Reitzef810432014-12-02 18:32:42 +01001345 opts = qemu_opts_create(bdrv_qcow2.create_opts, NULL, 0,
Chunyan Liuc282e1f2014-06-05 17:21:11 +08001346 &error_abort);
Markus Armbruster39101f22015-02-12 16:46:36 +01001347 qemu_opt_set_number(opts, BLOCK_OPT_SIZE, total_size, &error_abort);
Max Reitzef810432014-12-02 18:32:42 +01001348 ret = bdrv_create(&bdrv_qcow2, tmp_filename, opts, &local_err);
Chunyan Liu83d05212014-06-05 17:20:51 +08001349 qemu_opts_del(opts);
Kevin Wolfb9988752014-04-03 12:09:34 +02001350 if (ret < 0) {
1351 error_setg_errno(errp, -ret, "Could not create temporary overlay "
1352 "'%s': %s", tmp_filename,
1353 error_get_pretty(local_err));
1354 error_free(local_err);
Benoît Canet1ba4b6a2014-04-22 17:05:27 +02001355 goto out;
Kevin Wolfb9988752014-04-03 12:09:34 +02001356 }
1357
1358 /* Prepare a new options QDict for the temporary file */
1359 snapshot_options = qdict_new();
1360 qdict_put(snapshot_options, "file.driver",
1361 qstring_from_str("file"));
1362 qdict_put(snapshot_options, "file.filename",
1363 qstring_from_str(tmp_filename));
Max Reitze6641712015-08-26 19:47:48 +02001364 qdict_put(snapshot_options, "driver",
1365 qstring_from_str("qcow2"));
Kevin Wolfb9988752014-04-03 12:09:34 +02001366
Markus Armbrustere4e99862014-10-07 13:59:03 +02001367 bs_snapshot = bdrv_new();
Kevin Wolfb9988752014-04-03 12:09:34 +02001368
1369 ret = bdrv_open(&bs_snapshot, NULL, NULL, snapshot_options,
Max Reitz6ebf9aa2015-08-26 19:47:49 +02001370 flags, &local_err);
Kevin Wolfb9988752014-04-03 12:09:34 +02001371 if (ret < 0) {
1372 error_propagate(errp, local_err);
Benoît Canet1ba4b6a2014-04-22 17:05:27 +02001373 goto out;
Kevin Wolfb9988752014-04-03 12:09:34 +02001374 }
1375
1376 bdrv_append(bs_snapshot, bs);
Benoît Canet1ba4b6a2014-04-22 17:05:27 +02001377
1378out:
1379 g_free(tmp_filename);
Chen Gang6b8aeca2014-06-23 23:28:23 +08001380 return ret;
Kevin Wolfb9988752014-04-03 12:09:34 +02001381}
1382
Max Reitzda557aa2013-12-20 19:28:11 +01001383/*
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001384 * Opens a disk image (raw, qcow2, vmdk, ...)
Kevin Wolfde9c0ce2013-03-15 10:35:02 +01001385 *
1386 * options is a QDict of options to pass to the block drivers, or NULL for an
1387 * empty set of options. The reference to the QDict belongs to the block layer
1388 * after the call (even on failure), so if the caller intends to reuse the
1389 * dictionary, it needs to use QINCREF() before calling bdrv_open.
Max Reitzf67503e2014-02-18 18:33:05 +01001390 *
1391 * If *pbs is NULL, a new BDS will be created with a pointer to it stored there.
1392 * If it is not NULL, the referenced BDS will be reused.
Max Reitzddf56362014-02-18 18:33:06 +01001393 *
1394 * The reference parameter may be used to specify an existing block device which
1395 * should be opened. If specified, neither options nor a filename may be given,
1396 * nor can an existing BDS be reused (that is, *pbs has to be NULL).
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001397 */
Kevin Wolff3930ed2015-04-08 13:43:47 +02001398static int bdrv_open_inherit(BlockDriverState **pbs, const char *filename,
1399 const char *reference, QDict *options, int flags,
1400 BlockDriverState *parent,
Max Reitzce343772015-08-26 19:47:50 +02001401 const BdrvChildRole *child_role, Error **errp)
bellardea2384d2004-08-01 21:59:26 +00001402{
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001403 int ret;
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02001404 BdrvChild *file = NULL;
1405 BlockDriverState *bs;
Max Reitzce343772015-08-26 19:47:50 +02001406 BlockDriver *drv = NULL;
Kevin Wolf74fe54f2013-07-09 11:09:02 +02001407 const char *drvname;
Max Reitz34b5d2c2013-09-05 14:45:29 +02001408 Error *local_err = NULL;
Kevin Wolfb1e6fc02014-05-06 12:11:42 +02001409 int snapshot_flags = 0;
bellard712e7872005-04-28 21:09:32 +00001410
Max Reitzf67503e2014-02-18 18:33:05 +01001411 assert(pbs);
Kevin Wolff3930ed2015-04-08 13:43:47 +02001412 assert(!child_role || !flags);
1413 assert(!child_role == !parent);
Max Reitzf67503e2014-02-18 18:33:05 +01001414
Max Reitzddf56362014-02-18 18:33:06 +01001415 if (reference) {
1416 bool options_non_empty = options ? qdict_size(options) : false;
1417 QDECREF(options);
1418
1419 if (*pbs) {
1420 error_setg(errp, "Cannot reuse an existing BDS when referencing "
1421 "another block device");
1422 return -EINVAL;
1423 }
1424
1425 if (filename || options_non_empty) {
1426 error_setg(errp, "Cannot reference an existing block device with "
1427 "additional options or a new filename");
1428 return -EINVAL;
1429 }
1430
1431 bs = bdrv_lookup_bs(reference, reference, errp);
1432 if (!bs) {
1433 return -ENODEV;
1434 }
1435 bdrv_ref(bs);
1436 *pbs = bs;
1437 return 0;
1438 }
1439
Max Reitzf67503e2014-02-18 18:33:05 +01001440 if (*pbs) {
1441 bs = *pbs;
1442 } else {
Markus Armbrustere4e99862014-10-07 13:59:03 +02001443 bs = bdrv_new();
Max Reitzf67503e2014-02-18 18:33:05 +01001444 }
1445
Kevin Wolfde9c0ce2013-03-15 10:35:02 +01001446 /* NULL means an empty set of options */
1447 if (options == NULL) {
1448 options = qdict_new();
1449 }
1450
Kevin Wolff3930ed2015-04-08 13:43:47 +02001451 if (child_role) {
Kevin Wolfbddcec32015-04-09 18:47:50 +02001452 bs->inherits_from = parent;
Kevin Wolff3930ed2015-04-08 13:43:47 +02001453 flags = child_role->inherit_flags(parent->open_flags);
1454 }
1455
Max Reitz053e1572015-08-26 19:47:51 +02001456 ret = bdrv_fill_options(&options, &filename, &flags, &local_err);
Kevin Wolf462f5bc2014-05-26 11:39:55 +02001457 if (local_err) {
1458 goto fail;
1459 }
1460
Kevin Wolf76c591b2014-06-04 14:19:44 +02001461 /* Find the right image format driver */
Kevin Wolf76c591b2014-06-04 14:19:44 +02001462 drvname = qdict_get_try_str(options, "driver");
1463 if (drvname) {
1464 drv = bdrv_find_format(drvname);
1465 qdict_del(options, "driver");
1466 if (!drv) {
1467 error_setg(errp, "Unknown driver: '%s'", drvname);
1468 ret = -EINVAL;
1469 goto fail;
1470 }
1471 }
1472
1473 assert(drvname || !(flags & BDRV_O_PROTOCOL));
Kevin Wolf76c591b2014-06-04 14:19:44 +02001474
Kevin Wolff3930ed2015-04-08 13:43:47 +02001475 bs->open_flags = flags;
Kevin Wolfde9c0ce2013-03-15 10:35:02 +01001476 bs->options = options;
Kevin Wolfb6ad4912013-03-15 10:35:04 +01001477 options = qdict_clone_shallow(options);
Kevin Wolfde9c0ce2013-03-15 10:35:02 +01001478
Kevin Wolff4788ad2014-06-03 16:44:19 +02001479 /* Open image file without format layer */
1480 if ((flags & BDRV_O_PROTOCOL) == 0) {
1481 if (flags & BDRV_O_RDWR) {
1482 flags |= BDRV_O_ALLOW_RDWR;
1483 }
1484 if (flags & BDRV_O_SNAPSHOT) {
1485 snapshot_flags = bdrv_temp_snapshot_flags(flags);
1486 flags = bdrv_backing_flags(flags);
1487 }
1488
Kevin Wolff3930ed2015-04-08 13:43:47 +02001489 bs->open_flags = flags;
Kevin Wolf1fdd6932015-06-15 14:11:51 +02001490
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02001491 file = bdrv_open_child(filename, options, "file", bs,
1492 &child_file, true, &local_err);
Kevin Wolf1fdd6932015-06-15 14:11:51 +02001493 if (local_err) {
1494 ret = -EINVAL;
Max Reitz5469a2a2014-02-18 18:33:10 +01001495 goto fail;
1496 }
1497 }
1498
Kevin Wolf76c591b2014-06-04 14:19:44 +02001499 /* Image format probing */
Kevin Wolf38f3ef52014-11-20 16:27:12 +01001500 bs->probed = !drv;
Kevin Wolf76c591b2014-06-04 14:19:44 +02001501 if (!drv && file) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02001502 ret = find_image_format(file->bs, filename, &drv, &local_err);
Kevin Wolf17b005f2014-05-27 10:50:29 +02001503 if (ret < 0) {
Kevin Wolf8bfea152014-04-11 19:16:36 +02001504 goto fail;
Max Reitz2a05cbe2013-12-20 19:28:10 +01001505 }
Kevin Wolf76c591b2014-06-04 14:19:44 +02001506 } else if (!drv) {
Kevin Wolf17b005f2014-05-27 10:50:29 +02001507 error_setg(errp, "Must specify either driver or file");
1508 ret = -EINVAL;
Kevin Wolf8bfea152014-04-11 19:16:36 +02001509 goto fail;
Kevin Wolff500a6d2012-11-12 17:35:27 +01001510 }
1511
Max Reitz53a29512015-03-19 14:53:16 -04001512 /* BDRV_O_PROTOCOL must be set iff a protocol BDS is about to be created */
1513 assert(!!(flags & BDRV_O_PROTOCOL) == !!drv->bdrv_file_open);
1514 /* file must be NULL if a protocol BDS is about to be created
1515 * (the inverse results in an error message from bdrv_open_common()) */
1516 assert(!(flags & BDRV_O_PROTOCOL) || !file);
1517
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001518 /* Open the image */
Max Reitz34b5d2c2013-09-05 14:45:29 +02001519 ret = bdrv_open_common(bs, file, options, flags, drv, &local_err);
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001520 if (ret < 0) {
Kevin Wolf8bfea152014-04-11 19:16:36 +02001521 goto fail;
Christoph Hellwig69873072010-01-20 18:13:25 +01001522 }
1523
Max Reitz2a05cbe2013-12-20 19:28:10 +01001524 if (file && (bs->file != file)) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02001525 bdrv_unref_child(bs, file);
Kevin Wolff500a6d2012-11-12 17:35:27 +01001526 file = NULL;
1527 }
1528
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001529 /* If there is a backing file, use it */
Paolo Bonzini9156df12012-10-18 16:49:17 +02001530 if ((flags & BDRV_O_NO_BACKING) == 0) {
Kevin Wolf31ca6d02013-03-28 15:29:24 +01001531 QDict *backing_options;
1532
Benoît Canet5726d872013-09-25 13:30:01 +02001533 qdict_extract_subqdict(options, &backing_options, "backing.");
Max Reitz34b5d2c2013-09-05 14:45:29 +02001534 ret = bdrv_open_backing_file(bs, backing_options, &local_err);
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001535 if (ret < 0) {
Kevin Wolfb6ad4912013-03-15 10:35:04 +01001536 goto close_and_fail;
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001537 }
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001538 }
1539
Max Reitz91af7012014-07-18 20:24:56 +02001540 bdrv_refresh_filename(bs);
1541
Kevin Wolfb9988752014-04-03 12:09:34 +02001542 /* For snapshot=on, create a temporary qcow2 overlay. bs points to the
1543 * temporary snapshot afterwards. */
Kevin Wolfb1e6fc02014-05-06 12:11:42 +02001544 if (snapshot_flags) {
Chen Gang6b8aeca2014-06-23 23:28:23 +08001545 ret = bdrv_append_temp_snapshot(bs, snapshot_flags, &local_err);
Kevin Wolfb9988752014-04-03 12:09:34 +02001546 if (local_err) {
Kevin Wolfb9988752014-04-03 12:09:34 +02001547 goto close_and_fail;
1548 }
1549 }
1550
Kevin Wolfb6ad4912013-03-15 10:35:04 +01001551 /* Check if any unknown options were used */
Max Reitz5acd9d82014-02-18 18:33:11 +01001552 if (options && (qdict_size(options) != 0)) {
Kevin Wolfb6ad4912013-03-15 10:35:04 +01001553 const QDictEntry *entry = qdict_first(options);
Max Reitz5acd9d82014-02-18 18:33:11 +01001554 if (flags & BDRV_O_PROTOCOL) {
1555 error_setg(errp, "Block protocol '%s' doesn't support the option "
1556 "'%s'", drv->format_name, entry->key);
1557 } else {
1558 error_setg(errp, "Block format '%s' used by device '%s' doesn't "
1559 "support the option '%s'", drv->format_name,
Markus Armbrusterbfb197e2014-10-07 13:59:11 +02001560 bdrv_get_device_name(bs), entry->key);
Max Reitz5acd9d82014-02-18 18:33:11 +01001561 }
Kevin Wolfb6ad4912013-03-15 10:35:04 +01001562
1563 ret = -EINVAL;
1564 goto close_and_fail;
1565 }
Kevin Wolfb6ad4912013-03-15 10:35:04 +01001566
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001567 if (!bdrv_key_required(bs)) {
Markus Armbrustera7f53e22014-10-07 13:59:25 +02001568 if (bs->blk) {
1569 blk_dev_change_media_cb(bs->blk, true);
1570 }
Markus Armbrusterc3adb582014-03-14 09:22:48 +01001571 } else if (!runstate_check(RUN_STATE_PRELAUNCH)
1572 && !runstate_check(RUN_STATE_INMIGRATE)
1573 && !runstate_check(RUN_STATE_PAUSED)) { /* HACK */
1574 error_setg(errp,
1575 "Guest must be stopped for opening of encrypted image");
1576 ret = -EBUSY;
1577 goto close_and_fail;
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001578 }
1579
Markus Armbrusterc3adb582014-03-14 09:22:48 +01001580 QDECREF(options);
Max Reitzf67503e2014-02-18 18:33:05 +01001581 *pbs = bs;
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001582 return 0;
1583
Kevin Wolf8bfea152014-04-11 19:16:36 +02001584fail:
Kevin Wolff500a6d2012-11-12 17:35:27 +01001585 if (file != NULL) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02001586 bdrv_unref_child(bs, file);
Kevin Wolff500a6d2012-11-12 17:35:27 +01001587 }
Kevin Wolfde9c0ce2013-03-15 10:35:02 +01001588 QDECREF(bs->options);
Kevin Wolfb6ad4912013-03-15 10:35:04 +01001589 QDECREF(options);
Kevin Wolfde9c0ce2013-03-15 10:35:02 +01001590 bs->options = NULL;
Max Reitzf67503e2014-02-18 18:33:05 +01001591 if (!*pbs) {
1592 /* If *pbs is NULL, a new BDS has been created in this function and
1593 needs to be freed now. Otherwise, it does not need to be closed,
1594 since it has not really been opened yet. */
1595 bdrv_unref(bs);
1596 }
Markus Armbruster84d18f02014-01-30 15:07:28 +01001597 if (local_err) {
Max Reitz34b5d2c2013-09-05 14:45:29 +02001598 error_propagate(errp, local_err);
1599 }
Kevin Wolfb6ad4912013-03-15 10:35:04 +01001600 return ret;
Kevin Wolfde9c0ce2013-03-15 10:35:02 +01001601
Kevin Wolfb6ad4912013-03-15 10:35:04 +01001602close_and_fail:
Max Reitzf67503e2014-02-18 18:33:05 +01001603 /* See fail path, but now the BDS has to be always closed */
1604 if (*pbs) {
1605 bdrv_close(bs);
1606 } else {
1607 bdrv_unref(bs);
1608 }
Kevin Wolfb6ad4912013-03-15 10:35:04 +01001609 QDECREF(options);
Markus Armbruster84d18f02014-01-30 15:07:28 +01001610 if (local_err) {
Max Reitz34b5d2c2013-09-05 14:45:29 +02001611 error_propagate(errp, local_err);
1612 }
Kevin Wolfb6ce07a2010-04-12 16:37:13 +02001613 return ret;
1614}
1615
Kevin Wolff3930ed2015-04-08 13:43:47 +02001616int bdrv_open(BlockDriverState **pbs, const char *filename,
Max Reitz6ebf9aa2015-08-26 19:47:49 +02001617 const char *reference, QDict *options, int flags, Error **errp)
Kevin Wolff3930ed2015-04-08 13:43:47 +02001618{
1619 return bdrv_open_inherit(pbs, filename, reference, options, flags, NULL,
Max Reitzce343772015-08-26 19:47:50 +02001620 NULL, errp);
Kevin Wolff3930ed2015-04-08 13:43:47 +02001621}
1622
Jeff Codye971aa12012-09-20 15:13:19 -04001623typedef struct BlockReopenQueueEntry {
1624 bool prepared;
1625 BDRVReopenState state;
1626 QSIMPLEQ_ENTRY(BlockReopenQueueEntry) entry;
1627} BlockReopenQueueEntry;
1628
1629/*
1630 * Adds a BlockDriverState to a simple queue for an atomic, transactional
1631 * reopen of multiple devices.
1632 *
1633 * bs_queue can either be an existing BlockReopenQueue that has had QSIMPLE_INIT
1634 * already performed, or alternatively may be NULL a new BlockReopenQueue will
1635 * be created and initialized. This newly created BlockReopenQueue should be
1636 * passed back in for subsequent calls that are intended to be of the same
1637 * atomic 'set'.
1638 *
1639 * bs is the BlockDriverState to add to the reopen queue.
1640 *
Kevin Wolf4d2cb092015-04-10 17:50:50 +02001641 * options contains the changed options for the associated bs
1642 * (the BlockReopenQueue takes ownership)
1643 *
Jeff Codye971aa12012-09-20 15:13:19 -04001644 * flags contains the open flags for the associated bs
1645 *
1646 * returns a pointer to bs_queue, which is either the newly allocated
1647 * bs_queue, or the existing bs_queue being used.
1648 *
1649 */
1650BlockReopenQueue *bdrv_reopen_queue(BlockReopenQueue *bs_queue,
Kevin Wolf4d2cb092015-04-10 17:50:50 +02001651 BlockDriverState *bs,
1652 QDict *options, int flags)
Jeff Codye971aa12012-09-20 15:13:19 -04001653{
1654 assert(bs != NULL);
1655
1656 BlockReopenQueueEntry *bs_entry;
Kevin Wolf67251a32015-04-09 18:54:04 +02001657 BdrvChild *child;
Kevin Wolf4d2cb092015-04-10 17:50:50 +02001658 QDict *old_options;
Kevin Wolf67251a32015-04-09 18:54:04 +02001659
Jeff Codye971aa12012-09-20 15:13:19 -04001660 if (bs_queue == NULL) {
1661 bs_queue = g_new0(BlockReopenQueue, 1);
1662 QSIMPLEQ_INIT(bs_queue);
1663 }
1664
Kevin Wolf4d2cb092015-04-10 17:50:50 +02001665 if (!options) {
1666 options = qdict_new();
1667 }
1668
1669 old_options = qdict_clone_shallow(bs->options);
1670 qdict_join(options, old_options, false);
1671 QDECREF(old_options);
1672
Kevin Wolff1f25a22014-04-25 19:04:55 +02001673 /* bdrv_open() masks this flag out */
1674 flags &= ~BDRV_O_PROTOCOL;
1675
Kevin Wolf67251a32015-04-09 18:54:04 +02001676 QLIST_FOREACH(child, &bs->children, next) {
1677 int child_flags;
1678
1679 if (child->bs->inherits_from != bs) {
1680 continue;
1681 }
1682
1683 child_flags = child->role->inherit_flags(flags);
Kevin Wolf4d2cb092015-04-10 17:50:50 +02001684 /* TODO Pass down child flags (backing.*, extents.*, ...) */
1685 bdrv_reopen_queue(bs_queue, child->bs, NULL, child_flags);
Jeff Codye971aa12012-09-20 15:13:19 -04001686 }
1687
1688 bs_entry = g_new0(BlockReopenQueueEntry, 1);
1689 QSIMPLEQ_INSERT_TAIL(bs_queue, bs_entry, entry);
1690
1691 bs_entry->state.bs = bs;
Kevin Wolf4d2cb092015-04-10 17:50:50 +02001692 bs_entry->state.options = options;
Jeff Codye971aa12012-09-20 15:13:19 -04001693 bs_entry->state.flags = flags;
1694
1695 return bs_queue;
1696}
1697
1698/*
1699 * Reopen multiple BlockDriverStates atomically & transactionally.
1700 *
1701 * The queue passed in (bs_queue) must have been built up previous
1702 * via bdrv_reopen_queue().
1703 *
1704 * Reopens all BDS specified in the queue, with the appropriate
1705 * flags. All devices are prepared for reopen, and failure of any
1706 * device will cause all device changes to be abandonded, and intermediate
1707 * data cleaned up.
1708 *
1709 * If all devices prepare successfully, then the changes are committed
1710 * to all devices.
1711 *
1712 */
1713int bdrv_reopen_multiple(BlockReopenQueue *bs_queue, Error **errp)
1714{
1715 int ret = -1;
1716 BlockReopenQueueEntry *bs_entry, *next;
1717 Error *local_err = NULL;
1718
1719 assert(bs_queue != NULL);
1720
1721 bdrv_drain_all();
1722
1723 QSIMPLEQ_FOREACH(bs_entry, bs_queue, entry) {
1724 if (bdrv_reopen_prepare(&bs_entry->state, bs_queue, &local_err)) {
1725 error_propagate(errp, local_err);
1726 goto cleanup;
1727 }
1728 bs_entry->prepared = true;
1729 }
1730
1731 /* If we reach this point, we have success and just need to apply the
1732 * changes
1733 */
1734 QSIMPLEQ_FOREACH(bs_entry, bs_queue, entry) {
1735 bdrv_reopen_commit(&bs_entry->state);
1736 }
1737
1738 ret = 0;
1739
1740cleanup:
1741 QSIMPLEQ_FOREACH_SAFE(bs_entry, bs_queue, entry, next) {
1742 if (ret && bs_entry->prepared) {
1743 bdrv_reopen_abort(&bs_entry->state);
1744 }
Kevin Wolf4d2cb092015-04-10 17:50:50 +02001745 QDECREF(bs_entry->state.options);
Jeff Codye971aa12012-09-20 15:13:19 -04001746 g_free(bs_entry);
1747 }
1748 g_free(bs_queue);
1749 return ret;
1750}
1751
1752
1753/* Reopen a single BlockDriverState with the specified flags. */
1754int bdrv_reopen(BlockDriverState *bs, int bdrv_flags, Error **errp)
1755{
1756 int ret = -1;
1757 Error *local_err = NULL;
Kevin Wolf4d2cb092015-04-10 17:50:50 +02001758 BlockReopenQueue *queue = bdrv_reopen_queue(NULL, bs, NULL, bdrv_flags);
Jeff Codye971aa12012-09-20 15:13:19 -04001759
1760 ret = bdrv_reopen_multiple(queue, &local_err);
1761 if (local_err != NULL) {
1762 error_propagate(errp, local_err);
1763 }
1764 return ret;
1765}
1766
1767
1768/*
1769 * Prepares a BlockDriverState for reopen. All changes are staged in the
1770 * 'opaque' field of the BDRVReopenState, which is used and allocated by
1771 * the block driver layer .bdrv_reopen_prepare()
1772 *
1773 * bs is the BlockDriverState to reopen
1774 * flags are the new open flags
1775 * queue is the reopen queue
1776 *
1777 * Returns 0 on success, non-zero on error. On error errp will be set
1778 * as well.
1779 *
1780 * On failure, bdrv_reopen_abort() will be called to clean up any data.
1781 * It is the responsibility of the caller to then call the abort() or
1782 * commit() for any other BDS that have been left in a prepare() state
1783 *
1784 */
1785int bdrv_reopen_prepare(BDRVReopenState *reopen_state, BlockReopenQueue *queue,
1786 Error **errp)
1787{
1788 int ret = -1;
1789 Error *local_err = NULL;
1790 BlockDriver *drv;
1791
1792 assert(reopen_state != NULL);
1793 assert(reopen_state->bs->drv != NULL);
1794 drv = reopen_state->bs->drv;
1795
1796 /* if we are to stay read-only, do not allow permission change
1797 * to r/w */
1798 if (!(reopen_state->bs->open_flags & BDRV_O_ALLOW_RDWR) &&
1799 reopen_state->flags & BDRV_O_RDWR) {
Alberto Garcia81e5f782015-04-08 12:29:19 +03001800 error_setg(errp, "Node '%s' is read only",
1801 bdrv_get_device_or_node_name(reopen_state->bs));
Jeff Codye971aa12012-09-20 15:13:19 -04001802 goto error;
1803 }
1804
1805
1806 ret = bdrv_flush(reopen_state->bs);
1807 if (ret) {
1808 error_set(errp, ERROR_CLASS_GENERIC_ERROR, "Error (%s) flushing drive",
1809 strerror(-ret));
1810 goto error;
1811 }
1812
1813 if (drv->bdrv_reopen_prepare) {
1814 ret = drv->bdrv_reopen_prepare(reopen_state, queue, &local_err);
1815 if (ret) {
1816 if (local_err != NULL) {
1817 error_propagate(errp, local_err);
1818 } else {
Luiz Capitulinod8b68952013-06-10 11:29:27 -04001819 error_setg(errp, "failed while preparing to reopen image '%s'",
1820 reopen_state->bs->filename);
Jeff Codye971aa12012-09-20 15:13:19 -04001821 }
1822 goto error;
1823 }
1824 } else {
1825 /* It is currently mandatory to have a bdrv_reopen_prepare()
1826 * handler for each supported drv. */
Alberto Garcia81e5f782015-04-08 12:29:19 +03001827 error_setg(errp, "Block format '%s' used by node '%s' "
1828 "does not support reopening files", drv->format_name,
1829 bdrv_get_device_or_node_name(reopen_state->bs));
Jeff Codye971aa12012-09-20 15:13:19 -04001830 ret = -1;
1831 goto error;
1832 }
1833
Kevin Wolf4d2cb092015-04-10 17:50:50 +02001834 /* Options that are not handled are only okay if they are unchanged
1835 * compared to the old state. It is expected that some options are only
1836 * used for the initial open, but not reopen (e.g. filename) */
1837 if (qdict_size(reopen_state->options)) {
1838 const QDictEntry *entry = qdict_first(reopen_state->options);
1839
1840 do {
1841 QString *new_obj = qobject_to_qstring(entry->value);
1842 const char *new = qstring_get_str(new_obj);
1843 const char *old = qdict_get_try_str(reopen_state->bs->options,
1844 entry->key);
1845
1846 if (!old || strcmp(new, old)) {
1847 error_setg(errp, "Cannot change the option '%s'", entry->key);
1848 ret = -EINVAL;
1849 goto error;
1850 }
1851 } while ((entry = qdict_next(reopen_state->options, entry)));
1852 }
1853
Jeff Codye971aa12012-09-20 15:13:19 -04001854 ret = 0;
1855
1856error:
1857 return ret;
1858}
1859
1860/*
1861 * Takes the staged changes for the reopen from bdrv_reopen_prepare(), and
1862 * makes them final by swapping the staging BlockDriverState contents into
1863 * the active BlockDriverState contents.
1864 */
1865void bdrv_reopen_commit(BDRVReopenState *reopen_state)
1866{
1867 BlockDriver *drv;
1868
1869 assert(reopen_state != NULL);
1870 drv = reopen_state->bs->drv;
1871 assert(drv != NULL);
1872
1873 /* If there are any driver level actions to take */
1874 if (drv->bdrv_reopen_commit) {
1875 drv->bdrv_reopen_commit(reopen_state);
1876 }
1877
1878 /* set BDS specific flags now */
1879 reopen_state->bs->open_flags = reopen_state->flags;
1880 reopen_state->bs->enable_write_cache = !!(reopen_state->flags &
1881 BDRV_O_CACHE_WB);
1882 reopen_state->bs->read_only = !(reopen_state->flags & BDRV_O_RDWR);
Kevin Wolf355ef4a2013-12-11 20:14:09 +01001883
Kevin Wolf3baca892014-07-16 17:48:16 +02001884 bdrv_refresh_limits(reopen_state->bs, NULL);
Jeff Codye971aa12012-09-20 15:13:19 -04001885}
1886
1887/*
1888 * Abort the reopen, and delete and free the staged changes in
1889 * reopen_state
1890 */
1891void bdrv_reopen_abort(BDRVReopenState *reopen_state)
1892{
1893 BlockDriver *drv;
1894
1895 assert(reopen_state != NULL);
1896 drv = reopen_state->bs->drv;
1897 assert(drv != NULL);
1898
1899 if (drv->bdrv_reopen_abort) {
1900 drv->bdrv_reopen_abort(reopen_state);
1901 }
1902}
1903
1904
bellardfc01f7e2003-06-30 10:03:06 +00001905void bdrv_close(BlockDriverState *bs)
1906{
Max Reitz33384422014-06-20 21:57:33 +02001907 BdrvAioNotifier *ban, *ban_next;
1908
Paolo Bonzini3cbc0022012-10-19 11:36:48 +02001909 if (bs->job) {
1910 block_job_cancel_sync(bs->job);
1911 }
Alberto Garcia99b7e772015-09-25 16:41:44 +03001912
1913 /* Disable I/O limits and drain all pending throttled requests */
1914 if (bs->io_limits_enabled) {
1915 bdrv_io_limits_disable(bs);
1916 }
1917
Fam Zheng53ec73e2015-05-29 18:53:14 +08001918 bdrv_drain(bs); /* complete I/O */
Stefan Hajnoczi58fda172013-07-02 15:36:25 +02001919 bdrv_flush(bs);
Fam Zheng53ec73e2015-05-29 18:53:14 +08001920 bdrv_drain(bs); /* in case flush left pending I/O */
Paolo Bonzinid7d512f2012-08-23 11:20:36 +02001921 notifier_list_notify(&bs->close_notifiers, bs);
Kevin Wolf7094f122012-04-11 11:06:37 +02001922
Paolo Bonzini3cbc0022012-10-19 11:36:48 +02001923 if (bs->drv) {
Kevin Wolf6e93e7c2015-04-08 13:49:41 +02001924 BdrvChild *child, *next;
1925
Kevin Wolf9a7dedb2015-06-16 10:58:20 +02001926 bs->drv->bdrv_close(bs);
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02001927 bs->drv = NULL;
Kevin Wolf9a7dedb2015-06-16 10:58:20 +02001928
1929 if (bs->backing_hd) {
1930 BlockDriverState *backing_hd = bs->backing_hd;
1931 bdrv_set_backing_hd(bs, NULL);
1932 bdrv_unref(backing_hd);
1933 }
1934
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02001935 if (bs->file != NULL) {
1936 bdrv_unref_child(bs, bs->file);
1937 bs->file = NULL;
1938 }
1939
Kevin Wolf6e93e7c2015-04-08 13:49:41 +02001940 QLIST_FOREACH_SAFE(child, &bs->children, next, next) {
Kevin Wolf33a60402015-06-15 13:51:04 +02001941 /* TODO Remove bdrv_unref() from drivers' close function and use
1942 * bdrv_unref_child() here */
Kevin Wolfbddcec32015-04-09 18:47:50 +02001943 if (child->bs->inherits_from == bs) {
1944 child->bs->inherits_from = NULL;
1945 }
Kevin Wolf33a60402015-06-15 13:51:04 +02001946 bdrv_detach_child(child);
Kevin Wolf6e93e7c2015-04-08 13:49:41 +02001947 }
1948
Anthony Liguori7267c092011-08-20 22:09:37 -05001949 g_free(bs->opaque);
bellardea2384d2004-08-01 21:59:26 +00001950 bs->opaque = NULL;
Stefan Hajnoczi53fec9d2011-11-28 16:08:47 +00001951 bs->copy_on_read = 0;
Paolo Bonzinia275fa42012-05-08 16:51:43 +02001952 bs->backing_file[0] = '\0';
1953 bs->backing_format[0] = '\0';
Paolo Bonzini64058752012-05-08 16:51:49 +02001954 bs->total_sectors = 0;
1955 bs->encrypted = 0;
1956 bs->valid_key = 0;
1957 bs->sg = 0;
Asias He0d51b4d2013-08-22 15:24:14 +08001958 bs->zero_beyond_eof = false;
Kevin Wolfde9c0ce2013-03-15 10:35:02 +01001959 QDECREF(bs->options);
1960 bs->options = NULL;
Max Reitz91af7012014-07-18 20:24:56 +02001961 QDECREF(bs->full_open_options);
1962 bs->full_open_options = NULL;
bellardb3380822004-03-14 21:38:54 +00001963 }
Zhi Yong Wu98f90db2011-11-08 13:00:14 +08001964
Markus Armbrustera7f53e22014-10-07 13:59:25 +02001965 if (bs->blk) {
1966 blk_dev_change_media_cb(bs->blk, false);
1967 }
Pavel Hrdina9ca11152012-08-09 12:44:48 +02001968
Max Reitz33384422014-06-20 21:57:33 +02001969 QLIST_FOREACH_SAFE(ban, &bs->aio_notifiers, list, ban_next) {
1970 g_free(ban);
1971 }
1972 QLIST_INIT(&bs->aio_notifiers);
bellardb3380822004-03-14 21:38:54 +00001973}
1974
MORITA Kazutaka2bc93fe2010-05-28 11:44:57 +09001975void bdrv_close_all(void)
1976{
1977 BlockDriverState *bs;
1978
Benoît Canetdc364f42014-01-23 21:31:32 +01001979 QTAILQ_FOREACH(bs, &bdrv_states, device_list) {
Stefan Hajnoczied78cda2014-05-08 16:34:35 +02001980 AioContext *aio_context = bdrv_get_aio_context(bs);
1981
1982 aio_context_acquire(aio_context);
MORITA Kazutaka2bc93fe2010-05-28 11:44:57 +09001983 bdrv_close(bs);
Stefan Hajnoczied78cda2014-05-08 16:34:35 +02001984 aio_context_release(aio_context);
MORITA Kazutaka2bc93fe2010-05-28 11:44:57 +09001985 }
1986}
1987
Benoît Canetdc364f42014-01-23 21:31:32 +01001988/* make a BlockDriverState anonymous by removing from bdrv_state and
1989 * graph_bdrv_state list.
Ryan Harperd22b2f42011-03-29 20:51:47 -05001990 Also, NULL terminate the device_name to prevent double remove */
1991void bdrv_make_anon(BlockDriverState *bs)
1992{
Markus Armbrusterbfb197e2014-10-07 13:59:11 +02001993 /*
1994 * Take care to remove bs from bdrv_states only when it's actually
1995 * in it. Note that bs->device_list.tqe_prev is initially null,
1996 * and gets set to non-null by QTAILQ_INSERT_TAIL(). Establish
1997 * the useful invariant "bs in bdrv_states iff bs->tqe_prev" by
1998 * resetting it to null on remove.
1999 */
2000 if (bs->device_list.tqe_prev) {
Benoît Canetdc364f42014-01-23 21:31:32 +01002001 QTAILQ_REMOVE(&bdrv_states, bs, device_list);
Markus Armbrusterbfb197e2014-10-07 13:59:11 +02002002 bs->device_list.tqe_prev = NULL;
Ryan Harperd22b2f42011-03-29 20:51:47 -05002003 }
Benoît Canetdc364f42014-01-23 21:31:32 +01002004 if (bs->node_name[0] != '\0') {
2005 QTAILQ_REMOVE(&graph_bdrv_states, bs, node_list);
2006 }
2007 bs->node_name[0] = '\0';
Ryan Harperd22b2f42011-03-29 20:51:47 -05002008}
2009
Paolo Bonzinie023b2e2012-05-08 16:51:41 +02002010static void bdrv_rebind(BlockDriverState *bs)
2011{
2012 if (bs->drv && bs->drv->bdrv_rebind) {
2013 bs->drv->bdrv_rebind(bs);
2014 }
2015}
2016
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002017static void bdrv_move_feature_fields(BlockDriverState *bs_dest,
2018 BlockDriverState *bs_src)
2019{
2020 /* move some fields that need to stay attached to the device */
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002021
2022 /* dev info */
Paolo Bonzini1b7fd722011-11-29 11:35:47 +01002023 bs_dest->guest_block_size = bs_src->guest_block_size;
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002024 bs_dest->copy_on_read = bs_src->copy_on_read;
2025
2026 bs_dest->enable_write_cache = bs_src->enable_write_cache;
2027
Benoît Canetcc0681c2013-09-02 14:14:39 +02002028 /* i/o throttled req */
Alberto Garcia76f4afb2015-06-08 18:17:44 +02002029 bs_dest->throttle_state = bs_src->throttle_state,
2030 bs_dest->io_limits_enabled = bs_src->io_limits_enabled;
2031 bs_dest->pending_reqs[0] = bs_src->pending_reqs[0];
2032 bs_dest->pending_reqs[1] = bs_src->pending_reqs[1];
2033 bs_dest->throttled_reqs[0] = bs_src->throttled_reqs[0];
2034 bs_dest->throttled_reqs[1] = bs_src->throttled_reqs[1];
2035 memcpy(&bs_dest->round_robin,
2036 &bs_src->round_robin,
2037 sizeof(bs_dest->round_robin));
Benoît Canet0e5b0a22015-06-08 18:17:41 +02002038 memcpy(&bs_dest->throttle_timers,
2039 &bs_src->throttle_timers,
2040 sizeof(ThrottleTimers));
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002041
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002042 /* r/w error */
2043 bs_dest->on_read_error = bs_src->on_read_error;
2044 bs_dest->on_write_error = bs_src->on_write_error;
2045
2046 /* i/o status */
2047 bs_dest->iostatus_enabled = bs_src->iostatus_enabled;
2048 bs_dest->iostatus = bs_src->iostatus;
2049
2050 /* dirty bitmap */
Fam Zhenge4654d22013-11-13 18:29:43 +08002051 bs_dest->dirty_bitmaps = bs_src->dirty_bitmaps;
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002052
Fam Zheng9fcb0252013-08-23 09:14:46 +08002053 /* reference count */
2054 bs_dest->refcnt = bs_src->refcnt;
2055
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002056 /* job */
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002057 bs_dest->job = bs_src->job;
2058
2059 /* keep the same entry in bdrv_states */
Benoît Canetdc364f42014-01-23 21:31:32 +01002060 bs_dest->device_list = bs_src->device_list;
Markus Armbruster7e7d56d2014-10-07 13:59:05 +02002061 bs_dest->blk = bs_src->blk;
2062
Fam Zhengfbe40ff2014-05-23 21:29:42 +08002063 memcpy(bs_dest->op_blockers, bs_src->op_blockers,
2064 sizeof(bs_dest->op_blockers));
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002065}
2066
2067/*
2068 * Swap bs contents for two image chains while they are live,
2069 * while keeping required fields on the BlockDriverState that is
2070 * actually attached to a device.
2071 *
2072 * This will modify the BlockDriverState fields, and swap contents
2073 * between bs_new and bs_old. Both bs_new and bs_old are modified.
2074 *
Markus Armbrusterbfb197e2014-10-07 13:59:11 +02002075 * bs_new must not be attached to a BlockBackend.
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002076 *
2077 * This function does not create any image files.
2078 */
2079void bdrv_swap(BlockDriverState *bs_new, BlockDriverState *bs_old)
2080{
2081 BlockDriverState tmp;
Kevin Wolfbddcec32015-04-09 18:47:50 +02002082 BdrvChild *child;
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002083
Kevin Wolf6ee4ce12015-06-10 13:33:17 +02002084 bdrv_drain(bs_new);
2085 bdrv_drain(bs_old);
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002086
Benoît Canet90ce8a02014-03-05 23:48:29 +01002087 /* The code needs to swap the node_name but simply swapping node_list won't
2088 * work so first remove the nodes from the graph list, do the swap then
2089 * insert them back if needed.
2090 */
2091 if (bs_new->node_name[0] != '\0') {
2092 QTAILQ_REMOVE(&graph_bdrv_states, bs_new, node_list);
2093 }
2094 if (bs_old->node_name[0] != '\0') {
2095 QTAILQ_REMOVE(&graph_bdrv_states, bs_old, node_list);
2096 }
2097
Alberto Garciadb628332015-06-08 18:17:45 +02002098 /* If the BlockDriverState is part of a throttling group acquire
2099 * its lock since we're going to mess with the protected fields.
2100 * Otherwise there's no need to worry since no one else can touch
2101 * them. */
2102 if (bs_old->throttle_state) {
2103 throttle_group_lock(bs_old);
2104 }
2105
Markus Armbrusterbfb197e2014-10-07 13:59:11 +02002106 /* bs_new must be unattached and shouldn't have anything fancy enabled */
Markus Armbruster7e7d56d2014-10-07 13:59:05 +02002107 assert(!bs_new->blk);
Fam Zhenge4654d22013-11-13 18:29:43 +08002108 assert(QLIST_EMPTY(&bs_new->dirty_bitmaps));
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002109 assert(bs_new->job == NULL);
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002110 assert(bs_new->io_limits_enabled == false);
Alberto Garciadb628332015-06-08 18:17:45 +02002111 assert(bs_new->throttle_state == NULL);
Benoît Canet0e5b0a22015-06-08 18:17:41 +02002112 assert(!throttle_timers_are_initialized(&bs_new->throttle_timers));
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002113
2114 tmp = *bs_new;
2115 *bs_new = *bs_old;
2116 *bs_old = tmp;
2117
2118 /* there are some fields that should not be swapped, move them back */
2119 bdrv_move_feature_fields(&tmp, bs_old);
2120 bdrv_move_feature_fields(bs_old, bs_new);
2121 bdrv_move_feature_fields(bs_new, &tmp);
2122
Markus Armbrusterbfb197e2014-10-07 13:59:11 +02002123 /* bs_new must remain unattached */
Markus Armbruster7e7d56d2014-10-07 13:59:05 +02002124 assert(!bs_new->blk);
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002125
2126 /* Check a few fields that should remain attached to the device */
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002127 assert(bs_new->job == NULL);
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002128 assert(bs_new->io_limits_enabled == false);
Alberto Garciadb628332015-06-08 18:17:45 +02002129 assert(bs_new->throttle_state == NULL);
Benoît Canet0e5b0a22015-06-08 18:17:41 +02002130 assert(!throttle_timers_are_initialized(&bs_new->throttle_timers));
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002131
Alberto Garciadb628332015-06-08 18:17:45 +02002132 /* Release the ThrottleGroup lock */
2133 if (bs_old->throttle_state) {
2134 throttle_group_unlock(bs_old);
2135 }
2136
Benoît Canet90ce8a02014-03-05 23:48:29 +01002137 /* insert the nodes back into the graph node list if needed */
2138 if (bs_new->node_name[0] != '\0') {
2139 QTAILQ_INSERT_TAIL(&graph_bdrv_states, bs_new, node_list);
2140 }
2141 if (bs_old->node_name[0] != '\0') {
2142 QTAILQ_INSERT_TAIL(&graph_bdrv_states, bs_old, node_list);
2143 }
2144
Kevin Wolf6e93e7c2015-04-08 13:49:41 +02002145 /*
2146 * Update lh_first.le_prev for non-empty lists.
2147 *
2148 * The head of the op blocker list doesn't change because it is moved back
2149 * in bdrv_move_feature_fields().
2150 */
Kevin Wolf6ee4ce12015-06-10 13:33:17 +02002151 assert(QLIST_EMPTY(&bs_old->tracked_requests));
2152 assert(QLIST_EMPTY(&bs_new->tracked_requests));
2153
Kevin Wolf6e93e7c2015-04-08 13:49:41 +02002154 QLIST_FIX_HEAD_PTR(&bs_new->children, next);
2155 QLIST_FIX_HEAD_PTR(&bs_old->children, next);
2156
Kevin Wolfbddcec32015-04-09 18:47:50 +02002157 /* Update references in bs->opaque and children */
2158 QLIST_FOREACH(child, &bs_old->children, next) {
2159 if (child->bs->inherits_from == bs_new) {
2160 child->bs->inherits_from = bs_old;
2161 }
2162 }
2163 QLIST_FOREACH(child, &bs_new->children, next) {
2164 if (child->bs->inherits_from == bs_old) {
2165 child->bs->inherits_from = bs_new;
2166 }
2167 }
2168
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002169 bdrv_rebind(bs_new);
2170 bdrv_rebind(bs_old);
2171}
2172
Jeff Cody8802d1f2012-02-28 15:54:06 -05002173/*
2174 * Add new bs contents at the top of an image chain while the chain is
2175 * live, while keeping required fields on the top layer.
2176 *
2177 * This will modify the BlockDriverState fields, and swap contents
2178 * between bs_new and bs_top. Both bs_new and bs_top are modified.
2179 *
Markus Armbrusterbfb197e2014-10-07 13:59:11 +02002180 * bs_new must not be attached to a BlockBackend.
Jeff Codyf6801b82012-03-27 16:30:19 -04002181 *
Jeff Cody8802d1f2012-02-28 15:54:06 -05002182 * This function does not create any image files.
2183 */
2184void bdrv_append(BlockDriverState *bs_new, BlockDriverState *bs_top)
2185{
Paolo Bonzini4ddc07c2012-06-14 16:55:02 +02002186 bdrv_swap(bs_new, bs_top);
Jeff Cody8802d1f2012-02-28 15:54:06 -05002187
2188 /* The contents of 'tmp' will become bs_top, as we are
2189 * swapping bs_new and bs_top contents. */
Fam Zheng8d24cce2014-05-23 21:29:45 +08002190 bdrv_set_backing_hd(bs_top, bs_new);
Jeff Cody8802d1f2012-02-28 15:54:06 -05002191}
2192
Fam Zheng4f6fd342013-08-23 09:14:47 +08002193static void bdrv_delete(BlockDriverState *bs)
bellardb3380822004-03-14 21:38:54 +00002194{
Paolo Bonzini3e914652012-03-30 13:17:11 +02002195 assert(!bs->job);
Fam Zheng3718d8a2014-05-23 21:29:43 +08002196 assert(bdrv_op_blocker_is_empty(bs));
Fam Zheng4f6fd342013-08-23 09:14:47 +08002197 assert(!bs->refcnt);
Fam Zhenge4654d22013-11-13 18:29:43 +08002198 assert(QLIST_EMPTY(&bs->dirty_bitmaps));
Markus Armbruster18846de2010-06-29 16:58:30 +02002199
Stefan Hajnoczie1b5c522013-06-27 15:32:26 +02002200 bdrv_close(bs);
2201
Stefan Hajnoczi1b7bdbc2010-04-10 07:02:42 +01002202 /* remove from list, if necessary */
Ryan Harperd22b2f42011-03-29 20:51:47 -05002203 bdrv_make_anon(bs);
aurel3234c6f052008-04-08 19:51:21 +00002204
Anthony Liguori7267c092011-08-20 22:09:37 -05002205 g_free(bs);
bellardfc01f7e2003-06-30 10:03:06 +00002206}
2207
aliguorie97fc192009-04-21 23:11:50 +00002208/*
2209 * Run consistency checks on an image
2210 *
Kevin Wolfe076f332010-06-29 11:43:13 +02002211 * Returns 0 if the check could be completed (it doesn't mean that the image is
Stefan Weila1c72732011-04-28 17:20:38 +02002212 * free of errors) or -errno when an internal error occurred. The results of the
Kevin Wolfe076f332010-06-29 11:43:13 +02002213 * check are stored in res.
aliguorie97fc192009-04-21 23:11:50 +00002214 */
Kevin Wolf4534ff52012-05-11 16:07:02 +02002215int bdrv_check(BlockDriverState *bs, BdrvCheckResult *res, BdrvCheckMode fix)
aliguorie97fc192009-04-21 23:11:50 +00002216{
Max Reitz908bcd52014-08-07 22:47:55 +02002217 if (bs->drv == NULL) {
2218 return -ENOMEDIUM;
2219 }
aliguorie97fc192009-04-21 23:11:50 +00002220 if (bs->drv->bdrv_check == NULL) {
2221 return -ENOTSUP;
2222 }
2223
Kevin Wolfe076f332010-06-29 11:43:13 +02002224 memset(res, 0, sizeof(*res));
Kevin Wolf4534ff52012-05-11 16:07:02 +02002225 return bs->drv->bdrv_check(bs, res, fix);
aliguorie97fc192009-04-21 23:11:50 +00002226}
2227
Kevin Wolf8a426612010-07-16 17:17:01 +02002228#define COMMIT_BUF_SECTORS 2048
2229
bellard33e39632003-07-06 17:15:21 +00002230/* commit COW file into the raw image */
2231int bdrv_commit(BlockDriverState *bs)
2232{
bellard19cb3732006-08-19 11:45:59 +00002233 BlockDriver *drv = bs->drv;
Jeff Cody72706ea2014-01-24 09:02:35 -05002234 int64_t sector, total_sectors, length, backing_length;
Kevin Wolf8a426612010-07-16 17:17:01 +02002235 int n, ro, open_flags;
Jeff Cody0bce5972012-09-20 15:13:34 -04002236 int ret = 0;
Jeff Cody72706ea2014-01-24 09:02:35 -05002237 uint8_t *buf = NULL;
bellard33e39632003-07-06 17:15:21 +00002238
bellard19cb3732006-08-19 11:45:59 +00002239 if (!drv)
2240 return -ENOMEDIUM;
Liu Yuan6bb45152014-09-01 13:35:21 +08002241
Naphtali Sprei4dca4b62010-02-14 13:39:18 +02002242 if (!bs->backing_hd) {
2243 return -ENOTSUP;
bellard33e39632003-07-06 17:15:21 +00002244 }
2245
Fam Zhengbb000212014-09-11 13:14:00 +08002246 if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_COMMIT_SOURCE, NULL) ||
2247 bdrv_op_is_blocked(bs->backing_hd, BLOCK_OP_TYPE_COMMIT_TARGET, NULL)) {
Stefan Hajnoczi2d3735d2012-01-18 14:40:41 +00002248 return -EBUSY;
2249 }
2250
Naphtali Sprei4dca4b62010-02-14 13:39:18 +02002251 ro = bs->backing_hd->read_only;
Naphtali Sprei4dca4b62010-02-14 13:39:18 +02002252 open_flags = bs->backing_hd->open_flags;
2253
2254 if (ro) {
Jeff Cody0bce5972012-09-20 15:13:34 -04002255 if (bdrv_reopen(bs->backing_hd, open_flags | BDRV_O_RDWR, NULL)) {
2256 return -EACCES;
Naphtali Sprei4dca4b62010-02-14 13:39:18 +02002257 }
bellard33e39632003-07-06 17:15:21 +00002258 }
bellardea2384d2004-08-01 21:59:26 +00002259
Jeff Cody72706ea2014-01-24 09:02:35 -05002260 length = bdrv_getlength(bs);
2261 if (length < 0) {
2262 ret = length;
2263 goto ro_cleanup;
2264 }
2265
2266 backing_length = bdrv_getlength(bs->backing_hd);
2267 if (backing_length < 0) {
2268 ret = backing_length;
2269 goto ro_cleanup;
2270 }
2271
2272 /* If our top snapshot is larger than the backing file image,
2273 * grow the backing file image if possible. If not possible,
2274 * we must return an error */
2275 if (length > backing_length) {
2276 ret = bdrv_truncate(bs->backing_hd, length);
2277 if (ret < 0) {
2278 goto ro_cleanup;
2279 }
2280 }
2281
2282 total_sectors = length >> BDRV_SECTOR_BITS;
Kevin Wolf857d4f42014-05-20 13:16:51 +02002283
2284 /* qemu_try_blockalign() for bs will choose an alignment that works for
2285 * bs->backing_hd as well, so no need to compare the alignment manually. */
2286 buf = qemu_try_blockalign(bs, COMMIT_BUF_SECTORS * BDRV_SECTOR_SIZE);
2287 if (buf == NULL) {
2288 ret = -ENOMEM;
2289 goto ro_cleanup;
2290 }
bellardea2384d2004-08-01 21:59:26 +00002291
Kevin Wolf8a426612010-07-16 17:17:01 +02002292 for (sector = 0; sector < total_sectors; sector += n) {
Paolo Bonzinid6636402013-09-04 19:00:25 +02002293 ret = bdrv_is_allocated(bs, sector, COMMIT_BUF_SECTORS, &n);
2294 if (ret < 0) {
2295 goto ro_cleanup;
2296 }
2297 if (ret) {
Kevin Wolfdabfa6c2014-01-24 14:00:43 +01002298 ret = bdrv_read(bs, sector, buf, n);
2299 if (ret < 0) {
Kevin Wolf8a426612010-07-16 17:17:01 +02002300 goto ro_cleanup;
2301 }
2302
Kevin Wolfdabfa6c2014-01-24 14:00:43 +01002303 ret = bdrv_write(bs->backing_hd, sector, buf, n);
2304 if (ret < 0) {
Kevin Wolf8a426612010-07-16 17:17:01 +02002305 goto ro_cleanup;
2306 }
bellardea2384d2004-08-01 21:59:26 +00002307 }
2308 }
bellard95389c82005-12-18 18:28:15 +00002309
Christoph Hellwig1d449522010-01-17 12:32:30 +01002310 if (drv->bdrv_make_empty) {
2311 ret = drv->bdrv_make_empty(bs);
Kevin Wolfdabfa6c2014-01-24 14:00:43 +01002312 if (ret < 0) {
2313 goto ro_cleanup;
2314 }
Christoph Hellwig1d449522010-01-17 12:32:30 +01002315 bdrv_flush(bs);
2316 }
bellard95389c82005-12-18 18:28:15 +00002317
Christoph Hellwig3f5075a2010-01-12 13:49:23 +01002318 /*
2319 * Make sure all data we wrote to the backing device is actually
2320 * stable on disk.
2321 */
Kevin Wolfdabfa6c2014-01-24 14:00:43 +01002322 if (bs->backing_hd) {
Christoph Hellwig3f5075a2010-01-12 13:49:23 +01002323 bdrv_flush(bs->backing_hd);
Kevin Wolfdabfa6c2014-01-24 14:00:43 +01002324 }
Naphtali Sprei4dca4b62010-02-14 13:39:18 +02002325
Kevin Wolfdabfa6c2014-01-24 14:00:43 +01002326 ret = 0;
Naphtali Sprei4dca4b62010-02-14 13:39:18 +02002327ro_cleanup:
Kevin Wolf857d4f42014-05-20 13:16:51 +02002328 qemu_vfree(buf);
Naphtali Sprei4dca4b62010-02-14 13:39:18 +02002329
2330 if (ro) {
Jeff Cody0bce5972012-09-20 15:13:34 -04002331 /* ignoring error return here */
2332 bdrv_reopen(bs->backing_hd, open_flags & ~BDRV_O_RDWR, NULL);
Naphtali Sprei4dca4b62010-02-14 13:39:18 +02002333 }
2334
Christoph Hellwig1d449522010-01-17 12:32:30 +01002335 return ret;
bellard33e39632003-07-06 17:15:21 +00002336}
2337
Stefan Hajnoczie8877492012-03-05 18:10:11 +00002338int bdrv_commit_all(void)
Markus Armbruster6ab4b5a2010-06-02 18:55:18 +02002339{
2340 BlockDriverState *bs;
2341
Benoît Canetdc364f42014-01-23 21:31:32 +01002342 QTAILQ_FOREACH(bs, &bdrv_states, device_list) {
Stefan Hajnoczied78cda2014-05-08 16:34:35 +02002343 AioContext *aio_context = bdrv_get_aio_context(bs);
2344
2345 aio_context_acquire(aio_context);
Jeff Cody272d2d82013-02-26 09:55:48 -05002346 if (bs->drv && bs->backing_hd) {
2347 int ret = bdrv_commit(bs);
2348 if (ret < 0) {
Stefan Hajnoczied78cda2014-05-08 16:34:35 +02002349 aio_context_release(aio_context);
Jeff Cody272d2d82013-02-26 09:55:48 -05002350 return ret;
2351 }
Stefan Hajnoczie8877492012-03-05 18:10:11 +00002352 }
Stefan Hajnoczied78cda2014-05-08 16:34:35 +02002353 aio_context_release(aio_context);
Markus Armbruster6ab4b5a2010-06-02 18:55:18 +02002354 }
Stefan Hajnoczie8877492012-03-05 18:10:11 +00002355 return 0;
Markus Armbruster6ab4b5a2010-06-02 18:55:18 +02002356}
2357
Kevin Wolf756e6732010-01-12 12:55:17 +01002358/*
2359 * Return values:
2360 * 0 - success
2361 * -EINVAL - backing format specified, but no file
2362 * -ENOSPC - can't update the backing file because no space is left in the
2363 * image file header
2364 * -ENOTSUP - format driver doesn't support changing the backing file
2365 */
2366int bdrv_change_backing_file(BlockDriverState *bs,
2367 const char *backing_file, const char *backing_fmt)
2368{
2369 BlockDriver *drv = bs->drv;
Paolo Bonzini469ef352012-04-12 14:01:02 +02002370 int ret;
Kevin Wolf756e6732010-01-12 12:55:17 +01002371
Paolo Bonzini5f377792012-04-12 14:01:01 +02002372 /* Backing file format doesn't make sense without a backing file */
2373 if (backing_fmt && !backing_file) {
2374 return -EINVAL;
2375 }
2376
Kevin Wolf756e6732010-01-12 12:55:17 +01002377 if (drv->bdrv_change_backing_file != NULL) {
Paolo Bonzini469ef352012-04-12 14:01:02 +02002378 ret = drv->bdrv_change_backing_file(bs, backing_file, backing_fmt);
Kevin Wolf756e6732010-01-12 12:55:17 +01002379 } else {
Paolo Bonzini469ef352012-04-12 14:01:02 +02002380 ret = -ENOTSUP;
Kevin Wolf756e6732010-01-12 12:55:17 +01002381 }
Paolo Bonzini469ef352012-04-12 14:01:02 +02002382
2383 if (ret == 0) {
2384 pstrcpy(bs->backing_file, sizeof(bs->backing_file), backing_file ?: "");
2385 pstrcpy(bs->backing_format, sizeof(bs->backing_format), backing_fmt ?: "");
2386 }
2387 return ret;
Kevin Wolf756e6732010-01-12 12:55:17 +01002388}
2389
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002390/*
2391 * Finds the image layer in the chain that has 'bs' as its backing file.
2392 *
2393 * active is the current topmost image.
2394 *
2395 * Returns NULL if bs is not found in active's image chain,
2396 * or if active == bs.
Jeff Cody4caf0fc2014-06-25 15:35:26 -04002397 *
2398 * Returns the bottommost base image if bs == NULL.
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002399 */
2400BlockDriverState *bdrv_find_overlay(BlockDriverState *active,
2401 BlockDriverState *bs)
2402{
Jeff Cody4caf0fc2014-06-25 15:35:26 -04002403 while (active && bs != active->backing_hd) {
2404 active = active->backing_hd;
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002405 }
2406
Jeff Cody4caf0fc2014-06-25 15:35:26 -04002407 return active;
2408}
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002409
Jeff Cody4caf0fc2014-06-25 15:35:26 -04002410/* Given a BDS, searches for the base layer. */
2411BlockDriverState *bdrv_find_base(BlockDriverState *bs)
2412{
2413 return bdrv_find_overlay(bs, NULL);
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002414}
2415
2416typedef struct BlkIntermediateStates {
2417 BlockDriverState *bs;
2418 QSIMPLEQ_ENTRY(BlkIntermediateStates) entry;
2419} BlkIntermediateStates;
2420
2421
2422/*
2423 * Drops images above 'base' up to and including 'top', and sets the image
2424 * above 'top' to have base as its backing file.
2425 *
2426 * Requires that the overlay to 'top' is opened r/w, so that the backing file
2427 * information in 'bs' can be properly updated.
2428 *
2429 * E.g., this will convert the following chain:
2430 * bottom <- base <- intermediate <- top <- active
2431 *
2432 * to
2433 *
2434 * bottom <- base <- active
2435 *
2436 * It is allowed for bottom==base, in which case it converts:
2437 *
2438 * base <- intermediate <- top <- active
2439 *
2440 * to
2441 *
2442 * base <- active
2443 *
Jeff Cody54e26902014-06-25 15:40:10 -04002444 * If backing_file_str is non-NULL, it will be used when modifying top's
2445 * overlay image metadata.
2446 *
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002447 * Error conditions:
2448 * if active == top, that is considered an error
2449 *
2450 */
2451int bdrv_drop_intermediate(BlockDriverState *active, BlockDriverState *top,
Jeff Cody54e26902014-06-25 15:40:10 -04002452 BlockDriverState *base, const char *backing_file_str)
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002453{
2454 BlockDriverState *intermediate;
2455 BlockDriverState *base_bs = NULL;
2456 BlockDriverState *new_top_bs = NULL;
2457 BlkIntermediateStates *intermediate_state, *next;
2458 int ret = -EIO;
2459
2460 QSIMPLEQ_HEAD(states_to_delete, BlkIntermediateStates) states_to_delete;
2461 QSIMPLEQ_INIT(&states_to_delete);
2462
2463 if (!top->drv || !base->drv) {
2464 goto exit;
2465 }
2466
2467 new_top_bs = bdrv_find_overlay(active, top);
2468
2469 if (new_top_bs == NULL) {
2470 /* we could not find the image above 'top', this is an error */
2471 goto exit;
2472 }
2473
2474 /* special case of new_top_bs->backing_hd already pointing to base - nothing
2475 * to do, no intermediate images */
2476 if (new_top_bs->backing_hd == base) {
2477 ret = 0;
2478 goto exit;
2479 }
2480
2481 intermediate = top;
2482
2483 /* now we will go down through the list, and add each BDS we find
2484 * into our deletion queue, until we hit the 'base'
2485 */
2486 while (intermediate) {
Markus Armbruster5839e532014-08-19 10:31:08 +02002487 intermediate_state = g_new0(BlkIntermediateStates, 1);
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002488 intermediate_state->bs = intermediate;
2489 QSIMPLEQ_INSERT_TAIL(&states_to_delete, intermediate_state, entry);
2490
2491 if (intermediate->backing_hd == base) {
2492 base_bs = intermediate->backing_hd;
2493 break;
2494 }
2495 intermediate = intermediate->backing_hd;
2496 }
2497 if (base_bs == NULL) {
2498 /* something went wrong, we did not end at the base. safely
2499 * unravel everything, and exit with error */
2500 goto exit;
2501 }
2502
2503 /* success - we can delete the intermediate states, and link top->base */
Jeff Cody54e26902014-06-25 15:40:10 -04002504 backing_file_str = backing_file_str ? backing_file_str : base_bs->filename;
2505 ret = bdrv_change_backing_file(new_top_bs, backing_file_str,
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002506 base_bs->drv ? base_bs->drv->format_name : "");
2507 if (ret) {
2508 goto exit;
2509 }
Fam Zheng920beae2014-05-23 21:29:46 +08002510 bdrv_set_backing_hd(new_top_bs, base_bs);
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002511
2512 QSIMPLEQ_FOREACH_SAFE(intermediate_state, &states_to_delete, entry, next) {
2513 /* so that bdrv_close() does not recursively close the chain */
Fam Zheng920beae2014-05-23 21:29:46 +08002514 bdrv_set_backing_hd(intermediate_state->bs, NULL);
Fam Zheng4f6fd342013-08-23 09:14:47 +08002515 bdrv_unref(intermediate_state->bs);
Jeff Cody6ebdcee2012-09-27 13:29:12 -04002516 }
2517 ret = 0;
2518
2519exit:
2520 QSIMPLEQ_FOREACH_SAFE(intermediate_state, &states_to_delete, entry, next) {
2521 g_free(intermediate_state);
2522 }
2523 return ret;
2524}
2525
bellard83f64092006-08-01 16:21:11 +00002526/**
bellard83f64092006-08-01 16:21:11 +00002527 * Truncate file to 'offset' bytes (needed only for file protocols)
2528 */
2529int bdrv_truncate(BlockDriverState *bs, int64_t offset)
2530{
2531 BlockDriver *drv = bs->drv;
Stefan Hajnoczi51762282010-04-19 16:56:41 +01002532 int ret;
bellard83f64092006-08-01 16:21:11 +00002533 if (!drv)
bellard19cb3732006-08-19 11:45:59 +00002534 return -ENOMEDIUM;
bellard83f64092006-08-01 16:21:11 +00002535 if (!drv->bdrv_truncate)
2536 return -ENOTSUP;
Naphtali Sprei59f26892009-10-26 16:25:16 +02002537 if (bs->read_only)
2538 return -EACCES;
Jeff Cody9c75e162014-06-25 16:55:30 -04002539
Stefan Hajnoczi51762282010-04-19 16:56:41 +01002540 ret = drv->bdrv_truncate(bs, offset);
2541 if (ret == 0) {
2542 ret = refresh_total_sectors(bs, offset >> BDRV_SECTOR_BITS);
John Snowce1ffea2015-04-17 19:50:03 -04002543 bdrv_dirty_bitmap_truncate(bs);
Markus Armbrustera7f53e22014-10-07 13:59:25 +02002544 if (bs->blk) {
2545 blk_dev_resize_cb(bs->blk);
2546 }
Stefan Hajnoczi51762282010-04-19 16:56:41 +01002547 }
2548 return ret;
bellard83f64092006-08-01 16:21:11 +00002549}
2550
2551/**
Fam Zheng4a1d5e12011-07-12 19:56:39 +08002552 * Length of a allocated file in bytes. Sparse files are counted by actual
2553 * allocated space. Return < 0 if error or unknown.
2554 */
2555int64_t bdrv_get_allocated_file_size(BlockDriverState *bs)
2556{
2557 BlockDriver *drv = bs->drv;
2558 if (!drv) {
2559 return -ENOMEDIUM;
2560 }
2561 if (drv->bdrv_get_allocated_file_size) {
2562 return drv->bdrv_get_allocated_file_size(bs);
2563 }
2564 if (bs->file) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02002565 return bdrv_get_allocated_file_size(bs->file->bs);
Fam Zheng4a1d5e12011-07-12 19:56:39 +08002566 }
2567 return -ENOTSUP;
2568}
2569
2570/**
Markus Armbruster65a9bb22014-06-26 13:23:17 +02002571 * Return number of sectors on success, -errno on error.
bellard83f64092006-08-01 16:21:11 +00002572 */
Markus Armbruster65a9bb22014-06-26 13:23:17 +02002573int64_t bdrv_nb_sectors(BlockDriverState *bs)
bellard83f64092006-08-01 16:21:11 +00002574{
2575 BlockDriver *drv = bs->drv;
Markus Armbruster65a9bb22014-06-26 13:23:17 +02002576
bellard83f64092006-08-01 16:21:11 +00002577 if (!drv)
bellard19cb3732006-08-19 11:45:59 +00002578 return -ENOMEDIUM;
Stefan Hajnoczi51762282010-04-19 16:56:41 +01002579
Kevin Wolfb94a2612013-10-29 12:18:58 +01002580 if (drv->has_variable_length) {
2581 int ret = refresh_total_sectors(bs, bs->total_sectors);
2582 if (ret < 0) {
2583 return ret;
Stefan Hajnoczi46a4e4e2011-03-29 20:04:41 +01002584 }
bellard83f64092006-08-01 16:21:11 +00002585 }
Markus Armbruster65a9bb22014-06-26 13:23:17 +02002586 return bs->total_sectors;
2587}
2588
2589/**
2590 * Return length in bytes on success, -errno on error.
2591 * The length is always a multiple of BDRV_SECTOR_SIZE.
2592 */
2593int64_t bdrv_getlength(BlockDriverState *bs)
2594{
2595 int64_t ret = bdrv_nb_sectors(bs);
2596
Fam Zheng4a9c9ea2015-05-15 16:36:05 +08002597 ret = ret > INT64_MAX / BDRV_SECTOR_SIZE ? -EFBIG : ret;
Markus Armbruster65a9bb22014-06-26 13:23:17 +02002598 return ret < 0 ? ret : ret * BDRV_SECTOR_SIZE;
bellardfc01f7e2003-06-30 10:03:06 +00002599}
2600
bellard19cb3732006-08-19 11:45:59 +00002601/* return 0 as number of sectors if no device present or error */
ths96b8f132007-12-17 01:35:20 +00002602void bdrv_get_geometry(BlockDriverState *bs, uint64_t *nb_sectors_ptr)
bellardfc01f7e2003-06-30 10:03:06 +00002603{
Markus Armbruster65a9bb22014-06-26 13:23:17 +02002604 int64_t nb_sectors = bdrv_nb_sectors(bs);
2605
2606 *nb_sectors_ptr = nb_sectors < 0 ? 0 : nb_sectors;
bellardfc01f7e2003-06-30 10:03:06 +00002607}
bellardcf989512004-02-16 21:56:36 +00002608
Paolo Bonziniff06f5f2012-09-28 17:22:54 +02002609void bdrv_set_on_error(BlockDriverState *bs, BlockdevOnError on_read_error,
2610 BlockdevOnError on_write_error)
Markus Armbrusterabd7f682010-06-02 18:55:17 +02002611{
2612 bs->on_read_error = on_read_error;
2613 bs->on_write_error = on_write_error;
2614}
2615
Paolo Bonzini1ceee0d2012-09-28 17:22:56 +02002616BlockdevOnError bdrv_get_on_error(BlockDriverState *bs, bool is_read)
Markus Armbrusterabd7f682010-06-02 18:55:17 +02002617{
2618 return is_read ? bs->on_read_error : bs->on_write_error;
2619}
2620
Paolo Bonzini3e1caa52012-09-28 17:22:57 +02002621BlockErrorAction bdrv_get_error_action(BlockDriverState *bs, bool is_read, int error)
2622{
2623 BlockdevOnError on_err = is_read ? bs->on_read_error : bs->on_write_error;
2624
2625 switch (on_err) {
2626 case BLOCKDEV_ON_ERROR_ENOSPC:
Wenchao Xiaa5895692014-06-18 08:43:30 +02002627 return (error == ENOSPC) ?
2628 BLOCK_ERROR_ACTION_STOP : BLOCK_ERROR_ACTION_REPORT;
Paolo Bonzini3e1caa52012-09-28 17:22:57 +02002629 case BLOCKDEV_ON_ERROR_STOP:
Wenchao Xiaa5895692014-06-18 08:43:30 +02002630 return BLOCK_ERROR_ACTION_STOP;
Paolo Bonzini3e1caa52012-09-28 17:22:57 +02002631 case BLOCKDEV_ON_ERROR_REPORT:
Wenchao Xiaa5895692014-06-18 08:43:30 +02002632 return BLOCK_ERROR_ACTION_REPORT;
Paolo Bonzini3e1caa52012-09-28 17:22:57 +02002633 case BLOCKDEV_ON_ERROR_IGNORE:
Wenchao Xiaa5895692014-06-18 08:43:30 +02002634 return BLOCK_ERROR_ACTION_IGNORE;
Paolo Bonzini3e1caa52012-09-28 17:22:57 +02002635 default:
2636 abort();
2637 }
2638}
2639
Luiz Capitulinoc7c2ff02014-08-29 16:07:27 -04002640static void send_qmp_error_event(BlockDriverState *bs,
2641 BlockErrorAction action,
2642 bool is_read, int error)
2643{
Peter Maydell573742a2014-10-10 20:33:03 +01002644 IoOperationType optype;
Luiz Capitulinoc7c2ff02014-08-29 16:07:27 -04002645
Peter Maydell573742a2014-10-10 20:33:03 +01002646 optype = is_read ? IO_OPERATION_TYPE_READ : IO_OPERATION_TYPE_WRITE;
2647 qapi_event_send_block_io_error(bdrv_get_device_name(bs), optype, action,
Luiz Capitulinoc7c2ff02014-08-29 16:07:27 -04002648 bdrv_iostatus_is_enabled(bs),
Luiz Capitulino624ff572014-09-11 10:25:48 -04002649 error == ENOSPC, strerror(error),
2650 &error_abort);
Luiz Capitulinoc7c2ff02014-08-29 16:07:27 -04002651}
2652
Paolo Bonzini3e1caa52012-09-28 17:22:57 +02002653/* This is done by device models because, while the block layer knows
2654 * about the error, it does not know whether an operation comes from
2655 * the device or the block layer (from a job, for example).
2656 */
2657void bdrv_error_action(BlockDriverState *bs, BlockErrorAction action,
2658 bool is_read, int error)
2659{
2660 assert(error >= 0);
Paolo Bonzini2bd3bce2014-06-05 14:53:59 +02002661
Wenchao Xiaa5895692014-06-18 08:43:30 +02002662 if (action == BLOCK_ERROR_ACTION_STOP) {
Paolo Bonzini2bd3bce2014-06-05 14:53:59 +02002663 /* First set the iostatus, so that "info block" returns an iostatus
2664 * that matches the events raised so far (an additional error iostatus
2665 * is fine, but not a lost one).
2666 */
Paolo Bonzini3e1caa52012-09-28 17:22:57 +02002667 bdrv_iostatus_set_err(bs, error);
Paolo Bonzini2bd3bce2014-06-05 14:53:59 +02002668
2669 /* Then raise the request to stop the VM and the event.
2670 * qemu_system_vmstop_request_prepare has two effects. First,
2671 * it ensures that the STOP event always comes after the
2672 * BLOCK_IO_ERROR event. Second, it ensures that even if management
2673 * can observe the STOP event and do a "cont" before the STOP
2674 * event is issued, the VM will not stop. In this case, vm_start()
2675 * also ensures that the STOP/RESUME pair of events is emitted.
2676 */
2677 qemu_system_vmstop_request_prepare();
Luiz Capitulinoc7c2ff02014-08-29 16:07:27 -04002678 send_qmp_error_event(bs, action, is_read, error);
Paolo Bonzini2bd3bce2014-06-05 14:53:59 +02002679 qemu_system_vmstop_request(RUN_STATE_IO_ERROR);
2680 } else {
Luiz Capitulinoc7c2ff02014-08-29 16:07:27 -04002681 send_qmp_error_event(bs, action, is_read, error);
Paolo Bonzini3e1caa52012-09-28 17:22:57 +02002682 }
2683}
2684
bellardb3380822004-03-14 21:38:54 +00002685int bdrv_is_read_only(BlockDriverState *bs)
2686{
2687 return bs->read_only;
2688}
2689
ths985a03b2007-12-24 16:10:43 +00002690int bdrv_is_sg(BlockDriverState *bs)
2691{
2692 return bs->sg;
2693}
2694
Christoph Hellwige900a7b2009-09-04 19:01:15 +02002695int bdrv_enable_write_cache(BlockDriverState *bs)
2696{
2697 return bs->enable_write_cache;
2698}
2699
Paolo Bonzini425b0142012-06-06 00:04:52 +02002700void bdrv_set_enable_write_cache(BlockDriverState *bs, bool wce)
2701{
2702 bs->enable_write_cache = wce;
Jeff Cody55b110f2012-09-20 15:13:18 -04002703
2704 /* so a reopen() will preserve wce */
2705 if (wce) {
2706 bs->open_flags |= BDRV_O_CACHE_WB;
2707 } else {
2708 bs->open_flags &= ~BDRV_O_CACHE_WB;
2709 }
Paolo Bonzini425b0142012-06-06 00:04:52 +02002710}
2711
bellardea2384d2004-08-01 21:59:26 +00002712int bdrv_is_encrypted(BlockDriverState *bs)
2713{
2714 if (bs->backing_hd && bs->backing_hd->encrypted)
2715 return 1;
2716 return bs->encrypted;
2717}
2718
aliguoric0f4ce72009-03-05 23:01:01 +00002719int bdrv_key_required(BlockDriverState *bs)
2720{
2721 BlockDriverState *backing_hd = bs->backing_hd;
2722
2723 if (backing_hd && backing_hd->encrypted && !backing_hd->valid_key)
2724 return 1;
2725 return (bs->encrypted && !bs->valid_key);
2726}
2727
bellardea2384d2004-08-01 21:59:26 +00002728int bdrv_set_key(BlockDriverState *bs, const char *key)
2729{
2730 int ret;
2731 if (bs->backing_hd && bs->backing_hd->encrypted) {
2732 ret = bdrv_set_key(bs->backing_hd, key);
2733 if (ret < 0)
2734 return ret;
2735 if (!bs->encrypted)
2736 return 0;
2737 }
Shahar Havivifd04a2a2010-03-06 00:26:13 +02002738 if (!bs->encrypted) {
2739 return -EINVAL;
2740 } else if (!bs->drv || !bs->drv->bdrv_set_key) {
2741 return -ENOMEDIUM;
2742 }
aliguoric0f4ce72009-03-05 23:01:01 +00002743 ret = bs->drv->bdrv_set_key(bs, key);
aliguoribb5fc202009-03-05 23:01:15 +00002744 if (ret < 0) {
2745 bs->valid_key = 0;
2746 } else if (!bs->valid_key) {
2747 bs->valid_key = 1;
Markus Armbrustera7f53e22014-10-07 13:59:25 +02002748 if (bs->blk) {
2749 /* call the change callback now, we skipped it on open */
2750 blk_dev_change_media_cb(bs->blk, true);
2751 }
aliguoribb5fc202009-03-05 23:01:15 +00002752 }
aliguoric0f4ce72009-03-05 23:01:01 +00002753 return ret;
bellardea2384d2004-08-01 21:59:26 +00002754}
2755
Markus Armbruster4d2855a2015-01-29 10:37:00 +01002756/*
2757 * Provide an encryption key for @bs.
2758 * If @key is non-null:
2759 * If @bs is not encrypted, fail.
2760 * Else if the key is invalid, fail.
2761 * Else set @bs's key to @key, replacing the existing key, if any.
2762 * If @key is null:
2763 * If @bs is encrypted and still lacks a key, fail.
2764 * Else do nothing.
2765 * On failure, store an error object through @errp if non-null.
2766 */
2767void bdrv_add_key(BlockDriverState *bs, const char *key, Error **errp)
2768{
2769 if (key) {
2770 if (!bdrv_is_encrypted(bs)) {
Alberto Garcia81e5f782015-04-08 12:29:19 +03002771 error_setg(errp, "Node '%s' is not encrypted",
2772 bdrv_get_device_or_node_name(bs));
Markus Armbruster4d2855a2015-01-29 10:37:00 +01002773 } else if (bdrv_set_key(bs, key) < 0) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01002774 error_setg(errp, QERR_INVALID_PASSWORD);
Markus Armbruster4d2855a2015-01-29 10:37:00 +01002775 }
2776 } else {
2777 if (bdrv_key_required(bs)) {
Markus Armbrusterb1ca6392015-01-29 10:37:01 +01002778 error_set(errp, ERROR_CLASS_DEVICE_ENCRYPTED,
2779 "'%s' (%s) is encrypted",
Alberto Garcia81e5f782015-04-08 12:29:19 +03002780 bdrv_get_device_or_node_name(bs),
Markus Armbruster4d2855a2015-01-29 10:37:00 +01002781 bdrv_get_encrypted_filename(bs));
2782 }
2783 }
2784}
2785
Markus Armbrusterf8d6bba2012-06-13 10:11:48 +02002786const char *bdrv_get_format_name(BlockDriverState *bs)
bellardea2384d2004-08-01 21:59:26 +00002787{
Markus Armbrusterf8d6bba2012-06-13 10:11:48 +02002788 return bs->drv ? bs->drv->format_name : NULL;
bellardea2384d2004-08-01 21:59:26 +00002789}
2790
Stefan Hajnocziada42402014-08-27 12:08:55 +01002791static int qsort_strcmp(const void *a, const void *b)
2792{
2793 return strcmp(a, b);
2794}
2795
ths5fafdf22007-09-16 21:08:06 +00002796void bdrv_iterate_format(void (*it)(void *opaque, const char *name),
bellardea2384d2004-08-01 21:59:26 +00002797 void *opaque)
2798{
2799 BlockDriver *drv;
Jeff Codye855e4f2014-04-28 18:29:54 -04002800 int count = 0;
Stefan Hajnocziada42402014-08-27 12:08:55 +01002801 int i;
Jeff Codye855e4f2014-04-28 18:29:54 -04002802 const char **formats = NULL;
bellardea2384d2004-08-01 21:59:26 +00002803
Stefan Hajnoczi8a22f022010-04-13 10:29:33 +01002804 QLIST_FOREACH(drv, &bdrv_drivers, list) {
Jeff Codye855e4f2014-04-28 18:29:54 -04002805 if (drv->format_name) {
2806 bool found = false;
2807 int i = count;
2808 while (formats && i && !found) {
2809 found = !strcmp(formats[--i], drv->format_name);
2810 }
2811
2812 if (!found) {
Markus Armbruster5839e532014-08-19 10:31:08 +02002813 formats = g_renew(const char *, formats, count + 1);
Jeff Codye855e4f2014-04-28 18:29:54 -04002814 formats[count++] = drv->format_name;
Jeff Codye855e4f2014-04-28 18:29:54 -04002815 }
2816 }
bellardea2384d2004-08-01 21:59:26 +00002817 }
Stefan Hajnocziada42402014-08-27 12:08:55 +01002818
2819 qsort(formats, count, sizeof(formats[0]), qsort_strcmp);
2820
2821 for (i = 0; i < count; i++) {
2822 it(opaque, formats[i]);
2823 }
2824
Jeff Codye855e4f2014-04-28 18:29:54 -04002825 g_free(formats);
bellardea2384d2004-08-01 21:59:26 +00002826}
2827
Benoît Canetdc364f42014-01-23 21:31:32 +01002828/* This function is to find a node in the bs graph */
2829BlockDriverState *bdrv_find_node(const char *node_name)
2830{
2831 BlockDriverState *bs;
2832
2833 assert(node_name);
2834
2835 QTAILQ_FOREACH(bs, &graph_bdrv_states, node_list) {
2836 if (!strcmp(node_name, bs->node_name)) {
2837 return bs;
2838 }
2839 }
2840 return NULL;
2841}
2842
Benoît Canetc13163f2014-01-23 21:31:34 +01002843/* Put this QMP function here so it can access the static graph_bdrv_states. */
Alberto Garciad5a8ee62015-04-17 14:52:43 +03002844BlockDeviceInfoList *bdrv_named_nodes_list(Error **errp)
Benoît Canetc13163f2014-01-23 21:31:34 +01002845{
2846 BlockDeviceInfoList *list, *entry;
2847 BlockDriverState *bs;
2848
2849 list = NULL;
2850 QTAILQ_FOREACH(bs, &graph_bdrv_states, node_list) {
Alberto Garciad5a8ee62015-04-17 14:52:43 +03002851 BlockDeviceInfo *info = bdrv_block_device_info(bs, errp);
2852 if (!info) {
2853 qapi_free_BlockDeviceInfoList(list);
2854 return NULL;
2855 }
Benoît Canetc13163f2014-01-23 21:31:34 +01002856 entry = g_malloc0(sizeof(*entry));
Alberto Garciad5a8ee62015-04-17 14:52:43 +03002857 entry->value = info;
Benoît Canetc13163f2014-01-23 21:31:34 +01002858 entry->next = list;
2859 list = entry;
2860 }
2861
2862 return list;
2863}
2864
Benoît Canet12d3ba82014-01-23 21:31:35 +01002865BlockDriverState *bdrv_lookup_bs(const char *device,
2866 const char *node_name,
2867 Error **errp)
2868{
Markus Armbruster7f06d472014-10-07 13:59:12 +02002869 BlockBackend *blk;
2870 BlockDriverState *bs;
Benoît Canet12d3ba82014-01-23 21:31:35 +01002871
Benoît Canet12d3ba82014-01-23 21:31:35 +01002872 if (device) {
Markus Armbruster7f06d472014-10-07 13:59:12 +02002873 blk = blk_by_name(device);
Benoît Canet12d3ba82014-01-23 21:31:35 +01002874
Markus Armbruster7f06d472014-10-07 13:59:12 +02002875 if (blk) {
2876 return blk_bs(blk);
Benoît Canet12d3ba82014-01-23 21:31:35 +01002877 }
Benoît Canet12d3ba82014-01-23 21:31:35 +01002878 }
2879
Benoît Canetdd67fa52014-02-12 17:15:06 +01002880 if (node_name) {
2881 bs = bdrv_find_node(node_name);
Benoît Canet12d3ba82014-01-23 21:31:35 +01002882
Benoît Canetdd67fa52014-02-12 17:15:06 +01002883 if (bs) {
2884 return bs;
2885 }
Benoît Canet12d3ba82014-01-23 21:31:35 +01002886 }
2887
Benoît Canetdd67fa52014-02-12 17:15:06 +01002888 error_setg(errp, "Cannot find device=%s nor node_name=%s",
2889 device ? device : "",
2890 node_name ? node_name : "");
2891 return NULL;
Benoît Canet12d3ba82014-01-23 21:31:35 +01002892}
2893
Jeff Cody5a6684d2014-06-25 15:40:09 -04002894/* If 'base' is in the same chain as 'top', return true. Otherwise,
2895 * return false. If either argument is NULL, return false. */
2896bool bdrv_chain_contains(BlockDriverState *top, BlockDriverState *base)
2897{
2898 while (top && top != base) {
2899 top = top->backing_hd;
2900 }
2901
2902 return top != NULL;
2903}
2904
Fam Zheng04df7652014-10-31 11:32:54 +08002905BlockDriverState *bdrv_next_node(BlockDriverState *bs)
2906{
2907 if (!bs) {
2908 return QTAILQ_FIRST(&graph_bdrv_states);
2909 }
2910 return QTAILQ_NEXT(bs, node_list);
2911}
2912
Markus Armbruster2f399b02010-06-02 18:55:20 +02002913BlockDriverState *bdrv_next(BlockDriverState *bs)
2914{
2915 if (!bs) {
2916 return QTAILQ_FIRST(&bdrv_states);
2917 }
Benoît Canetdc364f42014-01-23 21:31:32 +01002918 return QTAILQ_NEXT(bs, device_list);
Markus Armbruster2f399b02010-06-02 18:55:20 +02002919}
2920
Fam Zheng20a9e772014-10-31 11:32:55 +08002921const char *bdrv_get_node_name(const BlockDriverState *bs)
2922{
2923 return bs->node_name;
2924}
2925
Markus Armbruster7f06d472014-10-07 13:59:12 +02002926/* TODO check what callers really want: bs->node_name or blk_name() */
Markus Armbrusterbfb197e2014-10-07 13:59:11 +02002927const char *bdrv_get_device_name(const BlockDriverState *bs)
bellardea2384d2004-08-01 21:59:26 +00002928{
Markus Armbrusterbfb197e2014-10-07 13:59:11 +02002929 return bs->blk ? blk_name(bs->blk) : "";
bellardea2384d2004-08-01 21:59:26 +00002930}
2931
Alberto Garcia9b2aa842015-04-08 12:29:18 +03002932/* This can be used to identify nodes that might not have a device
2933 * name associated. Since node and device names live in the same
2934 * namespace, the result is unambiguous. The exception is if both are
2935 * absent, then this returns an empty (non-null) string. */
2936const char *bdrv_get_device_or_node_name(const BlockDriverState *bs)
2937{
2938 return bs->blk ? blk_name(bs->blk) : bs->node_name;
2939}
2940
Markus Armbrusterc8433282012-06-05 16:49:24 +02002941int bdrv_get_flags(BlockDriverState *bs)
2942{
2943 return bs->open_flags;
2944}
2945
Peter Lieven3ac21622013-06-28 12:47:42 +02002946int bdrv_has_zero_init_1(BlockDriverState *bs)
2947{
2948 return 1;
2949}
2950
Kevin Wolff2feebb2010-04-14 17:30:35 +02002951int bdrv_has_zero_init(BlockDriverState *bs)
2952{
2953 assert(bs->drv);
2954
Paolo Bonzini11212d82013-09-04 19:00:27 +02002955 /* If BS is a copy on write image, it is initialized to
2956 the contents of the base image, which may not be zeroes. */
2957 if (bs->backing_hd) {
2958 return 0;
2959 }
Kevin Wolf336c1c12010-07-28 11:26:29 +02002960 if (bs->drv->bdrv_has_zero_init) {
2961 return bs->drv->bdrv_has_zero_init(bs);
Kevin Wolff2feebb2010-04-14 17:30:35 +02002962 }
2963
Peter Lieven3ac21622013-06-28 12:47:42 +02002964 /* safe default */
2965 return 0;
Kevin Wolff2feebb2010-04-14 17:30:35 +02002966}
2967
Peter Lieven4ce78692013-10-24 12:06:54 +02002968bool bdrv_unallocated_blocks_are_zero(BlockDriverState *bs)
2969{
2970 BlockDriverInfo bdi;
2971
2972 if (bs->backing_hd) {
2973 return false;
2974 }
2975
2976 if (bdrv_get_info(bs, &bdi) == 0) {
2977 return bdi.unallocated_blocks_are_zero;
2978 }
2979
2980 return false;
2981}
2982
2983bool bdrv_can_write_zeroes_with_unmap(BlockDriverState *bs)
2984{
2985 BlockDriverInfo bdi;
2986
2987 if (bs->backing_hd || !(bs->open_flags & BDRV_O_UNMAP)) {
2988 return false;
2989 }
2990
2991 if (bdrv_get_info(bs, &bdi) == 0) {
2992 return bdi.can_write_zeroes_with_unmap;
2993 }
2994
2995 return false;
2996}
2997
aliguori045df332009-03-05 23:00:48 +00002998const char *bdrv_get_encrypted_filename(BlockDriverState *bs)
2999{
3000 if (bs->backing_hd && bs->backing_hd->encrypted)
3001 return bs->backing_file;
3002 else if (bs->encrypted)
3003 return bs->filename;
3004 else
3005 return NULL;
3006}
3007
ths5fafdf22007-09-16 21:08:06 +00003008void bdrv_get_backing_filename(BlockDriverState *bs,
bellard83f64092006-08-01 16:21:11 +00003009 char *filename, int filename_size)
bellardea2384d2004-08-01 21:59:26 +00003010{
Kevin Wolf3574c602011-10-26 11:02:11 +02003011 pstrcpy(filename, filename_size, bs->backing_file);
bellardea2384d2004-08-01 21:59:26 +00003012}
3013
bellardfaea38e2006-08-05 21:31:00 +00003014int bdrv_get_info(BlockDriverState *bs, BlockDriverInfo *bdi)
3015{
3016 BlockDriver *drv = bs->drv;
3017 if (!drv)
bellard19cb3732006-08-19 11:45:59 +00003018 return -ENOMEDIUM;
bellardfaea38e2006-08-05 21:31:00 +00003019 if (!drv->bdrv_get_info)
3020 return -ENOTSUP;
3021 memset(bdi, 0, sizeof(*bdi));
3022 return drv->bdrv_get_info(bs, bdi);
3023}
3024
Max Reitzeae041f2013-10-09 10:46:16 +02003025ImageInfoSpecific *bdrv_get_specific_info(BlockDriverState *bs)
3026{
3027 BlockDriver *drv = bs->drv;
3028 if (drv && drv->bdrv_get_specific_info) {
3029 return drv->bdrv_get_specific_info(bs);
3030 }
3031 return NULL;
3032}
3033
Kevin Wolf8b9b0cc2010-03-15 17:27:00 +01003034void bdrv_debug_event(BlockDriverState *bs, BlkDebugEvent event)
3035{
Kevin Wolfbf736fe2013-06-05 15:17:55 +02003036 if (!bs || !bs->drv || !bs->drv->bdrv_debug_event) {
Kevin Wolf8b9b0cc2010-03-15 17:27:00 +01003037 return;
3038 }
3039
Kevin Wolfbf736fe2013-06-05 15:17:55 +02003040 bs->drv->bdrv_debug_event(bs, event);
Kevin Wolf41c695c2012-12-06 14:32:58 +01003041}
Kevin Wolf8b9b0cc2010-03-15 17:27:00 +01003042
Kevin Wolf41c695c2012-12-06 14:32:58 +01003043int bdrv_debug_breakpoint(BlockDriverState *bs, const char *event,
3044 const char *tag)
3045{
3046 while (bs && bs->drv && !bs->drv->bdrv_debug_breakpoint) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02003047 bs = bs->file ? bs->file->bs : NULL;
Kevin Wolf41c695c2012-12-06 14:32:58 +01003048 }
3049
3050 if (bs && bs->drv && bs->drv->bdrv_debug_breakpoint) {
3051 return bs->drv->bdrv_debug_breakpoint(bs, event, tag);
3052 }
3053
3054 return -ENOTSUP;
3055}
3056
Fam Zheng4cc70e92013-11-20 10:01:54 +08003057int bdrv_debug_remove_breakpoint(BlockDriverState *bs, const char *tag)
3058{
3059 while (bs && bs->drv && !bs->drv->bdrv_debug_remove_breakpoint) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02003060 bs = bs->file ? bs->file->bs : NULL;
Fam Zheng4cc70e92013-11-20 10:01:54 +08003061 }
3062
3063 if (bs && bs->drv && bs->drv->bdrv_debug_remove_breakpoint) {
3064 return bs->drv->bdrv_debug_remove_breakpoint(bs, tag);
3065 }
3066
3067 return -ENOTSUP;
3068}
3069
Kevin Wolf41c695c2012-12-06 14:32:58 +01003070int bdrv_debug_resume(BlockDriverState *bs, const char *tag)
3071{
Max Reitz938789e2014-03-10 23:44:08 +01003072 while (bs && (!bs->drv || !bs->drv->bdrv_debug_resume)) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02003073 bs = bs->file ? bs->file->bs : NULL;
Kevin Wolf41c695c2012-12-06 14:32:58 +01003074 }
3075
3076 if (bs && bs->drv && bs->drv->bdrv_debug_resume) {
3077 return bs->drv->bdrv_debug_resume(bs, tag);
3078 }
3079
3080 return -ENOTSUP;
3081}
3082
3083bool bdrv_debug_is_suspended(BlockDriverState *bs, const char *tag)
3084{
3085 while (bs && bs->drv && !bs->drv->bdrv_debug_is_suspended) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02003086 bs = bs->file ? bs->file->bs : NULL;
Kevin Wolf41c695c2012-12-06 14:32:58 +01003087 }
3088
3089 if (bs && bs->drv && bs->drv->bdrv_debug_is_suspended) {
3090 return bs->drv->bdrv_debug_is_suspended(bs, tag);
3091 }
3092
3093 return false;
Kevin Wolf8b9b0cc2010-03-15 17:27:00 +01003094}
3095
Blue Swirl199630b2010-07-25 20:49:34 +00003096int bdrv_is_snapshot(BlockDriverState *bs)
3097{
3098 return !!(bs->open_flags & BDRV_O_SNAPSHOT);
3099}
3100
Jeff Codyb1b1d782012-10-16 15:49:09 -04003101/* backing_file can either be relative, or absolute, or a protocol. If it is
3102 * relative, it must be relative to the chain. So, passing in bs->filename
3103 * from a BDS as backing_file should not be done, as that may be relative to
3104 * the CWD rather than the chain. */
Marcelo Tosattie8a6bb92012-01-18 14:40:51 +00003105BlockDriverState *bdrv_find_backing_image(BlockDriverState *bs,
3106 const char *backing_file)
3107{
Jeff Codyb1b1d782012-10-16 15:49:09 -04003108 char *filename_full = NULL;
3109 char *backing_file_full = NULL;
3110 char *filename_tmp = NULL;
3111 int is_protocol = 0;
3112 BlockDriverState *curr_bs = NULL;
3113 BlockDriverState *retval = NULL;
3114
3115 if (!bs || !bs->drv || !backing_file) {
Marcelo Tosattie8a6bb92012-01-18 14:40:51 +00003116 return NULL;
3117 }
3118
Jeff Codyb1b1d782012-10-16 15:49:09 -04003119 filename_full = g_malloc(PATH_MAX);
3120 backing_file_full = g_malloc(PATH_MAX);
3121 filename_tmp = g_malloc(PATH_MAX);
3122
3123 is_protocol = path_has_protocol(backing_file);
3124
3125 for (curr_bs = bs; curr_bs->backing_hd; curr_bs = curr_bs->backing_hd) {
3126
3127 /* If either of the filename paths is actually a protocol, then
3128 * compare unmodified paths; otherwise make paths relative */
3129 if (is_protocol || path_has_protocol(curr_bs->backing_file)) {
3130 if (strcmp(backing_file, curr_bs->backing_file) == 0) {
3131 retval = curr_bs->backing_hd;
3132 break;
3133 }
Marcelo Tosattie8a6bb92012-01-18 14:40:51 +00003134 } else {
Jeff Codyb1b1d782012-10-16 15:49:09 -04003135 /* If not an absolute filename path, make it relative to the current
3136 * image's filename path */
3137 path_combine(filename_tmp, PATH_MAX, curr_bs->filename,
3138 backing_file);
3139
3140 /* We are going to compare absolute pathnames */
3141 if (!realpath(filename_tmp, filename_full)) {
3142 continue;
3143 }
3144
3145 /* We need to make sure the backing filename we are comparing against
3146 * is relative to the current image filename (or absolute) */
3147 path_combine(filename_tmp, PATH_MAX, curr_bs->filename,
3148 curr_bs->backing_file);
3149
3150 if (!realpath(filename_tmp, backing_file_full)) {
3151 continue;
3152 }
3153
3154 if (strcmp(backing_file_full, filename_full) == 0) {
3155 retval = curr_bs->backing_hd;
3156 break;
3157 }
Marcelo Tosattie8a6bb92012-01-18 14:40:51 +00003158 }
3159 }
3160
Jeff Codyb1b1d782012-10-16 15:49:09 -04003161 g_free(filename_full);
3162 g_free(backing_file_full);
3163 g_free(filename_tmp);
3164 return retval;
Marcelo Tosattie8a6bb92012-01-18 14:40:51 +00003165}
3166
Benoît Canetf198fd12012-08-02 10:22:47 +02003167int bdrv_get_backing_file_depth(BlockDriverState *bs)
3168{
3169 if (!bs->drv) {
3170 return 0;
3171 }
3172
3173 if (!bs->backing_hd) {
3174 return 0;
3175 }
3176
3177 return 1 + bdrv_get_backing_file_depth(bs->backing_hd);
3178}
3179
bellardea2384d2004-08-01 21:59:26 +00003180void bdrv_init(void)
3181{
Anthony Liguori5efa9d52009-05-09 17:03:42 -05003182 module_call_init(MODULE_INIT_BLOCK);
bellardea2384d2004-08-01 21:59:26 +00003183}
pbrookce1a14d2006-08-07 02:38:06 +00003184
Markus Armbrustereb852012009-10-27 18:41:44 +01003185void bdrv_init_with_whitelist(void)
3186{
3187 use_bdrv_whitelist = 1;
3188 bdrv_init();
3189}
3190
Kevin Wolf5a8a30d2014-03-12 15:59:16 +01003191void bdrv_invalidate_cache(BlockDriverState *bs, Error **errp)
Anthony Liguori0f154232011-11-14 15:09:45 -06003192{
Kevin Wolf5a8a30d2014-03-12 15:59:16 +01003193 Error *local_err = NULL;
3194 int ret;
3195
Kevin Wolf3456a8d2014-03-11 10:58:39 +01003196 if (!bs->drv) {
3197 return;
Anthony Liguori0f154232011-11-14 15:09:45 -06003198 }
Kevin Wolf3456a8d2014-03-11 10:58:39 +01003199
Alexey Kardashevskiy7ea2d262014-10-09 13:50:46 +11003200 if (!(bs->open_flags & BDRV_O_INCOMING)) {
3201 return;
3202 }
3203 bs->open_flags &= ~BDRV_O_INCOMING;
3204
Kevin Wolf3456a8d2014-03-11 10:58:39 +01003205 if (bs->drv->bdrv_invalidate_cache) {
Kevin Wolf5a8a30d2014-03-12 15:59:16 +01003206 bs->drv->bdrv_invalidate_cache(bs, &local_err);
Kevin Wolf3456a8d2014-03-11 10:58:39 +01003207 } else if (bs->file) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02003208 bdrv_invalidate_cache(bs->file->bs, &local_err);
Kevin Wolf5a8a30d2014-03-12 15:59:16 +01003209 }
3210 if (local_err) {
3211 error_propagate(errp, local_err);
3212 return;
Kevin Wolf3456a8d2014-03-11 10:58:39 +01003213 }
3214
Kevin Wolf5a8a30d2014-03-12 15:59:16 +01003215 ret = refresh_total_sectors(bs, bs->total_sectors);
3216 if (ret < 0) {
3217 error_setg_errno(errp, -ret, "Could not refresh total sector count");
3218 return;
3219 }
Anthony Liguori0f154232011-11-14 15:09:45 -06003220}
3221
Kevin Wolf5a8a30d2014-03-12 15:59:16 +01003222void bdrv_invalidate_cache_all(Error **errp)
Anthony Liguori0f154232011-11-14 15:09:45 -06003223{
3224 BlockDriverState *bs;
Kevin Wolf5a8a30d2014-03-12 15:59:16 +01003225 Error *local_err = NULL;
Anthony Liguori0f154232011-11-14 15:09:45 -06003226
Benoît Canetdc364f42014-01-23 21:31:32 +01003227 QTAILQ_FOREACH(bs, &bdrv_states, device_list) {
Stefan Hajnoczied78cda2014-05-08 16:34:35 +02003228 AioContext *aio_context = bdrv_get_aio_context(bs);
3229
3230 aio_context_acquire(aio_context);
Kevin Wolf5a8a30d2014-03-12 15:59:16 +01003231 bdrv_invalidate_cache(bs, &local_err);
Stefan Hajnoczied78cda2014-05-08 16:34:35 +02003232 aio_context_release(aio_context);
Kevin Wolf5a8a30d2014-03-12 15:59:16 +01003233 if (local_err) {
3234 error_propagate(errp, local_err);
3235 return;
3236 }
Anthony Liguori0f154232011-11-14 15:09:45 -06003237 }
3238}
3239
Kevin Wolff9f05dc2011-07-15 13:50:26 +02003240/**************************************************************/
bellard19cb3732006-08-19 11:45:59 +00003241/* removable device support */
3242
3243/**
3244 * Return TRUE if the media is present
3245 */
3246int bdrv_is_inserted(BlockDriverState *bs)
3247{
3248 BlockDriver *drv = bs->drv;
Markus Armbrustera1aff5b2011-09-06 18:58:41 +02003249
bellard19cb3732006-08-19 11:45:59 +00003250 if (!drv)
3251 return 0;
3252 if (!drv->bdrv_is_inserted)
Markus Armbrustera1aff5b2011-09-06 18:58:41 +02003253 return 1;
3254 return drv->bdrv_is_inserted(bs);
bellard19cb3732006-08-19 11:45:59 +00003255}
3256
3257/**
Markus Armbruster8e49ca42011-08-03 15:08:08 +02003258 * Return whether the media changed since the last call to this
3259 * function, or -ENOTSUP if we don't know. Most drivers don't know.
bellard19cb3732006-08-19 11:45:59 +00003260 */
3261int bdrv_media_changed(BlockDriverState *bs)
3262{
3263 BlockDriver *drv = bs->drv;
bellard19cb3732006-08-19 11:45:59 +00003264
Markus Armbruster8e49ca42011-08-03 15:08:08 +02003265 if (drv && drv->bdrv_media_changed) {
3266 return drv->bdrv_media_changed(bs);
3267 }
3268 return -ENOTSUP;
bellard19cb3732006-08-19 11:45:59 +00003269}
3270
3271/**
3272 * If eject_flag is TRUE, eject the media. Otherwise, close the tray
3273 */
Luiz Capitulinof36f3942012-02-03 16:24:53 -02003274void bdrv_eject(BlockDriverState *bs, bool eject_flag)
bellard19cb3732006-08-19 11:45:59 +00003275{
3276 BlockDriver *drv = bs->drv;
Markus Armbrusterbfb197e2014-10-07 13:59:11 +02003277 const char *device_name;
bellard19cb3732006-08-19 11:45:59 +00003278
Markus Armbruster822e1cd2011-07-20 18:23:42 +02003279 if (drv && drv->bdrv_eject) {
3280 drv->bdrv_eject(bs, eject_flag);
bellard19cb3732006-08-19 11:45:59 +00003281 }
Luiz Capitulino6f382ed2012-02-14 13:41:13 -02003282
Markus Armbrusterbfb197e2014-10-07 13:59:11 +02003283 device_name = bdrv_get_device_name(bs);
3284 if (device_name[0] != '\0') {
3285 qapi_event_send_device_tray_moved(device_name,
Wenchao Xiaa5ee7bd2014-06-18 08:43:44 +02003286 eject_flag, &error_abort);
Luiz Capitulino6f382ed2012-02-14 13:41:13 -02003287 }
bellard19cb3732006-08-19 11:45:59 +00003288}
3289
bellard19cb3732006-08-19 11:45:59 +00003290/**
3291 * Lock or unlock the media (if it is locked, the user won't be able
3292 * to eject it manually).
3293 */
Markus Armbruster025e8492011-09-06 18:58:47 +02003294void bdrv_lock_medium(BlockDriverState *bs, bool locked)
bellard19cb3732006-08-19 11:45:59 +00003295{
3296 BlockDriver *drv = bs->drv;
3297
Markus Armbruster025e8492011-09-06 18:58:47 +02003298 trace_bdrv_lock_medium(bs, locked);
Stefan Hajnoczib8c6d092011-03-29 20:04:40 +01003299
Markus Armbruster025e8492011-09-06 18:58:47 +02003300 if (drv && drv->bdrv_lock_medium) {
3301 drv->bdrv_lock_medium(bs, locked);
bellard19cb3732006-08-19 11:45:59 +00003302 }
3303}
ths985a03b2007-12-24 16:10:43 +00003304
Paolo Bonzini1b7fd722011-11-29 11:35:47 +01003305void bdrv_set_guest_block_size(BlockDriverState *bs, int align)
Markus Armbruster7b6f9302011-09-06 18:58:56 +02003306{
Paolo Bonzini1b7fd722011-11-29 11:35:47 +01003307 bs->guest_block_size = align;
Markus Armbruster7b6f9302011-09-06 18:58:56 +02003308}
lirans@il.ibm.com7cd1e322009-11-02 15:40:41 +02003309
Fam Zheng0db6e542015-04-17 19:49:50 -04003310BdrvDirtyBitmap *bdrv_find_dirty_bitmap(BlockDriverState *bs, const char *name)
3311{
3312 BdrvDirtyBitmap *bm;
3313
3314 assert(name);
3315 QLIST_FOREACH(bm, &bs->dirty_bitmaps, list) {
3316 if (bm->name && !strcmp(name, bm->name)) {
3317 return bm;
3318 }
3319 }
3320 return NULL;
3321}
3322
John Snow20dca812015-04-17 19:50:02 -04003323void bdrv_dirty_bitmap_make_anon(BdrvDirtyBitmap *bitmap)
Fam Zheng0db6e542015-04-17 19:49:50 -04003324{
John Snow9bd2b082015-04-17 19:49:57 -04003325 assert(!bdrv_dirty_bitmap_frozen(bitmap));
Fam Zheng0db6e542015-04-17 19:49:50 -04003326 g_free(bitmap->name);
3327 bitmap->name = NULL;
3328}
3329
3330BdrvDirtyBitmap *bdrv_create_dirty_bitmap(BlockDriverState *bs,
John Snow5fba6c02015-04-17 19:49:51 -04003331 uint32_t granularity,
Fam Zheng0db6e542015-04-17 19:49:50 -04003332 const char *name,
Fam Zhengb8afb522014-04-16 09:34:30 +08003333 Error **errp)
lirans@il.ibm.com7cd1e322009-11-02 15:40:41 +02003334{
3335 int64_t bitmap_size;
Fam Zhenge4654d22013-11-13 18:29:43 +08003336 BdrvDirtyBitmap *bitmap;
John Snow5fba6c02015-04-17 19:49:51 -04003337 uint32_t sector_granularity;
Jan Kiszkaa55eb922009-11-30 18:21:19 +01003338
Paolo Bonzini50717e92013-01-21 17:09:45 +01003339 assert((granularity & (granularity - 1)) == 0);
3340
Fam Zheng0db6e542015-04-17 19:49:50 -04003341 if (name && bdrv_find_dirty_bitmap(bs, name)) {
3342 error_setg(errp, "Bitmap already exists: %s", name);
3343 return NULL;
3344 }
John Snow5fba6c02015-04-17 19:49:51 -04003345 sector_granularity = granularity >> BDRV_SECTOR_BITS;
3346 assert(sector_granularity);
Markus Armbruster57322b72014-06-26 13:23:22 +02003347 bitmap_size = bdrv_nb_sectors(bs);
Fam Zhengb8afb522014-04-16 09:34:30 +08003348 if (bitmap_size < 0) {
3349 error_setg_errno(errp, -bitmap_size, "could not get length of device");
3350 errno = -bitmap_size;
3351 return NULL;
3352 }
Markus Armbruster5839e532014-08-19 10:31:08 +02003353 bitmap = g_new0(BdrvDirtyBitmap, 1);
John Snow5fba6c02015-04-17 19:49:51 -04003354 bitmap->bitmap = hbitmap_alloc(bitmap_size, ctz32(sector_granularity));
John Snowe74e6b72015-04-17 19:49:59 -04003355 bitmap->size = bitmap_size;
Fam Zheng0db6e542015-04-17 19:49:50 -04003356 bitmap->name = g_strdup(name);
John Snowb8e6fb72015-04-17 19:49:56 -04003357 bitmap->disabled = false;
Fam Zhenge4654d22013-11-13 18:29:43 +08003358 QLIST_INSERT_HEAD(&bs->dirty_bitmaps, bitmap, list);
3359 return bitmap;
3360}
3361
John Snow9bd2b082015-04-17 19:49:57 -04003362bool bdrv_dirty_bitmap_frozen(BdrvDirtyBitmap *bitmap)
3363{
3364 return bitmap->successor;
3365}
3366
John Snowb8e6fb72015-04-17 19:49:56 -04003367bool bdrv_dirty_bitmap_enabled(BdrvDirtyBitmap *bitmap)
3368{
John Snow9bd2b082015-04-17 19:49:57 -04003369 return !(bitmap->disabled || bitmap->successor);
3370}
3371
John Snow9abe3bd2015-05-12 15:53:01 -04003372DirtyBitmapStatus bdrv_dirty_bitmap_status(BdrvDirtyBitmap *bitmap)
3373{
3374 if (bdrv_dirty_bitmap_frozen(bitmap)) {
3375 return DIRTY_BITMAP_STATUS_FROZEN;
3376 } else if (!bdrv_dirty_bitmap_enabled(bitmap)) {
3377 return DIRTY_BITMAP_STATUS_DISABLED;
3378 } else {
3379 return DIRTY_BITMAP_STATUS_ACTIVE;
3380 }
3381}
3382
John Snow9bd2b082015-04-17 19:49:57 -04003383/**
3384 * Create a successor bitmap destined to replace this bitmap after an operation.
3385 * Requires that the bitmap is not frozen and has no successor.
3386 */
3387int bdrv_dirty_bitmap_create_successor(BlockDriverState *bs,
3388 BdrvDirtyBitmap *bitmap, Error **errp)
3389{
3390 uint64_t granularity;
3391 BdrvDirtyBitmap *child;
3392
3393 if (bdrv_dirty_bitmap_frozen(bitmap)) {
3394 error_setg(errp, "Cannot create a successor for a bitmap that is "
3395 "currently frozen");
3396 return -1;
3397 }
3398 assert(!bitmap->successor);
3399
3400 /* Create an anonymous successor */
3401 granularity = bdrv_dirty_bitmap_granularity(bitmap);
3402 child = bdrv_create_dirty_bitmap(bs, granularity, NULL, errp);
3403 if (!child) {
3404 return -1;
3405 }
3406
3407 /* Successor will be on or off based on our current state. */
3408 child->disabled = bitmap->disabled;
3409
3410 /* Install the successor and freeze the parent */
3411 bitmap->successor = child;
3412 return 0;
3413}
3414
3415/**
3416 * For a bitmap with a successor, yield our name to the successor,
3417 * delete the old bitmap, and return a handle to the new bitmap.
3418 */
3419BdrvDirtyBitmap *bdrv_dirty_bitmap_abdicate(BlockDriverState *bs,
3420 BdrvDirtyBitmap *bitmap,
3421 Error **errp)
3422{
3423 char *name;
3424 BdrvDirtyBitmap *successor = bitmap->successor;
3425
3426 if (successor == NULL) {
3427 error_setg(errp, "Cannot relinquish control if "
3428 "there's no successor present");
3429 return NULL;
3430 }
3431
3432 name = bitmap->name;
3433 bitmap->name = NULL;
3434 successor->name = name;
3435 bitmap->successor = NULL;
3436 bdrv_release_dirty_bitmap(bs, bitmap);
3437
3438 return successor;
3439}
3440
3441/**
3442 * In cases of failure where we can no longer safely delete the parent,
3443 * we may wish to re-join the parent and child/successor.
3444 * The merged parent will be un-frozen, but not explicitly re-enabled.
3445 */
3446BdrvDirtyBitmap *bdrv_reclaim_dirty_bitmap(BlockDriverState *bs,
3447 BdrvDirtyBitmap *parent,
3448 Error **errp)
3449{
3450 BdrvDirtyBitmap *successor = parent->successor;
3451
3452 if (!successor) {
3453 error_setg(errp, "Cannot reclaim a successor when none is present");
3454 return NULL;
3455 }
3456
3457 if (!hbitmap_merge(parent->bitmap, successor->bitmap)) {
3458 error_setg(errp, "Merging of parent and successor bitmap failed");
3459 return NULL;
3460 }
3461 bdrv_release_dirty_bitmap(bs, successor);
3462 parent->successor = NULL;
3463
3464 return parent;
John Snowb8e6fb72015-04-17 19:49:56 -04003465}
3466
John Snowce1ffea2015-04-17 19:50:03 -04003467/**
3468 * Truncates _all_ bitmaps attached to a BDS.
3469 */
3470static void bdrv_dirty_bitmap_truncate(BlockDriverState *bs)
3471{
3472 BdrvDirtyBitmap *bitmap;
3473 uint64_t size = bdrv_nb_sectors(bs);
3474
3475 QLIST_FOREACH(bitmap, &bs->dirty_bitmaps, list) {
John Snow06207b02015-06-10 13:24:54 -04003476 assert(!bdrv_dirty_bitmap_frozen(bitmap));
John Snowce1ffea2015-04-17 19:50:03 -04003477 hbitmap_truncate(bitmap->bitmap, size);
John Snow5270b6a2015-06-08 16:49:15 -04003478 bitmap->size = size;
John Snowce1ffea2015-04-17 19:50:03 -04003479 }
3480}
3481
Fam Zhenge4654d22013-11-13 18:29:43 +08003482void bdrv_release_dirty_bitmap(BlockDriverState *bs, BdrvDirtyBitmap *bitmap)
3483{
3484 BdrvDirtyBitmap *bm, *next;
3485 QLIST_FOREACH_SAFE(bm, &bs->dirty_bitmaps, list, next) {
3486 if (bm == bitmap) {
John Snow9bd2b082015-04-17 19:49:57 -04003487 assert(!bdrv_dirty_bitmap_frozen(bm));
Fam Zhenge4654d22013-11-13 18:29:43 +08003488 QLIST_REMOVE(bitmap, list);
3489 hbitmap_free(bitmap->bitmap);
Fam Zheng0db6e542015-04-17 19:49:50 -04003490 g_free(bitmap->name);
Fam Zhenge4654d22013-11-13 18:29:43 +08003491 g_free(bitmap);
3492 return;
Jan Kiszkaa55eb922009-11-30 18:21:19 +01003493 }
lirans@il.ibm.com7cd1e322009-11-02 15:40:41 +02003494 }
3495}
3496
John Snowb8e6fb72015-04-17 19:49:56 -04003497void bdrv_disable_dirty_bitmap(BdrvDirtyBitmap *bitmap)
3498{
John Snow9bd2b082015-04-17 19:49:57 -04003499 assert(!bdrv_dirty_bitmap_frozen(bitmap));
John Snowb8e6fb72015-04-17 19:49:56 -04003500 bitmap->disabled = true;
3501}
3502
3503void bdrv_enable_dirty_bitmap(BdrvDirtyBitmap *bitmap)
3504{
John Snow9bd2b082015-04-17 19:49:57 -04003505 assert(!bdrv_dirty_bitmap_frozen(bitmap));
John Snowb8e6fb72015-04-17 19:49:56 -04003506 bitmap->disabled = false;
3507}
3508
Fam Zheng21b56832013-11-13 18:29:44 +08003509BlockDirtyInfoList *bdrv_query_dirty_bitmaps(BlockDriverState *bs)
3510{
3511 BdrvDirtyBitmap *bm;
3512 BlockDirtyInfoList *list = NULL;
3513 BlockDirtyInfoList **plist = &list;
3514
3515 QLIST_FOREACH(bm, &bs->dirty_bitmaps, list) {
Markus Armbruster5839e532014-08-19 10:31:08 +02003516 BlockDirtyInfo *info = g_new0(BlockDirtyInfo, 1);
3517 BlockDirtyInfoList *entry = g_new0(BlockDirtyInfoList, 1);
John Snow20dca812015-04-17 19:50:02 -04003518 info->count = bdrv_get_dirty_count(bm);
John Snow592fdd02015-04-17 19:49:53 -04003519 info->granularity = bdrv_dirty_bitmap_granularity(bm);
Fam Zheng0db6e542015-04-17 19:49:50 -04003520 info->has_name = !!bm->name;
3521 info->name = g_strdup(bm->name);
John Snow9abe3bd2015-05-12 15:53:01 -04003522 info->status = bdrv_dirty_bitmap_status(bm);
Fam Zheng21b56832013-11-13 18:29:44 +08003523 entry->value = info;
3524 *plist = entry;
3525 plist = &entry->next;
3526 }
3527
3528 return list;
3529}
3530
Fam Zhenge4654d22013-11-13 18:29:43 +08003531int bdrv_get_dirty(BlockDriverState *bs, BdrvDirtyBitmap *bitmap, int64_t sector)
lirans@il.ibm.com7cd1e322009-11-02 15:40:41 +02003532{
Fam Zhenge4654d22013-11-13 18:29:43 +08003533 if (bitmap) {
3534 return hbitmap_get(bitmap->bitmap, sector);
lirans@il.ibm.com7cd1e322009-11-02 15:40:41 +02003535 } else {
3536 return 0;
3537 }
3538}
3539
John Snow341ebc22015-04-17 19:49:52 -04003540/**
3541 * Chooses a default granularity based on the existing cluster size,
3542 * but clamped between [4K, 64K]. Defaults to 64K in the case that there
3543 * is no cluster size information available.
3544 */
3545uint32_t bdrv_get_default_bitmap_granularity(BlockDriverState *bs)
3546{
3547 BlockDriverInfo bdi;
3548 uint32_t granularity;
3549
3550 if (bdrv_get_info(bs, &bdi) >= 0 && bdi.cluster_size > 0) {
3551 granularity = MAX(4096, bdi.cluster_size);
3552 granularity = MIN(65536, granularity);
3553 } else {
3554 granularity = 65536;
3555 }
3556
3557 return granularity;
3558}
3559
John Snow592fdd02015-04-17 19:49:53 -04003560uint32_t bdrv_dirty_bitmap_granularity(BdrvDirtyBitmap *bitmap)
3561{
3562 return BDRV_SECTOR_SIZE << hbitmap_granularity(bitmap->bitmap);
3563}
3564
John Snow20dca812015-04-17 19:50:02 -04003565void bdrv_dirty_iter_init(BdrvDirtyBitmap *bitmap, HBitmapIter *hbi)
Paolo Bonzini1755da12012-10-18 16:49:18 +02003566{
Fam Zhenge4654d22013-11-13 18:29:43 +08003567 hbitmap_iter_init(hbi, bitmap->bitmap, 0);
Paolo Bonzini1755da12012-10-18 16:49:18 +02003568}
3569
John Snow20dca812015-04-17 19:50:02 -04003570void bdrv_set_dirty_bitmap(BdrvDirtyBitmap *bitmap,
Vladimir Sementsov-Ogievskiyc4237df2014-11-27 12:40:46 +03003571 int64_t cur_sector, int nr_sectors)
3572{
John Snowb8e6fb72015-04-17 19:49:56 -04003573 assert(bdrv_dirty_bitmap_enabled(bitmap));
Vladimir Sementsov-Ogievskiyc4237df2014-11-27 12:40:46 +03003574 hbitmap_set(bitmap->bitmap, cur_sector, nr_sectors);
3575}
3576
John Snow20dca812015-04-17 19:50:02 -04003577void bdrv_reset_dirty_bitmap(BdrvDirtyBitmap *bitmap,
Vladimir Sementsov-Ogievskiyc4237df2014-11-27 12:40:46 +03003578 int64_t cur_sector, int nr_sectors)
3579{
John Snowb8e6fb72015-04-17 19:49:56 -04003580 assert(bdrv_dirty_bitmap_enabled(bitmap));
Vladimir Sementsov-Ogievskiyc4237df2014-11-27 12:40:46 +03003581 hbitmap_reset(bitmap->bitmap, cur_sector, nr_sectors);
3582}
3583
John Snowe74e6b72015-04-17 19:49:59 -04003584void bdrv_clear_dirty_bitmap(BdrvDirtyBitmap *bitmap)
3585{
3586 assert(bdrv_dirty_bitmap_enabled(bitmap));
Wen Congyangc6a8c322015-05-22 09:29:46 +08003587 hbitmap_reset_all(bitmap->bitmap);
John Snowe74e6b72015-04-17 19:49:59 -04003588}
3589
Stefan Hajnoczie0c47b62015-04-28 14:27:50 +01003590void bdrv_set_dirty(BlockDriverState *bs, int64_t cur_sector,
3591 int nr_sectors)
Paolo Bonzini1755da12012-10-18 16:49:18 +02003592{
Fam Zhenge4654d22013-11-13 18:29:43 +08003593 BdrvDirtyBitmap *bitmap;
3594 QLIST_FOREACH(bitmap, &bs->dirty_bitmaps, list) {
John Snowb8e6fb72015-04-17 19:49:56 -04003595 if (!bdrv_dirty_bitmap_enabled(bitmap)) {
3596 continue;
3597 }
Fam Zhenge4654d22013-11-13 18:29:43 +08003598 hbitmap_set(bitmap->bitmap, cur_sector, nr_sectors);
Paolo Bonzini8f0720e2013-01-21 17:09:41 +01003599 }
Liran Schouraaa0eb72010-01-26 10:31:48 +02003600}
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003601
John Snowd58d8452015-04-17 19:49:58 -04003602/**
3603 * Advance an HBitmapIter to an arbitrary offset.
3604 */
3605void bdrv_set_dirty_iter(HBitmapIter *hbi, int64_t offset)
3606{
3607 assert(hbi->hb);
3608 hbitmap_iter_init(hbi, hbi->hb, offset);
3609}
3610
John Snow20dca812015-04-17 19:50:02 -04003611int64_t bdrv_get_dirty_count(BdrvDirtyBitmap *bitmap)
Fam Zhenge4654d22013-11-13 18:29:43 +08003612{
3613 return hbitmap_count(bitmap->bitmap);
3614}
3615
Fam Zheng9fcb0252013-08-23 09:14:46 +08003616/* Get a reference to bs */
3617void bdrv_ref(BlockDriverState *bs)
3618{
3619 bs->refcnt++;
3620}
3621
3622/* Release a previously grabbed reference to bs.
3623 * If after releasing, reference count is zero, the BlockDriverState is
3624 * deleted. */
3625void bdrv_unref(BlockDriverState *bs)
3626{
Jeff Cody9a4d5ca2014-07-23 17:22:57 -04003627 if (!bs) {
3628 return;
3629 }
Fam Zheng9fcb0252013-08-23 09:14:46 +08003630 assert(bs->refcnt > 0);
3631 if (--bs->refcnt == 0) {
3632 bdrv_delete(bs);
3633 }
3634}
3635
Fam Zhengfbe40ff2014-05-23 21:29:42 +08003636struct BdrvOpBlocker {
3637 Error *reason;
3638 QLIST_ENTRY(BdrvOpBlocker) list;
3639};
3640
3641bool bdrv_op_is_blocked(BlockDriverState *bs, BlockOpType op, Error **errp)
3642{
3643 BdrvOpBlocker *blocker;
3644 assert((int) op >= 0 && op < BLOCK_OP_TYPE_MAX);
3645 if (!QLIST_EMPTY(&bs->op_blockers[op])) {
3646 blocker = QLIST_FIRST(&bs->op_blockers[op]);
3647 if (errp) {
Alberto Garcia81e5f782015-04-08 12:29:19 +03003648 error_setg(errp, "Node '%s' is busy: %s",
3649 bdrv_get_device_or_node_name(bs),
Markus Armbrusterbfb197e2014-10-07 13:59:11 +02003650 error_get_pretty(blocker->reason));
Fam Zhengfbe40ff2014-05-23 21:29:42 +08003651 }
3652 return true;
3653 }
3654 return false;
3655}
3656
3657void bdrv_op_block(BlockDriverState *bs, BlockOpType op, Error *reason)
3658{
3659 BdrvOpBlocker *blocker;
3660 assert((int) op >= 0 && op < BLOCK_OP_TYPE_MAX);
3661
Markus Armbruster5839e532014-08-19 10:31:08 +02003662 blocker = g_new0(BdrvOpBlocker, 1);
Fam Zhengfbe40ff2014-05-23 21:29:42 +08003663 blocker->reason = reason;
3664 QLIST_INSERT_HEAD(&bs->op_blockers[op], blocker, list);
3665}
3666
3667void bdrv_op_unblock(BlockDriverState *bs, BlockOpType op, Error *reason)
3668{
3669 BdrvOpBlocker *blocker, *next;
3670 assert((int) op >= 0 && op < BLOCK_OP_TYPE_MAX);
3671 QLIST_FOREACH_SAFE(blocker, &bs->op_blockers[op], list, next) {
3672 if (blocker->reason == reason) {
3673 QLIST_REMOVE(blocker, list);
3674 g_free(blocker);
3675 }
3676 }
3677}
3678
3679void bdrv_op_block_all(BlockDriverState *bs, Error *reason)
3680{
3681 int i;
3682 for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
3683 bdrv_op_block(bs, i, reason);
3684 }
3685}
3686
3687void bdrv_op_unblock_all(BlockDriverState *bs, Error *reason)
3688{
3689 int i;
3690 for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
3691 bdrv_op_unblock(bs, i, reason);
3692 }
3693}
3694
3695bool bdrv_op_blocker_is_empty(BlockDriverState *bs)
3696{
3697 int i;
3698
3699 for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
3700 if (!QLIST_EMPTY(&bs->op_blockers[i])) {
3701 return false;
3702 }
3703 }
3704 return true;
3705}
3706
Luiz Capitulino28a72822011-09-26 17:43:50 -03003707void bdrv_iostatus_enable(BlockDriverState *bs)
3708{
Luiz Capitulinod6bf2792011-10-14 17:11:23 -03003709 bs->iostatus_enabled = true;
Luiz Capitulino58e21ef2011-10-14 17:22:24 -03003710 bs->iostatus = BLOCK_DEVICE_IO_STATUS_OK;
Luiz Capitulino28a72822011-09-26 17:43:50 -03003711}
3712
3713/* The I/O status is only enabled if the drive explicitly
3714 * enables it _and_ the VM is configured to stop on errors */
3715bool bdrv_iostatus_is_enabled(const BlockDriverState *bs)
3716{
Luiz Capitulinod6bf2792011-10-14 17:11:23 -03003717 return (bs->iostatus_enabled &&
Paolo Bonzini92aa5c62012-09-28 17:22:55 +02003718 (bs->on_write_error == BLOCKDEV_ON_ERROR_ENOSPC ||
3719 bs->on_write_error == BLOCKDEV_ON_ERROR_STOP ||
3720 bs->on_read_error == BLOCKDEV_ON_ERROR_STOP));
Luiz Capitulino28a72822011-09-26 17:43:50 -03003721}
3722
3723void bdrv_iostatus_disable(BlockDriverState *bs)
3724{
Luiz Capitulinod6bf2792011-10-14 17:11:23 -03003725 bs->iostatus_enabled = false;
Luiz Capitulino28a72822011-09-26 17:43:50 -03003726}
3727
3728void bdrv_iostatus_reset(BlockDriverState *bs)
3729{
3730 if (bdrv_iostatus_is_enabled(bs)) {
Luiz Capitulino58e21ef2011-10-14 17:22:24 -03003731 bs->iostatus = BLOCK_DEVICE_IO_STATUS_OK;
Paolo Bonzini3bd293c2012-10-18 16:49:27 +02003732 if (bs->job) {
3733 block_job_iostatus_reset(bs->job);
3734 }
Luiz Capitulino28a72822011-09-26 17:43:50 -03003735 }
3736}
3737
Luiz Capitulino28a72822011-09-26 17:43:50 -03003738void bdrv_iostatus_set_err(BlockDriverState *bs, int error)
3739{
Paolo Bonzini3e1caa52012-09-28 17:22:57 +02003740 assert(bdrv_iostatus_is_enabled(bs));
3741 if (bs->iostatus == BLOCK_DEVICE_IO_STATUS_OK) {
Luiz Capitulino58e21ef2011-10-14 17:22:24 -03003742 bs->iostatus = error == ENOSPC ? BLOCK_DEVICE_IO_STATUS_NOSPACE :
3743 BLOCK_DEVICE_IO_STATUS_FAILED;
Luiz Capitulino28a72822011-09-26 17:43:50 -03003744 }
3745}
3746
Luiz Capitulinod92ada22012-11-30 10:52:09 -02003747void bdrv_img_create(const char *filename, const char *fmt,
3748 const char *base_filename, const char *base_fmt,
Miroslav Rezaninaf382d432013-02-13 09:09:40 +01003749 char *options, uint64_t img_size, int flags,
3750 Error **errp, bool quiet)
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003751{
Chunyan Liu83d05212014-06-05 17:20:51 +08003752 QemuOptsList *create_opts = NULL;
3753 QemuOpts *opts = NULL;
3754 const char *backing_fmt, *backing_file;
3755 int64_t size;
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003756 BlockDriver *drv, *proto_drv;
Max Reitzcc84d902013-09-06 17:14:26 +02003757 Error *local_err = NULL;
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003758 int ret = 0;
3759
3760 /* Find driver and parse its options */
3761 drv = bdrv_find_format(fmt);
3762 if (!drv) {
Luiz Capitulino71c79812012-11-30 10:52:04 -02003763 error_setg(errp, "Unknown file format '%s'", fmt);
Luiz Capitulinod92ada22012-11-30 10:52:09 -02003764 return;
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003765 }
3766
Max Reitzb65a5e12015-02-05 13:58:12 -05003767 proto_drv = bdrv_find_protocol(filename, true, errp);
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003768 if (!proto_drv) {
Luiz Capitulinod92ada22012-11-30 10:52:09 -02003769 return;
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003770 }
3771
Max Reitzc6149722014-12-02 18:32:45 +01003772 if (!drv->create_opts) {
3773 error_setg(errp, "Format driver '%s' does not support image creation",
3774 drv->format_name);
3775 return;
3776 }
3777
3778 if (!proto_drv->create_opts) {
3779 error_setg(errp, "Protocol driver '%s' does not support image creation",
3780 proto_drv->format_name);
3781 return;
3782 }
3783
Chunyan Liuc282e1f2014-06-05 17:21:11 +08003784 create_opts = qemu_opts_append(create_opts, drv->create_opts);
3785 create_opts = qemu_opts_append(create_opts, proto_drv->create_opts);
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003786
3787 /* Create parameter list with default values */
Chunyan Liu83d05212014-06-05 17:20:51 +08003788 opts = qemu_opts_create(create_opts, NULL, 0, &error_abort);
Markus Armbruster39101f22015-02-12 16:46:36 +01003789 qemu_opt_set_number(opts, BLOCK_OPT_SIZE, img_size, &error_abort);
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003790
3791 /* Parse -o options */
3792 if (options) {
Markus Armbrusterdc523cd342015-02-12 18:37:11 +01003793 qemu_opts_do_parse(opts, options, NULL, &local_err);
3794 if (local_err) {
3795 error_report_err(local_err);
3796 local_err = NULL;
Chunyan Liu83d05212014-06-05 17:20:51 +08003797 error_setg(errp, "Invalid options for file format '%s'", fmt);
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003798 goto out;
3799 }
3800 }
3801
3802 if (base_filename) {
Markus Armbrusterf43e47d2015-02-12 17:52:20 +01003803 qemu_opt_set(opts, BLOCK_OPT_BACKING_FILE, base_filename, &local_err);
Markus Armbruster6be41942015-02-12 17:49:02 +01003804 if (local_err) {
Luiz Capitulino71c79812012-11-30 10:52:04 -02003805 error_setg(errp, "Backing file not supported for file format '%s'",
3806 fmt);
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003807 goto out;
3808 }
3809 }
3810
3811 if (base_fmt) {
Markus Armbrusterf43e47d2015-02-12 17:52:20 +01003812 qemu_opt_set(opts, BLOCK_OPT_BACKING_FMT, base_fmt, &local_err);
Markus Armbruster6be41942015-02-12 17:49:02 +01003813 if (local_err) {
Luiz Capitulino71c79812012-11-30 10:52:04 -02003814 error_setg(errp, "Backing file format not supported for file "
3815 "format '%s'", fmt);
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003816 goto out;
3817 }
3818 }
3819
Chunyan Liu83d05212014-06-05 17:20:51 +08003820 backing_file = qemu_opt_get(opts, BLOCK_OPT_BACKING_FILE);
3821 if (backing_file) {
3822 if (!strcmp(filename, backing_file)) {
Luiz Capitulino71c79812012-11-30 10:52:04 -02003823 error_setg(errp, "Error: Trying to create an image with the "
3824 "same filename as the backing file");
Jes Sorensen792da932010-12-16 13:52:17 +01003825 goto out;
3826 }
3827 }
3828
Chunyan Liu83d05212014-06-05 17:20:51 +08003829 backing_fmt = qemu_opt_get(opts, BLOCK_OPT_BACKING_FMT);
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003830
3831 // The size for the image must always be specified, with one exception:
3832 // If we are using a backing file, we can obtain the size from there
Chunyan Liu83d05212014-06-05 17:20:51 +08003833 size = qemu_opt_get_size(opts, BLOCK_OPT_SIZE, 0);
3834 if (size == -1) {
3835 if (backing_file) {
Max Reitz66f6b812013-12-03 14:57:52 +01003836 BlockDriverState *bs;
Max Reitz29168012014-11-26 17:20:27 +01003837 char *full_backing = g_new0(char, PATH_MAX);
Markus Armbruster52bf1e72014-06-26 13:23:25 +02003838 int64_t size;
Paolo Bonzini63090da2012-04-12 14:01:03 +02003839 int back_flags;
Max Reitze6641712015-08-26 19:47:48 +02003840 QDict *backing_options = NULL;
Paolo Bonzini63090da2012-04-12 14:01:03 +02003841
Max Reitz29168012014-11-26 17:20:27 +01003842 bdrv_get_full_backing_filename_from_filename(filename, backing_file,
3843 full_backing, PATH_MAX,
3844 &local_err);
3845 if (local_err) {
3846 g_free(full_backing);
3847 goto out;
3848 }
3849
Paolo Bonzini63090da2012-04-12 14:01:03 +02003850 /* backing files always opened read-only */
3851 back_flags =
3852 flags & ~(BDRV_O_RDWR | BDRV_O_SNAPSHOT | BDRV_O_NO_BACKING);
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003853
Max Reitze6641712015-08-26 19:47:48 +02003854 if (backing_fmt) {
3855 backing_options = qdict_new();
3856 qdict_put(backing_options, "driver",
3857 qstring_from_str(backing_fmt));
3858 }
3859
Max Reitzf67503e2014-02-18 18:33:05 +01003860 bs = NULL;
Max Reitze6641712015-08-26 19:47:48 +02003861 ret = bdrv_open(&bs, full_backing, NULL, backing_options,
Max Reitz6ebf9aa2015-08-26 19:47:49 +02003862 back_flags, &local_err);
Max Reitz29168012014-11-26 17:20:27 +01003863 g_free(full_backing);
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003864 if (ret < 0) {
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003865 goto out;
3866 }
Markus Armbruster52bf1e72014-06-26 13:23:25 +02003867 size = bdrv_getlength(bs);
3868 if (size < 0) {
3869 error_setg_errno(errp, -size, "Could not get size of '%s'",
3870 backing_file);
3871 bdrv_unref(bs);
3872 goto out;
3873 }
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003874
Markus Armbruster39101f22015-02-12 16:46:36 +01003875 qemu_opt_set_number(opts, BLOCK_OPT_SIZE, size, &error_abort);
Max Reitz66f6b812013-12-03 14:57:52 +01003876
3877 bdrv_unref(bs);
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003878 } else {
Luiz Capitulino71c79812012-11-30 10:52:04 -02003879 error_setg(errp, "Image creation needs a size parameter");
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003880 goto out;
3881 }
3882 }
3883
Miroslav Rezaninaf382d432013-02-13 09:09:40 +01003884 if (!quiet) {
Kővágó, Zoltánfe646692015-07-07 16:42:10 +02003885 printf("Formatting '%s', fmt=%s ", filename, fmt);
Fam Zheng43c5d8f2014-12-09 15:38:04 +08003886 qemu_opts_print(opts, " ");
Miroslav Rezaninaf382d432013-02-13 09:09:40 +01003887 puts("");
3888 }
Chunyan Liu83d05212014-06-05 17:20:51 +08003889
Chunyan Liuc282e1f2014-06-05 17:21:11 +08003890 ret = bdrv_create(drv, filename, opts, &local_err);
Chunyan Liu83d05212014-06-05 17:20:51 +08003891
Max Reitzcc84d902013-09-06 17:14:26 +02003892 if (ret == -EFBIG) {
3893 /* This is generally a better message than whatever the driver would
3894 * deliver (especially because of the cluster_size_hint), since that
3895 * is most probably not much different from "image too large". */
3896 const char *cluster_size_hint = "";
Chunyan Liu83d05212014-06-05 17:20:51 +08003897 if (qemu_opt_get_size(opts, BLOCK_OPT_CLUSTER_SIZE, 0)) {
Max Reitzcc84d902013-09-06 17:14:26 +02003898 cluster_size_hint = " (try using a larger cluster size)";
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003899 }
Max Reitzcc84d902013-09-06 17:14:26 +02003900 error_setg(errp, "The image size is too large for file format '%s'"
3901 "%s", fmt, cluster_size_hint);
3902 error_free(local_err);
3903 local_err = NULL;
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003904 }
3905
3906out:
Chunyan Liu83d05212014-06-05 17:20:51 +08003907 qemu_opts_del(opts);
3908 qemu_opts_free(create_opts);
Markus Armbruster84d18f02014-01-30 15:07:28 +01003909 if (local_err) {
Max Reitzcc84d902013-09-06 17:14:26 +02003910 error_propagate(errp, local_err);
3911 }
Jes Sorensenf88e1a42010-12-16 13:52:15 +01003912}
Stefan Hajnoczi85d126f2013-03-07 13:41:48 +01003913
3914AioContext *bdrv_get_aio_context(BlockDriverState *bs)
3915{
Stefan Hajnoczidcd04222014-05-08 16:34:37 +02003916 return bs->aio_context;
3917}
3918
3919void bdrv_detach_aio_context(BlockDriverState *bs)
3920{
Max Reitz33384422014-06-20 21:57:33 +02003921 BdrvAioNotifier *baf;
3922
Stefan Hajnoczidcd04222014-05-08 16:34:37 +02003923 if (!bs->drv) {
3924 return;
3925 }
3926
Max Reitz33384422014-06-20 21:57:33 +02003927 QLIST_FOREACH(baf, &bs->aio_notifiers, list) {
3928 baf->detach_aio_context(baf->opaque);
3929 }
3930
Stefan Hajnoczi13af91e2014-05-14 16:22:45 +02003931 if (bs->io_limits_enabled) {
Benoît Canet0e5b0a22015-06-08 18:17:41 +02003932 throttle_timers_detach_aio_context(&bs->throttle_timers);
Stefan Hajnoczi13af91e2014-05-14 16:22:45 +02003933 }
Stefan Hajnoczidcd04222014-05-08 16:34:37 +02003934 if (bs->drv->bdrv_detach_aio_context) {
3935 bs->drv->bdrv_detach_aio_context(bs);
3936 }
3937 if (bs->file) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02003938 bdrv_detach_aio_context(bs->file->bs);
Stefan Hajnoczidcd04222014-05-08 16:34:37 +02003939 }
3940 if (bs->backing_hd) {
3941 bdrv_detach_aio_context(bs->backing_hd);
3942 }
3943
3944 bs->aio_context = NULL;
3945}
3946
3947void bdrv_attach_aio_context(BlockDriverState *bs,
3948 AioContext *new_context)
3949{
Max Reitz33384422014-06-20 21:57:33 +02003950 BdrvAioNotifier *ban;
3951
Stefan Hajnoczidcd04222014-05-08 16:34:37 +02003952 if (!bs->drv) {
3953 return;
3954 }
3955
3956 bs->aio_context = new_context;
3957
3958 if (bs->backing_hd) {
3959 bdrv_attach_aio_context(bs->backing_hd, new_context);
3960 }
3961 if (bs->file) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02003962 bdrv_attach_aio_context(bs->file->bs, new_context);
Stefan Hajnoczidcd04222014-05-08 16:34:37 +02003963 }
3964 if (bs->drv->bdrv_attach_aio_context) {
3965 bs->drv->bdrv_attach_aio_context(bs, new_context);
3966 }
Stefan Hajnoczi13af91e2014-05-14 16:22:45 +02003967 if (bs->io_limits_enabled) {
Benoît Canet0e5b0a22015-06-08 18:17:41 +02003968 throttle_timers_attach_aio_context(&bs->throttle_timers, new_context);
Stefan Hajnoczi13af91e2014-05-14 16:22:45 +02003969 }
Max Reitz33384422014-06-20 21:57:33 +02003970
3971 QLIST_FOREACH(ban, &bs->aio_notifiers, list) {
3972 ban->attached_aio_context(new_context, ban->opaque);
3973 }
Stefan Hajnoczidcd04222014-05-08 16:34:37 +02003974}
3975
3976void bdrv_set_aio_context(BlockDriverState *bs, AioContext *new_context)
3977{
Fam Zheng53ec73e2015-05-29 18:53:14 +08003978 bdrv_drain(bs); /* ensure there are no in-flight requests */
Stefan Hajnoczidcd04222014-05-08 16:34:37 +02003979
3980 bdrv_detach_aio_context(bs);
3981
3982 /* This function executes in the old AioContext so acquire the new one in
3983 * case it runs in a different thread.
3984 */
3985 aio_context_acquire(new_context);
3986 bdrv_attach_aio_context(bs, new_context);
3987 aio_context_release(new_context);
Stefan Hajnoczi85d126f2013-03-07 13:41:48 +01003988}
Stefan Hajnoczid616b222013-06-24 17:13:10 +02003989
Max Reitz33384422014-06-20 21:57:33 +02003990void bdrv_add_aio_context_notifier(BlockDriverState *bs,
3991 void (*attached_aio_context)(AioContext *new_context, void *opaque),
3992 void (*detach_aio_context)(void *opaque), void *opaque)
3993{
3994 BdrvAioNotifier *ban = g_new(BdrvAioNotifier, 1);
3995 *ban = (BdrvAioNotifier){
3996 .attached_aio_context = attached_aio_context,
3997 .detach_aio_context = detach_aio_context,
3998 .opaque = opaque
3999 };
4000
4001 QLIST_INSERT_HEAD(&bs->aio_notifiers, ban, list);
4002}
4003
4004void bdrv_remove_aio_context_notifier(BlockDriverState *bs,
4005 void (*attached_aio_context)(AioContext *,
4006 void *),
4007 void (*detach_aio_context)(void *),
4008 void *opaque)
4009{
4010 BdrvAioNotifier *ban, *ban_next;
4011
4012 QLIST_FOREACH_SAFE(ban, &bs->aio_notifiers, list, ban_next) {
4013 if (ban->attached_aio_context == attached_aio_context &&
4014 ban->detach_aio_context == detach_aio_context &&
4015 ban->opaque == opaque)
4016 {
4017 QLIST_REMOVE(ban, list);
4018 g_free(ban);
4019
4020 return;
4021 }
4022 }
4023
4024 abort();
4025}
4026
Max Reitz77485432014-10-27 11:12:50 +01004027int bdrv_amend_options(BlockDriverState *bs, QemuOpts *opts,
4028 BlockDriverAmendStatusCB *status_cb)
Max Reitz6f176b42013-09-03 10:09:50 +02004029{
Chunyan Liuc282e1f2014-06-05 17:21:11 +08004030 if (!bs->drv->bdrv_amend_options) {
Max Reitz6f176b42013-09-03 10:09:50 +02004031 return -ENOTSUP;
4032 }
Max Reitz77485432014-10-27 11:12:50 +01004033 return bs->drv->bdrv_amend_options(bs, opts, status_cb);
Max Reitz6f176b42013-09-03 10:09:50 +02004034}
Benoît Canetf6186f42013-10-02 14:33:48 +02004035
Benoît Canetb5042a32014-03-03 19:11:34 +01004036/* This function will be called by the bdrv_recurse_is_first_non_filter method
4037 * of block filter and by bdrv_is_first_non_filter.
4038 * It is used to test if the given bs is the candidate or recurse more in the
4039 * node graph.
Benoît Canet212a5a82014-01-23 21:31:36 +01004040 */
Benoît Canet212a5a82014-01-23 21:31:36 +01004041bool bdrv_recurse_is_first_non_filter(BlockDriverState *bs,
4042 BlockDriverState *candidate)
Benoît Canetf6186f42013-10-02 14:33:48 +02004043{
Benoît Canetb5042a32014-03-03 19:11:34 +01004044 /* return false if basic checks fails */
4045 if (!bs || !bs->drv) {
4046 return false;
4047 }
4048
4049 /* the code reached a non block filter driver -> check if the bs is
4050 * the same as the candidate. It's the recursion termination condition.
4051 */
4052 if (!bs->drv->is_filter) {
4053 return bs == candidate;
4054 }
4055 /* Down this path the driver is a block filter driver */
4056
4057 /* If the block filter recursion method is defined use it to recurse down
4058 * the node graph.
4059 */
4060 if (bs->drv->bdrv_recurse_is_first_non_filter) {
Benoît Canet212a5a82014-01-23 21:31:36 +01004061 return bs->drv->bdrv_recurse_is_first_non_filter(bs, candidate);
4062 }
4063
Benoît Canetb5042a32014-03-03 19:11:34 +01004064 /* the driver is a block filter but don't allow to recurse -> return false
4065 */
4066 return false;
Benoît Canet212a5a82014-01-23 21:31:36 +01004067}
4068
4069/* This function checks if the candidate is the first non filter bs down it's
4070 * bs chain. Since we don't have pointers to parents it explore all bs chains
4071 * from the top. Some filters can choose not to pass down the recursion.
4072 */
4073bool bdrv_is_first_non_filter(BlockDriverState *candidate)
4074{
4075 BlockDriverState *bs;
4076
4077 /* walk down the bs forest recursively */
4078 QTAILQ_FOREACH(bs, &bdrv_states, device_list) {
4079 bool perm;
4080
Benoît Canetb5042a32014-03-03 19:11:34 +01004081 /* try to recurse in this top level bs */
Kevin Wolfe6dc8a12014-02-04 11:45:31 +01004082 perm = bdrv_recurse_is_first_non_filter(bs, candidate);
Benoît Canet212a5a82014-01-23 21:31:36 +01004083
4084 /* candidate is the first non filter */
4085 if (perm) {
4086 return true;
4087 }
4088 }
4089
4090 return false;
Benoît Canetf6186f42013-10-02 14:33:48 +02004091}
Benoît Canet09158f02014-06-27 18:25:25 +02004092
Wen Congyange12f3782015-07-17 10:12:22 +08004093BlockDriverState *check_to_replace_node(BlockDriverState *parent_bs,
4094 const char *node_name, Error **errp)
Benoît Canet09158f02014-06-27 18:25:25 +02004095{
4096 BlockDriverState *to_replace_bs = bdrv_find_node(node_name);
Stefan Hajnoczi5a7e7a02014-10-21 12:03:58 +01004097 AioContext *aio_context;
4098
Benoît Canet09158f02014-06-27 18:25:25 +02004099 if (!to_replace_bs) {
4100 error_setg(errp, "Node name '%s' not found", node_name);
4101 return NULL;
4102 }
4103
Stefan Hajnoczi5a7e7a02014-10-21 12:03:58 +01004104 aio_context = bdrv_get_aio_context(to_replace_bs);
4105 aio_context_acquire(aio_context);
4106
Benoît Canet09158f02014-06-27 18:25:25 +02004107 if (bdrv_op_is_blocked(to_replace_bs, BLOCK_OP_TYPE_REPLACE, errp)) {
Stefan Hajnoczi5a7e7a02014-10-21 12:03:58 +01004108 to_replace_bs = NULL;
4109 goto out;
Benoît Canet09158f02014-06-27 18:25:25 +02004110 }
4111
4112 /* We don't want arbitrary node of the BDS chain to be replaced only the top
4113 * most non filter in order to prevent data corruption.
4114 * Another benefit is that this tests exclude backing files which are
4115 * blocked by the backing blockers.
4116 */
Wen Congyange12f3782015-07-17 10:12:22 +08004117 if (!bdrv_recurse_is_first_non_filter(parent_bs, to_replace_bs)) {
Benoît Canet09158f02014-06-27 18:25:25 +02004118 error_setg(errp, "Only top most non filter can be replaced");
Stefan Hajnoczi5a7e7a02014-10-21 12:03:58 +01004119 to_replace_bs = NULL;
4120 goto out;
Benoît Canet09158f02014-06-27 18:25:25 +02004121 }
4122
Stefan Hajnoczi5a7e7a02014-10-21 12:03:58 +01004123out:
4124 aio_context_release(aio_context);
Benoît Canet09158f02014-06-27 18:25:25 +02004125 return to_replace_bs;
4126}
Ming Lei448ad912014-07-04 18:04:33 +08004127
Max Reitz91af7012014-07-18 20:24:56 +02004128static bool append_open_options(QDict *d, BlockDriverState *bs)
4129{
4130 const QDictEntry *entry;
4131 bool found_any = false;
4132
4133 for (entry = qdict_first(bs->options); entry;
4134 entry = qdict_next(bs->options, entry))
4135 {
4136 /* Only take options for this level and exclude all non-driver-specific
4137 * options */
4138 if (!strchr(qdict_entry_key(entry), '.') &&
4139 strcmp(qdict_entry_key(entry), "node-name"))
4140 {
4141 qobject_incref(qdict_entry_value(entry));
4142 qdict_put_obj(d, qdict_entry_key(entry), qdict_entry_value(entry));
4143 found_any = true;
4144 }
4145 }
4146
4147 return found_any;
4148}
4149
4150/* Updates the following BDS fields:
4151 * - exact_filename: A filename which may be used for opening a block device
4152 * which (mostly) equals the given BDS (even without any
4153 * other options; so reading and writing must return the same
4154 * results, but caching etc. may be different)
4155 * - full_open_options: Options which, when given when opening a block device
4156 * (without a filename), result in a BDS (mostly)
4157 * equalling the given one
4158 * - filename: If exact_filename is set, it is copied here. Otherwise,
4159 * full_open_options is converted to a JSON object, prefixed with
4160 * "json:" (for use through the JSON pseudo protocol) and put here.
4161 */
4162void bdrv_refresh_filename(BlockDriverState *bs)
4163{
4164 BlockDriver *drv = bs->drv;
4165 QDict *opts;
4166
4167 if (!drv) {
4168 return;
4169 }
4170
4171 /* This BDS's file name will most probably depend on its file's name, so
4172 * refresh that first */
4173 if (bs->file) {
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02004174 bdrv_refresh_filename(bs->file->bs);
Max Reitz91af7012014-07-18 20:24:56 +02004175 }
4176
4177 if (drv->bdrv_refresh_filename) {
4178 /* Obsolete information is of no use here, so drop the old file name
4179 * information before refreshing it */
4180 bs->exact_filename[0] = '\0';
4181 if (bs->full_open_options) {
4182 QDECREF(bs->full_open_options);
4183 bs->full_open_options = NULL;
4184 }
4185
4186 drv->bdrv_refresh_filename(bs);
4187 } else if (bs->file) {
4188 /* Try to reconstruct valid information from the underlying file */
4189 bool has_open_options;
4190
4191 bs->exact_filename[0] = '\0';
4192 if (bs->full_open_options) {
4193 QDECREF(bs->full_open_options);
4194 bs->full_open_options = NULL;
4195 }
4196
4197 opts = qdict_new();
4198 has_open_options = append_open_options(opts, bs);
4199
4200 /* If no specific options have been given for this BDS, the filename of
4201 * the underlying file should suffice for this one as well */
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02004202 if (bs->file->bs->exact_filename[0] && !has_open_options) {
4203 strcpy(bs->exact_filename, bs->file->bs->exact_filename);
Max Reitz91af7012014-07-18 20:24:56 +02004204 }
4205 /* Reconstructing the full options QDict is simple for most format block
4206 * drivers, as long as the full options are known for the underlying
4207 * file BDS. The full options QDict of that file BDS should somehow
4208 * contain a representation of the filename, therefore the following
4209 * suffices without querying the (exact_)filename of this BDS. */
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02004210 if (bs->file->bs->full_open_options) {
Max Reitz91af7012014-07-18 20:24:56 +02004211 qdict_put_obj(opts, "driver",
4212 QOBJECT(qstring_from_str(drv->format_name)));
Kevin Wolf9a4f4c32015-06-16 14:19:22 +02004213 QINCREF(bs->file->bs->full_open_options);
4214 qdict_put_obj(opts, "file",
4215 QOBJECT(bs->file->bs->full_open_options));
Max Reitz91af7012014-07-18 20:24:56 +02004216
4217 bs->full_open_options = opts;
4218 } else {
4219 QDECREF(opts);
4220 }
4221 } else if (!bs->full_open_options && qdict_size(bs->options)) {
4222 /* There is no underlying file BDS (at least referenced by BDS.file),
4223 * so the full options QDict should be equal to the options given
4224 * specifically for this block device when it was opened (plus the
4225 * driver specification).
4226 * Because those options don't change, there is no need to update
4227 * full_open_options when it's already set. */
4228
4229 opts = qdict_new();
4230 append_open_options(opts, bs);
4231 qdict_put_obj(opts, "driver",
4232 QOBJECT(qstring_from_str(drv->format_name)));
4233
4234 if (bs->exact_filename[0]) {
4235 /* This may not work for all block protocol drivers (some may
4236 * require this filename to be parsed), but we have to find some
4237 * default solution here, so just include it. If some block driver
4238 * does not support pure options without any filename at all or
4239 * needs some special format of the options QDict, it needs to
4240 * implement the driver-specific bdrv_refresh_filename() function.
4241 */
4242 qdict_put_obj(opts, "filename",
4243 QOBJECT(qstring_from_str(bs->exact_filename)));
4244 }
4245
4246 bs->full_open_options = opts;
4247 }
4248
4249 if (bs->exact_filename[0]) {
4250 pstrcpy(bs->filename, sizeof(bs->filename), bs->exact_filename);
4251 } else if (bs->full_open_options) {
4252 QString *json = qobject_to_json(QOBJECT(bs->full_open_options));
4253 snprintf(bs->filename, sizeof(bs->filename), "json:%s",
4254 qstring_get_str(json));
4255 QDECREF(json);
4256 }
4257}
Benoît Canet5366d0c2014-09-05 15:46:18 +02004258
4259/* This accessor function purpose is to allow the device models to access the
4260 * BlockAcctStats structure embedded inside a BlockDriverState without being
4261 * aware of the BlockDriverState structure layout.
4262 * It will go away when the BlockAcctStats structure will be moved inside
4263 * the device models.
4264 */
4265BlockAcctStats *bdrv_get_stats(BlockDriverState *bs)
4266{
4267 return &bs->stats;
4268}