2003-06-30 18:03:06 +08:00
|
|
|
/*
|
|
|
|
* QEMU System Emulator block driver
|
2007-09-17 05:08:06 +08:00
|
|
|
*
|
2003-06-30 18:03:06 +08:00
|
|
|
* Copyright (c) 2003 Fabrice Bellard
|
2007-09-17 05:08:06 +08:00
|
|
|
*
|
2003-06-30 18:03:06 +08:00
|
|
|
* Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
|
|
* of this software and associated documentation files (the "Software"), to deal
|
|
|
|
* in the Software without restriction, including without limitation the rights
|
|
|
|
* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
|
|
* copies of the Software, and to permit persons to whom the Software is
|
|
|
|
* furnished to do so, subject to the following conditions:
|
|
|
|
*
|
|
|
|
* The above copyright notice and this permission notice shall be included in
|
|
|
|
* all copies or substantial portions of the Software.
|
|
|
|
*
|
|
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
|
|
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
|
|
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
|
|
* THE SOFTWARE.
|
|
|
|
*/
|
2016-01-30 01:50:05 +08:00
|
|
|
#include "qemu/osdep.h"
|
2007-11-11 10:51:17 +08:00
|
|
|
#include "qemu-common.h"
|
2010-05-23 01:15:08 +08:00
|
|
|
#include "trace.h"
|
2012-12-18 01:19:44 +08:00
|
|
|
#include "block/block_int.h"
|
|
|
|
#include "block/blockjob.h"
|
2015-03-18 01:29:20 +08:00
|
|
|
#include "qemu/error-report.h"
|
2012-12-18 01:20:00 +08:00
|
|
|
#include "qemu/module.h"
|
2015-03-18 00:22:46 +08:00
|
|
|
#include "qapi/qmp/qerror.h"
|
2015-05-08 23:49:53 +08:00
|
|
|
#include "qapi/qmp/qbool.h"
|
2012-12-18 01:19:43 +08:00
|
|
|
#include "qapi/qmp/qjson.h"
|
2014-10-07 19:59:11 +08:00
|
|
|
#include "sysemu/block-backend.h"
|
2012-12-18 01:20:04 +08:00
|
|
|
#include "sysemu/sysemu.h"
|
2012-12-18 01:20:00 +08:00
|
|
|
#include "qemu/notify.h"
|
2015-09-01 21:48:02 +08:00
|
|
|
#include "qemu/coroutine.h"
|
2014-01-24 04:31:34 +08:00
|
|
|
#include "block/qapi.h"
|
2011-09-22 04:16:47 +08:00
|
|
|
#include "qmp-commands.h"
|
2012-12-18 01:20:00 +08:00
|
|
|
#include "qemu/timer.h"
|
2014-06-18 14:43:44 +08:00
|
|
|
#include "qapi-event.h"
|
2015-06-09 00:17:45 +08:00
|
|
|
#include "block/throttle-groups.h"
|
2003-06-30 18:03:06 +08:00
|
|
|
|
2009-07-27 22:12:56 +08:00
|
|
|
#ifdef CONFIG_BSD
|
2005-04-27 05:59:26 +08:00
|
|
|
#include <sys/ioctl.h>
|
2009-09-12 15:36:22 +08:00
|
|
|
#include <sys/queue.h>
|
2009-03-08 04:06:23 +08:00
|
|
|
#ifndef __DragonFly__
|
2005-04-27 05:59:26 +08:00
|
|
|
#include <sys/disk.h>
|
|
|
|
#endif
|
2009-03-08 04:06:23 +08:00
|
|
|
#endif
|
2005-04-27 05:59:26 +08:00
|
|
|
|
2009-03-09 00:26:59 +08:00
|
|
|
#ifdef _WIN32
|
|
|
|
#include <windows.h>
|
|
|
|
#endif
|
|
|
|
|
block: Add bitmap successors
A bitmap successor is an anonymous BdrvDirtyBitmap that is intended to
be created just prior to a sensitive operation (e.g. Incremental Backup)
that can either succeed or fail, but during the course of which we still
want a bitmap tracking writes.
On creating a successor, we "freeze" the parent bitmap which prevents
its deletion, enabling, anonymization, or creating a bitmap with the
same name.
On success, the parent bitmap can "abdicate" responsibility to the
successor, which will inherit its name. The successor will have been
tracking writes during the course of the backup operation. The parent
will be safely deleted.
On failure, we can "reclaim" the successor from the parent, unifying
them such that the resulting bitmap describes all writes occurring since
the last successful backup, for instance. Reclamation will thaw the
parent, but not explicitly re-enable it.
BdrvDirtyBitmap operations that target a single bitmap are protected
by assertions that the bitmap is not frozen and/or disabled.
BdrvDirtyBitmap operations that target a group of bitmaps, such as
bdrv_{set,reset}_dirty will ignore frozen/disabled drives with a
conditional instead.
Internal functions that enable/disable dirty bitmaps have assertions
added to them to prevent modifying frozen bitmaps.
Signed-off-by: John Snow <jsnow@redhat.com>
Reviewed-by: Max Reitz <mreitz@redhat.com>
Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com>
Reviewed-by: Eric Blake <eblake@redhat.com>
Message-id: 1429314609-29776-10-git-send-email-jsnow@redhat.com
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
2015-04-18 07:49:57 +08:00
|
|
|
/**
|
|
|
|
* A BdrvDirtyBitmap can be in three possible states:
|
|
|
|
* (1) successor is NULL and disabled is false: full r/w mode
|
|
|
|
* (2) successor is NULL and disabled is true: read only mode ("disabled")
|
|
|
|
* (3) successor is set: frozen mode.
|
|
|
|
* A frozen bitmap cannot be renamed, deleted, anonymized, cleared, set,
|
|
|
|
* or enabled. A frozen bitmap can only abdicate() or reclaim().
|
|
|
|
*/
|
2013-11-13 18:29:43 +08:00
|
|
|
struct BdrvDirtyBitmap {
|
2015-04-18 07:50:01 +08:00
|
|
|
HBitmap *bitmap; /* Dirty sector bitmap implementation */
|
|
|
|
BdrvDirtyBitmap *successor; /* Anonymous child; implies frozen status */
|
|
|
|
char *name; /* Optional non-empty unique ID */
|
|
|
|
int64_t size; /* Size of the bitmap (Number of sectors) */
|
|
|
|
bool disabled; /* Bitmap is read-only */
|
2013-11-13 18:29:43 +08:00
|
|
|
QLIST_ENTRY(BdrvDirtyBitmap) list;
|
|
|
|
};
|
|
|
|
|
2011-10-13 20:08:22 +08:00
|
|
|
#define NOT_DONE 0x7fffffff /* used while emulated sync operation in progress */
|
|
|
|
|
2015-10-27 04:39:06 +08:00
|
|
|
struct BdrvStates bdrv_states = QTAILQ_HEAD_INITIALIZER(bdrv_states);
|
2008-09-18 03:04:14 +08:00
|
|
|
|
2014-01-24 04:31:32 +08:00
|
|
|
static QTAILQ_HEAD(, BlockDriverState) graph_bdrv_states =
|
|
|
|
QTAILQ_HEAD_INITIALIZER(graph_bdrv_states);
|
|
|
|
|
2016-01-29 23:36:11 +08:00
|
|
|
static QTAILQ_HEAD(, BlockDriverState) all_bdrv_states =
|
|
|
|
QTAILQ_HEAD_INITIALIZER(all_bdrv_states);
|
|
|
|
|
2010-04-13 17:29:33 +08:00
|
|
|
static QLIST_HEAD(, BlockDriver) bdrv_drivers =
|
|
|
|
QLIST_HEAD_INITIALIZER(bdrv_drivers);
|
2004-08-02 05:59:26 +08:00
|
|
|
|
2015-04-08 19:43:47 +08:00
|
|
|
static int bdrv_open_inherit(BlockDriverState **pbs, const char *filename,
|
|
|
|
const char *reference, QDict *options, int flags,
|
|
|
|
BlockDriverState *parent,
|
2015-08-27 01:47:50 +08:00
|
|
|
const BdrvChildRole *child_role, Error **errp);
|
2015-04-08 19:43:47 +08:00
|
|
|
|
2015-04-18 07:50:03 +08:00
|
|
|
static void bdrv_dirty_bitmap_truncate(BlockDriverState *bs);
|
2016-01-29 23:36:01 +08:00
|
|
|
static void bdrv_release_named_dirty_bitmaps(BlockDriverState *bs);
|
|
|
|
|
2009-10-28 01:41:44 +08:00
|
|
|
/* If non-zero, use only whitelisted block drivers */
|
|
|
|
static int use_bdrv_whitelist;
|
|
|
|
|
2016-01-29 23:36:10 +08:00
|
|
|
static void bdrv_close(BlockDriverState *bs);
|
|
|
|
|
2010-12-09 19:53:00 +08:00
|
|
|
#ifdef _WIN32
|
|
|
|
static int is_windows_drive_prefix(const char *filename)
|
|
|
|
{
|
|
|
|
return (((filename[0] >= 'a' && filename[0] <= 'z') ||
|
|
|
|
(filename[0] >= 'A' && filename[0] <= 'Z')) &&
|
|
|
|
filename[1] == ':');
|
|
|
|
}
|
|
|
|
|
|
|
|
int is_windows_drive(const char *filename)
|
|
|
|
{
|
|
|
|
if (is_windows_drive_prefix(filename) &&
|
|
|
|
filename[2] == '\0')
|
|
|
|
return 1;
|
|
|
|
if (strstart(filename, "\\\\.\\", NULL) ||
|
|
|
|
strstart(filename, "//./", NULL))
|
|
|
|
return 1;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
2013-11-28 17:23:32 +08:00
|
|
|
size_t bdrv_opt_mem_align(BlockDriverState *bs)
|
|
|
|
{
|
|
|
|
if (!bs || !bs->drv) {
|
block: align bounce buffers to page
The following sequence
int fd = open(argv[1], O_RDWR | O_CREAT | O_DIRECT, 0644);
for (i = 0; i < 100000; i++)
write(fd, buf, 4096);
performs 5% better if buf is aligned to 4096 bytes.
The difference is quite reliable.
On the other hand we do not want at the moment to enforce bounce
buffering if guest request is aligned to 512 bytes.
The patch changes default bounce buffer optimal alignment to
MAX(page size, 4k). 4k is chosen as maximal known sector size on real
HDD.
The justification of the performance improve is quite interesting.
From the kernel point of view each request to the disk was split
by two. This could be seen by blktrace like this:
9,0 11 1 0.000000000 11151 Q WS 312737792 + 1023 [qemu-img]
9,0 11 2 0.000007938 11151 Q WS 312738815 + 8 [qemu-img]
9,0 11 3 0.000030735 11151 Q WS 312738823 + 1016 [qemu-img]
9,0 11 4 0.000032482 11151 Q WS 312739839 + 8 [qemu-img]
9,0 11 5 0.000041379 11151 Q WS 312739847 + 1016 [qemu-img]
9,0 11 6 0.000042818 11151 Q WS 312740863 + 8 [qemu-img]
9,0 11 7 0.000051236 11151 Q WS 312740871 + 1017 [qemu-img]
9,0 5 1 0.169071519 11151 Q WS 312741888 + 1023 [qemu-img]
After the patch the pattern becomes normal:
9,0 6 1 0.000000000 12422 Q WS 314834944 + 1024 [qemu-img]
9,0 6 2 0.000038527 12422 Q WS 314835968 + 1024 [qemu-img]
9,0 6 3 0.000072849 12422 Q WS 314836992 + 1024 [qemu-img]
9,0 6 4 0.000106276 12422 Q WS 314838016 + 1024 [qemu-img]
and the amount of requests sent to disk (could be calculated counting
number of lines in the output of blktrace) is reduced about 2 times.
Both qemu-img and qemu-io are affected while qemu-kvm is not. The guest
does his job well and real requests comes properly aligned (to page).
Signed-off-by: Denis V. Lunev <den@openvz.org>
Reviewed-by: Kevin Wolf <kwolf@redhat.com>
Message-id: 1431441056-26198-3-git-send-email-den@openvz.org
CC: Paolo Bonzini <pbonzini@redhat.com>
CC: Kevin Wolf <kwolf@redhat.com>
CC: Stefan Hajnoczi <stefanha@redhat.com>
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
2015-05-12 22:30:56 +08:00
|
|
|
/* page size or 4k (hdd sector size) should be on the safe side */
|
|
|
|
return MAX(4096, getpagesize());
|
2013-11-28 17:23:32 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
return bs->bl.opt_mem_alignment;
|
|
|
|
}
|
|
|
|
|
2015-05-12 22:30:55 +08:00
|
|
|
size_t bdrv_min_mem_align(BlockDriverState *bs)
|
|
|
|
{
|
|
|
|
if (!bs || !bs->drv) {
|
block: align bounce buffers to page
The following sequence
int fd = open(argv[1], O_RDWR | O_CREAT | O_DIRECT, 0644);
for (i = 0; i < 100000; i++)
write(fd, buf, 4096);
performs 5% better if buf is aligned to 4096 bytes.
The difference is quite reliable.
On the other hand we do not want at the moment to enforce bounce
buffering if guest request is aligned to 512 bytes.
The patch changes default bounce buffer optimal alignment to
MAX(page size, 4k). 4k is chosen as maximal known sector size on real
HDD.
The justification of the performance improve is quite interesting.
From the kernel point of view each request to the disk was split
by two. This could be seen by blktrace like this:
9,0 11 1 0.000000000 11151 Q WS 312737792 + 1023 [qemu-img]
9,0 11 2 0.000007938 11151 Q WS 312738815 + 8 [qemu-img]
9,0 11 3 0.000030735 11151 Q WS 312738823 + 1016 [qemu-img]
9,0 11 4 0.000032482 11151 Q WS 312739839 + 8 [qemu-img]
9,0 11 5 0.000041379 11151 Q WS 312739847 + 1016 [qemu-img]
9,0 11 6 0.000042818 11151 Q WS 312740863 + 8 [qemu-img]
9,0 11 7 0.000051236 11151 Q WS 312740871 + 1017 [qemu-img]
9,0 5 1 0.169071519 11151 Q WS 312741888 + 1023 [qemu-img]
After the patch the pattern becomes normal:
9,0 6 1 0.000000000 12422 Q WS 314834944 + 1024 [qemu-img]
9,0 6 2 0.000038527 12422 Q WS 314835968 + 1024 [qemu-img]
9,0 6 3 0.000072849 12422 Q WS 314836992 + 1024 [qemu-img]
9,0 6 4 0.000106276 12422 Q WS 314838016 + 1024 [qemu-img]
and the amount of requests sent to disk (could be calculated counting
number of lines in the output of blktrace) is reduced about 2 times.
Both qemu-img and qemu-io are affected while qemu-kvm is not. The guest
does his job well and real requests comes properly aligned (to page).
Signed-off-by: Denis V. Lunev <den@openvz.org>
Reviewed-by: Kevin Wolf <kwolf@redhat.com>
Message-id: 1431441056-26198-3-git-send-email-den@openvz.org
CC: Paolo Bonzini <pbonzini@redhat.com>
CC: Kevin Wolf <kwolf@redhat.com>
CC: Stefan Hajnoczi <stefanha@redhat.com>
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
2015-05-12 22:30:56 +08:00
|
|
|
/* page size or 4k (hdd sector size) should be on the safe side */
|
|
|
|
return MAX(4096, getpagesize());
|
2015-05-12 22:30:55 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
return bs->bl.min_mem_alignment;
|
|
|
|
}
|
|
|
|
|
2010-12-09 19:53:00 +08:00
|
|
|
/* check if the path starts with "<protocol>:" */
|
2014-12-03 21:57:22 +08:00
|
|
|
int path_has_protocol(const char *path)
|
2010-12-09 19:53:00 +08:00
|
|
|
{
|
2012-05-08 22:51:48 +08:00
|
|
|
const char *p;
|
|
|
|
|
2010-12-09 19:53:00 +08:00
|
|
|
#ifdef _WIN32
|
|
|
|
if (is_windows_drive(path) ||
|
|
|
|
is_windows_drive_prefix(path)) {
|
|
|
|
return 0;
|
|
|
|
}
|
2012-05-08 22:51:48 +08:00
|
|
|
p = path + strcspn(path, ":/\\");
|
|
|
|
#else
|
|
|
|
p = path + strcspn(path, ":/");
|
2010-12-09 19:53:00 +08:00
|
|
|
#endif
|
|
|
|
|
2012-05-08 22:51:48 +08:00
|
|
|
return *p == ':';
|
2010-12-09 19:53:00 +08:00
|
|
|
}
|
|
|
|
|
2006-08-02 00:21:11 +08:00
|
|
|
int path_is_absolute(const char *path)
|
2005-10-31 02:30:10 +08:00
|
|
|
{
|
2007-01-08 02:22:37 +08:00
|
|
|
#ifdef _WIN32
|
|
|
|
/* specific case for names like: "\\.\d:" */
|
2012-05-08 22:51:47 +08:00
|
|
|
if (is_windows_drive(path) || is_windows_drive_prefix(path)) {
|
2007-01-08 02:22:37 +08:00
|
|
|
return 1;
|
2012-05-08 22:51:47 +08:00
|
|
|
}
|
|
|
|
return (*path == '/' || *path == '\\');
|
2007-01-08 01:27:07 +08:00
|
|
|
#else
|
2012-05-08 22:51:47 +08:00
|
|
|
return (*path == '/');
|
2007-01-08 01:27:07 +08:00
|
|
|
#endif
|
2005-10-31 02:30:10 +08:00
|
|
|
}
|
|
|
|
|
2006-08-02 00:21:11 +08:00
|
|
|
/* if filename is absolute, just copy it to dest. Otherwise, build a
|
|
|
|
path to it by considering it is relative to base_path. URL are
|
|
|
|
supported. */
|
|
|
|
void path_combine(char *dest, int dest_size,
|
|
|
|
const char *base_path,
|
|
|
|
const char *filename)
|
2005-10-31 02:30:10 +08:00
|
|
|
{
|
2006-08-02 00:21:11 +08:00
|
|
|
const char *p, *p1;
|
|
|
|
int len;
|
|
|
|
|
|
|
|
if (dest_size <= 0)
|
|
|
|
return;
|
|
|
|
if (path_is_absolute(filename)) {
|
|
|
|
pstrcpy(dest, dest_size, filename);
|
|
|
|
} else {
|
|
|
|
p = strchr(base_path, ':');
|
|
|
|
if (p)
|
|
|
|
p++;
|
|
|
|
else
|
|
|
|
p = base_path;
|
2007-01-08 01:27:07 +08:00
|
|
|
p1 = strrchr(base_path, '/');
|
|
|
|
#ifdef _WIN32
|
|
|
|
{
|
|
|
|
const char *p2;
|
|
|
|
p2 = strrchr(base_path, '\\');
|
|
|
|
if (!p1 || p2 > p1)
|
|
|
|
p1 = p2;
|
|
|
|
}
|
|
|
|
#endif
|
2006-08-02 00:21:11 +08:00
|
|
|
if (p1)
|
|
|
|
p1++;
|
|
|
|
else
|
|
|
|
p1 = base_path;
|
|
|
|
if (p1 > p)
|
|
|
|
p = p1;
|
|
|
|
len = p - base_path;
|
|
|
|
if (len > dest_size - 1)
|
|
|
|
len = dest_size - 1;
|
|
|
|
memcpy(dest, base_path, len);
|
|
|
|
dest[len] = '\0';
|
|
|
|
pstrcat(dest, dest_size, filename);
|
2005-10-31 02:30:10 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-11-27 00:20:25 +08:00
|
|
|
void bdrv_get_full_backing_filename_from_filename(const char *backed,
|
|
|
|
const char *backing,
|
2014-11-27 00:20:26 +08:00
|
|
|
char *dest, size_t sz,
|
|
|
|
Error **errp)
|
2012-05-08 22:51:50 +08:00
|
|
|
{
|
2014-11-27 00:20:26 +08:00
|
|
|
if (backing[0] == '\0' || path_has_protocol(backing) ||
|
|
|
|
path_is_absolute(backing))
|
|
|
|
{
|
2014-11-27 00:20:25 +08:00
|
|
|
pstrcpy(dest, sz, backing);
|
2014-11-27 00:20:26 +08:00
|
|
|
} else if (backed[0] == '\0' || strstart(backed, "json:", NULL)) {
|
|
|
|
error_setg(errp, "Cannot use relative backing file names for '%s'",
|
|
|
|
backed);
|
2012-05-08 22:51:50 +08:00
|
|
|
} else {
|
2014-11-27 00:20:25 +08:00
|
|
|
path_combine(dest, sz, backed, backing);
|
2012-05-08 22:51:50 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-11-27 00:20:26 +08:00
|
|
|
void bdrv_get_full_backing_filename(BlockDriverState *bs, char *dest, size_t sz,
|
|
|
|
Error **errp)
|
2014-11-27 00:20:25 +08:00
|
|
|
{
|
2014-11-27 00:20:26 +08:00
|
|
|
char *backed = bs->exact_filename[0] ? bs->exact_filename : bs->filename;
|
|
|
|
|
|
|
|
bdrv_get_full_backing_filename_from_filename(backed, bs->backing_file,
|
|
|
|
dest, sz, errp);
|
2014-11-27 00:20:25 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:51 +08:00
|
|
|
void bdrv_register(BlockDriver *bdrv)
|
|
|
|
{
|
|
|
|
bdrv_setup_io_funcs(bdrv);
|
2009-09-05 01:01:49 +08:00
|
|
|
|
2010-04-13 17:29:33 +08:00
|
|
|
QLIST_INSERT_HEAD(&bdrv_drivers, bdrv, list);
|
2004-08-02 05:59:26 +08:00
|
|
|
}
|
2004-03-15 05:38:54 +08:00
|
|
|
|
2014-10-07 19:59:12 +08:00
|
|
|
BlockDriverState *bdrv_new_root(void)
|
2004-03-15 05:38:54 +08:00
|
|
|
{
|
2014-10-07 19:59:12 +08:00
|
|
|
BlockDriverState *bs = bdrv_new();
|
2014-10-07 19:59:03 +08:00
|
|
|
|
|
|
|
QTAILQ_INSERT_TAIL(&bdrv_states, bs, device_list);
|
|
|
|
return bs;
|
|
|
|
}
|
|
|
|
|
|
|
|
BlockDriverState *bdrv_new(void)
|
|
|
|
{
|
|
|
|
BlockDriverState *bs;
|
|
|
|
int i;
|
|
|
|
|
block: Use g_new() & friends where that makes obvious sense
g_new(T, n) is neater than g_malloc(sizeof(T) * n). It's also safer,
for two reasons. One, it catches multiplication overflowing size_t.
Two, it returns T * rather than void *, which lets the compiler catch
more type errors.
Patch created with Coccinelle, with two manual changes on top:
* Add const to bdrv_iterate_format() to keep the types straight
* Convert the allocation in bdrv_drop_intermediate(), which Coccinelle
inexplicably misses
Coccinelle semantic patch:
@@
type T;
@@
-g_malloc(sizeof(T))
+g_new(T, 1)
@@
type T;
@@
-g_try_malloc(sizeof(T))
+g_try_new(T, 1)
@@
type T;
@@
-g_malloc0(sizeof(T))
+g_new0(T, 1)
@@
type T;
@@
-g_try_malloc0(sizeof(T))
+g_try_new0(T, 1)
@@
type T;
expression n;
@@
-g_malloc(sizeof(T) * (n))
+g_new(T, n)
@@
type T;
expression n;
@@
-g_try_malloc(sizeof(T) * (n))
+g_try_new(T, n)
@@
type T;
expression n;
@@
-g_malloc0(sizeof(T) * (n))
+g_new0(T, n)
@@
type T;
expression n;
@@
-g_try_malloc0(sizeof(T) * (n))
+g_try_new0(T, n)
@@
type T;
expression p, n;
@@
-g_realloc(p, sizeof(T) * (n))
+g_renew(T, p, n)
@@
type T;
expression p, n;
@@
-g_try_realloc(p, sizeof(T) * (n))
+g_try_renew(T, p, n)
Signed-off-by: Markus Armbruster <armbru@redhat.com>
Reviewed-by: Max Reitz <mreitz@redhat.com>
Reviewed-by: Jeff Cody <jcody@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
2014-08-19 16:31:08 +08:00
|
|
|
bs = g_new0(BlockDriverState, 1);
|
2013-11-13 18:29:43 +08:00
|
|
|
QLIST_INIT(&bs->dirty_bitmaps);
|
2014-05-23 21:29:42 +08:00
|
|
|
for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
|
|
|
|
QLIST_INIT(&bs->op_blockers[i]);
|
|
|
|
}
|
2013-06-24 23:13:10 +08:00
|
|
|
notifier_with_return_list_init(&bs->before_write_notifiers);
|
2013-09-02 20:14:39 +08:00
|
|
|
qemu_co_queue_init(&bs->throttled_reqs[0]);
|
|
|
|
qemu_co_queue_init(&bs->throttled_reqs[1]);
|
2013-08-23 09:14:46 +08:00
|
|
|
bs->refcnt = 1;
|
2014-05-08 22:34:37 +08:00
|
|
|
bs->aio_context = qemu_get_aio_context();
|
2012-08-23 17:20:36 +08:00
|
|
|
|
2016-01-29 23:36:11 +08:00
|
|
|
QTAILQ_INSERT_TAIL(&all_bdrv_states, bs, bs_list);
|
|
|
|
|
2004-03-15 05:38:54 +08:00
|
|
|
return bs;
|
|
|
|
}
|
|
|
|
|
2004-08-02 05:59:26 +08:00
|
|
|
BlockDriver *bdrv_find_format(const char *format_name)
|
|
|
|
{
|
|
|
|
BlockDriver *drv1;
|
2010-04-13 17:29:33 +08:00
|
|
|
QLIST_FOREACH(drv1, &bdrv_drivers, list) {
|
|
|
|
if (!strcmp(drv1->format_name, format_name)) {
|
2004-08-02 05:59:26 +08:00
|
|
|
return drv1;
|
2010-04-13 17:29:33 +08:00
|
|
|
}
|
2004-08-02 05:59:26 +08:00
|
|
|
}
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2013-05-29 19:35:40 +08:00
|
|
|
static int bdrv_is_whitelisted(BlockDriver *drv, bool read_only)
|
2009-10-28 01:41:44 +08:00
|
|
|
{
|
2013-05-29 19:35:40 +08:00
|
|
|
static const char *whitelist_rw[] = {
|
|
|
|
CONFIG_BDRV_RW_WHITELIST
|
|
|
|
};
|
|
|
|
static const char *whitelist_ro[] = {
|
|
|
|
CONFIG_BDRV_RO_WHITELIST
|
2009-10-28 01:41:44 +08:00
|
|
|
};
|
|
|
|
const char **p;
|
|
|
|
|
2013-05-29 19:35:40 +08:00
|
|
|
if (!whitelist_rw[0] && !whitelist_ro[0]) {
|
2009-10-28 01:41:44 +08:00
|
|
|
return 1; /* no whitelist, anything goes */
|
2013-05-29 19:35:40 +08:00
|
|
|
}
|
2009-10-28 01:41:44 +08:00
|
|
|
|
2013-05-29 19:35:40 +08:00
|
|
|
for (p = whitelist_rw; *p; p++) {
|
2009-10-28 01:41:44 +08:00
|
|
|
if (!strcmp(drv->format_name, *p)) {
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
}
|
2013-05-29 19:35:40 +08:00
|
|
|
if (read_only) {
|
|
|
|
for (p = whitelist_ro; *p; p++) {
|
|
|
|
if (!strcmp(drv->format_name, *p)) {
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2009-10-28 01:41:44 +08:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2012-05-07 16:50:42 +08:00
|
|
|
typedef struct CreateCo {
|
|
|
|
BlockDriver *drv;
|
|
|
|
char *filename;
|
2014-06-05 17:20:51 +08:00
|
|
|
QemuOpts *opts;
|
2012-05-07 16:50:42 +08:00
|
|
|
int ret;
|
2013-09-06 23:14:26 +08:00
|
|
|
Error *err;
|
2012-05-07 16:50:42 +08:00
|
|
|
} CreateCo;
|
|
|
|
|
|
|
|
static void coroutine_fn bdrv_create_co_entry(void *opaque)
|
|
|
|
{
|
2013-09-06 23:14:26 +08:00
|
|
|
Error *local_err = NULL;
|
|
|
|
int ret;
|
|
|
|
|
2012-05-07 16:50:42 +08:00
|
|
|
CreateCo *cco = opaque;
|
|
|
|
assert(cco->drv);
|
|
|
|
|
2014-06-05 17:21:11 +08:00
|
|
|
ret = cco->drv->bdrv_create(cco->filename, cco->opts, &local_err);
|
2014-01-30 22:07:28 +08:00
|
|
|
if (local_err) {
|
2013-09-06 23:14:26 +08:00
|
|
|
error_propagate(&cco->err, local_err);
|
|
|
|
}
|
|
|
|
cco->ret = ret;
|
2012-05-07 16:50:42 +08:00
|
|
|
}
|
|
|
|
|
2009-05-18 22:42:10 +08:00
|
|
|
int bdrv_create(BlockDriver *drv, const char* filename,
|
2014-06-05 17:20:51 +08:00
|
|
|
QemuOpts *opts, Error **errp)
|
2004-08-02 05:59:26 +08:00
|
|
|
{
|
2012-05-07 16:50:42 +08:00
|
|
|
int ret;
|
|
|
|
|
|
|
|
Coroutine *co;
|
|
|
|
CreateCo cco = {
|
|
|
|
.drv = drv,
|
|
|
|
.filename = g_strdup(filename),
|
2014-06-05 17:20:51 +08:00
|
|
|
.opts = opts,
|
2012-05-07 16:50:42 +08:00
|
|
|
.ret = NOT_DONE,
|
2013-09-06 23:14:26 +08:00
|
|
|
.err = NULL,
|
2012-05-07 16:50:42 +08:00
|
|
|
};
|
|
|
|
|
2014-06-05 17:21:11 +08:00
|
|
|
if (!drv->bdrv_create) {
|
2013-09-06 23:14:26 +08:00
|
|
|
error_setg(errp, "Driver '%s' does not support image creation", drv->format_name);
|
2012-10-18 03:45:25 +08:00
|
|
|
ret = -ENOTSUP;
|
|
|
|
goto out;
|
2012-05-07 16:50:42 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
if (qemu_in_coroutine()) {
|
|
|
|
/* Fast-path if already in coroutine context */
|
|
|
|
bdrv_create_co_entry(&cco);
|
|
|
|
} else {
|
|
|
|
co = qemu_coroutine_create(bdrv_create_co_entry);
|
|
|
|
qemu_coroutine_enter(co, &cco);
|
|
|
|
while (cco.ret == NOT_DONE) {
|
2014-07-07 21:18:01 +08:00
|
|
|
aio_poll(qemu_get_aio_context(), true);
|
2012-05-07 16:50:42 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
ret = cco.ret;
|
2013-09-06 23:14:26 +08:00
|
|
|
if (ret < 0) {
|
2014-01-30 22:07:28 +08:00
|
|
|
if (cco.err) {
|
2013-09-06 23:14:26 +08:00
|
|
|
error_propagate(errp, cco.err);
|
|
|
|
} else {
|
|
|
|
error_setg_errno(errp, -ret, "Could not create image");
|
|
|
|
}
|
|
|
|
}
|
2009-05-18 22:42:10 +08:00
|
|
|
|
2012-10-18 03:45:25 +08:00
|
|
|
out:
|
|
|
|
g_free(cco.filename);
|
2012-05-07 16:50:42 +08:00
|
|
|
return ret;
|
2004-08-02 05:59:26 +08:00
|
|
|
}
|
|
|
|
|
2014-06-05 17:21:11 +08:00
|
|
|
int bdrv_create_file(const char *filename, QemuOpts *opts, Error **errp)
|
2010-04-08 04:30:24 +08:00
|
|
|
{
|
|
|
|
BlockDriver *drv;
|
2013-09-06 23:14:26 +08:00
|
|
|
Error *local_err = NULL;
|
|
|
|
int ret;
|
2010-04-08 04:30:24 +08:00
|
|
|
|
2015-02-06 02:58:12 +08:00
|
|
|
drv = bdrv_find_protocol(filename, true, errp);
|
2010-04-08 04:30:24 +08:00
|
|
|
if (drv == NULL) {
|
2010-11-30 23:14:14 +08:00
|
|
|
return -ENOENT;
|
2010-04-08 04:30:24 +08:00
|
|
|
}
|
|
|
|
|
2014-06-05 17:21:11 +08:00
|
|
|
ret = bdrv_create(drv, filename, opts, &local_err);
|
2014-01-30 22:07:28 +08:00
|
|
|
if (local_err) {
|
2013-09-06 23:14:26 +08:00
|
|
|
error_propagate(errp, local_err);
|
|
|
|
}
|
|
|
|
return ret;
|
2010-04-08 04:30:24 +08:00
|
|
|
}
|
|
|
|
|
2015-02-16 19:47:54 +08:00
|
|
|
/**
|
|
|
|
* Try to get @bs's logical and physical block size.
|
|
|
|
* On success, store them in @bsz struct and return 0.
|
|
|
|
* On failure return -errno.
|
|
|
|
* @bs must not be empty.
|
|
|
|
*/
|
|
|
|
int bdrv_probe_blocksizes(BlockDriverState *bs, BlockSizes *bsz)
|
|
|
|
{
|
|
|
|
BlockDriver *drv = bs->drv;
|
|
|
|
|
|
|
|
if (drv && drv->bdrv_probe_blocksizes) {
|
|
|
|
return drv->bdrv_probe_blocksizes(bs, bsz);
|
|
|
|
}
|
|
|
|
|
|
|
|
return -ENOTSUP;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Try to get @bs's geometry (cyls, heads, sectors).
|
|
|
|
* On success, store them in @geo struct and return 0.
|
|
|
|
* On failure return -errno.
|
|
|
|
* @bs must not be empty.
|
|
|
|
*/
|
|
|
|
int bdrv_probe_geometry(BlockDriverState *bs, HDGeometry *geo)
|
|
|
|
{
|
|
|
|
BlockDriver *drv = bs->drv;
|
|
|
|
|
|
|
|
if (drv && drv->bdrv_probe_geometry) {
|
|
|
|
return drv->bdrv_probe_geometry(bs, geo);
|
|
|
|
}
|
|
|
|
|
|
|
|
return -ENOTSUP;
|
|
|
|
}
|
|
|
|
|
2012-05-28 15:27:54 +08:00
|
|
|
/*
|
|
|
|
* Create a uniquely-named empty temporary file.
|
|
|
|
* Return 0 upon success, otherwise a negative errno value.
|
|
|
|
*/
|
|
|
|
int get_tmp_filename(char *filename, int size)
|
2004-08-04 05:14:23 +08:00
|
|
|
{
|
2012-05-28 15:27:54 +08:00
|
|
|
#ifdef _WIN32
|
2007-01-08 01:27:07 +08:00
|
|
|
char temp_dir[MAX_PATH];
|
2012-05-28 15:27:54 +08:00
|
|
|
/* GetTempFileName requires that its output buffer (4th param)
|
|
|
|
have length MAX_PATH or greater. */
|
|
|
|
assert(size >= MAX_PATH);
|
|
|
|
return (GetTempPath(MAX_PATH, temp_dir)
|
|
|
|
&& GetTempFileName(temp_dir, "qem", 0, filename)
|
|
|
|
? 0 : -GetLastError());
|
2004-08-04 05:14:23 +08:00
|
|
|
#else
|
2004-04-01 07:37:16 +08:00
|
|
|
int fd;
|
2008-09-14 14:45:34 +08:00
|
|
|
const char *tmpdir;
|
2008-03-10 08:05:34 +08:00
|
|
|
tmpdir = getenv("TMPDIR");
|
2014-02-26 17:42:37 +08:00
|
|
|
if (!tmpdir) {
|
|
|
|
tmpdir = "/var/tmp";
|
|
|
|
}
|
2012-05-28 15:27:54 +08:00
|
|
|
if (snprintf(filename, size, "%s/vl.XXXXXX", tmpdir) >= size) {
|
|
|
|
return -EOVERFLOW;
|
|
|
|
}
|
2004-08-02 05:59:26 +08:00
|
|
|
fd = mkstemp(filename);
|
2012-09-05 21:26:22 +08:00
|
|
|
if (fd < 0) {
|
|
|
|
return -errno;
|
|
|
|
}
|
|
|
|
if (close(fd) != 0) {
|
|
|
|
unlink(filename);
|
2012-05-28 15:27:54 +08:00
|
|
|
return -errno;
|
|
|
|
}
|
|
|
|
return 0;
|
2004-08-04 05:14:23 +08:00
|
|
|
#endif
|
2012-05-28 15:27:54 +08:00
|
|
|
}
|
2003-06-30 18:03:06 +08:00
|
|
|
|
2010-04-08 04:30:24 +08:00
|
|
|
/*
|
|
|
|
* Detect host devices. By convention, /dev/cdrom[N] is always
|
|
|
|
* recognized as a host CDROM.
|
|
|
|
*/
|
|
|
|
static BlockDriver *find_hdev_driver(const char *filename)
|
|
|
|
{
|
|
|
|
int score_max = 0, score;
|
|
|
|
BlockDriver *drv = NULL, *d;
|
|
|
|
|
|
|
|
QLIST_FOREACH(d, &bdrv_drivers, list) {
|
|
|
|
if (d->bdrv_probe_device) {
|
|
|
|
score = d->bdrv_probe_device(filename);
|
|
|
|
if (score > score_max) {
|
|
|
|
score_max = score;
|
|
|
|
drv = d;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return drv;
|
|
|
|
}
|
|
|
|
|
2013-07-10 21:47:39 +08:00
|
|
|
BlockDriver *bdrv_find_protocol(const char *filename,
|
2015-02-06 02:58:12 +08:00
|
|
|
bool allow_protocol_prefix,
|
|
|
|
Error **errp)
|
2006-08-02 00:21:11 +08:00
|
|
|
{
|
|
|
|
BlockDriver *drv1;
|
|
|
|
char protocol[128];
|
2009-07-02 21:12:26 +08:00
|
|
|
int len;
|
2006-08-02 00:21:11 +08:00
|
|
|
const char *p;
|
2006-08-19 19:45:59 +08:00
|
|
|
|
2010-04-14 20:17:38 +08:00
|
|
|
/* TODO Drivers without bdrv_file_open must be specified explicitly */
|
|
|
|
|
2010-06-23 18:25:17 +08:00
|
|
|
/*
|
|
|
|
* XXX(hch): we really should not let host device detection
|
|
|
|
* override an explicit protocol specification, but moving this
|
|
|
|
* later breaks access to device names with colons in them.
|
|
|
|
* Thanks to the brain-dead persistent naming schemes on udev-
|
|
|
|
* based Linux systems those actually are quite common.
|
|
|
|
*/
|
|
|
|
drv1 = find_hdev_driver(filename);
|
|
|
|
if (drv1) {
|
|
|
|
return drv1;
|
|
|
|
}
|
|
|
|
|
2013-07-10 21:47:39 +08:00
|
|
|
if (!path_has_protocol(filename) || !allow_protocol_prefix) {
|
2014-12-03 01:32:42 +08:00
|
|
|
return &bdrv_file;
|
2010-04-08 04:30:24 +08:00
|
|
|
}
|
2013-07-10 21:47:39 +08:00
|
|
|
|
2010-12-09 19:53:00 +08:00
|
|
|
p = strchr(filename, ':');
|
|
|
|
assert(p != NULL);
|
2009-07-02 21:12:26 +08:00
|
|
|
len = p - filename;
|
|
|
|
if (len > sizeof(protocol) - 1)
|
|
|
|
len = sizeof(protocol) - 1;
|
|
|
|
memcpy(protocol, filename, len);
|
|
|
|
protocol[len] = '\0';
|
2010-04-13 17:29:33 +08:00
|
|
|
QLIST_FOREACH(drv1, &bdrv_drivers, list) {
|
2007-09-17 05:08:06 +08:00
|
|
|
if (drv1->protocol_name &&
|
2010-04-13 17:29:33 +08:00
|
|
|
!strcmp(drv1->protocol_name, protocol)) {
|
2006-08-02 00:21:11 +08:00
|
|
|
return drv1;
|
2010-04-13 17:29:33 +08:00
|
|
|
}
|
2006-08-02 00:21:11 +08:00
|
|
|
}
|
2015-02-06 02:58:12 +08:00
|
|
|
|
|
|
|
error_setg(errp, "Unknown protocol '%s'", protocol);
|
2006-08-02 00:21:11 +08:00
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2014-11-20 23:27:10 +08:00
|
|
|
/*
|
|
|
|
* Guess image format by probing its contents.
|
|
|
|
* This is not a good idea when your image is raw (CVE-2008-2004), but
|
|
|
|
* we do it anyway for backward compatibility.
|
|
|
|
*
|
|
|
|
* @buf contains the image's first @buf_size bytes.
|
2014-11-20 23:27:11 +08:00
|
|
|
* @buf_size is the buffer size in bytes (generally BLOCK_PROBE_BUF_SIZE,
|
|
|
|
* but can be smaller if the image file is smaller)
|
2014-11-20 23:27:10 +08:00
|
|
|
* @filename is its filename.
|
|
|
|
*
|
|
|
|
* For all block drivers, call the bdrv_probe() method to get its
|
|
|
|
* probing score.
|
|
|
|
* Return the first block driver with the highest probing score.
|
|
|
|
*/
|
raw: Prohibit dangerous writes for probed images
If the user neglects to specify the image format, QEMU probes the
image to guess it automatically, for convenience.
Relying on format probing is insecure for raw images (CVE-2008-2004).
If the guest writes a suitable header to the device, the next probe
will recognize a format chosen by the guest. A malicious guest can
abuse this to gain access to host files, e.g. by crafting a QCOW2
header with backing file /etc/shadow.
Commit 1e72d3b (April 2008) provided -drive parameter format to let
users disable probing. Commit f965509 (March 2009) extended QCOW2 to
optionally store the backing file format, to let users disable backing
file probing. QED has had a flag to suppress probing since the
beginning (2010), set whenever a raw backing file is assigned.
All of these additions that allow to avoid format probing have to be
specified explicitly. The default still allows the attack.
In order to fix this, commit 79368c8 (July 2010) put probed raw images
in a restricted mode, in which they wouldn't be able to overwrite the
first few bytes of the image so that they would identify as a different
image. If a write to the first sector would write one of the signatures
of another driver, qemu would instead zero out the first four bytes.
This patch was later reverted in commit 8b33d9e (September 2010) because
it didn't get the handling of unaligned qiov members right.
Today's block layer that is based on coroutines and has qiov utility
functions makes it much easier to get this functionality right, so this
patch implements it.
The other differences of this patch to the old one are that it doesn't
silently write something different than the guest requested by zeroing
out some bytes (it fails the request instead) and that it doesn't
maintain a list of signatures in the raw driver (it calls the usual
probe function instead).
Note that this change doesn't introduce new breakage for false positive
cases where the guest legitimately writes data into the first sector
that matches the signatures of an image format (e.g. for nested virt):
These cases were broken before, only the failure mode changes from
corruption after the next restart (when the wrong format is probed) to
failing the problematic write request.
Also note that like in the original patch, the restrictions only apply
if the image format has been guessed by probing. Explicitly specifying a
format allows guests to write anything they like.
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
Reviewed-by: Eric Blake <eblake@redhat.com>
Reviewed-by: Max Reitz <mreitz@redhat.com>
Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com>
Message-id: 1416497234-29880-8-git-send-email-kwolf@redhat.com
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
2014-11-20 23:27:12 +08:00
|
|
|
BlockDriver *bdrv_probe_all(const uint8_t *buf, int buf_size,
|
|
|
|
const char *filename)
|
2014-11-20 23:27:10 +08:00
|
|
|
{
|
|
|
|
int score_max = 0, score;
|
|
|
|
BlockDriver *drv = NULL, *d;
|
|
|
|
|
|
|
|
QLIST_FOREACH(d, &bdrv_drivers, list) {
|
|
|
|
if (d->bdrv_probe) {
|
|
|
|
score = d->bdrv_probe(buf, buf_size, filename);
|
|
|
|
if (score > score_max) {
|
|
|
|
score_max = score;
|
|
|
|
drv = d;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return drv;
|
|
|
|
}
|
|
|
|
|
2012-11-13 00:35:27 +08:00
|
|
|
static int find_image_format(BlockDriverState *bs, const char *filename,
|
2013-09-05 20:45:29 +08:00
|
|
|
BlockDriver **pdrv, Error **errp)
|
2009-06-15 19:55:19 +08:00
|
|
|
{
|
2014-11-20 23:27:10 +08:00
|
|
|
BlockDriver *drv;
|
2014-11-20 23:27:11 +08:00
|
|
|
uint8_t buf[BLOCK_PROBE_BUF_SIZE];
|
2012-11-13 00:35:27 +08:00
|
|
|
int ret = 0;
|
2010-05-18 00:45:57 +08:00
|
|
|
|
2010-06-02 00:37:31 +08:00
|
|
|
/* Return the raw BlockDriver * to scsi-generic devices or empty drives */
|
2015-06-23 18:44:56 +08:00
|
|
|
if (bdrv_is_sg(bs) || !bdrv_is_inserted(bs) || bdrv_getlength(bs) == 0) {
|
2014-12-03 01:32:42 +08:00
|
|
|
*pdrv = &bdrv_raw;
|
2010-07-22 03:51:51 +08:00
|
|
|
return ret;
|
2010-05-27 23:56:28 +08:00
|
|
|
}
|
2010-05-18 00:45:57 +08:00
|
|
|
|
2006-08-02 00:21:11 +08:00
|
|
|
ret = bdrv_pread(bs, 0, buf, sizeof(buf));
|
|
|
|
if (ret < 0) {
|
2013-09-05 20:45:29 +08:00
|
|
|
error_setg_errno(errp, -ret, "Could not read image for determining its "
|
|
|
|
"format");
|
2010-07-22 03:51:51 +08:00
|
|
|
*pdrv = NULL;
|
|
|
|
return ret;
|
2006-08-02 00:21:11 +08:00
|
|
|
}
|
|
|
|
|
2014-11-20 23:27:10 +08:00
|
|
|
drv = bdrv_probe_all(buf, ret, filename);
|
2010-07-22 03:51:51 +08:00
|
|
|
if (!drv) {
|
2013-09-05 20:45:29 +08:00
|
|
|
error_setg(errp, "Could not determine image format: No compatible "
|
|
|
|
"driver found");
|
2010-07-22 03:51:51 +08:00
|
|
|
ret = -ENOENT;
|
|
|
|
}
|
|
|
|
*pdrv = drv;
|
|
|
|
return ret;
|
2004-08-02 05:59:26 +08:00
|
|
|
}
|
|
|
|
|
2010-04-19 23:56:41 +08:00
|
|
|
/**
|
|
|
|
* Set the current 'total_sectors' value
|
2014-06-26 19:23:17 +08:00
|
|
|
* Return 0 on success, -errno on error.
|
2010-04-19 23:56:41 +08:00
|
|
|
*/
|
|
|
|
static int refresh_total_sectors(BlockDriverState *bs, int64_t hint)
|
|
|
|
{
|
|
|
|
BlockDriver *drv = bs->drv;
|
|
|
|
|
2010-05-18 00:46:04 +08:00
|
|
|
/* Do not attempt drv->bdrv_getlength() on scsi-generic devices */
|
2015-06-23 18:44:56 +08:00
|
|
|
if (bdrv_is_sg(bs))
|
2010-05-18 00:46:04 +08:00
|
|
|
return 0;
|
|
|
|
|
2010-04-19 23:56:41 +08:00
|
|
|
/* query actual device if possible, otherwise just trust the hint */
|
|
|
|
if (drv->bdrv_getlength) {
|
|
|
|
int64_t length = drv->bdrv_getlength(bs);
|
|
|
|
if (length < 0) {
|
|
|
|
return length;
|
|
|
|
}
|
2013-11-06 19:48:06 +08:00
|
|
|
hint = DIV_ROUND_UP(length, BDRV_SECTOR_SIZE);
|
2010-04-19 23:56:41 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
bs->total_sectors = hint;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2015-11-16 23:43:27 +08:00
|
|
|
/**
|
|
|
|
* Combines a QDict of new block driver @options with any missing options taken
|
|
|
|
* from @old_options, so that leaving out an option defaults to its old value.
|
|
|
|
*/
|
|
|
|
static void bdrv_join_options(BlockDriverState *bs, QDict *options,
|
|
|
|
QDict *old_options)
|
|
|
|
{
|
|
|
|
if (bs->drv && bs->drv->bdrv_join_options) {
|
|
|
|
bs->drv->bdrv_join_options(options, old_options);
|
|
|
|
} else {
|
|
|
|
qdict_join(options, old_options, false);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2013-02-08 21:06:11 +08:00
|
|
|
/**
|
|
|
|
* Set open flags for a given discard mode
|
|
|
|
*
|
|
|
|
* Return 0 on success, -1 if the discard mode was invalid.
|
|
|
|
*/
|
|
|
|
int bdrv_parse_discard_flags(const char *mode, int *flags)
|
|
|
|
{
|
|
|
|
*flags &= ~BDRV_O_UNMAP;
|
|
|
|
|
|
|
|
if (!strcmp(mode, "off") || !strcmp(mode, "ignore")) {
|
|
|
|
/* do nothing */
|
|
|
|
} else if (!strcmp(mode, "on") || !strcmp(mode, "unmap")) {
|
|
|
|
*flags |= BDRV_O_UNMAP;
|
|
|
|
} else {
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2011-08-04 19:26:51 +08:00
|
|
|
/**
|
|
|
|
* Set open flags for a given cache mode
|
|
|
|
*
|
|
|
|
* Return 0 on success, -1 if the cache mode was invalid.
|
|
|
|
*/
|
|
|
|
int bdrv_parse_cache_flags(const char *mode, int *flags)
|
|
|
|
{
|
|
|
|
*flags &= ~BDRV_O_CACHE_MASK;
|
|
|
|
|
|
|
|
if (!strcmp(mode, "off") || !strcmp(mode, "none")) {
|
|
|
|
*flags |= BDRV_O_NOCACHE | BDRV_O_CACHE_WB;
|
2011-08-04 19:26:52 +08:00
|
|
|
} else if (!strcmp(mode, "directsync")) {
|
|
|
|
*flags |= BDRV_O_NOCACHE;
|
2011-08-04 19:26:51 +08:00
|
|
|
} else if (!strcmp(mode, "writeback")) {
|
|
|
|
*flags |= BDRV_O_CACHE_WB;
|
|
|
|
} else if (!strcmp(mode, "unsafe")) {
|
|
|
|
*flags |= BDRV_O_CACHE_WB;
|
|
|
|
*flags |= BDRV_O_NO_FLUSH;
|
|
|
|
} else if (!strcmp(mode, "writethrough")) {
|
|
|
|
/* this is the default */
|
|
|
|
} else {
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2014-05-06 18:11:42 +08:00
|
|
|
/*
|
|
|
|
* Returns the flags that a temporary snapshot should get, based on the
|
|
|
|
* originally requested flags (the originally requested image will have flags
|
|
|
|
* like a backing file)
|
|
|
|
*/
|
|
|
|
static int bdrv_temp_snapshot_flags(int flags)
|
|
|
|
{
|
|
|
|
return (flags & ~BDRV_O_SNAPSHOT) | BDRV_O_TEMPORARY;
|
|
|
|
}
|
|
|
|
|
2014-04-12 03:29:52 +08:00
|
|
|
/*
|
2015-04-29 23:29:39 +08:00
|
|
|
* Returns the options and flags that bs->file should get if a protocol driver
|
|
|
|
* is expected, based on the given options and flags for the parent BDS
|
2014-04-12 03:29:52 +08:00
|
|
|
*/
|
2015-04-29 23:29:39 +08:00
|
|
|
static void bdrv_inherited_options(int *child_flags, QDict *child_options,
|
|
|
|
int parent_flags, QDict *parent_options)
|
2014-04-12 03:29:52 +08:00
|
|
|
{
|
2015-04-29 23:29:39 +08:00
|
|
|
int flags = parent_flags;
|
|
|
|
|
2014-04-12 03:29:52 +08:00
|
|
|
/* Enable protocol handling, disable format probing for bs->file */
|
|
|
|
flags |= BDRV_O_PROTOCOL;
|
|
|
|
|
2015-05-08 23:49:53 +08:00
|
|
|
/* If the cache mode isn't explicitly set, inherit direct and no-flush from
|
|
|
|
* the parent. */
|
|
|
|
qdict_copy_default(child_options, parent_options, BDRV_OPT_CACHE_DIRECT);
|
|
|
|
qdict_copy_default(child_options, parent_options, BDRV_OPT_CACHE_NO_FLUSH);
|
|
|
|
|
2014-04-12 03:29:52 +08:00
|
|
|
/* Our block drivers take care to send flushes and respect unmap policy,
|
2015-05-08 23:49:53 +08:00
|
|
|
* so we can default to enable both on lower layers regardless of the
|
|
|
|
* corresponding parent options. */
|
|
|
|
qdict_set_default_str(child_options, BDRV_OPT_CACHE_WB, "on");
|
|
|
|
flags |= BDRV_O_UNMAP;
|
2014-04-12 03:29:52 +08:00
|
|
|
|
|
|
|
/* Clear flags that only apply to the top layer */
|
2014-04-12 03:36:45 +08:00
|
|
|
flags &= ~(BDRV_O_SNAPSHOT | BDRV_O_NO_BACKING | BDRV_O_COPY_ON_READ);
|
2014-04-12 03:29:52 +08:00
|
|
|
|
2015-04-29 23:29:39 +08:00
|
|
|
*child_flags = flags;
|
2014-04-12 03:29:52 +08:00
|
|
|
}
|
|
|
|
|
2015-04-08 19:43:47 +08:00
|
|
|
const BdrvChildRole child_file = {
|
2015-04-29 23:29:39 +08:00
|
|
|
.inherit_options = bdrv_inherited_options,
|
2015-04-08 19:43:47 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
/*
|
2015-04-29 23:29:39 +08:00
|
|
|
* Returns the options and flags that bs->file should get if the use of formats
|
|
|
|
* (and not only protocols) is permitted for it, based on the given options and
|
|
|
|
* flags for the parent BDS
|
2015-04-08 19:43:47 +08:00
|
|
|
*/
|
2015-04-29 23:29:39 +08:00
|
|
|
static void bdrv_inherited_fmt_options(int *child_flags, QDict *child_options,
|
|
|
|
int parent_flags, QDict *parent_options)
|
2015-04-08 19:43:47 +08:00
|
|
|
{
|
2015-04-29 23:29:39 +08:00
|
|
|
child_file.inherit_options(child_flags, child_options,
|
|
|
|
parent_flags, parent_options);
|
|
|
|
|
|
|
|
*child_flags &= ~BDRV_O_PROTOCOL;
|
2015-04-08 19:43:47 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
const BdrvChildRole child_format = {
|
2015-04-29 23:29:39 +08:00
|
|
|
.inherit_options = bdrv_inherited_fmt_options,
|
2015-04-08 19:43:47 +08:00
|
|
|
};
|
|
|
|
|
2014-04-25 19:27:34 +08:00
|
|
|
/*
|
2015-04-29 23:29:39 +08:00
|
|
|
* Returns the options and flags that bs->backing should get, based on the
|
|
|
|
* given options and flags for the parent BDS
|
2014-04-25 19:27:34 +08:00
|
|
|
*/
|
2015-04-29 23:29:39 +08:00
|
|
|
static void bdrv_backing_options(int *child_flags, QDict *child_options,
|
|
|
|
int parent_flags, QDict *parent_options)
|
2014-04-25 19:27:34 +08:00
|
|
|
{
|
2015-04-29 23:29:39 +08:00
|
|
|
int flags = parent_flags;
|
|
|
|
|
2015-05-08 23:49:53 +08:00
|
|
|
/* The cache mode is inherited unmodified for backing files */
|
|
|
|
qdict_copy_default(child_options, parent_options, BDRV_OPT_CACHE_WB);
|
|
|
|
qdict_copy_default(child_options, parent_options, BDRV_OPT_CACHE_DIRECT);
|
|
|
|
qdict_copy_default(child_options, parent_options, BDRV_OPT_CACHE_NO_FLUSH);
|
|
|
|
|
2014-04-25 19:27:34 +08:00
|
|
|
/* backing files always opened read-only */
|
|
|
|
flags &= ~(BDRV_O_RDWR | BDRV_O_COPY_ON_READ);
|
|
|
|
|
|
|
|
/* snapshot=on is handled on the top layer */
|
2014-04-12 01:16:36 +08:00
|
|
|
flags &= ~(BDRV_O_SNAPSHOT | BDRV_O_TEMPORARY);
|
2014-04-25 19:27:34 +08:00
|
|
|
|
2015-04-29 23:29:39 +08:00
|
|
|
*child_flags = flags;
|
2014-04-25 19:27:34 +08:00
|
|
|
}
|
|
|
|
|
2015-04-08 19:43:47 +08:00
|
|
|
static const BdrvChildRole child_backing = {
|
2015-04-29 23:29:39 +08:00
|
|
|
.inherit_options = bdrv_backing_options,
|
2015-04-08 19:43:47 +08:00
|
|
|
};
|
|
|
|
|
2012-11-13 00:05:39 +08:00
|
|
|
static int bdrv_open_flags(BlockDriverState *bs, int flags)
|
|
|
|
{
|
|
|
|
int open_flags = flags | BDRV_O_CACHE_WB;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Clear flags that are internal to the block layer before opening the
|
|
|
|
* image.
|
|
|
|
*/
|
2014-06-04 20:33:27 +08:00
|
|
|
open_flags &= ~(BDRV_O_SNAPSHOT | BDRV_O_NO_BACKING | BDRV_O_PROTOCOL);
|
2012-11-13 00:05:39 +08:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Snapshots should be writable.
|
|
|
|
*/
|
2014-04-12 01:16:36 +08:00
|
|
|
if (flags & BDRV_O_TEMPORARY) {
|
2012-11-13 00:05:39 +08:00
|
|
|
open_flags |= BDRV_O_RDWR;
|
|
|
|
}
|
|
|
|
|
|
|
|
return open_flags;
|
|
|
|
}
|
|
|
|
|
2015-05-08 23:49:53 +08:00
|
|
|
static void update_flags_from_options(int *flags, QemuOpts *opts)
|
|
|
|
{
|
|
|
|
*flags &= ~BDRV_O_CACHE_MASK;
|
|
|
|
|
|
|
|
assert(qemu_opt_find(opts, BDRV_OPT_CACHE_WB));
|
|
|
|
if (qemu_opt_get_bool(opts, BDRV_OPT_CACHE_WB, false)) {
|
|
|
|
*flags |= BDRV_O_CACHE_WB;
|
|
|
|
}
|
|
|
|
|
|
|
|
assert(qemu_opt_find(opts, BDRV_OPT_CACHE_NO_FLUSH));
|
|
|
|
if (qemu_opt_get_bool(opts, BDRV_OPT_CACHE_NO_FLUSH, false)) {
|
|
|
|
*flags |= BDRV_O_NO_FLUSH;
|
|
|
|
}
|
|
|
|
|
|
|
|
assert(qemu_opt_find(opts, BDRV_OPT_CACHE_DIRECT));
|
|
|
|
if (qemu_opt_get_bool(opts, BDRV_OPT_CACHE_DIRECT, false)) {
|
|
|
|
*flags |= BDRV_O_NOCACHE;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static void update_options_from_flags(QDict *options, int flags)
|
|
|
|
{
|
|
|
|
if (!qdict_haskey(options, BDRV_OPT_CACHE_WB)) {
|
|
|
|
qdict_put(options, BDRV_OPT_CACHE_WB,
|
|
|
|
qbool_from_bool(flags & BDRV_O_CACHE_WB));
|
|
|
|
}
|
|
|
|
if (!qdict_haskey(options, BDRV_OPT_CACHE_DIRECT)) {
|
|
|
|
qdict_put(options, BDRV_OPT_CACHE_DIRECT,
|
|
|
|
qbool_from_bool(flags & BDRV_O_NOCACHE));
|
|
|
|
}
|
|
|
|
if (!qdict_haskey(options, BDRV_OPT_CACHE_NO_FLUSH)) {
|
|
|
|
qdict_put(options, BDRV_OPT_CACHE_NO_FLUSH,
|
|
|
|
qbool_from_bool(flags & BDRV_O_NO_FLUSH));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-01-24 21:11:52 +08:00
|
|
|
static void bdrv_assign_node_name(BlockDriverState *bs,
|
|
|
|
const char *node_name,
|
|
|
|
Error **errp)
|
2014-01-24 04:31:33 +08:00
|
|
|
{
|
2015-10-13 07:36:50 +08:00
|
|
|
char *gen_node_name = NULL;
|
2014-01-24 04:31:33 +08:00
|
|
|
|
2015-10-13 07:36:50 +08:00
|
|
|
if (!node_name) {
|
|
|
|
node_name = gen_node_name = id_generate(ID_BLOCK);
|
|
|
|
} else if (!id_wellformed(node_name)) {
|
|
|
|
/*
|
|
|
|
* Check for empty string or invalid characters, but not if it is
|
|
|
|
* generated (generated names use characters not available to the user)
|
|
|
|
*/
|
2014-09-25 15:54:02 +08:00
|
|
|
error_setg(errp, "Invalid node name");
|
2014-01-24 21:11:52 +08:00
|
|
|
return;
|
2014-01-24 04:31:33 +08:00
|
|
|
}
|
|
|
|
|
2014-02-13 00:15:07 +08:00
|
|
|
/* takes care of avoiding namespaces collisions */
|
2014-10-07 19:59:12 +08:00
|
|
|
if (blk_by_name(node_name)) {
|
2014-02-13 00:15:07 +08:00
|
|
|
error_setg(errp, "node-name=%s is conflicting with a device id",
|
|
|
|
node_name);
|
2015-10-13 07:36:50 +08:00
|
|
|
goto out;
|
2014-02-13 00:15:07 +08:00
|
|
|
}
|
|
|
|
|
2014-01-24 04:31:33 +08:00
|
|
|
/* takes care of avoiding duplicates node names */
|
|
|
|
if (bdrv_find_node(node_name)) {
|
|
|
|
error_setg(errp, "Duplicate node name");
|
2015-10-13 07:36:50 +08:00
|
|
|
goto out;
|
2014-01-24 04:31:33 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/* copy node name into the bs and insert it into the graph list */
|
|
|
|
pstrcpy(bs->node_name, sizeof(bs->node_name), node_name);
|
|
|
|
QTAILQ_INSERT_TAIL(&graph_bdrv_states, bs, node_list);
|
2015-10-13 07:36:50 +08:00
|
|
|
out:
|
|
|
|
g_free(gen_node_name);
|
2014-01-24 04:31:33 +08:00
|
|
|
}
|
|
|
|
|
2015-04-07 23:12:56 +08:00
|
|
|
static QemuOptsList bdrv_runtime_opts = {
|
|
|
|
.name = "bdrv_common",
|
|
|
|
.head = QTAILQ_HEAD_INITIALIZER(bdrv_runtime_opts.head),
|
|
|
|
.desc = {
|
|
|
|
{
|
|
|
|
.name = "node-name",
|
|
|
|
.type = QEMU_OPT_STRING,
|
|
|
|
.help = "Node name of the block device node",
|
|
|
|
},
|
2015-04-24 22:38:02 +08:00
|
|
|
{
|
|
|
|
.name = "driver",
|
|
|
|
.type = QEMU_OPT_STRING,
|
|
|
|
.help = "Block driver to use for the node",
|
|
|
|
},
|
2015-05-08 23:49:53 +08:00
|
|
|
{
|
|
|
|
.name = BDRV_OPT_CACHE_WB,
|
|
|
|
.type = QEMU_OPT_BOOL,
|
|
|
|
.help = "Enable writeback mode",
|
|
|
|
},
|
|
|
|
{
|
|
|
|
.name = BDRV_OPT_CACHE_DIRECT,
|
|
|
|
.type = QEMU_OPT_BOOL,
|
|
|
|
.help = "Bypass software writeback cache on the host",
|
|
|
|
},
|
|
|
|
{
|
|
|
|
.name = BDRV_OPT_CACHE_NO_FLUSH,
|
|
|
|
.type = QEMU_OPT_BOOL,
|
|
|
|
.help = "Ignore flush requests",
|
|
|
|
},
|
2015-04-07 23:12:56 +08:00
|
|
|
{ /* end of list */ }
|
|
|
|
},
|
|
|
|
};
|
|
|
|
|
2010-04-14 21:24:50 +08:00
|
|
|
/*
|
|
|
|
* Common part for opening disk images and files
|
2013-03-15 17:35:04 +08:00
|
|
|
*
|
|
|
|
* Removes all processed options from *options.
|
2010-04-14 21:24:50 +08:00
|
|
|
*/
|
2015-06-16 20:19:22 +08:00
|
|
|
static int bdrv_open_common(BlockDriverState *bs, BdrvChild *file,
|
2016-01-12 02:07:50 +08:00
|
|
|
QDict *options, Error **errp)
|
2010-04-14 21:24:50 +08:00
|
|
|
{
|
|
|
|
int ret, open_flags;
|
2013-04-09 20:34:19 +08:00
|
|
|
const char *filename;
|
2015-04-24 22:38:02 +08:00
|
|
|
const char *driver_name = NULL;
|
2014-01-24 04:31:33 +08:00
|
|
|
const char *node_name = NULL;
|
2015-04-07 23:12:56 +08:00
|
|
|
QemuOpts *opts;
|
2015-04-24 22:38:02 +08:00
|
|
|
BlockDriver *drv;
|
2013-09-05 20:45:29 +08:00
|
|
|
Error *local_err = NULL;
|
2010-04-14 21:24:50 +08:00
|
|
|
|
2012-05-08 22:51:49 +08:00
|
|
|
assert(bs->file == NULL);
|
2013-03-06 19:20:31 +08:00
|
|
|
assert(options != NULL && bs->options != options);
|
2010-04-14 21:24:50 +08:00
|
|
|
|
2015-04-24 22:38:02 +08:00
|
|
|
opts = qemu_opts_create(&bdrv_runtime_opts, NULL, 0, &error_abort);
|
|
|
|
qemu_opts_absorb_qdict(opts, options, &local_err);
|
|
|
|
if (local_err) {
|
|
|
|
error_propagate(errp, local_err);
|
|
|
|
ret = -EINVAL;
|
|
|
|
goto fail_opts;
|
|
|
|
}
|
|
|
|
|
|
|
|
driver_name = qemu_opt_get(opts, "driver");
|
|
|
|
drv = bdrv_find_format(driver_name);
|
|
|
|
assert(drv != NULL);
|
|
|
|
|
2013-04-22 23:48:40 +08:00
|
|
|
if (file != NULL) {
|
2015-06-16 20:19:22 +08:00
|
|
|
filename = file->bs->filename;
|
2013-04-22 23:48:40 +08:00
|
|
|
} else {
|
|
|
|
filename = qdict_get_try_str(options, "filename");
|
|
|
|
}
|
|
|
|
|
2014-02-03 21:49:42 +08:00
|
|
|
if (drv->bdrv_needs_filename && !filename) {
|
|
|
|
error_setg(errp, "The '%s' block driver requires a file name",
|
|
|
|
drv->format_name);
|
2015-04-07 23:12:56 +08:00
|
|
|
ret = -EINVAL;
|
|
|
|
goto fail_opts;
|
2014-01-24 04:31:33 +08:00
|
|
|
}
|
|
|
|
|
2016-01-12 02:07:50 +08:00
|
|
|
trace_bdrv_open_common(bs, filename ?: "", bs->open_flags,
|
|
|
|
drv->format_name);
|
2015-04-24 22:38:02 +08:00
|
|
|
|
2015-04-07 23:12:56 +08:00
|
|
|
node_name = qemu_opt_get(opts, "node-name");
|
2014-01-24 21:11:52 +08:00
|
|
|
bdrv_assign_node_name(bs, node_name, &local_err);
|
2014-04-25 22:50:31 +08:00
|
|
|
if (local_err) {
|
2014-01-24 21:11:52 +08:00
|
|
|
error_propagate(errp, local_err);
|
2015-04-07 23:12:56 +08:00
|
|
|
ret = -EINVAL;
|
|
|
|
goto fail_opts;
|
2013-03-28 00:28:18 +08:00
|
|
|
}
|
|
|
|
|
2011-11-29 19:42:20 +08:00
|
|
|
bs->request_alignment = 512;
|
2013-08-22 15:24:14 +08:00
|
|
|
bs->zero_beyond_eof = true;
|
2016-01-12 02:07:50 +08:00
|
|
|
bs->read_only = !(bs->open_flags & BDRV_O_RDWR);
|
2013-05-29 19:35:40 +08:00
|
|
|
|
|
|
|
if (use_bdrv_whitelist && !bdrv_is_whitelisted(drv, bs->read_only)) {
|
2013-10-10 17:45:55 +08:00
|
|
|
error_setg(errp,
|
|
|
|
!bs->read_only && bdrv_is_whitelisted(drv, true)
|
|
|
|
? "Driver '%s' can only be used for read-only devices"
|
|
|
|
: "Driver '%s' is not whitelisted",
|
|
|
|
drv->format_name);
|
2015-04-07 23:12:56 +08:00
|
|
|
ret = -ENOTSUP;
|
|
|
|
goto fail_opts;
|
2013-05-29 19:35:40 +08:00
|
|
|
}
|
2010-04-14 21:24:50 +08:00
|
|
|
|
2011-11-29 00:08:47 +08:00
|
|
|
assert(bs->copy_on_read == 0); /* bdrv_new() and bdrv_close() make it so */
|
2016-01-12 02:07:50 +08:00
|
|
|
if (bs->open_flags & BDRV_O_COPY_ON_READ) {
|
2013-09-19 21:12:18 +08:00
|
|
|
if (!bs->read_only) {
|
|
|
|
bdrv_enable_copy_on_read(bs);
|
|
|
|
} else {
|
|
|
|
error_setg(errp, "Can't use copy-on-read on read-only device");
|
2015-04-07 23:12:56 +08:00
|
|
|
ret = -EINVAL;
|
|
|
|
goto fail_opts;
|
2013-09-19 21:12:18 +08:00
|
|
|
}
|
2011-11-29 00:08:47 +08:00
|
|
|
}
|
|
|
|
|
2013-03-18 23:40:51 +08:00
|
|
|
if (filename != NULL) {
|
|
|
|
pstrcpy(bs->filename, sizeof(bs->filename), filename);
|
|
|
|
} else {
|
|
|
|
bs->filename[0] = '\0';
|
|
|
|
}
|
2014-07-19 02:24:56 +08:00
|
|
|
pstrcpy(bs->exact_filename, sizeof(bs->exact_filename), bs->filename);
|
2010-04-14 21:24:50 +08:00
|
|
|
|
|
|
|
bs->drv = drv;
|
2011-08-21 11:09:37 +08:00
|
|
|
bs->opaque = g_malloc0(drv->instance_size);
|
2010-04-14 21:24:50 +08:00
|
|
|
|
2015-05-08 23:49:53 +08:00
|
|
|
/* Apply cache mode options */
|
|
|
|
update_flags_from_options(&bs->open_flags, opts);
|
|
|
|
bdrv_set_enable_write_cache(bs, bs->open_flags & BDRV_O_CACHE_WB);
|
2011-10-27 17:54:27 +08:00
|
|
|
|
2010-04-14 20:17:38 +08:00
|
|
|
/* Open the image, either directly or using a protocol */
|
2016-01-12 02:07:50 +08:00
|
|
|
open_flags = bdrv_open_flags(bs, bs->open_flags);
|
2010-04-14 20:17:38 +08:00
|
|
|
if (drv->bdrv_file_open) {
|
2013-03-28 00:28:18 +08:00
|
|
|
assert(file == NULL);
|
2013-09-24 23:07:04 +08:00
|
|
|
assert(!drv->bdrv_needs_filename || filename != NULL);
|
2013-09-05 20:45:29 +08:00
|
|
|
ret = drv->bdrv_file_open(bs, options, open_flags, &local_err);
|
2012-11-13 00:35:27 +08:00
|
|
|
} else {
|
2013-04-09 19:19:18 +08:00
|
|
|
if (file == NULL) {
|
2013-09-05 20:45:29 +08:00
|
|
|
error_setg(errp, "Can't use '%s' as a block driver for the "
|
|
|
|
"protocol level", drv->format_name);
|
2013-04-09 19:19:18 +08:00
|
|
|
ret = -EINVAL;
|
|
|
|
goto free_and_fail;
|
|
|
|
}
|
2012-11-13 00:35:27 +08:00
|
|
|
bs->file = file;
|
2013-09-05 20:45:29 +08:00
|
|
|
ret = drv->bdrv_open(bs, options, open_flags, &local_err);
|
2010-04-14 20:17:38 +08:00
|
|
|
}
|
|
|
|
|
2010-04-14 21:24:50 +08:00
|
|
|
if (ret < 0) {
|
2014-01-30 22:07:28 +08:00
|
|
|
if (local_err) {
|
2013-09-05 20:45:29 +08:00
|
|
|
error_propagate(errp, local_err);
|
2013-09-24 18:14:01 +08:00
|
|
|
} else if (bs->filename[0]) {
|
|
|
|
error_setg_errno(errp, -ret, "Could not open '%s'", bs->filename);
|
2013-09-05 20:45:29 +08:00
|
|
|
} else {
|
|
|
|
error_setg_errno(errp, -ret, "Could not open image");
|
|
|
|
}
|
2010-04-14 21:24:50 +08:00
|
|
|
goto free_and_fail;
|
|
|
|
}
|
|
|
|
|
block: Deprecate QCOW/QCOW2 encryption
We've steered users away from QCOW/QCOW2 encryption for a while,
because it's a flawed design (commit 136cd19 Describe flaws in
qcow/qcow2 encryption in the docs).
In addition to flawed crypto, we have comically bad usability, and
plain old bugs. Let me show you.
= Example images =
I'm going to use a raw image as backing file, and two QCOW2 images,
one encrypted, and one not:
$ qemu-img create -f raw backing.img 4m
Formatting 'backing.img', fmt=raw size=4194304
$ qemu-img create -f qcow2 -o encryption,backing_file=backing.img,backing_fmt=raw geheim.qcow2 4m
Formatting 'geheim.qcow2', fmt=qcow2 size=4194304 backing_file='backing.img' backing_fmt='raw' encryption=on cluster_size=65536 lazy_refcounts=off
$ qemu-img create -f qcow2 -o backing_file=backing.img,backing_fmt=raw normal.qcow2 4m
Formatting 'normal.qcow2', fmt=qcow2 size=4194304 backing_file='backing.img' backing_fmt='raw' encryption=off cluster_size=65536 lazy_refcounts=off
= Usability issues =
== Confusing startup ==
When no image is encrypted, and you don't give -S, QEMU starts the
guest immediately:
$ qemu-system-x86_64 -nodefaults -display none -monitor stdio normal.qcow2
QEMU 2.2.50 monitor - type 'help' for more information
(qemu) info status
VM status: running
But as soon as there's an encrypted image in play, the guest is *not*
started, with no notification whatsoever:
$ qemu-system-x86_64 -nodefaults -display none -monitor stdio geheim.qcow2
QEMU 2.2.50 monitor - type 'help' for more information
(qemu) info status
VM status: paused (prelaunch)
If the user figured out that he needs to type "cont" to enter his
keys, the confusion enters the next level: "cont" asks for at most
*one* key. If more are needed, it then silently does nothing. The
user has to type "cont" once per encrypted image:
$ qemu-system-x86_64 -nodefaults -display none -monitor stdio -drive if=none,file=geheim.qcow2 -drive if=none,file=geheim.qcow2
QEMU 2.2.50 monitor - type 'help' for more information
(qemu) info status
VM status: paused (prelaunch)
(qemu) c
none0 (geheim.qcow2) is encrypted.
Password: ******
(qemu) info status
VM status: paused (prelaunch)
(qemu) c
none1 (geheim.qcow2) is encrypted.
Password: ******
(qemu) info status
VM status: running
== Incorrect passwords not caught ==
All existing encryption schemes give you the GIGO treatment: garbage
password in, garbage data out. Guests usually refuse to mount
garbage, but other usage is prone to data loss.
== Need to stop the guest to add an encrypted image ==
$ qemu-system-x86_64 -nodefaults -display none -monitor stdio
QEMU 2.2.50 monitor - type 'help' for more information
(qemu) info status
VM status: running
(qemu) drive_add "" if=none,file=geheim.qcow2
Guest must be stopped for opening of encrypted image
(qemu) stop
(qemu) drive_add "" if=none,file=geheim.qcow2
OK
Commit c3adb58 added this restriction. Before, we could expose images
lacking an encryption key to guests, with potentially catastrophic
results. See also "Use without key is not always caught".
= Bugs =
== Use without key is not always caught ==
Encrypted images can be in an intermediate state "opened, but no key".
The weird startup behavior and the need to stop the guest are there to
ensure the guest isn't exposed to that state. But other things still
are!
* drive_backup
$ qemu-system-x86_64 -nodefaults -display none -monitor stdio geheim.qcow2
QEMU 2.2.50 monitor - type 'help' for more information
(qemu) drive_backup -f ide0-hd0 out.img raw
Formatting 'out.img', fmt=raw size=4194304
I guess this writes encrypted data to raw image out.img. Good luck
with figuring out how to decrypt that again.
* commit
$ qemu-system-x86_64 -nodefaults -display none -monitor stdio geheim.qcow2
QEMU 2.2.50 monitor - type 'help' for more information
(qemu) commit ide0-hd0
I guess this writes encrypted data into the unencrypted raw backing
image, effectively destroying it.
== QMP device_add of usb-storage fails when it shouldn't ==
When the image is encrypted, device_add creates the device, defers
actually attaching it to when the key becomes available, then fails.
This is wrong. device_add must either create the device and succeed,
or do nothing and fail.
$ qemu-system-x86_64 -nodefaults -display none -usb -qmp stdio -drive if=none,id=foo,file=geheim.qcow2
{"QMP": {"version": {"qemu": {"micro": 50, "minor": 2, "major": 2}, "package": ""}, "capabilities": []}}
{ "execute": "qmp_capabilities" }
{"return": {}}
{ "execute": "device_add", "arguments": { "driver": "usb-storage", "id": "bar", "drive": "foo" } }
{"error": {"class": "DeviceEncrypted", "desc": "'foo' (geheim.qcow2) is encrypted"}}
{"execute":"device_del","arguments": { "id": "bar" } }
{"timestamp": {"seconds": 1426003440, "microseconds": 237181}, "event": "DEVICE_DELETED", "data": {"path": "/machine/peripheral/bar/bar.0/legacy[0]"}}
{"timestamp": {"seconds": 1426003440, "microseconds": 238231}, "event": "DEVICE_DELETED", "data": {"device": "bar", "path": "/machine/peripheral/bar"}}
{"return": {}}
This stuff is worse than useless, it's a trap for users.
If people become sufficiently interested in encrypted images to
contribute a cryptographically sane implementation for QCOW2 (or
whatever other format), then rewriting the necessary support around it
from scratch will likely be easier and yield better results than
fixing up the existing mess.
Let's deprecate the mess now, drop it after a grace period, and move
on.
Signed-off-by: Markus Armbruster <armbru@redhat.com>
Reviewed-by: Eric Blake <eblake@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
2015-03-14 04:09:40 +08:00
|
|
|
if (bs->encrypted) {
|
|
|
|
error_report("Encrypted images are deprecated");
|
|
|
|
error_printf("Support for them will be removed in a future release.\n"
|
|
|
|
"You can use 'qemu-img convert' to convert your image"
|
|
|
|
" to an unencrypted one.\n");
|
|
|
|
}
|
|
|
|
|
2010-04-19 23:56:41 +08:00
|
|
|
ret = refresh_total_sectors(bs, bs->total_sectors);
|
|
|
|
if (ret < 0) {
|
2013-09-05 20:45:29 +08:00
|
|
|
error_setg_errno(errp, -ret, "Could not refresh total sector count");
|
2010-04-19 23:56:41 +08:00
|
|
|
goto free_and_fail;
|
2010-04-14 21:24:50 +08:00
|
|
|
}
|
2010-04-19 23:56:41 +08:00
|
|
|
|
2014-07-16 23:48:16 +08:00
|
|
|
bdrv_refresh_limits(bs, &local_err);
|
|
|
|
if (local_err) {
|
|
|
|
error_propagate(errp, local_err);
|
|
|
|
ret = -EINVAL;
|
|
|
|
goto free_and_fail;
|
|
|
|
}
|
|
|
|
|
2011-11-29 19:42:20 +08:00
|
|
|
assert(bdrv_opt_mem_align(bs) != 0);
|
2015-05-12 22:30:55 +08:00
|
|
|
assert(bdrv_min_mem_align(bs) != 0);
|
2015-06-23 18:44:56 +08:00
|
|
|
assert((bs->request_alignment != 0) || bdrv_is_sg(bs));
|
2015-04-07 23:12:56 +08:00
|
|
|
|
|
|
|
qemu_opts_del(opts);
|
2010-04-14 21:24:50 +08:00
|
|
|
return 0;
|
|
|
|
|
|
|
|
free_and_fail:
|
2012-11-13 00:35:27 +08:00
|
|
|
bs->file = NULL;
|
2011-08-21 11:09:37 +08:00
|
|
|
g_free(bs->opaque);
|
2010-04-14 21:24:50 +08:00
|
|
|
bs->opaque = NULL;
|
|
|
|
bs->drv = NULL;
|
2015-04-07 23:12:56 +08:00
|
|
|
fail_opts:
|
|
|
|
qemu_opts_del(opts);
|
2010-04-14 21:24:50 +08:00
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2014-05-26 17:45:08 +08:00
|
|
|
static QDict *parse_json_filename(const char *filename, Error **errp)
|
|
|
|
{
|
|
|
|
QObject *options_obj;
|
|
|
|
QDict *options;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
ret = strstart(filename, "json:", &filename);
|
|
|
|
assert(ret);
|
|
|
|
|
|
|
|
options_obj = qobject_from_json(filename);
|
|
|
|
if (!options_obj) {
|
|
|
|
error_setg(errp, "Could not parse the JSON options");
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (qobject_type(options_obj) != QTYPE_QDICT) {
|
|
|
|
qobject_decref(options_obj);
|
|
|
|
error_setg(errp, "Invalid JSON object given");
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
options = qobject_to_qdict(options_obj);
|
|
|
|
qdict_flatten(options);
|
|
|
|
|
|
|
|
return options;
|
|
|
|
}
|
|
|
|
|
2015-10-29 22:24:41 +08:00
|
|
|
static void parse_json_protocol(QDict *options, const char **pfilename,
|
|
|
|
Error **errp)
|
|
|
|
{
|
|
|
|
QDict *json_options;
|
|
|
|
Error *local_err = NULL;
|
|
|
|
|
|
|
|
/* Parse json: pseudo-protocol */
|
|
|
|
if (!*pfilename || !g_str_has_prefix(*pfilename, "json:")) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
json_options = parse_json_filename(*pfilename, &local_err);
|
|
|
|
if (local_err) {
|
|
|
|
error_propagate(errp, local_err);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Options given in the filename have lower priority than options
|
|
|
|
* specified directly */
|
|
|
|
qdict_join(options, json_options, false);
|
|
|
|
QDECREF(json_options);
|
|
|
|
*pfilename = NULL;
|
|
|
|
}
|
|
|
|
|
2010-04-12 22:37:13 +08:00
|
|
|
/*
|
2014-05-26 17:09:59 +08:00
|
|
|
* Fills in default options for opening images and converts the legacy
|
|
|
|
* filename/flags pair to option QDict entries.
|
block: driver should override flags in bdrv_open()
The BDRV_O_PROTOCOL flag should have an impact only if no driver is
specified explicitly. Therefore, if bdrv_open() is called with an
explicit block driver argument (either through the options QDict or
through the drv parameter) and that block driver is a protocol block
driver, BDRV_O_PROTOCOL should be set; if it is a format block driver,
BDRV_O_PROTOCOL should be unset.
While there was code to unset the flag in case a format block driver
has been selected, it only followed the bdrv_fill_options() function
call whereas the flag in fact needs to be adjusted before it is used
there.
With that change, BDRV_O_PROTOCOL will always be set if the BDS should
be a protocol driver; if the driver has been specified explicitly, the
new code will set it; and bdrv_fill_options() will only "probe" a
protocol driver if BDRV_O_PROTOCOL is set. The probing after
bdrv_fill_options() cannot select a protocol driver.
Thus, bdrv_open_image() to open BDS.file is never called if a protocol
BDS is about to be created. With that change in turn it is impossible to
call bdrv_open_common() with a protocol drv and file != NULL, which
allows us to remove the bdrv_swap() call.
This change breaks a test case in qemu-iotest 051:
"-drive file=t.qcow2,file.driver=qcow2" now works because the explicitly
specified "qcow2" overrides the BDRV_O_PROTOCOL which is automatically
set for the "file" BDS (and the filename is just passed down).
Therefore, this patch removes that test case.
Signed-off-by: Max Reitz <mreitz@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
2015-03-20 02:53:16 +08:00
|
|
|
* The BDRV_O_PROTOCOL flag in *flags will be set or cleared accordingly if a
|
|
|
|
* block driver has been specified explicitly.
|
2010-04-12 22:37:13 +08:00
|
|
|
*/
|
2015-10-29 22:24:41 +08:00
|
|
|
static int bdrv_fill_options(QDict **options, const char *filename,
|
2015-08-27 01:47:51 +08:00
|
|
|
int *flags, Error **errp)
|
2004-08-02 05:59:26 +08:00
|
|
|
{
|
2013-03-18 23:40:51 +08:00
|
|
|
const char *drvname;
|
block: driver should override flags in bdrv_open()
The BDRV_O_PROTOCOL flag should have an impact only if no driver is
specified explicitly. Therefore, if bdrv_open() is called with an
explicit block driver argument (either through the options QDict or
through the drv parameter) and that block driver is a protocol block
driver, BDRV_O_PROTOCOL should be set; if it is a format block driver,
BDRV_O_PROTOCOL should be unset.
While there was code to unset the flag in case a format block driver
has been selected, it only followed the bdrv_fill_options() function
call whereas the flag in fact needs to be adjusted before it is used
there.
With that change, BDRV_O_PROTOCOL will always be set if the BDS should
be a protocol driver; if the driver has been specified explicitly, the
new code will set it; and bdrv_fill_options() will only "probe" a
protocol driver if BDRV_O_PROTOCOL is set. The probing after
bdrv_fill_options() cannot select a protocol driver.
Thus, bdrv_open_image() to open BDS.file is never called if a protocol
BDS is about to be created. With that change in turn it is impossible to
call bdrv_open_common() with a protocol drv and file != NULL, which
allows us to remove the bdrv_swap() call.
This change breaks a test case in qemu-iotest 051:
"-drive file=t.qcow2,file.driver=qcow2" now works because the explicitly
specified "qcow2" overrides the BDRV_O_PROTOCOL which is automatically
set for the "file" BDS (and the filename is just passed down).
Therefore, this patch removes that test case.
Signed-off-by: Max Reitz <mreitz@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
2015-03-20 02:53:16 +08:00
|
|
|
bool protocol = *flags & BDRV_O_PROTOCOL;
|
2014-04-03 18:45:51 +08:00
|
|
|
bool parse_filename = false;
|
2015-08-27 01:47:51 +08:00
|
|
|
BlockDriver *drv = NULL;
|
2013-09-05 20:45:29 +08:00
|
|
|
Error *local_err = NULL;
|
2006-08-02 00:21:11 +08:00
|
|
|
|
block: driver should override flags in bdrv_open()
The BDRV_O_PROTOCOL flag should have an impact only if no driver is
specified explicitly. Therefore, if bdrv_open() is called with an
explicit block driver argument (either through the options QDict or
through the drv parameter) and that block driver is a protocol block
driver, BDRV_O_PROTOCOL should be set; if it is a format block driver,
BDRV_O_PROTOCOL should be unset.
While there was code to unset the flag in case a format block driver
has been selected, it only followed the bdrv_fill_options() function
call whereas the flag in fact needs to be adjusted before it is used
there.
With that change, BDRV_O_PROTOCOL will always be set if the BDS should
be a protocol driver; if the driver has been specified explicitly, the
new code will set it; and bdrv_fill_options() will only "probe" a
protocol driver if BDRV_O_PROTOCOL is set. The probing after
bdrv_fill_options() cannot select a protocol driver.
Thus, bdrv_open_image() to open BDS.file is never called if a protocol
BDS is about to be created. With that change in turn it is impossible to
call bdrv_open_common() with a protocol drv and file != NULL, which
allows us to remove the bdrv_swap() call.
This change breaks a test case in qemu-iotest 051:
"-drive file=t.qcow2,file.driver=qcow2" now works because the explicitly
specified "qcow2" overrides the BDRV_O_PROTOCOL which is automatically
set for the "file" BDS (and the filename is just passed down).
Therefore, this patch removes that test case.
Signed-off-by: Max Reitz <mreitz@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
2015-03-20 02:53:16 +08:00
|
|
|
drvname = qdict_get_try_str(*options, "driver");
|
2015-08-27 01:47:51 +08:00
|
|
|
if (drvname) {
|
|
|
|
drv = bdrv_find_format(drvname);
|
|
|
|
if (!drv) {
|
|
|
|
error_setg(errp, "Unknown driver '%s'", drvname);
|
|
|
|
return -ENOENT;
|
|
|
|
}
|
|
|
|
/* If the user has explicitly specified the driver, this choice should
|
|
|
|
* override the BDRV_O_PROTOCOL flag */
|
|
|
|
protocol = drv->bdrv_file_open;
|
block: driver should override flags in bdrv_open()
The BDRV_O_PROTOCOL flag should have an impact only if no driver is
specified explicitly. Therefore, if bdrv_open() is called with an
explicit block driver argument (either through the options QDict or
through the drv parameter) and that block driver is a protocol block
driver, BDRV_O_PROTOCOL should be set; if it is a format block driver,
BDRV_O_PROTOCOL should be unset.
While there was code to unset the flag in case a format block driver
has been selected, it only followed the bdrv_fill_options() function
call whereas the flag in fact needs to be adjusted before it is used
there.
With that change, BDRV_O_PROTOCOL will always be set if the BDS should
be a protocol driver; if the driver has been specified explicitly, the
new code will set it; and bdrv_fill_options() will only "probe" a
protocol driver if BDRV_O_PROTOCOL is set. The probing after
bdrv_fill_options() cannot select a protocol driver.
Thus, bdrv_open_image() to open BDS.file is never called if a protocol
BDS is about to be created. With that change in turn it is impossible to
call bdrv_open_common() with a protocol drv and file != NULL, which
allows us to remove the bdrv_swap() call.
This change breaks a test case in qemu-iotest 051:
"-drive file=t.qcow2,file.driver=qcow2" now works because the explicitly
specified "qcow2" overrides the BDRV_O_PROTOCOL which is automatically
set for the "file" BDS (and the filename is just passed down).
Therefore, this patch removes that test case.
Signed-off-by: Max Reitz <mreitz@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
2015-03-20 02:53:16 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
if (protocol) {
|
|
|
|
*flags |= BDRV_O_PROTOCOL;
|
|
|
|
} else {
|
|
|
|
*flags &= ~BDRV_O_PROTOCOL;
|
|
|
|
}
|
|
|
|
|
2015-05-08 23:49:53 +08:00
|
|
|
/* Translate cache options from flags into options */
|
|
|
|
update_options_from_flags(*options, *flags);
|
|
|
|
|
2013-04-09 20:34:19 +08:00
|
|
|
/* Fetch the file name from the options QDict if necessary */
|
2014-05-27 16:50:29 +08:00
|
|
|
if (protocol && filename) {
|
2014-05-26 17:09:59 +08:00
|
|
|
if (!qdict_haskey(*options, "filename")) {
|
|
|
|
qdict_put(*options, "filename", qstring_from_str(filename));
|
|
|
|
parse_filename = true;
|
|
|
|
} else {
|
|
|
|
error_setg(errp, "Can't specify 'file' and 'filename' options at "
|
|
|
|
"the same time");
|
|
|
|
return -EINVAL;
|
|
|
|
}
|
2013-04-09 20:34:19 +08:00
|
|
|
}
|
|
|
|
|
2013-03-18 23:40:51 +08:00
|
|
|
/* Find the right block driver */
|
2014-05-26 17:09:59 +08:00
|
|
|
filename = qdict_get_try_str(*options, "filename");
|
|
|
|
|
2015-08-27 01:47:51 +08:00
|
|
|
if (!drvname && protocol) {
|
|
|
|
if (filename) {
|
|
|
|
drv = bdrv_find_protocol(filename, parse_filename, errp);
|
2014-05-27 16:50:29 +08:00
|
|
|
if (!drv) {
|
2015-08-27 01:47:51 +08:00
|
|
|
return -EINVAL;
|
2014-05-27 16:50:29 +08:00
|
|
|
}
|
2015-08-27 01:47:51 +08:00
|
|
|
|
|
|
|
drvname = drv->format_name;
|
|
|
|
qdict_put(*options, "driver", qstring_from_str(drvname));
|
|
|
|
} else {
|
|
|
|
error_setg(errp, "Must specify either driver or file");
|
|
|
|
return -EINVAL;
|
2013-07-10 21:47:39 +08:00
|
|
|
}
|
2013-03-18 23:40:51 +08:00
|
|
|
}
|
|
|
|
|
2014-05-27 16:50:29 +08:00
|
|
|
assert(drv || !protocol);
|
2013-03-18 23:40:51 +08:00
|
|
|
|
2014-05-26 17:09:59 +08:00
|
|
|
/* Driver-specific filename parsing */
|
2014-05-27 16:50:29 +08:00
|
|
|
if (drv && drv->bdrv_parse_filename && parse_filename) {
|
2014-02-19 01:33:11 +08:00
|
|
|
drv->bdrv_parse_filename(filename, *options, &local_err);
|
2014-01-30 22:07:28 +08:00
|
|
|
if (local_err) {
|
2013-09-05 20:45:29 +08:00
|
|
|
error_propagate(errp, local_err);
|
2014-05-26 17:09:59 +08:00
|
|
|
return -EINVAL;
|
2013-03-16 01:47:22 +08:00
|
|
|
}
|
2014-03-06 05:41:36 +08:00
|
|
|
|
|
|
|
if (!drv->bdrv_needs_filename) {
|
|
|
|
qdict_del(*options, "filename");
|
|
|
|
}
|
2013-03-16 01:47:22 +08:00
|
|
|
}
|
|
|
|
|
2015-10-19 23:53:08 +08:00
|
|
|
if (runstate_check(RUN_STATE_INMIGRATE)) {
|
2016-01-13 22:56:06 +08:00
|
|
|
*flags |= BDRV_O_INACTIVE;
|
2015-10-19 23:53:08 +08:00
|
|
|
}
|
|
|
|
|
2014-05-26 17:09:59 +08:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2015-06-15 19:24:19 +08:00
|
|
|
static BdrvChild *bdrv_attach_child(BlockDriverState *parent_bs,
|
|
|
|
BlockDriverState *child_bs,
|
2015-04-27 19:46:22 +08:00
|
|
|
const char *child_name,
|
2015-06-15 19:24:19 +08:00
|
|
|
const BdrvChildRole *child_role)
|
2015-06-15 17:53:47 +08:00
|
|
|
{
|
|
|
|
BdrvChild *child = g_new(BdrvChild, 1);
|
|
|
|
*child = (BdrvChild) {
|
|
|
|
.bs = child_bs,
|
2015-04-27 19:46:22 +08:00
|
|
|
.name = g_strdup(child_name),
|
2015-06-15 17:53:47 +08:00
|
|
|
.role = child_role,
|
|
|
|
};
|
|
|
|
|
|
|
|
QLIST_INSERT_HEAD(&parent_bs->children, child, next);
|
2015-09-17 19:18:23 +08:00
|
|
|
QLIST_INSERT_HEAD(&child_bs->parents, child, next_parent);
|
2015-06-15 19:24:19 +08:00
|
|
|
|
|
|
|
return child;
|
2015-06-15 17:53:47 +08:00
|
|
|
}
|
|
|
|
|
2015-09-15 17:58:23 +08:00
|
|
|
static void bdrv_detach_child(BdrvChild *child)
|
2015-06-15 19:51:04 +08:00
|
|
|
{
|
|
|
|
QLIST_REMOVE(child, next);
|
2015-09-17 19:18:23 +08:00
|
|
|
QLIST_REMOVE(child, next_parent);
|
2015-04-27 19:46:22 +08:00
|
|
|
g_free(child->name);
|
2015-06-15 19:51:04 +08:00
|
|
|
g_free(child);
|
|
|
|
}
|
|
|
|
|
|
|
|
void bdrv_unref_child(BlockDriverState *parent, BdrvChild *child)
|
|
|
|
{
|
2015-10-13 20:09:44 +08:00
|
|
|
BlockDriverState *child_bs;
|
|
|
|
|
|
|
|
if (child == NULL) {
|
|
|
|
return;
|
|
|
|
}
|
2015-06-15 19:51:04 +08:00
|
|
|
|
|
|
|
if (child->bs->inherits_from == parent) {
|
|
|
|
child->bs->inherits_from = NULL;
|
|
|
|
}
|
|
|
|
|
2015-10-13 20:09:44 +08:00
|
|
|
child_bs = child->bs;
|
2015-06-15 19:51:04 +08:00
|
|
|
bdrv_detach_child(child);
|
|
|
|
bdrv_unref(child_bs);
|
|
|
|
}
|
|
|
|
|
2015-09-14 21:33:33 +08:00
|
|
|
/*
|
|
|
|
* Sets the backing file link of a BDS. A new reference is created; callers
|
|
|
|
* which don't need their own reference any more must call bdrv_unref().
|
|
|
|
*/
|
2014-05-23 21:29:45 +08:00
|
|
|
void bdrv_set_backing_hd(BlockDriverState *bs, BlockDriverState *backing_hd)
|
|
|
|
{
|
2015-09-14 21:33:33 +08:00
|
|
|
if (backing_hd) {
|
|
|
|
bdrv_ref(backing_hd);
|
|
|
|
}
|
2014-05-23 21:29:45 +08:00
|
|
|
|
2015-06-17 20:55:21 +08:00
|
|
|
if (bs->backing) {
|
2014-05-23 21:29:47 +08:00
|
|
|
assert(bs->backing_blocker);
|
2015-06-17 20:55:21 +08:00
|
|
|
bdrv_op_unblock_all(bs->backing->bs, bs->backing_blocker);
|
2015-09-14 21:33:33 +08:00
|
|
|
bdrv_unref_child(bs, bs->backing);
|
2014-05-23 21:29:47 +08:00
|
|
|
} else if (backing_hd) {
|
|
|
|
error_setg(&bs->backing_blocker,
|
2015-04-08 17:29:19 +08:00
|
|
|
"node is used as backing hd of '%s'",
|
|
|
|
bdrv_get_device_or_node_name(bs));
|
2014-05-23 21:29:47 +08:00
|
|
|
}
|
|
|
|
|
2014-05-23 21:29:45 +08:00
|
|
|
if (!backing_hd) {
|
2014-05-23 21:29:47 +08:00
|
|
|
error_free(bs->backing_blocker);
|
|
|
|
bs->backing_blocker = NULL;
|
2015-06-17 20:55:21 +08:00
|
|
|
bs->backing = NULL;
|
2014-05-23 21:29:45 +08:00
|
|
|
goto out;
|
|
|
|
}
|
2015-04-27 19:46:22 +08:00
|
|
|
bs->backing = bdrv_attach_child(bs, backing_hd, "backing", &child_backing);
|
2014-05-23 21:29:45 +08:00
|
|
|
bs->open_flags &= ~BDRV_O_NO_BACKING;
|
|
|
|
pstrcpy(bs->backing_file, sizeof(bs->backing_file), backing_hd->filename);
|
|
|
|
pstrcpy(bs->backing_format, sizeof(bs->backing_format),
|
|
|
|
backing_hd->drv ? backing_hd->drv->format_name : "");
|
2014-05-23 21:29:47 +08:00
|
|
|
|
2015-06-17 20:55:21 +08:00
|
|
|
bdrv_op_block_all(backing_hd, bs->backing_blocker);
|
2014-05-23 21:29:47 +08:00
|
|
|
/* Otherwise we won't be able to commit due to check in bdrv_commit */
|
2015-06-17 20:55:21 +08:00
|
|
|
bdrv_op_unblock(backing_hd, BLOCK_OP_TYPE_COMMIT_TARGET,
|
2014-05-23 21:29:47 +08:00
|
|
|
bs->backing_blocker);
|
2014-05-23 21:29:45 +08:00
|
|
|
out:
|
2014-07-16 23:48:16 +08:00
|
|
|
bdrv_refresh_limits(bs, NULL);
|
2014-05-23 21:29:45 +08:00
|
|
|
}
|
|
|
|
|
2013-03-28 22:29:24 +08:00
|
|
|
/*
|
|
|
|
* Opens the backing file for a BlockDriverState if not yet open
|
|
|
|
*
|
2015-01-17 01:23:41 +08:00
|
|
|
* bdref_key specifies the key for the image's BlockdevRef in the options QDict.
|
|
|
|
* That QDict has to be flattened; therefore, if the BlockdevRef is a QDict
|
|
|
|
* itself, all options starting with "${bdref_key}." are considered part of the
|
|
|
|
* BlockdevRef.
|
|
|
|
*
|
|
|
|
* TODO Can this be unified with bdrv_open_image()?
|
2013-03-28 22:29:24 +08:00
|
|
|
*/
|
2015-01-17 01:23:41 +08:00
|
|
|
int bdrv_open_backing_file(BlockDriverState *bs, QDict *parent_options,
|
|
|
|
const char *bdref_key, Error **errp)
|
2012-10-18 22:49:17 +08:00
|
|
|
{
|
2014-04-22 23:05:27 +08:00
|
|
|
char *backing_filename = g_malloc0(PATH_MAX);
|
2015-01-17 01:23:41 +08:00
|
|
|
char *bdref_key_dot;
|
|
|
|
const char *reference = NULL;
|
2014-04-25 19:27:34 +08:00
|
|
|
int ret = 0;
|
2014-05-23 21:29:45 +08:00
|
|
|
BlockDriverState *backing_hd;
|
2015-01-17 01:23:41 +08:00
|
|
|
QDict *options;
|
|
|
|
QDict *tmp_parent_options = NULL;
|
2013-09-05 20:45:29 +08:00
|
|
|
Error *local_err = NULL;
|
2012-10-18 22:49:17 +08:00
|
|
|
|
2015-06-17 20:55:21 +08:00
|
|
|
if (bs->backing != NULL) {
|
2014-04-22 23:05:27 +08:00
|
|
|
goto free_exit;
|
2012-10-18 22:49:17 +08:00
|
|
|
}
|
|
|
|
|
2013-03-28 22:29:24 +08:00
|
|
|
/* NULL means an empty set of options */
|
2015-01-17 01:23:41 +08:00
|
|
|
if (parent_options == NULL) {
|
|
|
|
tmp_parent_options = qdict_new();
|
|
|
|
parent_options = tmp_parent_options;
|
2013-03-28 22:29:24 +08:00
|
|
|
}
|
|
|
|
|
2012-10-18 22:49:17 +08:00
|
|
|
bs->open_flags &= ~BDRV_O_NO_BACKING;
|
2015-01-17 01:23:41 +08:00
|
|
|
|
|
|
|
bdref_key_dot = g_strdup_printf("%s.", bdref_key);
|
|
|
|
qdict_extract_subqdict(parent_options, &options, bdref_key_dot);
|
|
|
|
g_free(bdref_key_dot);
|
|
|
|
|
|
|
|
reference = qdict_get_try_str(parent_options, bdref_key);
|
|
|
|
if (reference || qdict_haskey(options, "file.filename")) {
|
2013-04-13 02:27:07 +08:00
|
|
|
backing_filename[0] = '\0';
|
|
|
|
} else if (bs->backing_file[0] == '\0' && qdict_size(options) == 0) {
|
2013-03-28 22:29:24 +08:00
|
|
|
QDECREF(options);
|
2014-04-22 23:05:27 +08:00
|
|
|
goto free_exit;
|
2013-09-22 20:05:06 +08:00
|
|
|
} else {
|
2014-11-27 00:20:26 +08:00
|
|
|
bdrv_get_full_backing_filename(bs, backing_filename, PATH_MAX,
|
|
|
|
&local_err);
|
|
|
|
if (local_err) {
|
|
|
|
ret = -EINVAL;
|
|
|
|
error_propagate(errp, local_err);
|
|
|
|
QDECREF(options);
|
|
|
|
goto free_exit;
|
|
|
|
}
|
2012-10-18 22:49:17 +08:00
|
|
|
}
|
|
|
|
|
2014-06-04 21:09:35 +08:00
|
|
|
if (!bs->drv || !bs->drv->supports_backing) {
|
|
|
|
ret = -EINVAL;
|
|
|
|
error_setg(errp, "Driver doesn't support backing files");
|
|
|
|
QDECREF(options);
|
|
|
|
goto free_exit;
|
|
|
|
}
|
|
|
|
|
2014-11-26 01:12:42 +08:00
|
|
|
if (bs->backing_format[0] != '\0' && !qdict_haskey(options, "driver")) {
|
|
|
|
qdict_put(options, "driver", qstring_from_str(bs->backing_format));
|
2012-10-18 22:49:17 +08:00
|
|
|
}
|
|
|
|
|
2015-01-17 01:23:41 +08:00
|
|
|
backing_hd = NULL;
|
2015-04-08 19:43:47 +08:00
|
|
|
ret = bdrv_open_inherit(&backing_hd,
|
|
|
|
*backing_filename ? backing_filename : NULL,
|
2015-01-17 01:23:41 +08:00
|
|
|
reference, options, 0, bs, &child_backing,
|
error: Use error_prepend() where it makes obvious sense
Done with this Coccinelle semantic patch
@@
expression FMT, E1, E2;
expression list ARGS;
@@
- error_setg(E1, FMT, ARGS, error_get_pretty(E2));
+ error_propagate(E1, E2);/*###*/
+ error_prepend(E1, FMT/*@@@*/, ARGS);
followed by manual cleanup, first because I can't figure out how to
make Coccinelle transform strings, and second to get rid of now
superfluous error_propagate().
We now use or propagate the original error whole instead of just its
message obtained with error_get_pretty(). This avoids suppressing its
hint (see commit 50b7b00), but I can't see how the errors touched in
this commit could come with hints. It also improves the message
printed with &error_abort when we screw up (see commit 1e9b65b).
Signed-off-by: Markus Armbruster <armbru@redhat.com>
Reviewed-by: Eric Blake <eblake@redhat.com>
2015-12-18 23:35:15 +08:00
|
|
|
errp);
|
2012-10-18 22:49:17 +08:00
|
|
|
if (ret < 0) {
|
|
|
|
bs->open_flags |= BDRV_O_NO_BACKING;
|
error: Use error_prepend() where it makes obvious sense
Done with this Coccinelle semantic patch
@@
expression FMT, E1, E2;
expression list ARGS;
@@
- error_setg(E1, FMT, ARGS, error_get_pretty(E2));
+ error_propagate(E1, E2);/*###*/
+ error_prepend(E1, FMT/*@@@*/, ARGS);
followed by manual cleanup, first because I can't figure out how to
make Coccinelle transform strings, and second to get rid of now
superfluous error_propagate().
We now use or propagate the original error whole instead of just its
message obtained with error_get_pretty(). This avoids suppressing its
hint (see commit 50b7b00), but I can't see how the errors touched in
this commit could come with hints. It also improves the message
printed with &error_abort when we screw up (see commit 1e9b65b).
Signed-off-by: Markus Armbruster <armbru@redhat.com>
Reviewed-by: Eric Blake <eblake@redhat.com>
2015-12-18 23:35:15 +08:00
|
|
|
error_prepend(errp, "Could not open backing file: ");
|
2014-04-22 23:05:27 +08:00
|
|
|
goto free_exit;
|
2012-10-18 22:49:17 +08:00
|
|
|
}
|
2015-06-15 17:53:47 +08:00
|
|
|
|
2015-09-14 21:33:33 +08:00
|
|
|
/* Hook up the backing file link; drop our reference, bs owns the
|
|
|
|
* backing_hd reference now */
|
2014-05-23 21:29:45 +08:00
|
|
|
bdrv_set_backing_hd(bs, backing_hd);
|
2015-09-14 21:33:33 +08:00
|
|
|
bdrv_unref(backing_hd);
|
2014-01-09 03:43:25 +08:00
|
|
|
|
2015-01-17 01:23:41 +08:00
|
|
|
qdict_del(parent_options, bdref_key);
|
|
|
|
|
2014-04-22 23:05:27 +08:00
|
|
|
free_exit:
|
|
|
|
g_free(backing_filename);
|
2015-01-17 01:23:41 +08:00
|
|
|
QDECREF(tmp_parent_options);
|
2014-04-22 23:05:27 +08:00
|
|
|
return ret;
|
2012-10-18 22:49:17 +08:00
|
|
|
}
|
|
|
|
|
2013-12-21 02:28:11 +08:00
|
|
|
/*
|
|
|
|
* Opens a disk image whose options are given as BlockdevRef in another block
|
|
|
|
* device's options.
|
|
|
|
*
|
|
|
|
* If allow_none is true, no image will be opened if filename is false and no
|
2015-06-15 19:24:19 +08:00
|
|
|
* BlockdevRef is given. NULL will be returned, but errp remains unset.
|
2013-12-21 02:28:11 +08:00
|
|
|
*
|
|
|
|
* bdrev_key specifies the key for the image's BlockdevRef in the options QDict.
|
|
|
|
* That QDict has to be flattened; therefore, if the BlockdevRef is a QDict
|
|
|
|
* itself, all options starting with "${bdref_key}." are considered part of the
|
|
|
|
* BlockdevRef.
|
|
|
|
*
|
|
|
|
* The BlockdevRef will be removed from the options QDict.
|
|
|
|
*/
|
2015-06-15 19:24:19 +08:00
|
|
|
BdrvChild *bdrv_open_child(const char *filename,
|
|
|
|
QDict *options, const char *bdref_key,
|
|
|
|
BlockDriverState* parent,
|
|
|
|
const BdrvChildRole *child_role,
|
|
|
|
bool allow_none, Error **errp)
|
2013-12-21 02:28:11 +08:00
|
|
|
{
|
2015-06-15 19:24:19 +08:00
|
|
|
BdrvChild *c = NULL;
|
|
|
|
BlockDriverState *bs;
|
2013-12-21 02:28:11 +08:00
|
|
|
QDict *image_options;
|
|
|
|
int ret;
|
|
|
|
char *bdref_key_dot;
|
|
|
|
const char *reference;
|
|
|
|
|
2015-06-15 17:53:47 +08:00
|
|
|
assert(child_role != NULL);
|
2014-02-19 01:33:05 +08:00
|
|
|
|
2013-12-21 02:28:11 +08:00
|
|
|
bdref_key_dot = g_strdup_printf("%s.", bdref_key);
|
|
|
|
qdict_extract_subqdict(options, &image_options, bdref_key_dot);
|
|
|
|
g_free(bdref_key_dot);
|
|
|
|
|
|
|
|
reference = qdict_get_try_str(options, bdref_key);
|
|
|
|
if (!filename && !reference && !qdict_size(image_options)) {
|
2015-06-15 19:24:19 +08:00
|
|
|
if (!allow_none) {
|
2013-12-21 02:28:11 +08:00
|
|
|
error_setg(errp, "A block device must be specified for \"%s\"",
|
|
|
|
bdref_key);
|
|
|
|
}
|
2014-05-28 17:16:57 +08:00
|
|
|
QDECREF(image_options);
|
2013-12-21 02:28:11 +08:00
|
|
|
goto done;
|
|
|
|
}
|
|
|
|
|
2015-06-15 19:24:19 +08:00
|
|
|
bs = NULL;
|
|
|
|
ret = bdrv_open_inherit(&bs, filename, reference, image_options, 0,
|
2015-08-27 01:47:50 +08:00
|
|
|
parent, child_role, errp);
|
2015-06-15 17:53:47 +08:00
|
|
|
if (ret < 0) {
|
|
|
|
goto done;
|
|
|
|
}
|
|
|
|
|
2015-04-27 19:46:22 +08:00
|
|
|
c = bdrv_attach_child(parent, bs, bdref_key, child_role);
|
2013-12-21 02:28:11 +08:00
|
|
|
|
|
|
|
done:
|
|
|
|
qdict_del(options, bdref_key);
|
2015-06-15 19:24:19 +08:00
|
|
|
return c;
|
|
|
|
}
|
|
|
|
|
2014-06-23 23:28:23 +08:00
|
|
|
int bdrv_append_temp_snapshot(BlockDriverState *bs, int flags, Error **errp)
|
2014-04-03 18:09:34 +08:00
|
|
|
{
|
|
|
|
/* TODO: extra byte is a hack to ensure MAX_PATH space on Windows. */
|
2014-04-22 23:05:27 +08:00
|
|
|
char *tmp_filename = g_malloc0(PATH_MAX + 1);
|
2014-04-03 18:09:34 +08:00
|
|
|
int64_t total_size;
|
2014-06-05 17:20:51 +08:00
|
|
|
QemuOpts *opts = NULL;
|
2014-04-03 18:09:34 +08:00
|
|
|
QDict *snapshot_options;
|
|
|
|
BlockDriverState *bs_snapshot;
|
2015-07-06 12:24:44 +08:00
|
|
|
Error *local_err = NULL;
|
2014-04-03 18:09:34 +08:00
|
|
|
int ret;
|
|
|
|
|
|
|
|
/* if snapshot, we create a temporary backing file and open it
|
|
|
|
instead of opening 'filename' directly */
|
|
|
|
|
|
|
|
/* Get the required size from the image */
|
2014-04-04 23:07:19 +08:00
|
|
|
total_size = bdrv_getlength(bs);
|
|
|
|
if (total_size < 0) {
|
2014-06-23 23:28:23 +08:00
|
|
|
ret = total_size;
|
2014-04-04 23:07:19 +08:00
|
|
|
error_setg_errno(errp, -total_size, "Could not get image size");
|
2014-04-22 23:05:27 +08:00
|
|
|
goto out;
|
2014-04-04 23:07:19 +08:00
|
|
|
}
|
2014-04-03 18:09:34 +08:00
|
|
|
|
|
|
|
/* Create the temporary image */
|
2014-04-22 23:05:27 +08:00
|
|
|
ret = get_tmp_filename(tmp_filename, PATH_MAX + 1);
|
2014-04-03 18:09:34 +08:00
|
|
|
if (ret < 0) {
|
|
|
|
error_setg_errno(errp, -ret, "Could not get temporary filename");
|
2014-04-22 23:05:27 +08:00
|
|
|
goto out;
|
2014-04-03 18:09:34 +08:00
|
|
|
}
|
|
|
|
|
2014-12-03 01:32:42 +08:00
|
|
|
opts = qemu_opts_create(bdrv_qcow2.create_opts, NULL, 0,
|
2014-06-05 17:21:11 +08:00
|
|
|
&error_abort);
|
2015-02-12 23:46:36 +08:00
|
|
|
qemu_opt_set_number(opts, BLOCK_OPT_SIZE, total_size, &error_abort);
|
error: Use error_prepend() where it makes obvious sense
Done with this Coccinelle semantic patch
@@
expression FMT, E1, E2;
expression list ARGS;
@@
- error_setg(E1, FMT, ARGS, error_get_pretty(E2));
+ error_propagate(E1, E2);/*###*/
+ error_prepend(E1, FMT/*@@@*/, ARGS);
followed by manual cleanup, first because I can't figure out how to
make Coccinelle transform strings, and second to get rid of now
superfluous error_propagate().
We now use or propagate the original error whole instead of just its
message obtained with error_get_pretty(). This avoids suppressing its
hint (see commit 50b7b00), but I can't see how the errors touched in
this commit could come with hints. It also improves the message
printed with &error_abort when we screw up (see commit 1e9b65b).
Signed-off-by: Markus Armbruster <armbru@redhat.com>
Reviewed-by: Eric Blake <eblake@redhat.com>
2015-12-18 23:35:15 +08:00
|
|
|
ret = bdrv_create(&bdrv_qcow2, tmp_filename, opts, errp);
|
2014-06-05 17:20:51 +08:00
|
|
|
qemu_opts_del(opts);
|
2014-04-03 18:09:34 +08:00
|
|
|
if (ret < 0) {
|
error: Use error_prepend() where it makes obvious sense
Done with this Coccinelle semantic patch
@@
expression FMT, E1, E2;
expression list ARGS;
@@
- error_setg(E1, FMT, ARGS, error_get_pretty(E2));
+ error_propagate(E1, E2);/*###*/
+ error_prepend(E1, FMT/*@@@*/, ARGS);
followed by manual cleanup, first because I can't figure out how to
make Coccinelle transform strings, and second to get rid of now
superfluous error_propagate().
We now use or propagate the original error whole instead of just its
message obtained with error_get_pretty(). This avoids suppressing its
hint (see commit 50b7b00), but I can't see how the errors touched in
this commit could come with hints. It also improves the message
printed with &error_abort when we screw up (see commit 1e9b65b).
Signed-off-by: Markus Armbruster <armbru@redhat.com>
Reviewed-by: Eric Blake <eblake@redhat.com>
2015-12-18 23:35:15 +08:00
|
|
|
error_prepend(errp, "Could not create temporary overlay '%s': ",
|
|
|
|
tmp_filename);
|
2014-04-22 23:05:27 +08:00
|
|
|
goto out;
|
2014-04-03 18:09:34 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/* Prepare a new options QDict for the temporary file */
|
|
|
|
snapshot_options = qdict_new();
|
|
|
|
qdict_put(snapshot_options, "file.driver",
|
|
|
|
qstring_from_str("file"));
|
|
|
|
qdict_put(snapshot_options, "file.filename",
|
|
|
|
qstring_from_str(tmp_filename));
|
2015-08-27 01:47:48 +08:00
|
|
|
qdict_put(snapshot_options, "driver",
|
|
|
|
qstring_from_str("qcow2"));
|
2014-04-03 18:09:34 +08:00
|
|
|
|
2014-10-07 19:59:03 +08:00
|
|
|
bs_snapshot = bdrv_new();
|
2014-04-03 18:09:34 +08:00
|
|
|
|
|
|
|
ret = bdrv_open(&bs_snapshot, NULL, NULL, snapshot_options,
|
2015-08-27 01:47:49 +08:00
|
|
|
flags, &local_err);
|
2014-04-03 18:09:34 +08:00
|
|
|
if (ret < 0) {
|
|
|
|
error_propagate(errp, local_err);
|
2014-04-22 23:05:27 +08:00
|
|
|
goto out;
|
2014-04-03 18:09:34 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
bdrv_append(bs_snapshot, bs);
|
2014-04-22 23:05:27 +08:00
|
|
|
|
|
|
|
out:
|
|
|
|
g_free(tmp_filename);
|
2014-06-23 23:28:23 +08:00
|
|
|
return ret;
|
2014-04-03 18:09:34 +08:00
|
|
|
}
|
|
|
|
|
2010-04-12 22:37:13 +08:00
|
|
|
/*
|
|
|
|
* Opens a disk image (raw, qcow2, vmdk, ...)
|
2013-03-15 17:35:02 +08:00
|
|
|
*
|
|
|
|
* options is a QDict of options to pass to the block drivers, or NULL for an
|
|
|
|
* empty set of options. The reference to the QDict belongs to the block layer
|
|
|
|
* after the call (even on failure), so if the caller intends to reuse the
|
|
|
|
* dictionary, it needs to use QINCREF() before calling bdrv_open.
|
2014-02-19 01:33:05 +08:00
|
|
|
*
|
|
|
|
* If *pbs is NULL, a new BDS will be created with a pointer to it stored there.
|
|
|
|
* If it is not NULL, the referenced BDS will be reused.
|
2014-02-19 01:33:06 +08:00
|
|
|
*
|
|
|
|
* The reference parameter may be used to specify an existing block device which
|
|
|
|
* should be opened. If specified, neither options nor a filename may be given,
|
|
|
|
* nor can an existing BDS be reused (that is, *pbs has to be NULL).
|
2010-04-12 22:37:13 +08:00
|
|
|
*/
|
2015-04-08 19:43:47 +08:00
|
|
|
static int bdrv_open_inherit(BlockDriverState **pbs, const char *filename,
|
|
|
|
const char *reference, QDict *options, int flags,
|
|
|
|
BlockDriverState *parent,
|
2015-08-27 01:47:50 +08:00
|
|
|
const BdrvChildRole *child_role, Error **errp)
|
2004-08-02 05:59:26 +08:00
|
|
|
{
|
2010-04-12 22:37:13 +08:00
|
|
|
int ret;
|
2015-06-16 20:19:22 +08:00
|
|
|
BdrvChild *file = NULL;
|
|
|
|
BlockDriverState *bs;
|
2015-08-27 01:47:50 +08:00
|
|
|
BlockDriver *drv = NULL;
|
2013-07-09 17:09:02 +08:00
|
|
|
const char *drvname;
|
2015-10-26 20:27:15 +08:00
|
|
|
const char *backing;
|
2013-09-05 20:45:29 +08:00
|
|
|
Error *local_err = NULL;
|
2014-05-06 18:11:42 +08:00
|
|
|
int snapshot_flags = 0;
|
2005-04-29 05:09:32 +08:00
|
|
|
|
2014-02-19 01:33:05 +08:00
|
|
|
assert(pbs);
|
2015-04-08 19:43:47 +08:00
|
|
|
assert(!child_role || !flags);
|
|
|
|
assert(!child_role == !parent);
|
2014-02-19 01:33:05 +08:00
|
|
|
|
2014-02-19 01:33:06 +08:00
|
|
|
if (reference) {
|
|
|
|
bool options_non_empty = options ? qdict_size(options) : false;
|
|
|
|
QDECREF(options);
|
|
|
|
|
|
|
|
if (*pbs) {
|
|
|
|
error_setg(errp, "Cannot reuse an existing BDS when referencing "
|
|
|
|
"another block device");
|
|
|
|
return -EINVAL;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (filename || options_non_empty) {
|
|
|
|
error_setg(errp, "Cannot reference an existing block device with "
|
|
|
|
"additional options or a new filename");
|
|
|
|
return -EINVAL;
|
|
|
|
}
|
|
|
|
|
|
|
|
bs = bdrv_lookup_bs(reference, reference, errp);
|
|
|
|
if (!bs) {
|
|
|
|
return -ENODEV;
|
|
|
|
}
|
|
|
|
bdrv_ref(bs);
|
|
|
|
*pbs = bs;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2014-02-19 01:33:05 +08:00
|
|
|
if (*pbs) {
|
|
|
|
bs = *pbs;
|
|
|
|
} else {
|
2014-10-07 19:59:03 +08:00
|
|
|
bs = bdrv_new();
|
2014-02-19 01:33:05 +08:00
|
|
|
}
|
|
|
|
|
2013-03-15 17:35:02 +08:00
|
|
|
/* NULL means an empty set of options */
|
|
|
|
if (options == NULL) {
|
|
|
|
options = qdict_new();
|
|
|
|
}
|
|
|
|
|
2015-05-08 22:15:03 +08:00
|
|
|
/* json: syntax counts as explicit options, as if in the QDict */
|
2015-10-29 22:24:41 +08:00
|
|
|
parse_json_protocol(options, &filename, &local_err);
|
|
|
|
if (local_err) {
|
|
|
|
ret = -EINVAL;
|
|
|
|
goto fail;
|
|
|
|
}
|
|
|
|
|
2015-05-08 22:15:03 +08:00
|
|
|
bs->explicit_options = qdict_clone_shallow(options);
|
|
|
|
|
2015-04-08 19:43:47 +08:00
|
|
|
if (child_role) {
|
2015-04-10 00:47:50 +08:00
|
|
|
bs->inherits_from = parent;
|
2015-04-29 23:29:39 +08:00
|
|
|
child_role->inherit_options(&flags, options,
|
|
|
|
parent->open_flags, parent->options);
|
2015-04-08 19:43:47 +08:00
|
|
|
}
|
|
|
|
|
2015-10-29 22:24:41 +08:00
|
|
|
ret = bdrv_fill_options(&options, filename, &flags, &local_err);
|
2014-05-26 17:39:55 +08:00
|
|
|
if (local_err) {
|
|
|
|
goto fail;
|
|
|
|
}
|
|
|
|
|
2015-04-24 22:38:02 +08:00
|
|
|
bs->open_flags = flags;
|
|
|
|
bs->options = options;
|
|
|
|
options = qdict_clone_shallow(options);
|
|
|
|
|
2014-06-04 20:19:44 +08:00
|
|
|
/* Find the right image format driver */
|
|
|
|
drvname = qdict_get_try_str(options, "driver");
|
|
|
|
if (drvname) {
|
|
|
|
drv = bdrv_find_format(drvname);
|
|
|
|
if (!drv) {
|
|
|
|
error_setg(errp, "Unknown driver: '%s'", drvname);
|
|
|
|
ret = -EINVAL;
|
|
|
|
goto fail;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
assert(drvname || !(flags & BDRV_O_PROTOCOL));
|
|
|
|
|
2015-10-26 20:27:15 +08:00
|
|
|
backing = qdict_get_try_str(options, "backing");
|
|
|
|
if (backing && *backing == '\0') {
|
|
|
|
flags |= BDRV_O_NO_BACKING;
|
|
|
|
qdict_del(options, "backing");
|
|
|
|
}
|
|
|
|
|
2012-11-13 00:35:27 +08:00
|
|
|
/* Open image file without format layer */
|
2014-06-03 22:44:19 +08:00
|
|
|
if ((flags & BDRV_O_PROTOCOL) == 0) {
|
|
|
|
if (flags & BDRV_O_RDWR) {
|
|
|
|
flags |= BDRV_O_ALLOW_RDWR;
|
|
|
|
}
|
|
|
|
if (flags & BDRV_O_SNAPSHOT) {
|
|
|
|
snapshot_flags = bdrv_temp_snapshot_flags(flags);
|
2015-04-29 23:29:39 +08:00
|
|
|
bdrv_backing_options(&flags, options, flags, options);
|
2014-06-03 22:44:19 +08:00
|
|
|
}
|
2012-11-13 00:35:27 +08:00
|
|
|
|
2015-04-08 19:43:47 +08:00
|
|
|
bs->open_flags = flags;
|
2015-06-15 20:11:51 +08:00
|
|
|
|
2015-06-16 20:19:22 +08:00
|
|
|
file = bdrv_open_child(filename, options, "file", bs,
|
|
|
|
&child_file, true, &local_err);
|
2015-06-15 20:11:51 +08:00
|
|
|
if (local_err) {
|
|
|
|
ret = -EINVAL;
|
2014-06-03 22:44:19 +08:00
|
|
|
goto fail;
|
|
|
|
}
|
2012-11-13 00:35:27 +08:00
|
|
|
}
|
|
|
|
|
2014-06-04 20:19:44 +08:00
|
|
|
/* Image format probing */
|
raw: Prohibit dangerous writes for probed images
If the user neglects to specify the image format, QEMU probes the
image to guess it automatically, for convenience.
Relying on format probing is insecure for raw images (CVE-2008-2004).
If the guest writes a suitable header to the device, the next probe
will recognize a format chosen by the guest. A malicious guest can
abuse this to gain access to host files, e.g. by crafting a QCOW2
header with backing file /etc/shadow.
Commit 1e72d3b (April 2008) provided -drive parameter format to let
users disable probing. Commit f965509 (March 2009) extended QCOW2 to
optionally store the backing file format, to let users disable backing
file probing. QED has had a flag to suppress probing since the
beginning (2010), set whenever a raw backing file is assigned.
All of these additions that allow to avoid format probing have to be
specified explicitly. The default still allows the attack.
In order to fix this, commit 79368c8 (July 2010) put probed raw images
in a restricted mode, in which they wouldn't be able to overwrite the
first few bytes of the image so that they would identify as a different
image. If a write to the first sector would write one of the signatures
of another driver, qemu would instead zero out the first four bytes.
This patch was later reverted in commit 8b33d9e (September 2010) because
it didn't get the handling of unaligned qiov members right.
Today's block layer that is based on coroutines and has qiov utility
functions makes it much easier to get this functionality right, so this
patch implements it.
The other differences of this patch to the old one are that it doesn't
silently write something different than the guest requested by zeroing
out some bytes (it fails the request instead) and that it doesn't
maintain a list of signatures in the raw driver (it calls the usual
probe function instead).
Note that this change doesn't introduce new breakage for false positive
cases where the guest legitimately writes data into the first sector
that matches the signatures of an image format (e.g. for nested virt):
These cases were broken before, only the failure mode changes from
corruption after the next restart (when the wrong format is probed) to
failing the problematic write request.
Also note that like in the original patch, the restrictions only apply
if the image format has been guessed by probing. Explicitly specifying a
format allows guests to write anything they like.
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
Reviewed-by: Eric Blake <eblake@redhat.com>
Reviewed-by: Max Reitz <mreitz@redhat.com>
Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com>
Message-id: 1416497234-29880-8-git-send-email-kwolf@redhat.com
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
2014-11-20 23:27:12 +08:00
|
|
|
bs->probed = !drv;
|
2014-06-04 20:19:44 +08:00
|
|
|
if (!drv && file) {
|
2015-06-16 20:19:22 +08:00
|
|
|
ret = find_image_format(file->bs, filename, &drv, &local_err);
|
2014-05-27 16:50:29 +08:00
|
|
|
if (ret < 0) {
|
2014-04-12 01:16:36 +08:00
|
|
|
goto fail;
|
2013-12-21 02:28:10 +08:00
|
|
|
}
|
2015-04-24 22:38:02 +08:00
|
|
|
/*
|
|
|
|
* This option update would logically belong in bdrv_fill_options(),
|
|
|
|
* but we first need to open bs->file for the probing to work, while
|
|
|
|
* opening bs->file already requires the (mostly) final set of options
|
|
|
|
* so that cache mode etc. can be inherited.
|
|
|
|
*
|
|
|
|
* Adding the driver later is somewhat ugly, but it's not an option
|
|
|
|
* that would ever be inherited, so it's correct. We just need to make
|
|
|
|
* sure to update both bs->options (which has the full effective
|
|
|
|
* options for bs) and options (which has file.* already removed).
|
|
|
|
*/
|
|
|
|
qdict_put(bs->options, "driver", qstring_from_str(drv->format_name));
|
|
|
|
qdict_put(options, "driver", qstring_from_str(drv->format_name));
|
2014-06-04 20:19:44 +08:00
|
|
|
} else if (!drv) {
|
2014-05-27 16:50:29 +08:00
|
|
|
error_setg(errp, "Must specify either driver or file");
|
|
|
|
ret = -EINVAL;
|
2014-04-12 01:16:36 +08:00
|
|
|
goto fail;
|
2004-08-02 05:59:26 +08:00
|
|
|
}
|
2010-04-12 22:37:13 +08:00
|
|
|
|
block: driver should override flags in bdrv_open()
The BDRV_O_PROTOCOL flag should have an impact only if no driver is
specified explicitly. Therefore, if bdrv_open() is called with an
explicit block driver argument (either through the options QDict or
through the drv parameter) and that block driver is a protocol block
driver, BDRV_O_PROTOCOL should be set; if it is a format block driver,
BDRV_O_PROTOCOL should be unset.
While there was code to unset the flag in case a format block driver
has been selected, it only followed the bdrv_fill_options() function
call whereas the flag in fact needs to be adjusted before it is used
there.
With that change, BDRV_O_PROTOCOL will always be set if the BDS should
be a protocol driver; if the driver has been specified explicitly, the
new code will set it; and bdrv_fill_options() will only "probe" a
protocol driver if BDRV_O_PROTOCOL is set. The probing after
bdrv_fill_options() cannot select a protocol driver.
Thus, bdrv_open_image() to open BDS.file is never called if a protocol
BDS is about to be created. With that change in turn it is impossible to
call bdrv_open_common() with a protocol drv and file != NULL, which
allows us to remove the bdrv_swap() call.
This change breaks a test case in qemu-iotest 051:
"-drive file=t.qcow2,file.driver=qcow2" now works because the explicitly
specified "qcow2" overrides the BDRV_O_PROTOCOL which is automatically
set for the "file" BDS (and the filename is just passed down).
Therefore, this patch removes that test case.
Signed-off-by: Max Reitz <mreitz@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
2015-03-20 02:53:16 +08:00
|
|
|
/* BDRV_O_PROTOCOL must be set iff a protocol BDS is about to be created */
|
|
|
|
assert(!!(flags & BDRV_O_PROTOCOL) == !!drv->bdrv_file_open);
|
|
|
|
/* file must be NULL if a protocol BDS is about to be created
|
|
|
|
* (the inverse results in an error message from bdrv_open_common()) */
|
|
|
|
assert(!(flags & BDRV_O_PROTOCOL) || !file);
|
|
|
|
|
2010-04-12 22:37:13 +08:00
|
|
|
/* Open the image */
|
2016-01-12 02:07:50 +08:00
|
|
|
ret = bdrv_open_common(bs, file, options, &local_err);
|
2010-04-12 22:37:13 +08:00
|
|
|
if (ret < 0) {
|
2014-04-12 01:16:36 +08:00
|
|
|
goto fail;
|
2010-01-21 01:13:25 +08:00
|
|
|
}
|
|
|
|
|
2013-12-21 02:28:10 +08:00
|
|
|
if (file && (bs->file != file)) {
|
2015-06-16 20:19:22 +08:00
|
|
|
bdrv_unref_child(bs, file);
|
2012-11-13 00:35:27 +08:00
|
|
|
file = NULL;
|
|
|
|
}
|
|
|
|
|
2010-04-12 22:37:13 +08:00
|
|
|
/* If there is a backing file, use it */
|
2012-10-18 22:49:17 +08:00
|
|
|
if ((flags & BDRV_O_NO_BACKING) == 0) {
|
2015-01-17 01:23:41 +08:00
|
|
|
ret = bdrv_open_backing_file(bs, options, "backing", &local_err);
|
2010-04-12 22:37:13 +08:00
|
|
|
if (ret < 0) {
|
2013-03-15 17:35:04 +08:00
|
|
|
goto close_and_fail;
|
2010-04-12 22:37:13 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-07-19 02:24:56 +08:00
|
|
|
bdrv_refresh_filename(bs);
|
|
|
|
|
2013-03-15 17:35:04 +08:00
|
|
|
/* Check if any unknown options were used */
|
2014-02-19 01:33:11 +08:00
|
|
|
if (options && (qdict_size(options) != 0)) {
|
2013-03-15 17:35:04 +08:00
|
|
|
const QDictEntry *entry = qdict_first(options);
|
2014-02-19 01:33:11 +08:00
|
|
|
if (flags & BDRV_O_PROTOCOL) {
|
|
|
|
error_setg(errp, "Block protocol '%s' doesn't support the option "
|
|
|
|
"'%s'", drv->format_name, entry->key);
|
|
|
|
} else {
|
|
|
|
error_setg(errp, "Block format '%s' used by device '%s' doesn't "
|
|
|
|
"support the option '%s'", drv->format_name,
|
2014-10-07 19:59:11 +08:00
|
|
|
bdrv_get_device_name(bs), entry->key);
|
2014-02-19 01:33:11 +08:00
|
|
|
}
|
2013-03-15 17:35:04 +08:00
|
|
|
|
|
|
|
ret = -EINVAL;
|
|
|
|
goto close_and_fail;
|
|
|
|
}
|
|
|
|
|
2010-04-12 22:37:13 +08:00
|
|
|
if (!bdrv_key_required(bs)) {
|
2014-10-07 19:59:25 +08:00
|
|
|
if (bs->blk) {
|
|
|
|
blk_dev_change_media_cb(bs->blk, true);
|
|
|
|
}
|
2014-03-14 16:22:48 +08:00
|
|
|
} else if (!runstate_check(RUN_STATE_PRELAUNCH)
|
|
|
|
&& !runstate_check(RUN_STATE_INMIGRATE)
|
|
|
|
&& !runstate_check(RUN_STATE_PAUSED)) { /* HACK */
|
|
|
|
error_setg(errp,
|
|
|
|
"Guest must be stopped for opening of encrypted image");
|
|
|
|
ret = -EBUSY;
|
|
|
|
goto close_and_fail;
|
2010-04-12 22:37:13 +08:00
|
|
|
}
|
|
|
|
|
2014-03-14 16:22:48 +08:00
|
|
|
QDECREF(options);
|
2014-02-19 01:33:05 +08:00
|
|
|
*pbs = bs;
|
2015-06-18 20:09:57 +08:00
|
|
|
|
|
|
|
/* For snapshot=on, create a temporary qcow2 overlay. bs points to the
|
|
|
|
* temporary snapshot afterwards. */
|
|
|
|
if (snapshot_flags) {
|
|
|
|
ret = bdrv_append_temp_snapshot(bs, snapshot_flags, &local_err);
|
|
|
|
if (local_err) {
|
|
|
|
goto close_and_fail;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2010-04-12 22:37:13 +08:00
|
|
|
return 0;
|
|
|
|
|
2014-04-12 01:16:36 +08:00
|
|
|
fail:
|
2012-11-13 00:35:27 +08:00
|
|
|
if (file != NULL) {
|
2015-06-16 20:19:22 +08:00
|
|
|
bdrv_unref_child(bs, file);
|
2012-11-13 00:35:27 +08:00
|
|
|
}
|
2015-05-08 22:15:03 +08:00
|
|
|
QDECREF(bs->explicit_options);
|
2013-03-15 17:35:02 +08:00
|
|
|
QDECREF(bs->options);
|
2013-03-15 17:35:04 +08:00
|
|
|
QDECREF(options);
|
2013-03-15 17:35:02 +08:00
|
|
|
bs->options = NULL;
|
2014-02-19 01:33:05 +08:00
|
|
|
if (!*pbs) {
|
|
|
|
/* If *pbs is NULL, a new BDS has been created in this function and
|
|
|
|
needs to be freed now. Otherwise, it does not need to be closed,
|
|
|
|
since it has not really been opened yet. */
|
|
|
|
bdrv_unref(bs);
|
|
|
|
}
|
2014-01-30 22:07:28 +08:00
|
|
|
if (local_err) {
|
2013-09-05 20:45:29 +08:00
|
|
|
error_propagate(errp, local_err);
|
|
|
|
}
|
2013-03-15 17:35:04 +08:00
|
|
|
return ret;
|
2013-03-15 17:35:02 +08:00
|
|
|
|
2013-03-15 17:35:04 +08:00
|
|
|
close_and_fail:
|
2014-02-19 01:33:05 +08:00
|
|
|
/* See fail path, but now the BDS has to be always closed */
|
|
|
|
if (*pbs) {
|
|
|
|
bdrv_close(bs);
|
|
|
|
} else {
|
|
|
|
bdrv_unref(bs);
|
|
|
|
}
|
2013-03-15 17:35:04 +08:00
|
|
|
QDECREF(options);
|
2014-01-30 22:07:28 +08:00
|
|
|
if (local_err) {
|
2013-09-05 20:45:29 +08:00
|
|
|
error_propagate(errp, local_err);
|
|
|
|
}
|
2010-04-12 22:37:13 +08:00
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2015-04-08 19:43:47 +08:00
|
|
|
int bdrv_open(BlockDriverState **pbs, const char *filename,
|
2015-08-27 01:47:49 +08:00
|
|
|
const char *reference, QDict *options, int flags, Error **errp)
|
2015-04-08 19:43:47 +08:00
|
|
|
{
|
|
|
|
return bdrv_open_inherit(pbs, filename, reference, options, flags, NULL,
|
2015-08-27 01:47:50 +08:00
|
|
|
NULL, errp);
|
2015-04-08 19:43:47 +08:00
|
|
|
}
|
|
|
|
|
2012-09-21 03:13:19 +08:00
|
|
|
typedef struct BlockReopenQueueEntry {
|
|
|
|
bool prepared;
|
|
|
|
BDRVReopenState state;
|
|
|
|
QSIMPLEQ_ENTRY(BlockReopenQueueEntry) entry;
|
|
|
|
} BlockReopenQueueEntry;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Adds a BlockDriverState to a simple queue for an atomic, transactional
|
|
|
|
* reopen of multiple devices.
|
|
|
|
*
|
|
|
|
* bs_queue can either be an existing BlockReopenQueue that has had QSIMPLE_INIT
|
|
|
|
* already performed, or alternatively may be NULL a new BlockReopenQueue will
|
|
|
|
* be created and initialized. This newly created BlockReopenQueue should be
|
|
|
|
* passed back in for subsequent calls that are intended to be of the same
|
|
|
|
* atomic 'set'.
|
|
|
|
*
|
|
|
|
* bs is the BlockDriverState to add to the reopen queue.
|
|
|
|
*
|
2015-04-10 23:50:50 +08:00
|
|
|
* options contains the changed options for the associated bs
|
|
|
|
* (the BlockReopenQueue takes ownership)
|
|
|
|
*
|
2012-09-21 03:13:19 +08:00
|
|
|
* flags contains the open flags for the associated bs
|
|
|
|
*
|
|
|
|
* returns a pointer to bs_queue, which is either the newly allocated
|
|
|
|
* bs_queue, or the existing bs_queue being used.
|
|
|
|
*
|
|
|
|
*/
|
2015-05-08 23:07:31 +08:00
|
|
|
static BlockReopenQueue *bdrv_reopen_queue_child(BlockReopenQueue *bs_queue,
|
|
|
|
BlockDriverState *bs,
|
|
|
|
QDict *options,
|
|
|
|
int flags,
|
|
|
|
const BdrvChildRole *role,
|
|
|
|
QDict *parent_options,
|
|
|
|
int parent_flags)
|
2012-09-21 03:13:19 +08:00
|
|
|
{
|
|
|
|
assert(bs != NULL);
|
|
|
|
|
|
|
|
BlockReopenQueueEntry *bs_entry;
|
2015-04-10 00:54:04 +08:00
|
|
|
BdrvChild *child;
|
2015-05-08 22:15:03 +08:00
|
|
|
QDict *old_options, *explicit_options;
|
2015-04-10 00:54:04 +08:00
|
|
|
|
2012-09-21 03:13:19 +08:00
|
|
|
if (bs_queue == NULL) {
|
|
|
|
bs_queue = g_new0(BlockReopenQueue, 1);
|
|
|
|
QSIMPLEQ_INIT(bs_queue);
|
|
|
|
}
|
|
|
|
|
2015-04-10 23:50:50 +08:00
|
|
|
if (!options) {
|
|
|
|
options = qdict_new();
|
|
|
|
}
|
|
|
|
|
2015-05-08 23:07:31 +08:00
|
|
|
/*
|
|
|
|
* Precedence of options:
|
|
|
|
* 1. Explicitly passed in options (highest)
|
2015-05-08 23:49:53 +08:00
|
|
|
* 2. Set in flags (only for top level)
|
2015-05-08 22:15:03 +08:00
|
|
|
* 3. Retained from explicitly set options of bs
|
2015-04-29 23:29:39 +08:00
|
|
|
* 4. Inherited from parent node
|
2015-05-08 23:07:31 +08:00
|
|
|
* 5. Retained from effective options of bs
|
|
|
|
*/
|
|
|
|
|
2015-05-08 23:49:53 +08:00
|
|
|
if (!parent_options) {
|
|
|
|
/*
|
|
|
|
* Any setting represented by flags is always updated. If the
|
|
|
|
* corresponding QDict option is set, it takes precedence. Otherwise
|
|
|
|
* the flag is translated into a QDict option. The old setting of bs is
|
|
|
|
* not considered.
|
|
|
|
*/
|
|
|
|
update_options_from_flags(options, flags);
|
|
|
|
}
|
|
|
|
|
2015-05-08 22:15:03 +08:00
|
|
|
/* Old explicitly set values (don't overwrite by inherited value) */
|
|
|
|
old_options = qdict_clone_shallow(bs->explicit_options);
|
|
|
|
bdrv_join_options(bs, options, old_options);
|
|
|
|
QDECREF(old_options);
|
|
|
|
|
|
|
|
explicit_options = qdict_clone_shallow(options);
|
|
|
|
|
2015-05-08 23:07:31 +08:00
|
|
|
/* Inherit from parent node */
|
|
|
|
if (parent_options) {
|
|
|
|
assert(!flags);
|
2015-04-29 23:29:39 +08:00
|
|
|
role->inherit_options(&flags, options, parent_flags, parent_options);
|
2015-05-08 23:07:31 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/* Old values are used for options that aren't set yet */
|
2015-04-10 23:50:50 +08:00
|
|
|
old_options = qdict_clone_shallow(bs->options);
|
2015-11-16 23:43:27 +08:00
|
|
|
bdrv_join_options(bs, options, old_options);
|
2015-04-10 23:50:50 +08:00
|
|
|
QDECREF(old_options);
|
|
|
|
|
2014-04-26 01:04:55 +08:00
|
|
|
/* bdrv_open() masks this flag out */
|
|
|
|
flags &= ~BDRV_O_PROTOCOL;
|
|
|
|
|
2015-04-10 00:54:04 +08:00
|
|
|
QLIST_FOREACH(child, &bs->children, next) {
|
2015-05-08 21:14:15 +08:00
|
|
|
QDict *new_child_options;
|
|
|
|
char *child_key_dot;
|
2015-04-10 00:54:04 +08:00
|
|
|
|
2015-05-08 21:14:15 +08:00
|
|
|
/* reopen can only change the options of block devices that were
|
|
|
|
* implicitly created and inherited options. For other (referenced)
|
|
|
|
* block devices, a syntax like "backing.foo" results in an error. */
|
2015-04-10 00:54:04 +08:00
|
|
|
if (child->bs->inherits_from != bs) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
2015-05-08 21:14:15 +08:00
|
|
|
child_key_dot = g_strdup_printf("%s.", child->name);
|
|
|
|
qdict_extract_subqdict(options, &new_child_options, child_key_dot);
|
|
|
|
g_free(child_key_dot);
|
|
|
|
|
2015-05-08 23:07:31 +08:00
|
|
|
bdrv_reopen_queue_child(bs_queue, child->bs, new_child_options, 0,
|
|
|
|
child->role, options, flags);
|
2012-09-21 03:13:19 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
bs_entry = g_new0(BlockReopenQueueEntry, 1);
|
|
|
|
QSIMPLEQ_INSERT_TAIL(bs_queue, bs_entry, entry);
|
|
|
|
|
|
|
|
bs_entry->state.bs = bs;
|
2015-04-10 23:50:50 +08:00
|
|
|
bs_entry->state.options = options;
|
2015-05-08 22:15:03 +08:00
|
|
|
bs_entry->state.explicit_options = explicit_options;
|
2012-09-21 03:13:19 +08:00
|
|
|
bs_entry->state.flags = flags;
|
|
|
|
|
|
|
|
return bs_queue;
|
|
|
|
}
|
|
|
|
|
2015-05-08 23:07:31 +08:00
|
|
|
BlockReopenQueue *bdrv_reopen_queue(BlockReopenQueue *bs_queue,
|
|
|
|
BlockDriverState *bs,
|
|
|
|
QDict *options, int flags)
|
|
|
|
{
|
|
|
|
return bdrv_reopen_queue_child(bs_queue, bs, options, flags,
|
|
|
|
NULL, NULL, 0);
|
|
|
|
}
|
|
|
|
|
2012-09-21 03:13:19 +08:00
|
|
|
/*
|
|
|
|
* Reopen multiple BlockDriverStates atomically & transactionally.
|
|
|
|
*
|
|
|
|
* The queue passed in (bs_queue) must have been built up previous
|
|
|
|
* via bdrv_reopen_queue().
|
|
|
|
*
|
|
|
|
* Reopens all BDS specified in the queue, with the appropriate
|
|
|
|
* flags. All devices are prepared for reopen, and failure of any
|
|
|
|
* device will cause all device changes to be abandonded, and intermediate
|
|
|
|
* data cleaned up.
|
|
|
|
*
|
|
|
|
* If all devices prepare successfully, then the changes are committed
|
|
|
|
* to all devices.
|
|
|
|
*
|
|
|
|
*/
|
|
|
|
int bdrv_reopen_multiple(BlockReopenQueue *bs_queue, Error **errp)
|
|
|
|
{
|
|
|
|
int ret = -1;
|
|
|
|
BlockReopenQueueEntry *bs_entry, *next;
|
|
|
|
Error *local_err = NULL;
|
|
|
|
|
|
|
|
assert(bs_queue != NULL);
|
|
|
|
|
|
|
|
bdrv_drain_all();
|
|
|
|
|
|
|
|
QSIMPLEQ_FOREACH(bs_entry, bs_queue, entry) {
|
|
|
|
if (bdrv_reopen_prepare(&bs_entry->state, bs_queue, &local_err)) {
|
|
|
|
error_propagate(errp, local_err);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
bs_entry->prepared = true;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* If we reach this point, we have success and just need to apply the
|
|
|
|
* changes
|
|
|
|
*/
|
|
|
|
QSIMPLEQ_FOREACH(bs_entry, bs_queue, entry) {
|
|
|
|
bdrv_reopen_commit(&bs_entry->state);
|
|
|
|
}
|
|
|
|
|
|
|
|
ret = 0;
|
|
|
|
|
|
|
|
cleanup:
|
|
|
|
QSIMPLEQ_FOREACH_SAFE(bs_entry, bs_queue, entry, next) {
|
|
|
|
if (ret && bs_entry->prepared) {
|
|
|
|
bdrv_reopen_abort(&bs_entry->state);
|
2015-05-08 22:15:03 +08:00
|
|
|
} else if (ret) {
|
|
|
|
QDECREF(bs_entry->state.explicit_options);
|
2012-09-21 03:13:19 +08:00
|
|
|
}
|
2015-04-10 23:50:50 +08:00
|
|
|
QDECREF(bs_entry->state.options);
|
2012-09-21 03:13:19 +08:00
|
|
|
g_free(bs_entry);
|
|
|
|
}
|
|
|
|
g_free(bs_queue);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/* Reopen a single BlockDriverState with the specified flags. */
|
|
|
|
int bdrv_reopen(BlockDriverState *bs, int bdrv_flags, Error **errp)
|
|
|
|
{
|
|
|
|
int ret = -1;
|
|
|
|
Error *local_err = NULL;
|
2015-04-10 23:50:50 +08:00
|
|
|
BlockReopenQueue *queue = bdrv_reopen_queue(NULL, bs, NULL, bdrv_flags);
|
2012-09-21 03:13:19 +08:00
|
|
|
|
|
|
|
ret = bdrv_reopen_multiple(queue, &local_err);
|
|
|
|
if (local_err != NULL) {
|
|
|
|
error_propagate(errp, local_err);
|
|
|
|
}
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Prepares a BlockDriverState for reopen. All changes are staged in the
|
|
|
|
* 'opaque' field of the BDRVReopenState, which is used and allocated by
|
|
|
|
* the block driver layer .bdrv_reopen_prepare()
|
|
|
|
*
|
|
|
|
* bs is the BlockDriverState to reopen
|
|
|
|
* flags are the new open flags
|
|
|
|
* queue is the reopen queue
|
|
|
|
*
|
|
|
|
* Returns 0 on success, non-zero on error. On error errp will be set
|
|
|
|
* as well.
|
|
|
|
*
|
|
|
|
* On failure, bdrv_reopen_abort() will be called to clean up any data.
|
|
|
|
* It is the responsibility of the caller to then call the abort() or
|
|
|
|
* commit() for any other BDS that have been left in a prepare() state
|
|
|
|
*
|
|
|
|
*/
|
|
|
|
int bdrv_reopen_prepare(BDRVReopenState *reopen_state, BlockReopenQueue *queue,
|
|
|
|
Error **errp)
|
|
|
|
{
|
|
|
|
int ret = -1;
|
|
|
|
Error *local_err = NULL;
|
|
|
|
BlockDriver *drv;
|
2015-05-08 23:24:56 +08:00
|
|
|
QemuOpts *opts;
|
|
|
|
const char *value;
|
2012-09-21 03:13:19 +08:00
|
|
|
|
|
|
|
assert(reopen_state != NULL);
|
|
|
|
assert(reopen_state->bs->drv != NULL);
|
|
|
|
drv = reopen_state->bs->drv;
|
|
|
|
|
2015-05-08 23:24:56 +08:00
|
|
|
/* Process generic block layer options */
|
|
|
|
opts = qemu_opts_create(&bdrv_runtime_opts, NULL, 0, &error_abort);
|
|
|
|
qemu_opts_absorb_qdict(opts, reopen_state->options, &local_err);
|
|
|
|
if (local_err) {
|
|
|
|
error_propagate(errp, local_err);
|
|
|
|
ret = -EINVAL;
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
|
2015-05-08 23:49:53 +08:00
|
|
|
update_flags_from_options(&reopen_state->flags, opts);
|
|
|
|
|
|
|
|
/* If a guest device is attached, it owns WCE */
|
|
|
|
if (reopen_state->bs->blk && blk_get_attached_dev(reopen_state->bs->blk)) {
|
|
|
|
bool old_wce = bdrv_enable_write_cache(reopen_state->bs);
|
|
|
|
bool new_wce = (reopen_state->flags & BDRV_O_CACHE_WB);
|
|
|
|
if (old_wce != new_wce) {
|
|
|
|
error_setg(errp, "Cannot change cache.writeback: Device attached");
|
|
|
|
ret = -EINVAL;
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-05-08 23:24:56 +08:00
|
|
|
/* node-name and driver must be unchanged. Put them back into the QDict, so
|
|
|
|
* that they are checked at the end of this function. */
|
|
|
|
value = qemu_opt_get(opts, "node-name");
|
|
|
|
if (value) {
|
|
|
|
qdict_put(reopen_state->options, "node-name", qstring_from_str(value));
|
|
|
|
}
|
|
|
|
|
|
|
|
value = qemu_opt_get(opts, "driver");
|
|
|
|
if (value) {
|
|
|
|
qdict_put(reopen_state->options, "driver", qstring_from_str(value));
|
|
|
|
}
|
|
|
|
|
2012-09-21 03:13:19 +08:00
|
|
|
/* if we are to stay read-only, do not allow permission change
|
|
|
|
* to r/w */
|
|
|
|
if (!(reopen_state->bs->open_flags & BDRV_O_ALLOW_RDWR) &&
|
|
|
|
reopen_state->flags & BDRV_O_RDWR) {
|
2015-04-08 17:29:19 +08:00
|
|
|
error_setg(errp, "Node '%s' is read only",
|
|
|
|
bdrv_get_device_or_node_name(reopen_state->bs));
|
2012-09-21 03:13:19 +08:00
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
ret = bdrv_flush(reopen_state->bs);
|
|
|
|
if (ret) {
|
2015-11-11 14:51:20 +08:00
|
|
|
error_setg_errno(errp, -ret, "Error flushing drive");
|
2012-09-21 03:13:19 +08:00
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (drv->bdrv_reopen_prepare) {
|
|
|
|
ret = drv->bdrv_reopen_prepare(reopen_state, queue, &local_err);
|
|
|
|
if (ret) {
|
|
|
|
if (local_err != NULL) {
|
|
|
|
error_propagate(errp, local_err);
|
|
|
|
} else {
|
2013-06-10 23:29:27 +08:00
|
|
|
error_setg(errp, "failed while preparing to reopen image '%s'",
|
|
|
|
reopen_state->bs->filename);
|
2012-09-21 03:13:19 +08:00
|
|
|
}
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
/* It is currently mandatory to have a bdrv_reopen_prepare()
|
|
|
|
* handler for each supported drv. */
|
2015-04-08 17:29:19 +08:00
|
|
|
error_setg(errp, "Block format '%s' used by node '%s' "
|
|
|
|
"does not support reopening files", drv->format_name,
|
|
|
|
bdrv_get_device_or_node_name(reopen_state->bs));
|
2012-09-21 03:13:19 +08:00
|
|
|
ret = -1;
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
|
2015-04-10 23:50:50 +08:00
|
|
|
/* Options that are not handled are only okay if they are unchanged
|
|
|
|
* compared to the old state. It is expected that some options are only
|
|
|
|
* used for the initial open, but not reopen (e.g. filename) */
|
|
|
|
if (qdict_size(reopen_state->options)) {
|
|
|
|
const QDictEntry *entry = qdict_first(reopen_state->options);
|
|
|
|
|
|
|
|
do {
|
|
|
|
QString *new_obj = qobject_to_qstring(entry->value);
|
|
|
|
const char *new = qstring_get_str(new_obj);
|
|
|
|
const char *old = qdict_get_try_str(reopen_state->bs->options,
|
|
|
|
entry->key);
|
|
|
|
|
|
|
|
if (!old || strcmp(new, old)) {
|
|
|
|
error_setg(errp, "Cannot change the option '%s'", entry->key);
|
|
|
|
ret = -EINVAL;
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
} while ((entry = qdict_next(reopen_state->options, entry)));
|
|
|
|
}
|
|
|
|
|
2012-09-21 03:13:19 +08:00
|
|
|
ret = 0;
|
|
|
|
|
|
|
|
error:
|
2015-05-08 23:24:56 +08:00
|
|
|
qemu_opts_del(opts);
|
2012-09-21 03:13:19 +08:00
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Takes the staged changes for the reopen from bdrv_reopen_prepare(), and
|
|
|
|
* makes them final by swapping the staging BlockDriverState contents into
|
|
|
|
* the active BlockDriverState contents.
|
|
|
|
*/
|
|
|
|
void bdrv_reopen_commit(BDRVReopenState *reopen_state)
|
|
|
|
{
|
|
|
|
BlockDriver *drv;
|
|
|
|
|
|
|
|
assert(reopen_state != NULL);
|
|
|
|
drv = reopen_state->bs->drv;
|
|
|
|
assert(drv != NULL);
|
|
|
|
|
|
|
|
/* If there are any driver level actions to take */
|
|
|
|
if (drv->bdrv_reopen_commit) {
|
|
|
|
drv->bdrv_reopen_commit(reopen_state);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* set BDS specific flags now */
|
2015-05-08 22:15:03 +08:00
|
|
|
QDECREF(reopen_state->bs->explicit_options);
|
|
|
|
|
|
|
|
reopen_state->bs->explicit_options = reopen_state->explicit_options;
|
2012-09-21 03:13:19 +08:00
|
|
|
reopen_state->bs->open_flags = reopen_state->flags;
|
|
|
|
reopen_state->bs->enable_write_cache = !!(reopen_state->flags &
|
|
|
|
BDRV_O_CACHE_WB);
|
|
|
|
reopen_state->bs->read_only = !(reopen_state->flags & BDRV_O_RDWR);
|
2013-12-12 03:14:09 +08:00
|
|
|
|
2014-07-16 23:48:16 +08:00
|
|
|
bdrv_refresh_limits(reopen_state->bs, NULL);
|
2012-09-21 03:13:19 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Abort the reopen, and delete and free the staged changes in
|
|
|
|
* reopen_state
|
|
|
|
*/
|
|
|
|
void bdrv_reopen_abort(BDRVReopenState *reopen_state)
|
|
|
|
{
|
|
|
|
BlockDriver *drv;
|
|
|
|
|
|
|
|
assert(reopen_state != NULL);
|
|
|
|
drv = reopen_state->bs->drv;
|
|
|
|
assert(drv != NULL);
|
|
|
|
|
|
|
|
if (drv->bdrv_reopen_abort) {
|
|
|
|
drv->bdrv_reopen_abort(reopen_state);
|
|
|
|
}
|
2015-05-08 22:15:03 +08:00
|
|
|
|
|
|
|
QDECREF(reopen_state->explicit_options);
|
2012-09-21 03:13:19 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
|
2016-01-29 23:36:10 +08:00
|
|
|
static void bdrv_close(BlockDriverState *bs)
|
2003-06-30 18:03:06 +08:00
|
|
|
{
|
2014-06-21 03:57:33 +08:00
|
|
|
BdrvAioNotifier *ban, *ban_next;
|
|
|
|
|
2016-01-29 23:36:14 +08:00
|
|
|
assert(!bs->job);
|
2015-09-25 21:41:44 +08:00
|
|
|
|
|
|
|
/* Disable I/O limits and drain all pending throttled requests */
|
2015-11-04 21:15:36 +08:00
|
|
|
if (bs->throttle_state) {
|
2015-09-25 21:41:44 +08:00
|
|
|
bdrv_io_limits_disable(bs);
|
|
|
|
}
|
|
|
|
|
2015-12-23 18:48:24 +08:00
|
|
|
bdrv_drained_begin(bs); /* complete I/O */
|
2013-07-02 21:36:25 +08:00
|
|
|
bdrv_flush(bs);
|
2015-05-29 18:53:14 +08:00
|
|
|
bdrv_drain(bs); /* in case flush left pending I/O */
|
2015-12-23 18:48:24 +08:00
|
|
|
|
2016-01-29 23:36:01 +08:00
|
|
|
bdrv_release_named_dirty_bitmaps(bs);
|
|
|
|
assert(QLIST_EMPTY(&bs->dirty_bitmaps));
|
|
|
|
|
2015-10-19 23:53:15 +08:00
|
|
|
if (bs->blk) {
|
|
|
|
blk_dev_change_media_cb(bs->blk, false);
|
|
|
|
}
|
|
|
|
|
2012-10-19 17:36:48 +08:00
|
|
|
if (bs->drv) {
|
2015-04-08 19:49:41 +08:00
|
|
|
BdrvChild *child, *next;
|
|
|
|
|
2015-06-16 16:58:20 +08:00
|
|
|
bs->drv->bdrv_close(bs);
|
2015-06-16 20:19:22 +08:00
|
|
|
bs->drv = NULL;
|
2015-06-16 16:58:20 +08:00
|
|
|
|
2015-09-14 21:33:33 +08:00
|
|
|
bdrv_set_backing_hd(bs, NULL);
|
2015-06-16 16:58:20 +08:00
|
|
|
|
2015-06-16 20:19:22 +08:00
|
|
|
if (bs->file != NULL) {
|
|
|
|
bdrv_unref_child(bs, bs->file);
|
|
|
|
bs->file = NULL;
|
|
|
|
}
|
|
|
|
|
2015-04-08 19:49:41 +08:00
|
|
|
QLIST_FOREACH_SAFE(child, &bs->children, next, next) {
|
2015-06-15 19:51:04 +08:00
|
|
|
/* TODO Remove bdrv_unref() from drivers' close function and use
|
|
|
|
* bdrv_unref_child() here */
|
2015-04-10 00:47:50 +08:00
|
|
|
if (child->bs->inherits_from == bs) {
|
|
|
|
child->bs->inherits_from = NULL;
|
|
|
|
}
|
2015-06-15 19:51:04 +08:00
|
|
|
bdrv_detach_child(child);
|
2015-04-08 19:49:41 +08:00
|
|
|
}
|
|
|
|
|
2011-08-21 11:09:37 +08:00
|
|
|
g_free(bs->opaque);
|
2004-08-02 05:59:26 +08:00
|
|
|
bs->opaque = NULL;
|
2011-11-29 00:08:47 +08:00
|
|
|
bs->copy_on_read = 0;
|
2012-05-08 22:51:43 +08:00
|
|
|
bs->backing_file[0] = '\0';
|
|
|
|
bs->backing_format[0] = '\0';
|
2012-05-08 22:51:49 +08:00
|
|
|
bs->total_sectors = 0;
|
|
|
|
bs->encrypted = 0;
|
|
|
|
bs->valid_key = 0;
|
|
|
|
bs->sg = 0;
|
2013-08-22 15:24:14 +08:00
|
|
|
bs->zero_beyond_eof = false;
|
2013-03-15 17:35:02 +08:00
|
|
|
QDECREF(bs->options);
|
2015-05-08 22:15:03 +08:00
|
|
|
QDECREF(bs->explicit_options);
|
2013-03-15 17:35:02 +08:00
|
|
|
bs->options = NULL;
|
2014-07-19 02:24:56 +08:00
|
|
|
QDECREF(bs->full_open_options);
|
|
|
|
bs->full_open_options = NULL;
|
2004-03-15 05:38:54 +08:00
|
|
|
}
|
2011-11-08 13:00:14 +08:00
|
|
|
|
2014-06-21 03:57:33 +08:00
|
|
|
QLIST_FOREACH_SAFE(ban, &bs->aio_notifiers, list, ban_next) {
|
|
|
|
g_free(ban);
|
|
|
|
}
|
|
|
|
QLIST_INIT(&bs->aio_notifiers);
|
2015-12-23 18:48:24 +08:00
|
|
|
bdrv_drained_end(bs);
|
2004-03-15 05:38:54 +08:00
|
|
|
}
|
|
|
|
|
2010-05-28 10:44:57 +08:00
|
|
|
void bdrv_close_all(void)
|
|
|
|
{
|
|
|
|
BlockDriverState *bs;
|
2016-01-29 23:36:14 +08:00
|
|
|
AioContext *aio_context;
|
|
|
|
|
|
|
|
/* Drop references from requests still in flight, such as canceled block
|
|
|
|
* jobs whose AIO context has not been polled yet */
|
|
|
|
bdrv_drain_all();
|
2010-05-28 10:44:57 +08:00
|
|
|
|
2016-01-29 23:36:14 +08:00
|
|
|
blk_remove_all_bs();
|
|
|
|
blockdev_close_all_bdrv_states();
|
2014-05-08 22:34:35 +08:00
|
|
|
|
2016-01-29 23:36:14 +08:00
|
|
|
/* Cancel all block jobs */
|
|
|
|
while (!QTAILQ_EMPTY(&all_bdrv_states)) {
|
|
|
|
QTAILQ_FOREACH(bs, &all_bdrv_states, bs_list) {
|
|
|
|
aio_context = bdrv_get_aio_context(bs);
|
|
|
|
|
|
|
|
aio_context_acquire(aio_context);
|
|
|
|
if (bs->job) {
|
|
|
|
block_job_cancel_sync(bs->job);
|
|
|
|
aio_context_release(aio_context);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
aio_context_release(aio_context);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* All the remaining BlockDriverStates are referenced directly or
|
|
|
|
* indirectly from block jobs, so there needs to be at least one BDS
|
|
|
|
* directly used by a block job */
|
|
|
|
assert(bs);
|
2010-05-28 10:44:57 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-02-02 09:33:10 +08:00
|
|
|
/* Note that bs->device_list.tqe_prev is initially null,
|
|
|
|
* and gets set to non-null by QTAILQ_INSERT_TAIL(). Establish
|
|
|
|
* the useful invariant "bs in bdrv_states iff bs->tqe_prev" by
|
|
|
|
* resetting it to null on remove. */
|
|
|
|
void bdrv_device_remove(BlockDriverState *bs)
|
|
|
|
{
|
|
|
|
QTAILQ_REMOVE(&bdrv_states, bs, device_list);
|
|
|
|
bs->device_list.tqe_prev = NULL;
|
|
|
|
}
|
|
|
|
|
2014-01-24 04:31:32 +08:00
|
|
|
/* make a BlockDriverState anonymous by removing from bdrv_state and
|
|
|
|
* graph_bdrv_state list.
|
Do not delete BlockDriverState when deleting the drive
When removing a drive from the host-side via drive_del we currently have
the following path:
drive_del
qemu_aio_flush()
bdrv_close() // zaps bs->drv, which makes any subsequent I/O get
// dropped. Works as designed
drive_uninit()
bdrv_delete() // frees the bs. Since the device is still connected to
// bs, any subsequent I/O is a use-after-free.
The value of bs->drv becomes unpredictable on free. As long as it
remains null, I/O still gets dropped, however it could become non-null
at any point after the free resulting SEGVs or other QEMU state
corruption.
To resolve this issue as simply as possible, we can chose to not
actually delete the BlockDriverState pointer. Since bdrv_close()
handles setting the drv pointer to NULL, we just need to remove the
BlockDriverState from the QLIST that is used to enumerate the block
devices. This is currently handled within bdrv_delete, so move this
into its own function, bdrv_make_anon().
The result is that we can now invoke drive_del, this closes the file
descriptors and sets BlockDriverState->drv to NULL which prevents futher
IO to the device, and since we do not free BlockDriverState, we don't
have to worry about the copy retained in the block devices.
We also don't attempt to remove the qdev property since we are no longer
deleting the BlockDriverState on drives with associated drives. This
also allows for removing Drives with no devices associated either.
Reported-by: Markus Armbruster <armbru@redhat.com>
Signed-off-by: Ryan Harper <ryanh@us.ibm.com>
Acked-by: Markus Armbruster <armbru@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
2011-03-30 09:51:47 +08:00
|
|
|
Also, NULL terminate the device_name to prevent double remove */
|
|
|
|
void bdrv_make_anon(BlockDriverState *bs)
|
|
|
|
{
|
2016-02-02 09:33:10 +08:00
|
|
|
/* Take care to remove bs from bdrv_states only when it's actually
|
|
|
|
* in it. */
|
2014-10-07 19:59:11 +08:00
|
|
|
if (bs->device_list.tqe_prev) {
|
2016-02-02 09:33:10 +08:00
|
|
|
bdrv_device_remove(bs);
|
Do not delete BlockDriverState when deleting the drive
When removing a drive from the host-side via drive_del we currently have
the following path:
drive_del
qemu_aio_flush()
bdrv_close() // zaps bs->drv, which makes any subsequent I/O get
// dropped. Works as designed
drive_uninit()
bdrv_delete() // frees the bs. Since the device is still connected to
// bs, any subsequent I/O is a use-after-free.
The value of bs->drv becomes unpredictable on free. As long as it
remains null, I/O still gets dropped, however it could become non-null
at any point after the free resulting SEGVs or other QEMU state
corruption.
To resolve this issue as simply as possible, we can chose to not
actually delete the BlockDriverState pointer. Since bdrv_close()
handles setting the drv pointer to NULL, we just need to remove the
BlockDriverState from the QLIST that is used to enumerate the block
devices. This is currently handled within bdrv_delete, so move this
into its own function, bdrv_make_anon().
The result is that we can now invoke drive_del, this closes the file
descriptors and sets BlockDriverState->drv to NULL which prevents futher
IO to the device, and since we do not free BlockDriverState, we don't
have to worry about the copy retained in the block devices.
We also don't attempt to remove the qdev property since we are no longer
deleting the BlockDriverState on drives with associated drives. This
also allows for removing Drives with no devices associated either.
Reported-by: Markus Armbruster <armbru@redhat.com>
Signed-off-by: Ryan Harper <ryanh@us.ibm.com>
Acked-by: Markus Armbruster <armbru@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
2011-03-30 09:51:47 +08:00
|
|
|
}
|
2014-01-24 04:31:32 +08:00
|
|
|
if (bs->node_name[0] != '\0') {
|
|
|
|
QTAILQ_REMOVE(&graph_bdrv_states, bs, node_list);
|
|
|
|
}
|
|
|
|
bs->node_name[0] = '\0';
|
Do not delete BlockDriverState when deleting the drive
When removing a drive from the host-side via drive_del we currently have
the following path:
drive_del
qemu_aio_flush()
bdrv_close() // zaps bs->drv, which makes any subsequent I/O get
// dropped. Works as designed
drive_uninit()
bdrv_delete() // frees the bs. Since the device is still connected to
// bs, any subsequent I/O is a use-after-free.
The value of bs->drv becomes unpredictable on free. As long as it
remains null, I/O still gets dropped, however it could become non-null
at any point after the free resulting SEGVs or other QEMU state
corruption.
To resolve this issue as simply as possible, we can chose to not
actually delete the BlockDriverState pointer. Since bdrv_close()
handles setting the drv pointer to NULL, we just need to remove the
BlockDriverState from the QLIST that is used to enumerate the block
devices. This is currently handled within bdrv_delete, so move this
into its own function, bdrv_make_anon().
The result is that we can now invoke drive_del, this closes the file
descriptors and sets BlockDriverState->drv to NULL which prevents futher
IO to the device, and since we do not free BlockDriverState, we don't
have to worry about the copy retained in the block devices.
We also don't attempt to remove the qdev property since we are no longer
deleting the BlockDriverState on drives with associated drives. This
also allows for removing Drives with no devices associated either.
Reported-by: Markus Armbruster <armbru@redhat.com>
Signed-off-by: Ryan Harper <ryanh@us.ibm.com>
Acked-by: Markus Armbruster <armbru@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
2011-03-30 09:51:47 +08:00
|
|
|
}
|
|
|
|
|
2015-09-16 22:18:38 +08:00
|
|
|
/* Fields that need to stay with the top-level BDS */
|
2012-06-14 22:55:02 +08:00
|
|
|
static void bdrv_move_feature_fields(BlockDriverState *bs_dest,
|
|
|
|
BlockDriverState *bs_src)
|
2012-02-29 04:54:06 +08:00
|
|
|
{
|
2012-06-14 22:55:02 +08:00
|
|
|
/* move some fields that need to stay attached to the device */
|
2012-02-29 04:54:06 +08:00
|
|
|
|
|
|
|
/* dev info */
|
2012-06-14 22:55:02 +08:00
|
|
|
bs_dest->copy_on_read = bs_src->copy_on_read;
|
2012-02-29 04:54:06 +08:00
|
|
|
|
2012-06-14 22:55:02 +08:00
|
|
|
bs_dest->enable_write_cache = bs_src->enable_write_cache;
|
2012-06-06 06:04:51 +08:00
|
|
|
|
2012-06-14 22:55:01 +08:00
|
|
|
/* dirty bitmap */
|
2013-11-13 18:29:43 +08:00
|
|
|
bs_dest->dirty_bitmaps = bs_src->dirty_bitmaps;
|
2015-09-17 18:33:26 +08:00
|
|
|
}
|
2012-06-14 22:55:01 +08:00
|
|
|
|
2015-06-18 20:09:57 +08:00
|
|
|
static void change_parent_backing_link(BlockDriverState *from,
|
|
|
|
BlockDriverState *to)
|
|
|
|
{
|
|
|
|
BdrvChild *c, *next;
|
|
|
|
|
|
|
|
QLIST_FOREACH_SAFE(c, &from->parents, next_parent, next) {
|
|
|
|
assert(c->role != &child_backing);
|
|
|
|
c->bs = to;
|
|
|
|
QLIST_REMOVE(c, next_parent);
|
|
|
|
QLIST_INSERT_HEAD(&to->parents, c, next_parent);
|
|
|
|
bdrv_ref(to);
|
|
|
|
bdrv_unref(from);
|
|
|
|
}
|
|
|
|
if (from->blk) {
|
|
|
|
blk_set_bs(from->blk, to);
|
|
|
|
if (!to->device_list.tqe_prev) {
|
|
|
|
QTAILQ_INSERT_BEFORE(from, to, device_list);
|
|
|
|
}
|
2016-02-02 09:33:10 +08:00
|
|
|
bdrv_device_remove(from);
|
2015-06-18 20:09:57 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static void swap_feature_fields(BlockDriverState *bs_top,
|
|
|
|
BlockDriverState *bs_new)
|
|
|
|
{
|
|
|
|
BlockDriverState tmp;
|
|
|
|
|
|
|
|
bdrv_move_feature_fields(&tmp, bs_top);
|
|
|
|
bdrv_move_feature_fields(bs_top, bs_new);
|
|
|
|
bdrv_move_feature_fields(bs_new, &tmp);
|
|
|
|
|
|
|
|
assert(!bs_new->throttle_state);
|
|
|
|
if (bs_top->throttle_state) {
|
|
|
|
assert(bs_top->io_limits_enabled);
|
|
|
|
bdrv_io_limits_enable(bs_new, throttle_group_get_name(bs_top));
|
|
|
|
bdrv_io_limits_disable(bs_top);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2012-06-14 22:55:02 +08:00
|
|
|
/*
|
|
|
|
* Add new bs contents at the top of an image chain while the chain is
|
|
|
|
* live, while keeping required fields on the top layer.
|
|
|
|
*
|
|
|
|
* This will modify the BlockDriverState fields, and swap contents
|
|
|
|
* between bs_new and bs_top. Both bs_new and bs_top are modified.
|
|
|
|
*
|
2014-10-07 19:59:11 +08:00
|
|
|
* bs_new must not be attached to a BlockBackend.
|
2012-06-14 22:55:02 +08:00
|
|
|
*
|
|
|
|
* This function does not create any image files.
|
2015-06-18 20:09:57 +08:00
|
|
|
*
|
|
|
|
* bdrv_append() takes ownership of a bs_new reference and unrefs it because
|
|
|
|
* that's what the callers commonly need. bs_new will be referenced by the old
|
|
|
|
* parents of bs_top after bdrv_append() returns. If the caller needs to keep a
|
|
|
|
* reference of its own, it must call bdrv_ref().
|
2012-06-14 22:55:02 +08:00
|
|
|
*/
|
|
|
|
void bdrv_append(BlockDriverState *bs_new, BlockDriverState *bs_top)
|
|
|
|
{
|
2015-06-18 20:09:57 +08:00
|
|
|
assert(!bdrv_requests_pending(bs_top));
|
|
|
|
assert(!bdrv_requests_pending(bs_new));
|
|
|
|
|
|
|
|
bdrv_ref(bs_top);
|
|
|
|
change_parent_backing_link(bs_top, bs_new);
|
|
|
|
|
|
|
|
/* Some fields always stay on top of the backing file chain */
|
|
|
|
swap_feature_fields(bs_top, bs_new);
|
|
|
|
|
|
|
|
bdrv_set_backing_hd(bs_new, bs_top);
|
|
|
|
bdrv_unref(bs_top);
|
2012-06-14 22:55:02 +08:00
|
|
|
|
2015-06-18 20:09:57 +08:00
|
|
|
/* bs_new is now referenced by its new parents, we don't need the
|
|
|
|
* additional reference any more. */
|
|
|
|
bdrv_unref(bs_new);
|
2012-02-29 04:54:06 +08:00
|
|
|
}
|
|
|
|
|
2015-09-15 17:58:23 +08:00
|
|
|
void bdrv_replace_in_backing_chain(BlockDriverState *old, BlockDriverState *new)
|
|
|
|
{
|
|
|
|
assert(!bdrv_requests_pending(old));
|
|
|
|
assert(!bdrv_requests_pending(new));
|
|
|
|
|
|
|
|
bdrv_ref(old);
|
|
|
|
|
|
|
|
if (old->blk) {
|
|
|
|
/* As long as these fields aren't in BlockBackend, but in the top-level
|
|
|
|
* BlockDriverState, it's not possible for a BDS to have two BBs.
|
|
|
|
*
|
|
|
|
* We really want to copy the fields from old to new, but we go for a
|
|
|
|
* swap instead so that pointers aren't duplicated and cause trouble.
|
|
|
|
* (Also, bdrv_swap() used to do the same.) */
|
|
|
|
assert(!new->blk);
|
|
|
|
swap_feature_fields(old, new);
|
|
|
|
}
|
|
|
|
change_parent_backing_link(old, new);
|
|
|
|
|
|
|
|
/* Change backing files if a previously independent node is added to the
|
|
|
|
* chain. For active commit, we replace top by its own (indirect) backing
|
|
|
|
* file and don't do anything here so we don't build a loop. */
|
|
|
|
if (new->backing == NULL && !bdrv_chain_contains(backing_bs(old), new)) {
|
|
|
|
bdrv_set_backing_hd(new, backing_bs(old));
|
|
|
|
bdrv_set_backing_hd(old, NULL);
|
|
|
|
}
|
|
|
|
|
|
|
|
bdrv_unref(old);
|
|
|
|
}
|
|
|
|
|
2013-08-23 09:14:47 +08:00
|
|
|
static void bdrv_delete(BlockDriverState *bs)
|
2004-03-15 05:38:54 +08:00
|
|
|
{
|
2012-03-30 19:17:11 +08:00
|
|
|
assert(!bs->job);
|
2014-05-23 21:29:43 +08:00
|
|
|
assert(bdrv_op_blocker_is_empty(bs));
|
2013-08-23 09:14:47 +08:00
|
|
|
assert(!bs->refcnt);
|
2010-06-29 22:58:30 +08:00
|
|
|
|
2013-06-27 21:32:26 +08:00
|
|
|
bdrv_close(bs);
|
|
|
|
|
2010-04-10 14:02:42 +08:00
|
|
|
/* remove from list, if necessary */
|
Do not delete BlockDriverState when deleting the drive
When removing a drive from the host-side via drive_del we currently have
the following path:
drive_del
qemu_aio_flush()
bdrv_close() // zaps bs->drv, which makes any subsequent I/O get
// dropped. Works as designed
drive_uninit()
bdrv_delete() // frees the bs. Since the device is still connected to
// bs, any subsequent I/O is a use-after-free.
The value of bs->drv becomes unpredictable on free. As long as it
remains null, I/O still gets dropped, however it could become non-null
at any point after the free resulting SEGVs or other QEMU state
corruption.
To resolve this issue as simply as possible, we can chose to not
actually delete the BlockDriverState pointer. Since bdrv_close()
handles setting the drv pointer to NULL, we just need to remove the
BlockDriverState from the QLIST that is used to enumerate the block
devices. This is currently handled within bdrv_delete, so move this
into its own function, bdrv_make_anon().
The result is that we can now invoke drive_del, this closes the file
descriptors and sets BlockDriverState->drv to NULL which prevents futher
IO to the device, and since we do not free BlockDriverState, we don't
have to worry about the copy retained in the block devices.
We also don't attempt to remove the qdev property since we are no longer
deleting the BlockDriverState on drives with associated drives. This
also allows for removing Drives with no devices associated either.
Reported-by: Markus Armbruster <armbru@redhat.com>
Signed-off-by: Ryan Harper <ryanh@us.ibm.com>
Acked-by: Markus Armbruster <armbru@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
2011-03-30 09:51:47 +08:00
|
|
|
bdrv_make_anon(bs);
|
2008-04-09 03:51:21 +08:00
|
|
|
|
2016-01-29 23:36:11 +08:00
|
|
|
QTAILQ_REMOVE(&all_bdrv_states, bs, bs_list);
|
|
|
|
|
2011-08-21 11:09:37 +08:00
|
|
|
g_free(bs);
|
2003-06-30 18:03:06 +08:00
|
|
|
}
|
|
|
|
|
2009-04-22 07:11:50 +08:00
|
|
|
/*
|
|
|
|
* Run consistency checks on an image
|
|
|
|
*
|
2010-06-29 17:43:13 +08:00
|
|
|
* Returns 0 if the check could be completed (it doesn't mean that the image is
|
2011-04-28 23:20:38 +08:00
|
|
|
* free of errors) or -errno when an internal error occurred. The results of the
|
2010-06-29 17:43:13 +08:00
|
|
|
* check are stored in res.
|
2009-04-22 07:11:50 +08:00
|
|
|
*/
|
2012-05-11 22:07:02 +08:00
|
|
|
int bdrv_check(BlockDriverState *bs, BdrvCheckResult *res, BdrvCheckMode fix)
|
2009-04-22 07:11:50 +08:00
|
|
|
{
|
2014-08-08 04:47:55 +08:00
|
|
|
if (bs->drv == NULL) {
|
|
|
|
return -ENOMEDIUM;
|
|
|
|
}
|
2009-04-22 07:11:50 +08:00
|
|
|
if (bs->drv->bdrv_check == NULL) {
|
|
|
|
return -ENOTSUP;
|
|
|
|
}
|
|
|
|
|
2010-06-29 17:43:13 +08:00
|
|
|
memset(res, 0, sizeof(*res));
|
2012-05-11 22:07:02 +08:00
|
|
|
return bs->drv->bdrv_check(bs, res, fix);
|
2009-04-22 07:11:50 +08:00
|
|
|
}
|
|
|
|
|
2010-07-16 23:17:01 +08:00
|
|
|
#define COMMIT_BUF_SECTORS 2048
|
|
|
|
|
2003-07-07 01:15:21 +08:00
|
|
|
/* commit COW file into the raw image */
|
|
|
|
int bdrv_commit(BlockDriverState *bs)
|
|
|
|
{
|
2006-08-19 19:45:59 +08:00
|
|
|
BlockDriver *drv = bs->drv;
|
2014-01-24 22:02:35 +08:00
|
|
|
int64_t sector, total_sectors, length, backing_length;
|
2010-07-16 23:17:01 +08:00
|
|
|
int n, ro, open_flags;
|
2012-09-21 03:13:34 +08:00
|
|
|
int ret = 0;
|
2014-01-24 22:02:35 +08:00
|
|
|
uint8_t *buf = NULL;
|
2003-07-07 01:15:21 +08:00
|
|
|
|
2006-08-19 19:45:59 +08:00
|
|
|
if (!drv)
|
|
|
|
return -ENOMEDIUM;
|
2014-09-01 13:35:21 +08:00
|
|
|
|
2015-06-17 20:55:21 +08:00
|
|
|
if (!bs->backing) {
|
2010-02-14 19:39:18 +08:00
|
|
|
return -ENOTSUP;
|
2003-07-07 01:15:21 +08:00
|
|
|
}
|
|
|
|
|
2014-09-11 13:14:00 +08:00
|
|
|
if (bdrv_op_is_blocked(bs, BLOCK_OP_TYPE_COMMIT_SOURCE, NULL) ||
|
2015-06-17 20:55:21 +08:00
|
|
|
bdrv_op_is_blocked(bs->backing->bs, BLOCK_OP_TYPE_COMMIT_TARGET, NULL)) {
|
2012-01-18 22:40:41 +08:00
|
|
|
return -EBUSY;
|
|
|
|
}
|
|
|
|
|
2015-06-17 20:55:21 +08:00
|
|
|
ro = bs->backing->bs->read_only;
|
|
|
|
open_flags = bs->backing->bs->open_flags;
|
2010-02-14 19:39:18 +08:00
|
|
|
|
|
|
|
if (ro) {
|
2015-06-17 20:55:21 +08:00
|
|
|
if (bdrv_reopen(bs->backing->bs, open_flags | BDRV_O_RDWR, NULL)) {
|
2012-09-21 03:13:34 +08:00
|
|
|
return -EACCES;
|
2010-02-14 19:39:18 +08:00
|
|
|
}
|
2004-08-02 05:59:26 +08:00
|
|
|
}
|
2003-07-07 01:15:21 +08:00
|
|
|
|
2014-01-24 22:02:35 +08:00
|
|
|
length = bdrv_getlength(bs);
|
|
|
|
if (length < 0) {
|
|
|
|
ret = length;
|
|
|
|
goto ro_cleanup;
|
|
|
|
}
|
|
|
|
|
2015-06-17 20:55:21 +08:00
|
|
|
backing_length = bdrv_getlength(bs->backing->bs);
|
2014-01-24 22:02:35 +08:00
|
|
|
if (backing_length < 0) {
|
|
|
|
ret = backing_length;
|
|
|
|
goto ro_cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* If our top snapshot is larger than the backing file image,
|
|
|
|
* grow the backing file image if possible. If not possible,
|
|
|
|
* we must return an error */
|
|
|
|
if (length > backing_length) {
|
2015-06-17 20:55:21 +08:00
|
|
|
ret = bdrv_truncate(bs->backing->bs, length);
|
2014-01-24 22:02:35 +08:00
|
|
|
if (ret < 0) {
|
|
|
|
goto ro_cleanup;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
total_sectors = length >> BDRV_SECTOR_BITS;
|
2014-05-20 19:16:51 +08:00
|
|
|
|
|
|
|
/* qemu_try_blockalign() for bs will choose an alignment that works for
|
2015-06-17 20:55:21 +08:00
|
|
|
* bs->backing->bs as well, so no need to compare the alignment manually. */
|
2014-05-20 19:16:51 +08:00
|
|
|
buf = qemu_try_blockalign(bs, COMMIT_BUF_SECTORS * BDRV_SECTOR_SIZE);
|
|
|
|
if (buf == NULL) {
|
|
|
|
ret = -ENOMEM;
|
|
|
|
goto ro_cleanup;
|
|
|
|
}
|
2010-07-16 23:17:01 +08:00
|
|
|
|
|
|
|
for (sector = 0; sector < total_sectors; sector += n) {
|
2013-09-05 01:00:25 +08:00
|
|
|
ret = bdrv_is_allocated(bs, sector, COMMIT_BUF_SECTORS, &n);
|
|
|
|
if (ret < 0) {
|
|
|
|
goto ro_cleanup;
|
|
|
|
}
|
|
|
|
if (ret) {
|
2014-01-24 21:00:43 +08:00
|
|
|
ret = bdrv_read(bs, sector, buf, n);
|
|
|
|
if (ret < 0) {
|
2010-07-16 23:17:01 +08:00
|
|
|
goto ro_cleanup;
|
|
|
|
}
|
|
|
|
|
2015-06-17 20:55:21 +08:00
|
|
|
ret = bdrv_write(bs->backing->bs, sector, buf, n);
|
2014-01-24 21:00:43 +08:00
|
|
|
if (ret < 0) {
|
2010-07-16 23:17:01 +08:00
|
|
|
goto ro_cleanup;
|
|
|
|
}
|
2004-08-02 05:59:26 +08:00
|
|
|
}
|
2003-07-07 01:15:21 +08:00
|
|
|
}
|
2005-12-19 02:28:15 +08:00
|
|
|
|
2010-01-17 19:32:30 +08:00
|
|
|
if (drv->bdrv_make_empty) {
|
|
|
|
ret = drv->bdrv_make_empty(bs);
|
2014-01-24 21:00:43 +08:00
|
|
|
if (ret < 0) {
|
|
|
|
goto ro_cleanup;
|
|
|
|
}
|
2010-01-17 19:32:30 +08:00
|
|
|
bdrv_flush(bs);
|
|
|
|
}
|
2005-12-19 02:28:15 +08:00
|
|
|
|
2010-01-12 20:49:23 +08:00
|
|
|
/*
|
|
|
|
* Make sure all data we wrote to the backing device is actually
|
|
|
|
* stable on disk.
|
|
|
|
*/
|
2015-06-17 20:55:21 +08:00
|
|
|
if (bs->backing) {
|
|
|
|
bdrv_flush(bs->backing->bs);
|
2014-01-24 21:00:43 +08:00
|
|
|
}
|
2010-02-14 19:39:18 +08:00
|
|
|
|
2014-01-24 21:00:43 +08:00
|
|
|
ret = 0;
|
2010-02-14 19:39:18 +08:00
|
|
|
ro_cleanup:
|
2014-05-20 19:16:51 +08:00
|
|
|
qemu_vfree(buf);
|
2010-02-14 19:39:18 +08:00
|
|
|
|
|
|
|
if (ro) {
|
2012-09-21 03:13:34 +08:00
|
|
|
/* ignoring error return here */
|
2015-06-17 20:55:21 +08:00
|
|
|
bdrv_reopen(bs->backing->bs, open_flags & ~BDRV_O_RDWR, NULL);
|
2010-02-14 19:39:18 +08:00
|
|
|
}
|
|
|
|
|
2010-01-17 19:32:30 +08:00
|
|
|
return ret;
|
2003-07-07 01:15:21 +08:00
|
|
|
}
|
|
|
|
|
2012-03-06 02:10:11 +08:00
|
|
|
int bdrv_commit_all(void)
|
2010-06-03 00:55:18 +08:00
|
|
|
{
|
|
|
|
BlockDriverState *bs;
|
|
|
|
|
2014-01-24 04:31:32 +08:00
|
|
|
QTAILQ_FOREACH(bs, &bdrv_states, device_list) {
|
2014-05-08 22:34:35 +08:00
|
|
|
AioContext *aio_context = bdrv_get_aio_context(bs);
|
|
|
|
|
|
|
|
aio_context_acquire(aio_context);
|
2015-06-17 20:55:21 +08:00
|
|
|
if (bs->drv && bs->backing) {
|
2013-02-26 22:55:48 +08:00
|
|
|
int ret = bdrv_commit(bs);
|
|
|
|
if (ret < 0) {
|
2014-05-08 22:34:35 +08:00
|
|
|
aio_context_release(aio_context);
|
2013-02-26 22:55:48 +08:00
|
|
|
return ret;
|
|
|
|
}
|
2012-03-06 02:10:11 +08:00
|
|
|
}
|
2014-05-08 22:34:35 +08:00
|
|
|
aio_context_release(aio_context);
|
2010-06-03 00:55:18 +08:00
|
|
|
}
|
2012-03-06 02:10:11 +08:00
|
|
|
return 0;
|
2010-06-03 00:55:18 +08:00
|
|
|
}
|
|
|
|
|
2010-01-12 19:55:17 +08:00
|
|
|
/*
|
|
|
|
* Return values:
|
|
|
|
* 0 - success
|
|
|
|
* -EINVAL - backing format specified, but no file
|
|
|
|
* -ENOSPC - can't update the backing file because no space is left in the
|
|
|
|
* image file header
|
|
|
|
* -ENOTSUP - format driver doesn't support changing the backing file
|
|
|
|
*/
|
|
|
|
int bdrv_change_backing_file(BlockDriverState *bs,
|
|
|
|
const char *backing_file, const char *backing_fmt)
|
|
|
|
{
|
|
|
|
BlockDriver *drv = bs->drv;
|
2012-04-12 20:01:02 +08:00
|
|
|
int ret;
|
2010-01-12 19:55:17 +08:00
|
|
|
|
2012-04-12 20:01:01 +08:00
|
|
|
/* Backing file format doesn't make sense without a backing file */
|
|
|
|
if (backing_fmt && !backing_file) {
|
|
|
|
return -EINVAL;
|
|
|
|
}
|
|
|
|
|
2010-01-12 19:55:17 +08:00
|
|
|
if (drv->bdrv_change_backing_file != NULL) {
|
2012-04-12 20:01:02 +08:00
|
|
|
ret = drv->bdrv_change_backing_file(bs, backing_file, backing_fmt);
|
2010-01-12 19:55:17 +08:00
|
|
|
} else {
|
2012-04-12 20:01:02 +08:00
|
|
|
ret = -ENOTSUP;
|
2010-01-12 19:55:17 +08:00
|
|
|
}
|
2012-04-12 20:01:02 +08:00
|
|
|
|
|
|
|
if (ret == 0) {
|
|
|
|
pstrcpy(bs->backing_file, sizeof(bs->backing_file), backing_file ?: "");
|
|
|
|
pstrcpy(bs->backing_format, sizeof(bs->backing_format), backing_fmt ?: "");
|
|
|
|
}
|
|
|
|
return ret;
|
2010-01-12 19:55:17 +08:00
|
|
|
}
|
|
|
|
|
2012-09-28 01:29:12 +08:00
|
|
|
/*
|
|
|
|
* Finds the image layer in the chain that has 'bs' as its backing file.
|
|
|
|
*
|
|
|
|
* active is the current topmost image.
|
|
|
|
*
|
|
|
|
* Returns NULL if bs is not found in active's image chain,
|
|
|
|
* or if active == bs.
|
2014-06-26 03:35:26 +08:00
|
|
|
*
|
|
|
|
* Returns the bottommost base image if bs == NULL.
|
2012-09-28 01:29:12 +08:00
|
|
|
*/
|
|
|
|
BlockDriverState *bdrv_find_overlay(BlockDriverState *active,
|
|
|
|
BlockDriverState *bs)
|
|
|
|
{
|
2015-06-17 20:55:21 +08:00
|
|
|
while (active && bs != backing_bs(active)) {
|
|
|
|
active = backing_bs(active);
|
2012-09-28 01:29:12 +08:00
|
|
|
}
|
|
|
|
|
2014-06-26 03:35:26 +08:00
|
|
|
return active;
|
|
|
|
}
|
2012-09-28 01:29:12 +08:00
|
|
|
|
2014-06-26 03:35:26 +08:00
|
|
|
/* Given a BDS, searches for the base layer. */
|
|
|
|
BlockDriverState *bdrv_find_base(BlockDriverState *bs)
|
|
|
|
{
|
|
|
|
return bdrv_find_overlay(bs, NULL);
|
2012-09-28 01:29:12 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Drops images above 'base' up to and including 'top', and sets the image
|
|
|
|
* above 'top' to have base as its backing file.
|
|
|
|
*
|
|
|
|
* Requires that the overlay to 'top' is opened r/w, so that the backing file
|
|
|
|
* information in 'bs' can be properly updated.
|
|
|
|
*
|
|
|
|
* E.g., this will convert the following chain:
|
|
|
|
* bottom <- base <- intermediate <- top <- active
|
|
|
|
*
|
|
|
|
* to
|
|
|
|
*
|
|
|
|
* bottom <- base <- active
|
|
|
|
*
|
|
|
|
* It is allowed for bottom==base, in which case it converts:
|
|
|
|
*
|
|
|
|
* base <- intermediate <- top <- active
|
|
|
|
*
|
|
|
|
* to
|
|
|
|
*
|
|
|
|
* base <- active
|
|
|
|
*
|
block: extend block-commit to accept a string for the backing file
On some image chains, QEMU may not always be able to resolve the
filenames properly, when updating the backing file of an image
after a block commit.
For instance, certain relative pathnames may fail, or drives may
have been specified originally by file descriptor (e.g. /dev/fd/???),
or a relative protocol pathname may have been used.
In these instances, QEMU may lack the information to be able to make
the correct choice, but the user or management layer most likely does
have that knowledge.
With this extension to the block-commit api, the user is able to change
the backing file of the overlay image as part of the block-commit
operation.
This allows the change to be 'safe', in the sense that if the attempt
to write the overlay image metadata fails, then the block-commit
operation returns failure, without disrupting the guest.
If the commit top is the active layer, then specifying the backing
file string will be treated as an error (there is no overlay image
to modify in that case).
If a backing file string is not specified in the command, the backing
file string to use is determined in the same manner as it was
previously.
Reviewed-by: Eric Blake <eblake@redhat.com>
Signed-off-by: Jeff Cody <jcody@redhat.com>
Reviewed-by: Kevin Wolf <kwolf@redhat.com>
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
2014-06-26 03:40:10 +08:00
|
|
|
* If backing_file_str is non-NULL, it will be used when modifying top's
|
|
|
|
* overlay image metadata.
|
|
|
|
*
|
2012-09-28 01:29:12 +08:00
|
|
|
* Error conditions:
|
|
|
|
* if active == top, that is considered an error
|
|
|
|
*
|
|
|
|
*/
|
|
|
|
int bdrv_drop_intermediate(BlockDriverState *active, BlockDriverState *top,
|
block: extend block-commit to accept a string for the backing file
On some image chains, QEMU may not always be able to resolve the
filenames properly, when updating the backing file of an image
after a block commit.
For instance, certain relative pathnames may fail, or drives may
have been specified originally by file descriptor (e.g. /dev/fd/???),
or a relative protocol pathname may have been used.
In these instances, QEMU may lack the information to be able to make
the correct choice, but the user or management layer most likely does
have that knowledge.
With this extension to the block-commit api, the user is able to change
the backing file of the overlay image as part of the block-commit
operation.
This allows the change to be 'safe', in the sense that if the attempt
to write the overlay image metadata fails, then the block-commit
operation returns failure, without disrupting the guest.
If the commit top is the active layer, then specifying the backing
file string will be treated as an error (there is no overlay image
to modify in that case).
If a backing file string is not specified in the command, the backing
file string to use is determined in the same manner as it was
previously.
Reviewed-by: Eric Blake <eblake@redhat.com>
Signed-off-by: Jeff Cody <jcody@redhat.com>
Reviewed-by: Kevin Wolf <kwolf@redhat.com>
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
2014-06-26 03:40:10 +08:00
|
|
|
BlockDriverState *base, const char *backing_file_str)
|
2012-09-28 01:29:12 +08:00
|
|
|
{
|
|
|
|
BlockDriverState *new_top_bs = NULL;
|
|
|
|
int ret = -EIO;
|
|
|
|
|
|
|
|
if (!top->drv || !base->drv) {
|
|
|
|
goto exit;
|
|
|
|
}
|
|
|
|
|
|
|
|
new_top_bs = bdrv_find_overlay(active, top);
|
|
|
|
|
|
|
|
if (new_top_bs == NULL) {
|
|
|
|
/* we could not find the image above 'top', this is an error */
|
|
|
|
goto exit;
|
|
|
|
}
|
|
|
|
|
2015-06-17 20:55:21 +08:00
|
|
|
/* special case of new_top_bs->backing->bs already pointing to base - nothing
|
2012-09-28 01:29:12 +08:00
|
|
|
* to do, no intermediate images */
|
2015-06-17 20:55:21 +08:00
|
|
|
if (backing_bs(new_top_bs) == base) {
|
2012-09-28 01:29:12 +08:00
|
|
|
ret = 0;
|
|
|
|
goto exit;
|
|
|
|
}
|
|
|
|
|
2015-09-14 21:33:33 +08:00
|
|
|
/* Make sure that base is in the backing chain of top */
|
|
|
|
if (!bdrv_chain_contains(top, base)) {
|
2012-09-28 01:29:12 +08:00
|
|
|
goto exit;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* success - we can delete the intermediate states, and link top->base */
|
2015-09-14 21:33:33 +08:00
|
|
|
backing_file_str = backing_file_str ? backing_file_str : base->filename;
|
block: extend block-commit to accept a string for the backing file
On some image chains, QEMU may not always be able to resolve the
filenames properly, when updating the backing file of an image
after a block commit.
For instance, certain relative pathnames may fail, or drives may
have been specified originally by file descriptor (e.g. /dev/fd/???),
or a relative protocol pathname may have been used.
In these instances, QEMU may lack the information to be able to make
the correct choice, but the user or management layer most likely does
have that knowledge.
With this extension to the block-commit api, the user is able to change
the backing file of the overlay image as part of the block-commit
operation.
This allows the change to be 'safe', in the sense that if the attempt
to write the overlay image metadata fails, then the block-commit
operation returns failure, without disrupting the guest.
If the commit top is the active layer, then specifying the backing
file string will be treated as an error (there is no overlay image
to modify in that case).
If a backing file string is not specified in the command, the backing
file string to use is determined in the same manner as it was
previously.
Reviewed-by: Eric Blake <eblake@redhat.com>
Signed-off-by: Jeff Cody <jcody@redhat.com>
Reviewed-by: Kevin Wolf <kwolf@redhat.com>
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
2014-06-26 03:40:10 +08:00
|
|
|
ret = bdrv_change_backing_file(new_top_bs, backing_file_str,
|
2015-09-14 21:33:33 +08:00
|
|
|
base->drv ? base->drv->format_name : "");
|
2012-09-28 01:29:12 +08:00
|
|
|
if (ret) {
|
|
|
|
goto exit;
|
|
|
|
}
|
2015-09-14 21:33:33 +08:00
|
|
|
bdrv_set_backing_hd(new_top_bs, base);
|
2012-09-28 01:29:12 +08:00
|
|
|
|
|
|
|
ret = 0;
|
|
|
|
exit:
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
/**
|
|
|
|
* Truncate file to 'offset' bytes (needed only for file protocols)
|
|
|
|
*/
|
|
|
|
int bdrv_truncate(BlockDriverState *bs, int64_t offset)
|
2009-03-04 01:37:16 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
BlockDriver *drv = bs->drv;
|
|
|
|
int ret;
|
|
|
|
if (!drv)
|
2009-03-04 01:37:16 +08:00
|
|
|
return -ENOMEDIUM;
|
2015-04-28 21:27:52 +08:00
|
|
|
if (!drv->bdrv_truncate)
|
|
|
|
return -ENOTSUP;
|
|
|
|
if (bs->read_only)
|
|
|
|
return -EACCES;
|
2009-03-04 01:37:16 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
ret = drv->bdrv_truncate(bs, offset);
|
|
|
|
if (ret == 0) {
|
|
|
|
ret = refresh_total_sectors(bs, offset >> BDRV_SECTOR_BITS);
|
|
|
|
bdrv_dirty_bitmap_truncate(bs);
|
|
|
|
if (bs->blk) {
|
|
|
|
blk_dev_resize_cb(bs->blk);
|
|
|
|
}
|
2015-02-06 02:58:24 +08:00
|
|
|
}
|
2015-04-28 21:27:52 +08:00
|
|
|
return ret;
|
2009-03-04 01:37:16 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
/**
|
|
|
|
* Length of a allocated file in bytes. Sparse files are counted by actual
|
|
|
|
* allocated space. Return < 0 if error or unknown.
|
|
|
|
*/
|
|
|
|
int64_t bdrv_get_allocated_file_size(BlockDriverState *bs)
|
2009-03-04 01:37:16 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
BlockDriver *drv = bs->drv;
|
|
|
|
if (!drv) {
|
|
|
|
return -ENOMEDIUM;
|
2014-03-26 20:06:02 +08:00
|
|
|
}
|
2015-04-28 21:27:52 +08:00
|
|
|
if (drv->bdrv_get_allocated_file_size) {
|
|
|
|
return drv->bdrv_get_allocated_file_size(bs);
|
|
|
|
}
|
|
|
|
if (bs->file) {
|
2015-06-16 20:19:22 +08:00
|
|
|
return bdrv_get_allocated_file_size(bs->file->bs);
|
2011-10-13 20:08:22 +08:00
|
|
|
}
|
2015-04-28 21:27:52 +08:00
|
|
|
return -ENOTSUP;
|
2011-10-13 20:08:22 +08:00
|
|
|
}
|
2011-07-15 22:05:00 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
/**
|
|
|
|
* Return number of sectors on success, -errno on error.
|
2011-10-13 20:08:22 +08:00
|
|
|
*/
|
2015-04-28 21:27:52 +08:00
|
|
|
int64_t bdrv_nb_sectors(BlockDriverState *bs)
|
2011-10-13 20:08:22 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
BlockDriver *drv = bs->drv;
|
2012-04-02 18:59:34 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
if (!drv)
|
|
|
|
return -ENOMEDIUM;
|
2014-05-08 22:34:34 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
if (drv->has_variable_length) {
|
|
|
|
int ret = refresh_total_sectors(bs, bs->total_sectors);
|
|
|
|
if (ret < 0) {
|
|
|
|
return ret;
|
2011-10-13 20:08:22 +08:00
|
|
|
}
|
|
|
|
}
|
2015-04-28 21:27:52 +08:00
|
|
|
return bs->total_sectors;
|
2011-10-13 20:08:22 +08:00
|
|
|
}
|
2004-03-15 05:38:54 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
/**
|
|
|
|
* Return length in bytes on success, -errno on error.
|
|
|
|
* The length is always a multiple of BDRV_SECTOR_SIZE.
|
2013-04-06 03:27:55 +08:00
|
|
|
*/
|
2015-04-28 21:27:52 +08:00
|
|
|
int64_t bdrv_getlength(BlockDriverState *bs)
|
2013-04-06 03:27:55 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
int64_t ret = bdrv_nb_sectors(bs);
|
2013-04-06 03:27:55 +08:00
|
|
|
|
2015-05-15 16:36:05 +08:00
|
|
|
ret = ret > INT64_MAX / BDRV_SECTOR_SIZE ? -EFBIG : ret;
|
2015-04-28 21:27:52 +08:00
|
|
|
return ret < 0 ? ret : ret * BDRV_SECTOR_SIZE;
|
2003-06-30 18:03:06 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
/* return 0 as number of sectors if no device present or error */
|
|
|
|
void bdrv_get_geometry(BlockDriverState *bs, uint64_t *nb_sectors_ptr)
|
2012-06-29 23:34:29 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
int64_t nb_sectors = bdrv_nb_sectors(bs);
|
2012-06-29 23:34:29 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
*nb_sectors_ptr = nb_sectors < 0 ? 0 : nb_sectors;
|
2012-06-29 23:34:29 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
int bdrv_is_read_only(BlockDriverState *bs)
|
2013-04-06 03:27:55 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
return bs->read_only;
|
2006-08-02 00:21:11 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
int bdrv_is_sg(BlockDriverState *bs)
|
2010-06-16 22:38:15 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
return bs->sg;
|
2010-06-16 22:38:15 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
int bdrv_enable_write_cache(BlockDriverState *bs)
|
2011-11-17 21:40:31 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
return bs->enable_write_cache;
|
2011-11-17 21:40:31 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
void bdrv_set_enable_write_cache(BlockDriverState *bs, bool wce)
|
2011-07-14 23:27:13 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
bs->enable_write_cache = wce;
|
2011-11-17 21:40:31 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
/* so a reopen() will preserve wce */
|
|
|
|
if (wce) {
|
|
|
|
bs->open_flags |= BDRV_O_CACHE_WB;
|
2013-08-06 09:53:40 +08:00
|
|
|
} else {
|
2015-04-28 21:27:52 +08:00
|
|
|
bs->open_flags &= ~BDRV_O_CACHE_WB;
|
2013-08-06 09:53:40 +08:00
|
|
|
}
|
2011-07-14 23:27:13 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
int bdrv_is_encrypted(BlockDriverState *bs)
|
2015-03-24 09:23:49 +08:00
|
|
|
{
|
2015-06-17 20:55:21 +08:00
|
|
|
if (bs->backing && bs->backing->bs->encrypted) {
|
2015-04-28 21:27:52 +08:00
|
|
|
return 1;
|
2015-06-17 20:55:21 +08:00
|
|
|
}
|
2015-04-28 21:27:52 +08:00
|
|
|
return bs->encrypted;
|
2015-03-24 09:23:49 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
int bdrv_key_required(BlockDriverState *bs)
|
2015-03-24 09:23:49 +08:00
|
|
|
{
|
2015-06-17 20:55:21 +08:00
|
|
|
BdrvChild *backing = bs->backing;
|
2015-04-28 21:27:52 +08:00
|
|
|
|
2015-06-17 20:55:21 +08:00
|
|
|
if (backing && backing->bs->encrypted && !backing->bs->valid_key) {
|
2015-04-28 21:27:52 +08:00
|
|
|
return 1;
|
2015-06-17 20:55:21 +08:00
|
|
|
}
|
2015-04-28 21:27:52 +08:00
|
|
|
return (bs->encrypted && !bs->valid_key);
|
2015-03-24 09:23:49 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
int bdrv_set_key(BlockDriverState *bs, const char *key)
|
2013-12-02 22:07:48 +08:00
|
|
|
{
|
|
|
|
int ret;
|
2015-06-17 20:55:21 +08:00
|
|
|
if (bs->backing && bs->backing->bs->encrypted) {
|
|
|
|
ret = bdrv_set_key(bs->backing->bs, key);
|
2015-04-28 21:27:52 +08:00
|
|
|
if (ret < 0)
|
|
|
|
return ret;
|
|
|
|
if (!bs->encrypted)
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
if (!bs->encrypted) {
|
|
|
|
return -EINVAL;
|
|
|
|
} else if (!bs->drv || !bs->drv->bdrv_set_key) {
|
2013-12-02 22:07:48 +08:00
|
|
|
return -ENOMEDIUM;
|
|
|
|
}
|
2015-04-28 21:27:52 +08:00
|
|
|
ret = bs->drv->bdrv_set_key(bs, key);
|
2015-02-06 02:58:25 +08:00
|
|
|
if (ret < 0) {
|
2015-04-28 21:27:52 +08:00
|
|
|
bs->valid_key = 0;
|
|
|
|
} else if (!bs->valid_key) {
|
|
|
|
bs->valid_key = 1;
|
|
|
|
if (bs->blk) {
|
|
|
|
/* call the change callback now, we skipped it on open */
|
|
|
|
blk_dev_change_media_cb(bs->blk, true);
|
|
|
|
}
|
2013-12-02 23:09:46 +08:00
|
|
|
}
|
2015-04-28 21:27:52 +08:00
|
|
|
return ret;
|
|
|
|
}
|
2012-02-07 21:27:25 +08:00
|
|
|
|
2011-10-06 00:17:03 +08:00
|
|
|
/*
|
2015-04-28 21:27:52 +08:00
|
|
|
* Provide an encryption key for @bs.
|
|
|
|
* If @key is non-null:
|
|
|
|
* If @bs is not encrypted, fail.
|
|
|
|
* Else if the key is invalid, fail.
|
|
|
|
* Else set @bs's key to @key, replacing the existing key, if any.
|
|
|
|
* If @key is null:
|
|
|
|
* If @bs is encrypted and still lacks a key, fail.
|
|
|
|
* Else do nothing.
|
|
|
|
* On failure, store an error object through @errp if non-null.
|
2011-10-06 00:17:03 +08:00
|
|
|
*/
|
2015-04-28 21:27:52 +08:00
|
|
|
void bdrv_add_key(BlockDriverState *bs, const char *key, Error **errp)
|
2011-10-06 00:17:03 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
if (key) {
|
|
|
|
if (!bdrv_is_encrypted(bs)) {
|
|
|
|
error_setg(errp, "Node '%s' is not encrypted",
|
|
|
|
bdrv_get_device_or_node_name(bs));
|
|
|
|
} else if (bdrv_set_key(bs, key) < 0) {
|
2015-03-17 18:54:50 +08:00
|
|
|
error_setg(errp, QERR_INVALID_PASSWORD);
|
2015-01-29 17:37:00 +08:00
|
|
|
}
|
|
|
|
} else {
|
|
|
|
if (bdrv_key_required(bs)) {
|
2015-01-29 17:37:01 +08:00
|
|
|
error_set(errp, ERROR_CLASS_DEVICE_ENCRYPTED,
|
|
|
|
"'%s' (%s) is encrypted",
|
2015-04-08 17:29:19 +08:00
|
|
|
bdrv_get_device_or_node_name(bs),
|
2015-01-29 17:37:00 +08:00
|
|
|
bdrv_get_encrypted_filename(bs));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
const char *bdrv_get_format_name(BlockDriverState *bs)
|
2009-09-09 23:53:37 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
return bs->drv ? bs->drv->format_name : NULL;
|
2009-09-09 23:53:37 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
static int qsort_strcmp(const void *a, const void *b)
|
2009-09-09 23:53:37 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
return strcmp(a, b);
|
2009-09-09 23:53:37 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
void bdrv_iterate_format(void (*it)(void *opaque, const char *name),
|
|
|
|
void *opaque)
|
2009-09-09 23:53:37 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
BlockDriver *drv;
|
|
|
|
int count = 0;
|
|
|
|
int i;
|
|
|
|
const char **formats = NULL;
|
2009-09-09 23:53:37 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
QLIST_FOREACH(drv, &bdrv_drivers, list) {
|
|
|
|
if (drv->format_name) {
|
|
|
|
bool found = false;
|
|
|
|
int i = count;
|
|
|
|
while (formats && i && !found) {
|
|
|
|
found = !strcmp(formats[--i], drv->format_name);
|
|
|
|
}
|
2010-01-26 21:49:08 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
if (!found) {
|
|
|
|
formats = g_renew(const char *, formats, count + 1);
|
|
|
|
formats[count++] = drv->format_name;
|
|
|
|
}
|
2014-10-27 17:18:46 +08:00
|
|
|
}
|
2015-04-28 21:27:52 +08:00
|
|
|
}
|
2014-10-27 17:18:46 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
qsort(formats, count, sizeof(formats[0]), qsort_strcmp);
|
2009-09-09 23:53:37 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
for (i = 0; i < count; i++) {
|
|
|
|
it(opaque, formats[i]);
|
|
|
|
}
|
2009-09-09 23:53:37 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
g_free(formats);
|
|
|
|
}
|
2009-09-09 23:53:37 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
/* This function is to find a node in the bs graph */
|
|
|
|
BlockDriverState *bdrv_find_node(const char *node_name)
|
|
|
|
{
|
|
|
|
BlockDriverState *bs;
|
2014-07-30 16:53:30 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
assert(node_name);
|
2009-09-09 23:53:37 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
QTAILQ_FOREACH(bs, &graph_bdrv_states, node_list) {
|
|
|
|
if (!strcmp(node_name, bs->node_name)) {
|
|
|
|
return bs;
|
2009-09-09 23:53:37 +08:00
|
|
|
}
|
|
|
|
}
|
2015-04-28 21:27:52 +08:00
|
|
|
return NULL;
|
2009-09-09 23:53:37 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
/* Put this QMP function here so it can access the static graph_bdrv_states. */
|
|
|
|
BlockDeviceInfoList *bdrv_named_nodes_list(Error **errp)
|
2009-09-09 23:53:37 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
BlockDeviceInfoList *list, *entry;
|
|
|
|
BlockDriverState *bs;
|
2009-09-09 23:53:37 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
list = NULL;
|
|
|
|
QTAILQ_FOREACH(bs, &graph_bdrv_states, node_list) {
|
|
|
|
BlockDeviceInfo *info = bdrv_block_device_info(bs, errp);
|
|
|
|
if (!info) {
|
|
|
|
qapi_free_BlockDeviceInfoList(list);
|
|
|
|
return NULL;
|
2011-03-08 00:01:04 +08:00
|
|
|
}
|
2015-04-28 21:27:52 +08:00
|
|
|
entry = g_malloc0(sizeof(*entry));
|
|
|
|
entry->value = info;
|
|
|
|
entry->next = list;
|
|
|
|
list = entry;
|
2011-03-08 00:01:04 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
return list;
|
|
|
|
}
|
2009-09-09 23:53:37 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
BlockDriverState *bdrv_lookup_bs(const char *device,
|
|
|
|
const char *node_name,
|
|
|
|
Error **errp)
|
|
|
|
{
|
|
|
|
BlockBackend *blk;
|
|
|
|
BlockDriverState *bs;
|
2009-09-09 23:53:37 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
if (device) {
|
|
|
|
blk = blk_by_name(device);
|
2009-09-09 23:53:37 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
if (blk) {
|
2015-10-26 22:46:49 +08:00
|
|
|
bs = blk_bs(blk);
|
|
|
|
if (!bs) {
|
2015-10-19 23:53:29 +08:00
|
|
|
error_setg(errp, "Device '%s' has no medium", device);
|
|
|
|
}
|
|
|
|
|
2015-10-26 22:46:49 +08:00
|
|
|
return bs;
|
2015-04-28 21:27:52 +08:00
|
|
|
}
|
|
|
|
}
|
2009-09-09 23:53:37 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
if (node_name) {
|
|
|
|
bs = bdrv_find_node(node_name);
|
2010-05-23 01:15:08 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
if (bs) {
|
|
|
|
return bs;
|
|
|
|
}
|
2009-09-09 23:53:37 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
error_setg(errp, "Cannot find device=%s nor node_name=%s",
|
|
|
|
device ? device : "",
|
|
|
|
node_name ? node_name : "");
|
|
|
|
return NULL;
|
2009-09-09 23:53:37 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
/* If 'base' is in the same chain as 'top', return true. Otherwise,
|
|
|
|
* return false. If either argument is NULL, return false. */
|
|
|
|
bool bdrv_chain_contains(BlockDriverState *top, BlockDriverState *base)
|
2006-08-02 00:21:11 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
while (top && top != base) {
|
2015-06-17 20:55:21 +08:00
|
|
|
top = backing_bs(top);
|
2014-09-11 13:41:09 +08:00
|
|
|
}
|
2015-04-28 21:27:52 +08:00
|
|
|
|
|
|
|
return top != NULL;
|
2014-09-11 13:41:09 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
BlockDriverState *bdrv_next_node(BlockDriverState *bs)
|
2014-09-11 13:41:09 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
if (!bs) {
|
|
|
|
return QTAILQ_FIRST(&graph_bdrv_states);
|
2014-09-11 13:41:09 +08:00
|
|
|
}
|
2015-04-28 21:27:52 +08:00
|
|
|
return QTAILQ_NEXT(bs, node_list);
|
2006-08-02 00:21:11 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
BlockDriverState *bdrv_next(BlockDriverState *bs)
|
2006-08-02 00:21:11 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
if (!bs) {
|
|
|
|
return QTAILQ_FIRST(&bdrv_states);
|
2014-05-20 19:16:51 +08:00
|
|
|
}
|
2015-04-28 21:27:52 +08:00
|
|
|
return QTAILQ_NEXT(bs, device_list);
|
2006-08-02 00:21:11 +08:00
|
|
|
}
|
2006-06-27 04:08:57 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
const char *bdrv_get_node_name(const BlockDriverState *bs)
|
2006-08-02 00:21:11 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
return bs->node_name;
|
2006-06-27 04:08:57 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
/* TODO check what callers really want: bs->node_name or blk_name() */
|
|
|
|
const char *bdrv_get_device_name(const BlockDriverState *bs)
|
2006-06-27 04:08:57 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
return bs->blk ? blk_name(bs->blk) : "";
|
2009-04-08 02:43:24 +08:00
|
|
|
}
|
2006-08-02 00:21:11 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
/* This can be used to identify nodes that might not have a device
|
|
|
|
* name associated. Since node and device names live in the same
|
|
|
|
* namespace, the result is unambiguous. The exception is if both are
|
|
|
|
* absent, then this returns an empty (non-null) string. */
|
|
|
|
const char *bdrv_get_device_or_node_name(const BlockDriverState *bs)
|
2009-04-08 02:43:24 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
return bs->blk ? blk_name(bs->blk) : bs->node_name;
|
2006-06-27 04:08:57 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
int bdrv_get_flags(BlockDriverState *bs)
|
2015-03-28 14:37:18 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
return bs->open_flags;
|
2015-03-28 14:37:18 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
int bdrv_has_zero_init_1(BlockDriverState *bs)
|
2011-06-30 16:05:46 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
return 1;
|
2015-03-28 14:37:18 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
int bdrv_has_zero_init(BlockDriverState *bs)
|
2015-03-28 14:37:18 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
assert(bs->drv);
|
2015-03-28 14:37:18 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
/* If BS is a copy on write image, it is initialized to
|
|
|
|
the contents of the base image, which may not be zeroes. */
|
2015-06-17 20:55:21 +08:00
|
|
|
if (bs->backing) {
|
2015-04-28 21:27:52 +08:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
if (bs->drv->bdrv_has_zero_init) {
|
|
|
|
return bs->drv->bdrv_has_zero_init(bs);
|
2015-03-28 14:37:18 +08:00
|
|
|
}
|
2015-04-28 21:27:52 +08:00
|
|
|
|
|
|
|
/* safe default */
|
|
|
|
return 0;
|
2011-06-30 16:05:46 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
bool bdrv_unallocated_blocks_are_zero(BlockDriverState *bs)
|
2011-10-13 20:08:23 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
BlockDriverInfo bdi;
|
2011-10-13 20:08:23 +08:00
|
|
|
|
2015-06-17 20:55:21 +08:00
|
|
|
if (bs->backing) {
|
2015-04-28 21:27:52 +08:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (bdrv_get_info(bs, &bdi) == 0) {
|
|
|
|
return bdi.unallocated_blocks_are_zero;
|
2011-10-13 20:08:23 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
return false;
|
2011-10-13 20:08:23 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
bool bdrv_can_write_zeroes_with_unmap(BlockDriverState *bs)
|
2011-06-30 16:05:46 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
BlockDriverInfo bdi;
|
2011-06-30 16:05:46 +08:00
|
|
|
|
2015-06-17 20:55:21 +08:00
|
|
|
if (bs->backing || !(bs->open_flags & BDRV_O_UNMAP)) {
|
2015-04-28 21:27:52 +08:00
|
|
|
return false;
|
|
|
|
}
|
2011-06-30 16:05:46 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
if (bdrv_get_info(bs, &bdi) == 0) {
|
|
|
|
return bdi.can_write_zeroes_with_unmap;
|
|
|
|
}
|
2011-06-30 16:05:46 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
return false;
|
2011-06-30 16:05:46 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
const char *bdrv_get_encrypted_filename(BlockDriverState *bs)
|
2009-09-05 01:01:49 +08:00
|
|
|
{
|
2015-06-17 20:55:21 +08:00
|
|
|
if (bs->backing && bs->backing->bs->encrypted)
|
2015-04-28 21:27:52 +08:00
|
|
|
return bs->backing_file;
|
|
|
|
else if (bs->encrypted)
|
|
|
|
return bs->filename;
|
|
|
|
else
|
|
|
|
return NULL;
|
2009-09-05 01:01:49 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
void bdrv_get_backing_filename(BlockDriverState *bs,
|
|
|
|
char *filename, int filename_size)
|
2010-05-26 23:51:49 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
pstrcpy(filename, filename_size, bs->backing_file);
|
|
|
|
}
|
2012-11-13 23:35:08 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
int bdrv_get_info(BlockDriverState *bs, BlockDriverInfo *bdi)
|
|
|
|
{
|
|
|
|
BlockDriver *drv = bs->drv;
|
|
|
|
if (!drv)
|
|
|
|
return -ENOMEDIUM;
|
|
|
|
if (!drv->bdrv_get_info)
|
|
|
|
return -ENOTSUP;
|
|
|
|
memset(bdi, 0, sizeof(*bdi));
|
|
|
|
return drv->bdrv_get_info(bs, bdi);
|
|
|
|
}
|
2010-05-26 23:51:49 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
ImageInfoSpecific *bdrv_get_specific_info(BlockDriverState *bs)
|
|
|
|
{
|
|
|
|
BlockDriver *drv = bs->drv;
|
|
|
|
if (drv && drv->bdrv_get_specific_info) {
|
|
|
|
return drv->bdrv_get_specific_info(bs);
|
|
|
|
}
|
|
|
|
return NULL;
|
2010-05-26 23:51:49 +08:00
|
|
|
}
|
|
|
|
|
2015-11-18 16:52:54 +08:00
|
|
|
void bdrv_debug_event(BlockDriverState *bs, BlkdebugEvent event)
|
2011-10-17 18:32:14 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
if (!bs || !bs->drv || !bs->drv->bdrv_debug_event) {
|
|
|
|
return;
|
|
|
|
}
|
2011-10-17 18:32:14 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
bs->drv->bdrv_debug_event(bs, event);
|
2011-10-17 18:32:14 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
int bdrv_debug_breakpoint(BlockDriverState *bs, const char *event,
|
|
|
|
const char *tag)
|
2011-10-17 18:32:14 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
while (bs && bs->drv && !bs->drv->bdrv_debug_breakpoint) {
|
2015-06-16 20:19:22 +08:00
|
|
|
bs = bs->file ? bs->file->bs : NULL;
|
2015-04-28 21:27:52 +08:00
|
|
|
}
|
2011-10-17 18:32:14 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
if (bs && bs->drv && bs->drv->bdrv_debug_breakpoint) {
|
|
|
|
return bs->drv->bdrv_debug_breakpoint(bs, event, tag);
|
|
|
|
}
|
2011-10-17 18:32:14 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
return -ENOTSUP;
|
2011-10-17 18:32:14 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
int bdrv_debug_remove_breakpoint(BlockDriverState *bs, const char *tag)
|
2004-08-02 05:59:26 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
while (bs && bs->drv && !bs->drv->bdrv_debug_remove_breakpoint) {
|
2015-06-16 20:19:22 +08:00
|
|
|
bs = bs->file ? bs->file->bs : NULL;
|
2015-04-28 21:27:52 +08:00
|
|
|
}
|
2006-08-07 10:38:06 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
if (bs && bs->drv && bs->drv->bdrv_debug_remove_breakpoint) {
|
|
|
|
return bs->drv->bdrv_debug_remove_breakpoint(bs, tag);
|
|
|
|
}
|
|
|
|
|
|
|
|
return -ENOTSUP;
|
2009-10-28 01:41:44 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
int bdrv_debug_resume(BlockDriverState *bs, const char *tag)
|
2006-08-07 10:38:06 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
while (bs && (!bs->drv || !bs->drv->bdrv_debug_resume)) {
|
2015-06-16 20:19:22 +08:00
|
|
|
bs = bs->file ? bs->file->bs : NULL;
|
2015-04-28 21:27:52 +08:00
|
|
|
}
|
2006-08-07 10:38:06 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
if (bs && bs->drv && bs->drv->bdrv_debug_resume) {
|
|
|
|
return bs->drv->bdrv_debug_resume(bs, tag);
|
|
|
|
}
|
2006-08-07 10:38:06 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
return -ENOTSUP;
|
2014-09-11 13:41:08 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
bool bdrv_debug_is_suspended(BlockDriverState *bs, const char *tag)
|
2006-08-07 10:38:06 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
while (bs && bs->drv && !bs->drv->bdrv_debug_is_suspended) {
|
2015-06-16 20:19:22 +08:00
|
|
|
bs = bs->file ? bs->file->bs : NULL;
|
2014-09-11 13:41:08 +08:00
|
|
|
}
|
2006-08-19 19:45:59 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
if (bs && bs->drv && bs->drv->bdrv_debug_is_suspended) {
|
|
|
|
return bs->drv->bdrv_debug_is_suspended(bs, tag);
|
|
|
|
}
|
2011-07-15 19:50:26 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
return false;
|
|
|
|
}
|
2011-07-15 19:50:26 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
int bdrv_is_snapshot(BlockDriverState *bs)
|
2011-07-15 19:50:26 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
return !!(bs->open_flags & BDRV_O_SNAPSHOT);
|
2011-07-15 19:50:26 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
/* backing_file can either be relative, or absolute, or a protocol. If it is
|
|
|
|
* relative, it must be relative to the chain. So, passing in bs->filename
|
|
|
|
* from a BDS as backing_file should not be done, as that may be relative to
|
|
|
|
* the CWD rather than the chain. */
|
|
|
|
BlockDriverState *bdrv_find_backing_image(BlockDriverState *bs,
|
|
|
|
const char *backing_file)
|
2011-07-15 19:50:26 +08:00
|
|
|
{
|
2015-04-28 21:27:52 +08:00
|
|
|
char *filename_full = NULL;
|
|
|
|
char *backing_file_full = NULL;
|
|
|
|
char *filename_tmp = NULL;
|
|
|
|
int is_protocol = 0;
|
|
|
|
BlockDriverState *curr_bs = NULL;
|
|
|
|
BlockDriverState *retval = NULL;
|
2011-07-15 19:50:26 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
if (!bs || !bs->drv || !backing_file) {
|
|
|
|
return NULL;
|
2011-07-15 19:50:26 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
filename_full = g_malloc(PATH_MAX);
|
|
|
|
backing_file_full = g_malloc(PATH_MAX);
|
|
|
|
filename_tmp = g_malloc(PATH_MAX);
|
2011-07-15 19:50:26 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
is_protocol = path_has_protocol(backing_file);
|
2011-07-15 19:50:26 +08:00
|
|
|
|
2015-06-17 20:55:21 +08:00
|
|
|
for (curr_bs = bs; curr_bs->backing; curr_bs = curr_bs->backing->bs) {
|
2011-07-15 19:50:26 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
/* If either of the filename paths is actually a protocol, then
|
|
|
|
* compare unmodified paths; otherwise make paths relative */
|
|
|
|
if (is_protocol || path_has_protocol(curr_bs->backing_file)) {
|
|
|
|
if (strcmp(backing_file, curr_bs->backing_file) == 0) {
|
2015-06-17 20:55:21 +08:00
|
|
|
retval = curr_bs->backing->bs;
|
2015-04-28 21:27:52 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
/* If not an absolute filename path, make it relative to the current
|
|
|
|
* image's filename path */
|
|
|
|
path_combine(filename_tmp, PATH_MAX, curr_bs->filename,
|
|
|
|
backing_file);
|
2011-07-15 19:50:26 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
/* We are going to compare absolute pathnames */
|
|
|
|
if (!realpath(filename_tmp, filename_full)) {
|
|
|
|
continue;
|
|
|
|
}
|
2011-10-17 18:32:12 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
/* We need to make sure the backing filename we are comparing against
|
|
|
|
* is relative to the current image filename (or absolute) */
|
|
|
|
path_combine(filename_tmp, PATH_MAX, curr_bs->filename,
|
|
|
|
curr_bs->backing_file);
|
2011-10-17 18:32:12 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
if (!realpath(filename_tmp, backing_file_full)) {
|
|
|
|
continue;
|
|
|
|
}
|
2011-11-11 01:10:11 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
if (strcmp(backing_file_full, filename_full) == 0) {
|
2015-06-17 20:55:21 +08:00
|
|
|
retval = curr_bs->backing->bs;
|
2015-04-28 21:27:52 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
2011-11-11 01:10:11 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
g_free(filename_full);
|
|
|
|
g_free(backing_file_full);
|
|
|
|
g_free(filename_tmp);
|
|
|
|
return retval;
|
|
|
|
}
|
|
|
|
|
|
|
|
int bdrv_get_backing_file_depth(BlockDriverState *bs)
|
|
|
|
{
|
|
|
|
if (!bs->drv) {
|
|
|
|
return 0;
|
2011-11-11 01:10:11 +08:00
|
|
|
}
|
|
|
|
|
2015-06-17 20:55:21 +08:00
|
|
|
if (!bs->backing) {
|
2015-04-28 21:27:52 +08:00
|
|
|
return 0;
|
2011-11-11 01:13:59 +08:00
|
|
|
}
|
|
|
|
|
2015-06-17 20:55:21 +08:00
|
|
|
return 1 + bdrv_get_backing_file_depth(bs->backing->bs);
|
2015-04-28 21:27:52 +08:00
|
|
|
}
|
2011-10-17 18:32:12 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
void bdrv_init(void)
|
|
|
|
{
|
|
|
|
module_call_init(MODULE_INIT_BLOCK);
|
|
|
|
}
|
2012-03-13 01:26:01 +08:00
|
|
|
|
2015-04-28 21:27:52 +08:00
|
|
|
void bdrv_init_with_whitelist(void)
|
|
|
|
{
|
|
|
|
use_bdrv_whitelist = 1;
|
|
|
|
bdrv_init();
|
2011-10-17 18:32:12 +08:00
|
|
|
}
|
|
|
|
|
2014-03-12 22:59:16 +08:00
|
|
|
void bdrv_invalidate_cache(BlockDriverState *bs, Error **errp)
|
2011-11-15 05:09:45 +08:00
|
|
|
{
|
2014-03-12 22:59:16 +08:00
|
|
|
Error *local_err = NULL;
|
|
|
|
int ret;
|
|
|
|
|
2014-03-11 17:58:39 +08:00
|
|
|
if (!bs->drv) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2016-01-13 22:56:06 +08:00
|
|
|
if (!(bs->open_flags & BDRV_O_INACTIVE)) {
|
2014-10-09 10:50:46 +08:00
|
|
|
return;
|
|
|
|
}
|
2016-01-13 22:56:06 +08:00
|
|
|
bs->open_flags &= ~BDRV_O_INACTIVE;
|
2014-10-09 10:50:46 +08:00
|
|
|
|
2014-03-11 17:58:39 +08:00
|
|
|
if (bs->drv->bdrv_invalidate_cache) {
|
2014-03-12 22:59:16 +08:00
|
|
|
bs->drv->bdrv_invalidate_cache(bs, &local_err);
|
2014-03-11 17:58:39 +08:00
|
|
|
} else if (bs->file) {
|
2015-06-16 20:19:22 +08:00
|
|
|
bdrv_invalidate_cache(bs->file->bs, &local_err);
|
2014-03-12 22:59:16 +08:00
|
|
|
}
|
|
|
|
if (local_err) {
|
2016-01-13 22:56:06 +08:00
|
|
|
bs->open_flags |= BDRV_O_INACTIVE;
|
2014-03-12 22:59:16 +08:00
|
|
|
error_propagate(errp, local_err);
|
|
|
|
return;
|
2011-11-15 05:09:45 +08:00
|
|
|
}
|
2014-03-11 17:58:39 +08:00
|
|
|
|
2014-03-12 22:59:16 +08:00
|
|
|
ret = refresh_total_sectors(bs, bs->total_sectors);
|
|
|
|
if (ret < 0) {
|
2016-01-13 22:56:06 +08:00
|
|
|
bs->open_flags |= BDRV_O_INACTIVE;
|
2014-03-12 22:59:16 +08:00
|
|
|
error_setg_errno(errp, -ret, "Could not refresh total sector count");
|
|
|
|
return;
|
|
|
|
}
|
2011-11-15 05:09:45 +08:00
|
|
|
}
|
|
|
|
|
2014-03-12 22:59:16 +08:00
|
|
|
void bdrv_invalidate_cache_all(Error **errp)
|
2011-11-15 05:09:45 +08:00
|
|
|
{
|
|
|
|
BlockDriverState *bs;
|
2014-03-12 22:59:16 +08:00
|
|
|
Error *local_err = NULL;
|
2011-11-15 05:09:45 +08:00
|
|
|
|
2014-01-24 04:31:32 +08:00
|
|
|
QTAILQ_FOREACH(bs, &bdrv_states, device_list) {
|
2014-05-08 22:34:35 +08:00
|
|
|
AioContext *aio_context = bdrv_get_aio_context(bs);
|
|
|
|
|
|
|
|
aio_context_acquire(aio_context);
|
2014-03-12 22:59:16 +08:00
|
|
|
bdrv_invalidate_cache(bs, &local_err);
|
2014-05-08 22:34:35 +08:00
|
|
|
aio_context_release(aio_context);
|
2014-03-12 22:59:16 +08:00
|
|
|
if (local_err) {
|
|
|
|
error_propagate(errp, local_err);
|
|
|
|
return;
|
|
|
|
}
|
2011-11-15 05:09:45 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-12-22 21:07:08 +08:00
|
|
|
static int bdrv_inactivate(BlockDriverState *bs)
|
|
|
|
{
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
if (bs->drv->bdrv_inactivate) {
|
|
|
|
ret = bs->drv->bdrv_inactivate(bs);
|
|
|
|
if (ret < 0) {
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
bs->open_flags |= BDRV_O_INACTIVE;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
int bdrv_inactivate_all(void)
|
|
|
|
{
|
|
|
|
BlockDriverState *bs;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
QTAILQ_FOREACH(bs, &bdrv_states, device_list) {
|
|
|
|
AioContext *aio_context = bdrv_get_aio_context(bs);
|
|
|
|
|
|
|
|
aio_context_acquire(aio_context);
|
|
|
|
ret = bdrv_inactivate(bs);
|
|
|
|
aio_context_release(aio_context);
|
|
|
|
if (ret < 0) {
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2006-08-19 19:45:59 +08:00
|
|
|
/**************************************************************/
|
|
|
|
/* removable device support */
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Return TRUE if the media is present
|
|
|
|
*/
|
2015-10-19 23:53:11 +08:00
|
|
|
bool bdrv_is_inserted(BlockDriverState *bs)
|
2006-08-19 19:45:59 +08:00
|
|
|
{
|
|
|
|
BlockDriver *drv = bs->drv;
|
2015-10-19 23:53:13 +08:00
|
|
|
BdrvChild *child;
|
2011-09-07 00:58:41 +08:00
|
|
|
|
2015-10-19 23:53:11 +08:00
|
|
|
if (!drv) {
|
|
|
|
return false;
|
|
|
|
}
|
2015-10-19 23:53:13 +08:00
|
|
|
if (drv->bdrv_is_inserted) {
|
|
|
|
return drv->bdrv_is_inserted(bs);
|
|
|
|
}
|
|
|
|
QLIST_FOREACH(child, &bs->children, next) {
|
|
|
|
if (!bdrv_is_inserted(child->bs)) {
|
|
|
|
return false;
|
|
|
|
}
|
2015-10-19 23:53:11 +08:00
|
|
|
}
|
2015-10-19 23:53:13 +08:00
|
|
|
return true;
|
2006-08-19 19:45:59 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
2011-08-03 21:08:08 +08:00
|
|
|
* Return whether the media changed since the last call to this
|
|
|
|
* function, or -ENOTSUP if we don't know. Most drivers don't know.
|
2006-08-19 19:45:59 +08:00
|
|
|
*/
|
|
|
|
int bdrv_media_changed(BlockDriverState *bs)
|
|
|
|
{
|
|
|
|
BlockDriver *drv = bs->drv;
|
|
|
|
|
2011-08-03 21:08:08 +08:00
|
|
|
if (drv && drv->bdrv_media_changed) {
|
|
|
|
return drv->bdrv_media_changed(bs);
|
|
|
|
}
|
|
|
|
return -ENOTSUP;
|
2006-08-19 19:45:59 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* If eject_flag is TRUE, eject the media. Otherwise, close the tray
|
|
|
|
*/
|
2012-02-04 02:24:53 +08:00
|
|
|
void bdrv_eject(BlockDriverState *bs, bool eject_flag)
|
2006-08-19 19:45:59 +08:00
|
|
|
{
|
|
|
|
BlockDriver *drv = bs->drv;
|
2014-10-07 19:59:11 +08:00
|
|
|
const char *device_name;
|
2006-08-19 19:45:59 +08:00
|
|
|
|
2011-07-21 00:23:42 +08:00
|
|
|
if (drv && drv->bdrv_eject) {
|
|
|
|
drv->bdrv_eject(bs, eject_flag);
|
2006-08-19 19:45:59 +08:00
|
|
|
}
|
2012-02-14 23:41:13 +08:00
|
|
|
|
2014-10-07 19:59:11 +08:00
|
|
|
device_name = bdrv_get_device_name(bs);
|
|
|
|
if (device_name[0] != '\0') {
|
|
|
|
qapi_event_send_device_tray_moved(device_name,
|
2014-06-18 14:43:44 +08:00
|
|
|
eject_flag, &error_abort);
|
2012-02-14 23:41:13 +08:00
|
|
|
}
|
2006-08-19 19:45:59 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Lock or unlock the media (if it is locked, the user won't be able
|
|
|
|
* to eject it manually).
|
|
|
|
*/
|
2011-09-07 00:58:47 +08:00
|
|
|
void bdrv_lock_medium(BlockDriverState *bs, bool locked)
|
2006-08-19 19:45:59 +08:00
|
|
|
{
|
|
|
|
BlockDriver *drv = bs->drv;
|
|
|
|
|
2011-09-07 00:58:47 +08:00
|
|
|
trace_bdrv_lock_medium(bs, locked);
|
2011-03-30 03:04:40 +08:00
|
|
|
|
2011-09-07 00:58:47 +08:00
|
|
|
if (drv && drv->bdrv_lock_medium) {
|
|
|
|
drv->bdrv_lock_medium(bs, locked);
|
2006-08-19 19:45:59 +08:00
|
|
|
}
|
|
|
|
}
|
2007-12-25 00:10:43 +08:00
|
|
|
|
2015-04-18 07:49:50 +08:00
|
|
|
BdrvDirtyBitmap *bdrv_find_dirty_bitmap(BlockDriverState *bs, const char *name)
|
|
|
|
{
|
|
|
|
BdrvDirtyBitmap *bm;
|
|
|
|
|
|
|
|
assert(name);
|
|
|
|
QLIST_FOREACH(bm, &bs->dirty_bitmaps, list) {
|
|
|
|
if (bm->name && !strcmp(name, bm->name)) {
|
|
|
|
return bm;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2015-04-18 07:50:02 +08:00
|
|
|
void bdrv_dirty_bitmap_make_anon(BdrvDirtyBitmap *bitmap)
|
2015-04-18 07:49:50 +08:00
|
|
|
{
|
block: Add bitmap successors
A bitmap successor is an anonymous BdrvDirtyBitmap that is intended to
be created just prior to a sensitive operation (e.g. Incremental Backup)
that can either succeed or fail, but during the course of which we still
want a bitmap tracking writes.
On creating a successor, we "freeze" the parent bitmap which prevents
its deletion, enabling, anonymization, or creating a bitmap with the
same name.
On success, the parent bitmap can "abdicate" responsibility to the
successor, which will inherit its name. The successor will have been
tracking writes during the course of the backup operation. The parent
will be safely deleted.
On failure, we can "reclaim" the successor from the parent, unifying
them such that the resulting bitmap describes all writes occurring since
the last successful backup, for instance. Reclamation will thaw the
parent, but not explicitly re-enable it.
BdrvDirtyBitmap operations that target a single bitmap are protected
by assertions that the bitmap is not frozen and/or disabled.
BdrvDirtyBitmap operations that target a group of bitmaps, such as
bdrv_{set,reset}_dirty will ignore frozen/disabled drives with a
conditional instead.
Internal functions that enable/disable dirty bitmaps have assertions
added to them to prevent modifying frozen bitmaps.
Signed-off-by: John Snow <jsnow@redhat.com>
Reviewed-by: Max Reitz <mreitz@redhat.com>
Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com>
Reviewed-by: Eric Blake <eblake@redhat.com>
Message-id: 1429314609-29776-10-git-send-email-jsnow@redhat.com
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
2015-04-18 07:49:57 +08:00
|
|
|
assert(!bdrv_dirty_bitmap_frozen(bitmap));
|
2015-04-18 07:49:50 +08:00
|
|
|
g_free(bitmap->name);
|
|
|
|
bitmap->name = NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
BdrvDirtyBitmap *bdrv_create_dirty_bitmap(BlockDriverState *bs,
|
2015-04-18 07:49:51 +08:00
|
|
|
uint32_t granularity,
|
2015-04-18 07:49:50 +08:00
|
|
|
const char *name,
|
2014-04-16 09:34:30 +08:00
|
|
|
Error **errp)
|
2009-11-02 21:40:41 +08:00
|
|
|
{
|
|
|
|
int64_t bitmap_size;
|
2013-11-13 18:29:43 +08:00
|
|
|
BdrvDirtyBitmap *bitmap;
|
2015-04-18 07:49:51 +08:00
|
|
|
uint32_t sector_granularity;
|
2009-12-01 01:21:19 +08:00
|
|
|
|
2013-01-22 00:09:45 +08:00
|
|
|
assert((granularity & (granularity - 1)) == 0);
|
|
|
|
|
2015-04-18 07:49:50 +08:00
|
|
|
if (name && bdrv_find_dirty_bitmap(bs, name)) {
|
|
|
|
error_setg(errp, "Bitmap already exists: %s", name);
|
|
|
|
return NULL;
|
|
|
|
}
|
2015-04-18 07:49:51 +08:00
|
|
|
sector_granularity = granularity >> BDRV_SECTOR_BITS;
|
|
|
|
assert(sector_granularity);
|
2014-06-26 19:23:22 +08:00
|
|
|
bitmap_size = bdrv_nb_sectors(bs);
|
2014-04-16 09:34:30 +08:00
|
|
|
if (bitmap_size < 0) {
|
|
|
|
error_setg_errno(errp, -bitmap_size, "could not get length of device");
|
|
|
|
errno = -bitmap_size;
|
|
|
|
return NULL;
|
|
|
|
}
|
block: Use g_new() & friends where that makes obvious sense
g_new(T, n) is neater than g_malloc(sizeof(T) * n). It's also safer,
for two reasons. One, it catches multiplication overflowing size_t.
Two, it returns T * rather than void *, which lets the compiler catch
more type errors.
Patch created with Coccinelle, with two manual changes on top:
* Add const to bdrv_iterate_format() to keep the types straight
* Convert the allocation in bdrv_drop_intermediate(), which Coccinelle
inexplicably misses
Coccinelle semantic patch:
@@
type T;
@@
-g_malloc(sizeof(T))
+g_new(T, 1)
@@
type T;
@@
-g_try_malloc(sizeof(T))
+g_try_new(T, 1)
@@
type T;
@@
-g_malloc0(sizeof(T))
+g_new0(T, 1)
@@
type T;
@@
-g_try_malloc0(sizeof(T))
+g_try_new0(T, 1)
@@
type T;
expression n;
@@
-g_malloc(sizeof(T) * (n))
+g_new(T, n)
@@
type T;
expression n;
@@
-g_try_malloc(sizeof(T) * (n))
+g_try_new(T, n)
@@
type T;
expression n;
@@
-g_malloc0(sizeof(T) * (n))
+g_new0(T, n)
@@
type T;
expression n;
@@
-g_try_malloc0(sizeof(T) * (n))
+g_try_new0(T, n)
@@
type T;
expression p, n;
@@
-g_realloc(p, sizeof(T) * (n))
+g_renew(T, p, n)
@@
type T;
expression p, n;
@@
-g_try_realloc(p, sizeof(T) * (n))
+g_try_renew(T, p, n)
Signed-off-by: Markus Armbruster <armbru@redhat.com>
Reviewed-by: Max Reitz <mreitz@redhat.com>
Reviewed-by: Jeff Cody <jcody@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
2014-08-19 16:31:08 +08:00
|
|
|
bitmap = g_new0(BdrvDirtyBitmap, 1);
|
2015-04-18 07:49:51 +08:00
|
|
|
bitmap->bitmap = hbitmap_alloc(bitmap_size, ctz32(sector_granularity));
|
2015-04-18 07:49:59 +08:00
|
|
|
bitmap->size = bitmap_size;
|
2015-04-18 07:49:50 +08:00
|
|
|
bitmap->name = g_strdup(name);
|
2015-04-18 07:49:56 +08:00
|
|
|
bitmap->disabled = false;
|
2013-11-13 18:29:43 +08:00
|
|
|
QLIST_INSERT_HEAD(&bs->dirty_bitmaps, bitmap, list);
|
|
|
|
return bitmap;
|
|
|
|
}
|
|
|
|
|
block: Add bitmap successors
A bitmap successor is an anonymous BdrvDirtyBitmap that is intended to
be created just prior to a sensitive operation (e.g. Incremental Backup)
that can either succeed or fail, but during the course of which we still
want a bitmap tracking writes.
On creating a successor, we "freeze" the parent bitmap which prevents
its deletion, enabling, anonymization, or creating a bitmap with the
same name.
On success, the parent bitmap can "abdicate" responsibility to the
successor, which will inherit its name. The successor will have been
tracking writes during the course of the backup operation. The parent
will be safely deleted.
On failure, we can "reclaim" the successor from the parent, unifying
them such that the resulting bitmap describes all writes occurring since
the last successful backup, for instance. Reclamation will thaw the
parent, but not explicitly re-enable it.
BdrvDirtyBitmap operations that target a single bitmap are protected
by assertions that the bitmap is not frozen and/or disabled.
BdrvDirtyBitmap operations that target a group of bitmaps, such as
bdrv_{set,reset}_dirty will ignore frozen/disabled drives with a
conditional instead.
Internal functions that enable/disable dirty bitmaps have assertions
added to them to prevent modifying frozen bitmaps.
Signed-off-by: John Snow <jsnow@redhat.com>
Reviewed-by: Max Reitz <mreitz@redhat.com>
Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com>
Reviewed-by: Eric Blake <eblake@redhat.com>
Message-id: 1429314609-29776-10-git-send-email-jsnow@redhat.com
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
2015-04-18 07:49:57 +08:00
|
|
|
bool bdrv_dirty_bitmap_frozen(BdrvDirtyBitmap *bitmap)
|
|
|
|
{
|
|
|
|
return bitmap->successor;
|
|
|
|
}
|
|
|
|
|
2015-04-18 07:49:56 +08:00
|
|
|
bool bdrv_dirty_bitmap_enabled(BdrvDirtyBitmap *bitmap)
|
|
|
|
{
|
block: Add bitmap successors
A bitmap successor is an anonymous BdrvDirtyBitmap that is intended to
be created just prior to a sensitive operation (e.g. Incremental Backup)
that can either succeed or fail, but during the course of which we still
want a bitmap tracking writes.
On creating a successor, we "freeze" the parent bitmap which prevents
its deletion, enabling, anonymization, or creating a bitmap with the
same name.
On success, the parent bitmap can "abdicate" responsibility to the
successor, which will inherit its name. The successor will have been
tracking writes during the course of the backup operation. The parent
will be safely deleted.
On failure, we can "reclaim" the successor from the parent, unifying
them such that the resulting bitmap describes all writes occurring since
the last successful backup, for instance. Reclamation will thaw the
parent, but not explicitly re-enable it.
BdrvDirtyBitmap operations that target a single bitmap are protected
by assertions that the bitmap is not frozen and/or disabled.
BdrvDirtyBitmap operations that target a group of bitmaps, such as
bdrv_{set,reset}_dirty will ignore frozen/disabled drives with a
conditional instead.
Internal functions that enable/disable dirty bitmaps have assertions
added to them to prevent modifying frozen bitmaps.
Signed-off-by: John Snow <jsnow@redhat.com>
Reviewed-by: Max Reitz <mreitz@redhat.com>
Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com>
Reviewed-by: Eric Blake <eblake@redhat.com>
Message-id: 1429314609-29776-10-git-send-email-jsnow@redhat.com
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
2015-04-18 07:49:57 +08:00
|
|
|
return !(bitmap->disabled || bitmap->successor);
|
|
|
|
}
|
|
|
|
|
2015-05-13 03:53:01 +08:00
|
|
|
DirtyBitmapStatus bdrv_dirty_bitmap_status(BdrvDirtyBitmap *bitmap)
|
|
|
|
{
|
|
|
|
if (bdrv_dirty_bitmap_frozen(bitmap)) {
|
|
|
|
return DIRTY_BITMAP_STATUS_FROZEN;
|
|
|
|
} else if (!bdrv_dirty_bitmap_enabled(bitmap)) {
|
|
|
|
return DIRTY_BITMAP_STATUS_DISABLED;
|
|
|
|
} else {
|
|
|
|
return DIRTY_BITMAP_STATUS_ACTIVE;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
block: Add bitmap successors
A bitmap successor is an anonymous BdrvDirtyBitmap that is intended to
be created just prior to a sensitive operation (e.g. Incremental Backup)
that can either succeed or fail, but during the course of which we still
want a bitmap tracking writes.
On creating a successor, we "freeze" the parent bitmap which prevents
its deletion, enabling, anonymization, or creating a bitmap with the
same name.
On success, the parent bitmap can "abdicate" responsibility to the
successor, which will inherit its name. The successor will have been
tracking writes during the course of the backup operation. The parent
will be safely deleted.
On failure, we can "reclaim" the successor from the parent, unifying
them such that the resulting bitmap describes all writes occurring since
the last successful backup, for instance. Reclamation will thaw the
parent, but not explicitly re-enable it.
BdrvDirtyBitmap operations that target a single bitmap are protected
by assertions that the bitmap is not frozen and/or disabled.
BdrvDirtyBitmap operations that target a group of bitmaps, such as
bdrv_{set,reset}_dirty will ignore frozen/disabled drives with a
conditional instead.
Internal functions that enable/disable dirty bitmaps have assertions
added to them to prevent modifying frozen bitmaps.
Signed-off-by: John Snow <jsnow@redhat.com>
Reviewed-by: Max Reitz <mreitz@redhat.com>
Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com>
Reviewed-by: Eric Blake <eblake@redhat.com>
Message-id: 1429314609-29776-10-git-send-email-jsnow@redhat.com
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
2015-04-18 07:49:57 +08:00
|
|
|
/**
|
|
|
|
* Create a successor bitmap destined to replace this bitmap after an operation.
|
|
|
|
* Requires that the bitmap is not frozen and has no successor.
|
|
|
|
*/
|
|
|
|
int bdrv_dirty_bitmap_create_successor(BlockDriverState *bs,
|
|
|
|
BdrvDirtyBitmap *bitmap, Error **errp)
|
|
|
|
{
|
|
|
|
uint64_t granularity;
|
|
|
|
BdrvDirtyBitmap *child;
|
|
|
|
|
|
|
|
if (bdrv_dirty_bitmap_frozen(bitmap)) {
|
|
|
|
error_setg(errp, "Cannot create a successor for a bitmap that is "
|
|
|
|
"currently frozen");
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
assert(!bitmap->successor);
|
|
|
|
|
|
|
|
/* Create an anonymous successor */
|
|
|
|
granularity = bdrv_dirty_bitmap_granularity(bitmap);
|
|
|
|
child = bdrv_create_dirty_bitmap(bs, granularity, NULL, errp);
|
|
|
|
if (!child) {
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Successor will be on or off based on our current state. */
|
|
|
|
child->disabled = bitmap->disabled;
|
|
|
|
|
|
|
|
/* Install the successor and freeze the parent */
|
|
|
|
bitmap->successor = child;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* For a bitmap with a successor, yield our name to the successor,
|
|
|
|
* delete the old bitmap, and return a handle to the new bitmap.
|
|
|
|
*/
|
|
|
|
BdrvDirtyBitmap *bdrv_dirty_bitmap_abdicate(BlockDriverState *bs,
|
|
|
|
BdrvDirtyBitmap *bitmap,
|
|
|
|
Error **errp)
|
|
|
|
{
|
|
|
|
char *name;
|
|
|
|
BdrvDirtyBitmap *successor = bitmap->successor;
|
|
|
|
|
|
|
|
if (successor == NULL) {
|
|
|
|
error_setg(errp, "Cannot relinquish control if "
|
|
|
|
"there's no successor present");
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
name = bitmap->name;
|
|
|
|
bitmap->name = NULL;
|
|
|
|
successor->name = name;
|
|
|
|
bitmap->successor = NULL;
|
|
|
|
bdrv_release_dirty_bitmap(bs, bitmap);
|
|
|
|
|
|
|
|
return successor;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* In cases of failure where we can no longer safely delete the parent,
|
|
|
|
* we may wish to re-join the parent and child/successor.
|
|
|
|
* The merged parent will be un-frozen, but not explicitly re-enabled.
|
|
|
|
*/
|
|
|
|
BdrvDirtyBitmap *bdrv_reclaim_dirty_bitmap(BlockDriverState *bs,
|
|
|
|
BdrvDirtyBitmap *parent,
|
|
|
|
Error **errp)
|
|
|
|
{
|
|
|
|
BdrvDirtyBitmap *successor = parent->successor;
|
|
|
|
|
|
|
|
if (!successor) {
|
|
|
|
error_setg(errp, "Cannot reclaim a successor when none is present");
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!hbitmap_merge(parent->bitmap, successor->bitmap)) {
|
|
|
|
error_setg(errp, "Merging of parent and successor bitmap failed");
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
bdrv_release_dirty_bitmap(bs, successor);
|
|
|
|
parent->successor = NULL;
|
|
|
|
|
|
|
|
return parent;
|
2015-04-18 07:49:56 +08:00
|
|
|
}
|
|
|
|
|
2015-04-18 07:50:03 +08:00
|
|
|
/**
|
|
|
|
* Truncates _all_ bitmaps attached to a BDS.
|
|
|
|
*/
|
|
|
|
static void bdrv_dirty_bitmap_truncate(BlockDriverState *bs)
|
|
|
|
{
|
|
|
|
BdrvDirtyBitmap *bitmap;
|
|
|
|
uint64_t size = bdrv_nb_sectors(bs);
|
|
|
|
|
|
|
|
QLIST_FOREACH(bitmap, &bs->dirty_bitmaps, list) {
|
2015-06-11 01:24:54 +08:00
|
|
|
assert(!bdrv_dirty_bitmap_frozen(bitmap));
|
2015-04-18 07:50:03 +08:00
|
|
|
hbitmap_truncate(bitmap->bitmap, size);
|
2015-06-09 04:49:15 +08:00
|
|
|
bitmap->size = size;
|
2015-04-18 07:50:03 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-01-29 23:36:01 +08:00
|
|
|
static void bdrv_do_release_matching_dirty_bitmap(BlockDriverState *bs,
|
|
|
|
BdrvDirtyBitmap *bitmap,
|
|
|
|
bool only_named)
|
2013-11-13 18:29:43 +08:00
|
|
|
{
|
|
|
|
BdrvDirtyBitmap *bm, *next;
|
|
|
|
QLIST_FOREACH_SAFE(bm, &bs->dirty_bitmaps, list, next) {
|
2016-01-29 23:36:01 +08:00
|
|
|
if ((!bitmap || bm == bitmap) && (!only_named || bm->name)) {
|
block: Add bitmap successors
A bitmap successor is an anonymous BdrvDirtyBitmap that is intended to
be created just prior to a sensitive operation (e.g. Incremental Backup)
that can either succeed or fail, but during the course of which we still
want a bitmap tracking writes.
On creating a successor, we "freeze" the parent bitmap which prevents
its deletion, enabling, anonymization, or creating a bitmap with the
same name.
On success, the parent bitmap can "abdicate" responsibility to the
successor, which will inherit its name. The successor will have been
tracking writes during the course of the backup operation. The parent
will be safely deleted.
On failure, we can "reclaim" the successor from the parent, unifying
them such that the resulting bitmap describes all writes occurring since
the last successful backup, for instance. Reclamation will thaw the
parent, but not explicitly re-enable it.
BdrvDirtyBitmap operations that target a single bitmap are protected
by assertions that the bitmap is not frozen and/or disabled.
BdrvDirtyBitmap operations that target a group of bitmaps, such as
bdrv_{set,reset}_dirty will ignore frozen/disabled drives with a
conditional instead.
Internal functions that enable/disable dirty bitmaps have assertions
added to them to prevent modifying frozen bitmaps.
Signed-off-by: John Snow <jsnow@redhat.com>
Reviewed-by: Max Reitz <mreitz@redhat.com>
Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com>
Reviewed-by: Eric Blake <eblake@redhat.com>
Message-id: 1429314609-29776-10-git-send-email-jsnow@redhat.com
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
2015-04-18 07:49:57 +08:00
|
|
|
assert(!bdrv_dirty_bitmap_frozen(bm));
|
2016-01-29 23:36:01 +08:00
|
|
|
QLIST_REMOVE(bm, list);
|
|
|
|
hbitmap_free(bm->bitmap);
|
|
|
|
g_free(bm->name);
|
|
|
|
g_free(bm);
|
|
|
|
|
|
|
|
if (bitmap) {
|
|
|
|
return;
|
|
|
|
}
|
2009-12-01 01:21:19 +08:00
|
|
|
}
|
2009-11-02 21:40:41 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-01-29 23:36:01 +08:00
|
|
|
void bdrv_release_dirty_bitmap(BlockDriverState *bs, BdrvDirtyBitmap *bitmap)
|
|
|
|
{
|
|
|
|
bdrv_do_release_matching_dirty_bitmap(bs, bitmap, false);
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Release all named dirty bitmaps attached to a BDS (for use in bdrv_close()).
|
|
|
|
* There must not be any frozen bitmaps attached.
|
|
|
|
*/
|
|
|
|
static void bdrv_release_named_dirty_bitmaps(BlockDriverState *bs)
|
|
|
|
{
|
|
|
|
bdrv_do_release_matching_dirty_bitmap(bs, NULL, true);
|
|
|
|
}
|
|
|
|
|
2015-04-18 07:49:56 +08:00
|
|
|
void bdrv_disable_dirty_bitmap(BdrvDirtyBitmap *bitmap)
|
|
|
|
{
|
block: Add bitmap successors
A bitmap successor is an anonymous BdrvDirtyBitmap that is intended to
be created just prior to a sensitive operation (e.g. Incremental Backup)
that can either succeed or fail, but during the course of which we still
want a bitmap tracking writes.
On creating a successor, we "freeze" the parent bitmap which prevents
its deletion, enabling, anonymization, or creating a bitmap with the
same name.
On success, the parent bitmap can "abdicate" responsibility to the
successor, which will inherit its name. The successor will have been
tracking writes during the course of the backup operation. The parent
will be safely deleted.
On failure, we can "reclaim" the successor from the parent, unifying
them such that the resulting bitmap describes all writes occurring since
the last successful backup, for instance. Reclamation will thaw the
parent, but not explicitly re-enable it.
BdrvDirtyBitmap operations that target a single bitmap are protected
by assertions that the bitmap is not frozen and/or disabled.
BdrvDirtyBitmap operations that target a group of bitmaps, such as
bdrv_{set,reset}_dirty will ignore frozen/disabled drives with a
conditional instead.
Internal functions that enable/disable dirty bitmaps have assertions
added to them to prevent modifying frozen bitmaps.
Signed-off-by: John Snow <jsnow@redhat.com>
Reviewed-by: Max Reitz <mreitz@redhat.com>
Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com>
Reviewed-by: Eric Blake <eblake@redhat.com>
Message-id: 1429314609-29776-10-git-send-email-jsnow@redhat.com
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
2015-04-18 07:49:57 +08:00
|
|
|
assert(!bdrv_dirty_bitmap_frozen(bitmap));
|
2015-04-18 07:49:56 +08:00
|
|
|
bitmap->disabled = true;
|
|
|
|
}
|
|
|
|
|
|
|
|
void bdrv_enable_dirty_bitmap(BdrvDirtyBitmap *bitmap)
|
|
|
|
{
|
block: Add bitmap successors
A bitmap successor is an anonymous BdrvDirtyBitmap that is intended to
be created just prior to a sensitive operation (e.g. Incremental Backup)
that can either succeed or fail, but during the course of which we still
want a bitmap tracking writes.
On creating a successor, we "freeze" the parent bitmap which prevents
its deletion, enabling, anonymization, or creating a bitmap with the
same name.
On success, the parent bitmap can "abdicate" responsibility to the
successor, which will inherit its name. The successor will have been
tracking writes during the course of the backup operation. The parent
will be safely deleted.
On failure, we can "reclaim" the successor from the parent, unifying
them such that the resulting bitmap describes all writes occurring since
the last successful backup, for instance. Reclamation will thaw the
parent, but not explicitly re-enable it.
BdrvDirtyBitmap operations that target a single bitmap are protected
by assertions that the bitmap is not frozen and/or disabled.
BdrvDirtyBitmap operations that target a group of bitmaps, such as
bdrv_{set,reset}_dirty will ignore frozen/disabled drives with a
conditional instead.
Internal functions that enable/disable dirty bitmaps have assertions
added to them to prevent modifying frozen bitmaps.
Signed-off-by: John Snow <jsnow@redhat.com>
Reviewed-by: Max Reitz <mreitz@redhat.com>
Reviewed-by: Stefan Hajnoczi <stefanha@redhat.com>
Reviewed-by: Eric Blake <eblake@redhat.com>
Message-id: 1429314609-29776-10-git-send-email-jsnow@redhat.com
Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
2015-04-18 07:49:57 +08:00
|
|
|
assert(!bdrv_dirty_bitmap_frozen(bitmap));
|
2015-04-18 07:49:56 +08:00
|
|
|
bitmap->disabled = false;
|
|
|
|
}
|
|
|
|
|
2013-11-13 18:29:44 +08:00
|
|
|
BlockDirtyInfoList *bdrv_query_dirty_bitmaps(BlockDriverState *bs)
|
|
|
|
{
|
|
|
|
BdrvDirtyBitmap *bm;
|
|
|
|
BlockDirtyInfoList *list = NULL;
|
|
|
|
BlockDirtyInfoList **plist = &list;
|
|
|
|
|
|
|
|
QLIST_FOREACH(bm, &bs->dirty_bitmaps, list) {
|
block: Use g_new() & friends where that makes obvious sense
g_new(T, n) is neater than g_malloc(sizeof(T) * n). It's also safer,
for two reasons. One, it catches multiplication overflowing size_t.
Two, it returns T * rather than void *, which lets the compiler catch
more type errors.
Patch created with Coccinelle, with two manual changes on top:
* Add const to bdrv_iterate_format() to keep the types straight
* Convert the allocation in bdrv_drop_intermediate(), which Coccinelle
inexplicably misses
Coccinelle semantic patch:
@@
type T;
@@
-g_malloc(sizeof(T))
+g_new(T, 1)
@@
type T;
@@
-g_try_malloc(sizeof(T))
+g_try_new(T, 1)
@@
type T;
@@
-g_malloc0(sizeof(T))
+g_new0(T, 1)
@@
type T;
@@
-g_try_malloc0(sizeof(T))
+g_try_new0(T, 1)
@@
type T;
expression n;
@@
-g_malloc(sizeof(T) * (n))
+g_new(T, n)
@@
type T;
expression n;
@@
-g_try_malloc(sizeof(T) * (n))
+g_try_new(T, n)
@@
type T;
expression n;
@@
-g_malloc0(sizeof(T) * (n))
+g_new0(T, n)
@@
type T;
expression n;
@@
-g_try_malloc0(sizeof(T) * (n))
+g_try_new0(T, n)
@@
type T;
expression p, n;
@@
-g_realloc(p, sizeof(T) * (n))
+g_renew(T, p, n)
@@
type T;
expression p, n;
@@
-g_try_realloc(p, sizeof(T) * (n))
+g_try_renew(T, p, n)
Signed-off-by: Markus Armbruster <armbru@redhat.com>
Reviewed-by: Max Reitz <mreitz@redhat.com>
Reviewed-by: Jeff Cody <jcody@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
2014-08-19 16:31:08 +08:00
|
|
|
BlockDirtyInfo *info = g_new0(BlockDirtyInfo, 1);
|
|
|
|
BlockDirtyInfoList *entry = g_new0(BlockDirtyInfoList, 1);
|
2015-04-18 07:50:02 +08:00
|
|
|
info->count = bdrv_get_dirty_count(bm);
|
2015-04-18 07:49:53 +08:00
|
|
|
info->granularity = bdrv_dirty_bitmap_granularity(bm);
|
2015-04-18 07:49:50 +08:00
|
|
|
info->has_name = !!bm->name;
|
|
|
|
info->name = g_strdup(bm->name);
|
2015-05-13 03:53:01 +08:00
|
|
|
info->status = bdrv_dirty_bitmap_status(bm);
|
2013-11-13 18:29:44 +08:00
|
|
|
entry->value = info;
|
|
|
|
*plist = entry;
|
|
|
|
plist = &entry->next;
|
|
|
|
}
|
|
|
|
|
|
|
|
return list;
|
|
|
|
}
|
|
|
|
|
2013-11-13 18:29:43 +08:00
|
|
|
int bdrv_get_dirty(BlockDriverState *bs, BdrvDirtyBitmap *bitmap, int64_t sector)
|
2009-11-02 21:40:41 +08:00
|
|
|
{
|
2013-11-13 18:29:43 +08:00
|
|
|
if (bitmap) {
|
|
|
|
return hbitmap_get(bitmap->bitmap, sector);
|
2009-11-02 21:40:41 +08:00
|
|
|
} else {
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-04-18 07:49:52 +08:00
|
|
|
/**
|
|
|
|
* Chooses a default granularity based on the existing cluster size,
|
|
|
|
* but clamped between [4K, 64K]. Defaults to 64K in the case that there
|
|
|
|
* is no cluster size information available.
|
|
|
|
*/
|
|
|
|
uint32_t bdrv_get_default_bitmap_granularity(BlockDriverState *bs)
|
|
|
|
{
|
|
|
|
BlockDriverInfo bdi;
|
|
|
|
uint32_t granularity;
|
|
|
|
|
|
|
|
if (bdrv_get_info(bs, &bdi) >= 0 && bdi.cluster_size > 0) {
|
|
|
|
granularity = MAX(4096, bdi.cluster_size);
|
|
|
|
granularity = MIN(65536, granularity);
|
|
|
|
} else {
|
|
|
|
granularity = 65536;
|
|
|
|
}
|
|
|
|
|
|
|
|
return granularity;
|
|
|
|
}
|
|
|
|
|
2015-04-18 07:49:53 +08:00
|
|
|
uint32_t bdrv_dirty_bitmap_granularity(BdrvDirtyBitmap *bitmap)
|
|
|
|
{
|
|
|
|
return BDRV_SECTOR_SIZE << hbitmap_granularity(bitmap->bitmap);
|
|
|
|
}
|
|
|
|
|
2015-04-18 07:50:02 +08:00
|
|
|
void bdrv_dirty_iter_init(BdrvDirtyBitmap *bitmap, HBitmapIter *hbi)
|
2012-10-18 22:49:18 +08:00
|
|
|
{
|
2013-11-13 18:29:43 +08:00
|
|
|
hbitmap_iter_init(hbi, bitmap->bitmap, 0);
|
2012-10-18 22:49:18 +08:00
|
|
|
}
|
|
|
|
|
2015-04-18 07:50:02 +08:00
|
|
|
void bdrv_set_dirty_bitmap(BdrvDirtyBitmap *bitmap,
|
2014-11-27 17:40:46 +08:00
|
|
|
int64_t cur_sector, int nr_sectors)
|
|
|
|
{
|
2015-04-18 07:49:56 +08:00
|
|
|
assert(bdrv_dirty_bitmap_enabled(bitmap));
|
2014-11-27 17:40:46 +08:00
|
|
|
hbitmap_set(bitmap->bitmap, cur_sector, nr_sectors);
|
|
|
|
}
|
|
|
|
|
2015-04-18 07:50:02 +08:00
|
|
|
void bdrv_reset_dirty_bitmap(BdrvDirtyBitmap *bitmap,
|
2014-11-27 17:40:46 +08:00
|
|
|
int64_t cur_sector, int nr_sectors)
|
|
|
|
{
|
2015-04-18 07:49:56 +08:00
|
|
|
assert(bdrv_dirty_bitmap_enabled(bitmap));
|
2014-11-27 17:40:46 +08:00
|
|
|
hbitmap_reset(bitmap->bitmap, cur_sector, nr_sectors);
|
|
|
|
}
|
|
|
|
|
2015-11-09 18:16:54 +08:00
|
|
|
void bdrv_clear_dirty_bitmap(BdrvDirtyBitmap *bitmap, HBitmap **out)
|
2015-04-18 07:49:59 +08:00
|
|
|
{
|
|
|
|
assert(bdrv_dirty_bitmap_enabled(bitmap));
|
2015-11-09 18:16:54 +08:00
|
|
|
if (!out) {
|
|
|
|
hbitmap_reset_all(bitmap->bitmap);
|
|
|
|
} else {
|
|
|
|
HBitmap *backup = bitmap->bitmap;
|
|
|
|
bitmap->bitmap = hbitmap_alloc(bitmap->size,
|
|
|
|
hbitmap_granularity(backup));
|
|
|
|
*out = backup;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void bdrv_undo_clear_dirty_bitmap(BdrvDirtyBitmap *bitmap, HBitmap *in)
|
|
|
|
{
|
|
|
|
HBitmap *tmp = bitmap->bitmap;
|
|
|
|
assert(bdrv_dirty_bitmap_enabled(bitmap));
|
|
|
|
bitmap->bitmap = in;
|
|
|
|
hbitmap_free(tmp);
|
2015-04-18 07:49:59 +08:00
|
|
|
}
|
|
|
|
|
2015-04-28 21:27:50 +08:00
|
|
|
void bdrv_set_dirty(BlockDriverState *bs, int64_t cur_sector,
|
|
|
|
int nr_sectors)
|
2012-10-18 22:49:18 +08:00
|
|
|
{
|
2013-11-13 18:29:43 +08:00
|
|
|
BdrvDirtyBitmap *bitmap;
|
|
|
|
QLIST_FOREACH(bitmap, &bs->dirty_bitmaps, list) {
|
2015-04-18 07:49:56 +08:00
|
|
|
if (!bdrv_dirty_bitmap_enabled(bitmap)) {
|
|
|
|
continue;
|
|
|
|
}
|
2013-11-13 18:29:43 +08:00
|
|
|
hbitmap_set(bitmap->bitmap, cur_sector, nr_sectors);
|
|
|
|
}
|
2012-10-18 22:49:18 +08:00
|
|
|
}
|
|
|
|
|
2015-04-18 07:49:58 +08:00
|
|
|
/**
|
|
|
|
* Advance an HBitmapIter to an arbitrary offset.
|
|
|
|
*/
|
|
|
|
void bdrv_set_dirty_iter(HBitmapIter *hbi, int64_t offset)
|
|
|
|
{
|
|
|
|
assert(hbi->hb);
|
|
|
|
hbitmap_iter_init(hbi, hbi->hb, offset);
|
|
|
|
}
|
|
|
|
|
2015-04-18 07:50:02 +08:00
|
|
|
int64_t bdrv_get_dirty_count(BdrvDirtyBitmap *bitmap)
|
2010-01-26 16:31:48 +08:00
|
|
|
{
|
2013-11-13 18:29:43 +08:00
|
|
|
return hbitmap_count(bitmap->bitmap);
|
2010-01-26 16:31:48 +08:00
|
|
|
}
|
2010-12-16 20:52:15 +08:00
|
|
|
|
2013-08-23 09:14:46 +08:00
|
|
|
/* Get a reference to bs */
|
|
|
|
void bdrv_ref(BlockDriverState *bs)
|
|
|
|
{
|
|
|
|
bs->refcnt++;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Release a previously grabbed reference to bs.
|
|
|
|
* If after releasing, reference count is zero, the BlockDriverState is
|
|
|
|
* deleted. */
|
|
|
|
void bdrv_unref(BlockDriverState *bs)
|
|
|
|
{
|
2014-07-24 05:22:57 +08:00
|
|
|
if (!bs) {
|
|
|
|
return;
|
|
|
|
}
|
2013-08-23 09:14:46 +08:00
|
|
|
assert(bs->refcnt > 0);
|
|
|
|
if (--bs->refcnt == 0) {
|
|
|
|
bdrv_delete(bs);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-05-23 21:29:42 +08:00
|
|
|
struct BdrvOpBlocker {
|
|
|
|
Error *reason;
|
|
|
|
QLIST_ENTRY(BdrvOpBlocker) list;
|
|
|
|
};
|
|
|
|
|
|
|
|
bool bdrv_op_is_blocked(BlockDriverState *bs, BlockOpType op, Error **errp)
|
|
|
|
{
|
|
|
|
BdrvOpBlocker *blocker;
|
|
|
|
assert((int) op >= 0 && op < BLOCK_OP_TYPE_MAX);
|
|
|
|
if (!QLIST_EMPTY(&bs->op_blockers[op])) {
|
|
|
|
blocker = QLIST_FIRST(&bs->op_blockers[op]);
|
|
|
|
if (errp) {
|
error: Use error_prepend() where it makes obvious sense
Done with this Coccinelle semantic patch
@@
expression FMT, E1, E2;
expression list ARGS;
@@
- error_setg(E1, FMT, ARGS, error_get_pretty(E2));
+ error_propagate(E1, E2);/*###*/
+ error_prepend(E1, FMT/*@@@*/, ARGS);
followed by manual cleanup, first because I can't figure out how to
make Coccinelle transform strings, and second to get rid of now
superfluous error_propagate().
We now use or propagate the original error whole instead of just its
message obtained with error_get_pretty(). This avoids suppressing its
hint (see commit 50b7b00), but I can't see how the errors touched in
this commit could come with hints. It also improves the message
printed with &error_abort when we screw up (see commit 1e9b65b).
Signed-off-by: Markus Armbruster <armbru@redhat.com>
Reviewed-by: Eric Blake <eblake@redhat.com>
2015-12-18 23:35:15 +08:00
|
|
|
*errp = error_copy(blocker->reason);
|
|
|
|
error_prepend(errp, "Node '%s' is busy: ",
|
|
|
|
bdrv_get_device_or_node_name(bs));
|
2014-05-23 21:29:42 +08:00
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
void bdrv_op_block(BlockDriverState *bs, BlockOpType op, Error *reason)
|
|
|
|
{
|
|
|
|
BdrvOpBlocker *blocker;
|
|
|
|
assert((int) op >= 0 && op < BLOCK_OP_TYPE_MAX);
|
|
|
|
|
block: Use g_new() & friends where that makes obvious sense
g_new(T, n) is neater than g_malloc(sizeof(T) * n). It's also safer,
for two reasons. One, it catches multiplication overflowing size_t.
Two, it returns T * rather than void *, which lets the compiler catch
more type errors.
Patch created with Coccinelle, with two manual changes on top:
* Add const to bdrv_iterate_format() to keep the types straight
* Convert the allocation in bdrv_drop_intermediate(), which Coccinelle
inexplicably misses
Coccinelle semantic patch:
@@
type T;
@@
-g_malloc(sizeof(T))
+g_new(T, 1)
@@
type T;
@@
-g_try_malloc(sizeof(T))
+g_try_new(T, 1)
@@
type T;
@@
-g_malloc0(sizeof(T))
+g_new0(T, 1)
@@
type T;
@@
-g_try_malloc0(sizeof(T))
+g_try_new0(T, 1)
@@
type T;
expression n;
@@
-g_malloc(sizeof(T) * (n))
+g_new(T, n)
@@
type T;
expression n;
@@
-g_try_malloc(sizeof(T) * (n))
+g_try_new(T, n)
@@
type T;
expression n;
@@
-g_malloc0(sizeof(T) * (n))
+g_new0(T, n)
@@
type T;
expression n;
@@
-g_try_malloc0(sizeof(T) * (n))
+g_try_new0(T, n)
@@
type T;
expression p, n;
@@
-g_realloc(p, sizeof(T) * (n))
+g_renew(T, p, n)
@@
type T;
expression p, n;
@@
-g_try_realloc(p, sizeof(T) * (n))
+g_try_renew(T, p, n)
Signed-off-by: Markus Armbruster <armbru@redhat.com>
Reviewed-by: Max Reitz <mreitz@redhat.com>
Reviewed-by: Jeff Cody <jcody@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
2014-08-19 16:31:08 +08:00
|
|
|
blocker = g_new0(BdrvOpBlocker, 1);
|
2014-05-23 21:29:42 +08:00
|
|
|
blocker->reason = reason;
|
|
|
|
QLIST_INSERT_HEAD(&bs->op_blockers[op], blocker, list);
|
|
|
|
}
|
|
|
|
|
|
|
|
void bdrv_op_unblock(BlockDriverState *bs, BlockOpType op, Error *reason)
|
|
|
|
{
|
|
|
|
BdrvOpBlocker *blocker, *next;
|
|
|
|
assert((int) op >= 0 && op < BLOCK_OP_TYPE_MAX);
|
|
|
|
QLIST_FOREACH_SAFE(blocker, &bs->op_blockers[op], list, next) {
|
|
|
|
if (blocker->reason == reason) {
|
|
|
|
QLIST_REMOVE(blocker, list);
|
|
|
|
g_free(blocker);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void bdrv_op_block_all(BlockDriverState *bs, Error *reason)
|
|
|
|
{
|
|
|
|
int i;
|
|
|
|
for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
|
|
|
|
bdrv_op_block(bs, i, reason);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void bdrv_op_unblock_all(BlockDriverState *bs, Error *reason)
|
|
|
|
{
|
|
|
|
int i;
|
|
|
|
for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
|
|
|
|
bdrv_op_unblock(bs, i, reason);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
bool bdrv_op_blocker_is_empty(BlockDriverState *bs)
|
|
|
|
{
|
|
|
|
int i;
|
|
|
|
|
|
|
|
for (i = 0; i < BLOCK_OP_TYPE_MAX; i++) {
|
|
|
|
if (!QLIST_EMPTY(&bs->op_blockers[i])) {
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2012-11-30 20:52:09 +08:00
|
|
|
void bdrv_img_create(const char *filename, const char *fmt,
|
|
|
|
const char *base_filename, const char *base_fmt,
|
2013-02-13 16:09:40 +08:00
|
|
|
char *options, uint64_t img_size, int flags,
|
|
|
|
Error **errp, bool quiet)
|
2010-12-16 20:52:15 +08:00
|
|
|
{
|
2014-06-05 17:20:51 +08:00
|
|
|
QemuOptsList *create_opts = NULL;
|
|
|
|
QemuOpts *opts = NULL;
|
|
|
|
const char *backing_fmt, *backing_file;
|
|
|
|
int64_t size;
|
2010-12-16 20:52:15 +08:00
|
|
|
BlockDriver *drv, *proto_drv;
|
2013-09-06 23:14:26 +08:00
|
|
|
Error *local_err = NULL;
|
2010-12-16 20:52:15 +08:00
|
|
|
int ret = 0;
|
|
|
|
|
|
|
|
/* Find driver and parse its options */
|
|
|
|
drv = bdrv_find_format(fmt);
|
|
|
|
if (!drv) {
|
2012-11-30 20:52:04 +08:00
|
|
|
error_setg(errp, "Unknown file format '%s'", fmt);
|
2012-11-30 20:52:09 +08:00
|
|
|
return;
|
2010-12-16 20:52:15 +08:00
|
|
|
}
|
|
|
|
|
2015-02-06 02:58:12 +08:00
|
|
|
proto_drv = bdrv_find_protocol(filename, true, errp);
|
2010-12-16 20:52:15 +08:00
|
|
|
if (!proto_drv) {
|
2012-11-30 20:52:09 +08:00
|
|
|
return;
|
2010-12-16 20:52:15 +08:00
|
|
|
}
|
|
|
|
|
2014-12-03 01:32:45 +08:00
|
|
|
if (!drv->create_opts) {
|
|
|
|
error_setg(errp, "Format driver '%s' does not support image creation",
|
|
|
|
drv->format_name);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!proto_drv->create_opts) {
|
|
|
|
error_setg(errp, "Protocol driver '%s' does not support image creation",
|
|
|
|
proto_drv->format_name);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2014-06-05 17:21:11 +08:00
|
|
|
create_opts = qemu_opts_append(create_opts, drv->create_opts);
|
|
|
|
create_opts = qemu_opts_append(create_opts, proto_drv->create_opts);
|
2010-12-16 20:52:15 +08:00
|
|
|
|
|
|
|
/* Create parameter list with default values */
|
2014-06-05 17:20:51 +08:00
|
|
|
opts = qemu_opts_create(create_opts, NULL, 0, &error_abort);
|
2015-02-12 23:46:36 +08:00
|
|
|
qemu_opt_set_number(opts, BLOCK_OPT_SIZE, img_size, &error_abort);
|
2010-12-16 20:52:15 +08:00
|
|
|
|
|
|
|
/* Parse -o options */
|
|
|
|
if (options) {
|
2015-02-13 01:37:11 +08:00
|
|
|
qemu_opts_do_parse(opts, options, NULL, &local_err);
|
|
|
|
if (local_err) {
|
|
|
|
error_report_err(local_err);
|
|
|
|
local_err = NULL;
|
2014-06-05 17:20:51 +08:00
|
|
|
error_setg(errp, "Invalid options for file format '%s'", fmt);
|
2010-12-16 20:52:15 +08:00
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (base_filename) {
|
2015-02-13 00:52:20 +08:00
|
|
|
qemu_opt_set(opts, BLOCK_OPT_BACKING_FILE, base_filename, &local_err);
|
2015-02-13 00:49:02 +08:00
|
|
|
if (local_err) {
|
2012-11-30 20:52:04 +08:00
|
|
|
error_setg(errp, "Backing file not supported for file format '%s'",
|
|
|
|
fmt);
|
2010-12-16 20:52:15 +08:00
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (base_fmt) {
|
2015-02-13 00:52:20 +08:00
|
|
|
qemu_opt_set(opts, BLOCK_OPT_BACKING_FMT, base_fmt, &local_err);
|
2015-02-13 00:49:02 +08:00
|
|
|
if (local_err) {
|
2012-11-30 20:52:04 +08:00
|
|
|
error_setg(errp, "Backing file format not supported for file "
|
|
|
|
"format '%s'", fmt);
|
2010-12-16 20:52:15 +08:00
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-06-05 17:20:51 +08:00
|
|
|
backing_file = qemu_opt_get(opts, BLOCK_OPT_BACKING_FILE);
|
|
|
|
if (backing_file) {
|
|
|
|
if (!strcmp(filename, backing_file)) {
|
2012-11-30 20:52:04 +08:00
|
|
|
error_setg(errp, "Error: Trying to create an image with the "
|
|
|
|
"same filename as the backing file");
|
2010-12-16 20:52:17 +08:00
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-06-05 17:20:51 +08:00
|
|
|
backing_fmt = qemu_opt_get(opts, BLOCK_OPT_BACKING_FMT);
|
2010-12-16 20:52:15 +08:00
|
|
|
|
|
|
|
// The size for the image must always be specified, with one exception:
|
|
|
|
// If we are using a backing file, we can obtain the size from there
|
2014-06-05 17:20:51 +08:00
|
|
|
size = qemu_opt_get_size(opts, BLOCK_OPT_SIZE, 0);
|
|
|
|
if (size == -1) {
|
|
|
|
if (backing_file) {
|
2013-12-03 21:57:52 +08:00
|
|
|
BlockDriverState *bs;
|
2014-11-27 00:20:27 +08:00
|
|
|
char *full_backing = g_new0(char, PATH_MAX);
|
2014-06-26 19:23:25 +08:00
|
|
|
int64_t size;
|
2012-04-12 20:01:03 +08:00
|
|
|
int back_flags;
|
2015-08-27 01:47:48 +08:00
|
|
|
QDict *backing_options = NULL;
|
2012-04-12 20:01:03 +08:00
|
|
|
|
2014-11-27 00:20:27 +08:00
|
|
|
bdrv_get_full_backing_filename_from_filename(filename, backing_file,
|
|
|
|
full_backing, PATH_MAX,
|
|
|
|
&local_err);
|
|
|
|
if (local_err) {
|
|
|
|
g_free(full_backing);
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
|
2012-04-12 20:01:03 +08:00
|
|
|
/* backing files always opened read-only */
|
|
|
|
back_flags =
|
|
|
|
flags & ~(BDRV_O_RDWR | BDRV_O_SNAPSHOT | BDRV_O_NO_BACKING);
|
2010-12-16 20:52:15 +08:00
|
|
|
|
2015-08-27 01:47:48 +08:00
|
|
|
if (backing_fmt) {
|
|
|
|
backing_options = qdict_new();
|
|
|
|
qdict_put(backing_options, "driver",
|
|
|
|
qstring_from_str(backing_fmt));
|
|
|
|
}
|
|
|
|
|
2014-02-19 01:33:05 +08:00
|
|
|
bs = NULL;
|
2015-08-27 01:47:48 +08:00
|
|
|
ret = bdrv_open(&bs, full_backing, NULL, backing_options,
|
2015-08-27 01:47:49 +08:00
|
|
|
back_flags, &local_err);
|
2014-11-27 00:20:27 +08:00
|
|
|
g_free(full_backing);
|
2010-12-16 20:52:15 +08:00
|
|
|
if (ret < 0) {
|
|
|
|
goto out;
|
|
|
|
}
|
2014-06-26 19:23:25 +08:00
|
|
|
size = bdrv_getlength(bs);
|
|
|
|
if (size < 0) {
|
|
|
|
error_setg_errno(errp, -size, "Could not get size of '%s'",
|
|
|
|
backing_file);
|
|
|
|
bdrv_unref(bs);
|
|
|
|
goto out;
|
|
|
|
}
|
2010-12-16 20:52:15 +08:00
|
|
|
|
2015-02-12 23:46:36 +08:00
|
|
|
qemu_opt_set_number(opts, BLOCK_OPT_SIZE, size, &error_abort);
|
2013-12-03 21:57:52 +08:00
|
|
|
|
|
|
|
bdrv_unref(bs);
|
2010-12-16 20:52:15 +08:00
|
|
|
} else {
|
2012-11-30 20:52:04 +08:00
|
|
|
error_setg(errp, "Image creation needs a size parameter");
|
2010-12-16 20:52:15 +08:00
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2013-02-13 16:09:40 +08:00
|
|
|
if (!quiet) {
|
2015-07-07 22:42:10 +08:00
|
|
|
printf("Formatting '%s', fmt=%s ", filename, fmt);
|
2014-12-09 15:38:04 +08:00
|
|
|
qemu_opts_print(opts, " ");
|
2013-02-13 16:09:40 +08:00
|
|
|
puts("");
|
|
|
|
}
|
2014-06-05 17:20:51 +08:00
|
|
|
|
2014-06-05 17:21:11 +08:00
|
|
|
ret = bdrv_create(drv, filename, opts, &local_err);
|
2014-06-05 17:20:51 +08:00
|
|
|
|
2013-09-06 23:14:26 +08:00
|
|
|
if (ret == -EFBIG) {
|
|
|
|
/* This is generally a better message than whatever the driver would
|
|
|
|
* deliver (especially because of the cluster_size_hint), since that
|
|
|
|
* is most probably not much different from "image too large". */
|
|
|
|
const char *cluster_size_hint = "";
|
2014-06-05 17:20:51 +08:00
|
|
|
if (qemu_opt_get_size(opts, BLOCK_OPT_CLUSTER_SIZE, 0)) {
|
2013-09-06 23:14:26 +08:00
|
|
|
cluster_size_hint = " (try using a larger cluster size)";
|
2010-12-16 20:52:15 +08:00
|
|
|
}
|
2013-09-06 23:14:26 +08:00
|
|
|
error_setg(errp, "The image size is too large for file format '%s'"
|
|
|
|
"%s", fmt, cluster_size_hint);
|
|
|
|
error_free(local_err);
|
|
|
|
local_err = NULL;
|
2010-12-16 20:52:15 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
out:
|
2014-06-05 17:20:51 +08:00
|
|
|
qemu_opts_del(opts);
|
|
|
|
qemu_opts_free(create_opts);
|
2014-01-30 22:07:28 +08:00
|
|
|
if (local_err) {
|
2013-09-06 23:14:26 +08:00
|
|
|
error_propagate(errp, local_err);
|
|
|
|
}
|
2010-12-16 20:52:15 +08:00
|
|
|
}
|
2013-03-07 20:41:48 +08:00
|
|
|
|
|
|
|
AioContext *bdrv_get_aio_context(BlockDriverState *bs)
|
|
|
|
{
|
2014-05-08 22:34:37 +08:00
|
|
|
return bs->aio_context;
|
|
|
|
}
|
|
|
|
|
|
|
|
void bdrv_detach_aio_context(BlockDriverState *bs)
|
|
|
|
{
|
2014-06-21 03:57:33 +08:00
|
|
|
BdrvAioNotifier *baf;
|
|
|
|
|
2014-05-08 22:34:37 +08:00
|
|
|
if (!bs->drv) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2014-06-21 03:57:33 +08:00
|
|
|
QLIST_FOREACH(baf, &bs->aio_notifiers, list) {
|
|
|
|
baf->detach_aio_context(baf->opaque);
|
|
|
|
}
|
|
|
|
|
2015-11-04 21:15:36 +08:00
|
|
|
if (bs->throttle_state) {
|
2015-06-09 00:17:41 +08:00
|
|
|
throttle_timers_detach_aio_context(&bs->throttle_timers);
|
2014-05-14 22:22:45 +08:00
|
|
|
}
|
2014-05-08 22:34:37 +08:00
|
|
|
if (bs->drv->bdrv_detach_aio_context) {
|
|
|
|
bs->drv->bdrv_detach_aio_context(bs);
|
|
|
|
}
|
|
|
|
if (bs->file) {
|
2015-06-16 20:19:22 +08:00
|
|
|
bdrv_detach_aio_context(bs->file->bs);
|
2014-05-08 22:34:37 +08:00
|
|
|
}
|
2015-06-17 20:55:21 +08:00
|
|
|
if (bs->backing) {
|
|
|
|
bdrv_detach_aio_context(bs->backing->bs);
|
2014-05-08 22:34:37 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
bs->aio_context = NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
void bdrv_attach_aio_context(BlockDriverState *bs,
|
|
|
|
AioContext *new_context)
|
|
|
|
{
|
2014-06-21 03:57:33 +08:00
|
|
|
BdrvAioNotifier *ban;
|
|
|
|
|
2014-05-08 22:34:37 +08:00
|
|
|
if (!bs->drv) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
bs->aio_context = new_context;
|
|
|
|
|
2015-06-17 20:55:21 +08:00
|
|
|
if (bs->backing) {
|
|
|
|
bdrv_attach_aio_context(bs->backing->bs, new_context);
|
2014-05-08 22:34:37 +08:00
|
|
|
}
|
|
|
|
if (bs->file) {
|
2015-06-16 20:19:22 +08:00
|
|
|
bdrv_attach_aio_context(bs->file->bs, new_context);
|
2014-05-08 22:34:37 +08:00
|
|
|
}
|
|
|
|
if (bs->drv->bdrv_attach_aio_context) {
|
|
|
|
bs->drv->bdrv_attach_aio_context(bs, new_context);
|
|
|
|
}
|
2015-11-04 21:15:36 +08:00
|
|
|
if (bs->throttle_state) {
|
2015-06-09 00:17:41 +08:00
|
|
|
throttle_timers_attach_aio_context(&bs->throttle_timers, new_context);
|
2014-05-14 22:22:45 +08:00
|
|
|
}
|
2014-06-21 03:57:33 +08:00
|
|
|
|
|
|
|
QLIST_FOREACH(ban, &bs->aio_notifiers, list) {
|
|
|
|
ban->attached_aio_context(new_context, ban->opaque);
|
|
|
|
}
|
2014-05-08 22:34:37 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
void bdrv_set_aio_context(BlockDriverState *bs, AioContext *new_context)
|
|
|
|
{
|
2015-05-29 18:53:14 +08:00
|
|
|
bdrv_drain(bs); /* ensure there are no in-flight requests */
|
2014-05-08 22:34:37 +08:00
|
|
|
|
|
|
|
bdrv_detach_aio_context(bs);
|
|
|
|
|
|
|
|
/* This function executes in the old AioContext so acquire the new one in
|
|
|
|
* case it runs in a different thread.
|
|
|
|
*/
|
|
|
|
aio_context_acquire(new_context);
|
|
|
|
bdrv_attach_aio_context(bs, new_context);
|
|
|
|
aio_context_release(new_context);
|
2013-03-07 20:41:48 +08:00
|
|
|
}
|
2013-06-24 23:13:10 +08:00
|
|
|
|
2014-06-21 03:57:33 +08:00
|
|
|
void bdrv_add_aio_context_notifier(BlockDriverState *bs,
|
|
|
|
void (*attached_aio_context)(AioContext *new_context, void *opaque),
|
|
|
|
void (*detach_aio_context)(void *opaque), void *opaque)
|
|
|
|
{
|
|
|
|
BdrvAioNotifier *ban = g_new(BdrvAioNotifier, 1);
|
|
|
|
*ban = (BdrvAioNotifier){
|
|
|
|
.attached_aio_context = attached_aio_context,
|
|
|
|
.detach_aio_context = detach_aio_context,
|
|
|
|
.opaque = opaque
|
|
|
|
};
|
|
|
|
|
|
|
|
QLIST_INSERT_HEAD(&bs->aio_notifiers, ban, list);
|
|
|
|
}
|
|
|
|
|
|
|
|
void bdrv_remove_aio_context_notifier(BlockDriverState *bs,
|
|
|
|
void (*attached_aio_context)(AioContext *,
|
|
|
|
void *),
|
|
|
|
void (*detach_aio_context)(void *),
|
|
|
|
void *opaque)
|
|
|
|
{
|
|
|
|
BdrvAioNotifier *ban, *ban_next;
|
|
|
|
|
|
|
|
QLIST_FOREACH_SAFE(ban, &bs->aio_notifiers, list, ban_next) {
|
|
|
|
if (ban->attached_aio_context == attached_aio_context &&
|
|
|
|
ban->detach_aio_context == detach_aio_context &&
|
|
|
|
ban->opaque == opaque)
|
|
|
|
{
|
|
|
|
QLIST_REMOVE(ban, list);
|
|
|
|
g_free(ban);
|
|
|
|
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
abort();
|
|
|
|
}
|
|
|
|
|
2014-10-27 18:12:50 +08:00
|
|
|
int bdrv_amend_options(BlockDriverState *bs, QemuOpts *opts,
|
2015-07-27 23:51:32 +08:00
|
|
|
BlockDriverAmendStatusCB *status_cb, void *cb_opaque)
|
2013-09-03 16:09:50 +08:00
|
|
|
{
|
2014-06-05 17:21:11 +08:00
|
|
|
if (!bs->drv->bdrv_amend_options) {
|
2013-09-03 16:09:50 +08:00
|
|
|
return -ENOTSUP;
|
|
|
|
}
|
2015-07-27 23:51:32 +08:00
|
|
|
return bs->drv->bdrv_amend_options(bs, opts, status_cb, cb_opaque);
|
2013-09-03 16:09:50 +08:00
|
|
|
}
|
2013-10-02 20:33:48 +08:00
|
|
|
|
2014-03-04 02:11:34 +08:00
|
|
|
/* This function will be called by the bdrv_recurse_is_first_non_filter method
|
|
|
|
* of block filter and by bdrv_is_first_non_filter.
|
|
|
|
* It is used to test if the given bs is the candidate or recurse more in the
|
|
|
|
* node graph.
|
2014-01-24 04:31:36 +08:00
|
|
|
*/
|
2014-03-04 02:11:34 +08:00
|
|
|
bool bdrv_recurse_is_first_non_filter(BlockDriverState *bs,
|
2014-01-24 04:31:36 +08:00
|
|
|
BlockDriverState *candidate)
|
2013-10-02 20:33:48 +08:00
|
|
|
{
|
2014-03-04 02:11:34 +08:00
|
|
|
/* return false if basic checks fails */
|
|
|
|
if (!bs || !bs->drv) {
|
2014-01-24 04:31:36 +08:00
|
|
|
return false;
|
2013-10-02 20:33:48 +08:00
|
|
|
}
|
|
|
|
|
2014-03-04 02:11:34 +08:00
|
|
|
/* the code reached a non block filter driver -> check if the bs is
|
|
|
|
* the same as the candidate. It's the recursion termination condition.
|
|
|
|
*/
|
|
|
|
if (!bs->drv->is_filter) {
|
|
|
|
return bs == candidate;
|
2014-01-24 04:31:36 +08:00
|
|
|
}
|
2014-03-04 02:11:34 +08:00
|
|
|
/* Down this path the driver is a block filter driver */
|
2014-01-24 04:31:36 +08:00
|
|
|
|
2014-03-04 02:11:34 +08:00
|
|
|
/* If the block filter recursion method is defined use it to recurse down
|
|
|
|
* the node graph.
|
|
|
|
*/
|
|
|
|
if (bs->drv->bdrv_recurse_is_first_non_filter) {
|
2014-01-24 04:31:36 +08:00
|
|
|
return bs->drv->bdrv_recurse_is_first_non_filter(bs, candidate);
|
2013-10-02 20:33:48 +08:00
|
|
|
}
|
|
|
|
|
2014-03-04 02:11:34 +08:00
|
|
|
/* the driver is a block filter but don't allow to recurse -> return false
|
|
|
|
*/
|
|
|
|
return false;
|
2013-10-02 20:33:48 +08:00
|
|
|
}
|
|
|
|
|
2014-01-24 04:31:36 +08:00
|
|
|
/* This function checks if the candidate is the first non filter bs down it's
|
|
|
|
* bs chain. Since we don't have pointers to parents it explore all bs chains
|
|
|
|
* from the top. Some filters can choose not to pass down the recursion.
|
|
|
|
*/
|
|
|
|
bool bdrv_is_first_non_filter(BlockDriverState *candidate)
|
2013-10-02 20:33:48 +08:00
|
|
|
{
|
2014-01-24 04:31:36 +08:00
|
|
|
BlockDriverState *bs;
|
|
|
|
|
|
|
|
/* walk down the bs forest recursively */
|
|
|
|
QTAILQ_FOREACH(bs, &bdrv_states, device_list) {
|
|
|
|
bool perm;
|
|
|
|
|
2014-03-04 02:11:34 +08:00
|
|
|
/* try to recurse in this top level bs */
|
2014-02-04 18:45:31 +08:00
|
|
|
perm = bdrv_recurse_is_first_non_filter(bs, candidate);
|
2014-01-24 04:31:36 +08:00
|
|
|
|
|
|
|
/* candidate is the first non filter */
|
|
|
|
if (perm) {
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return false;
|
2013-10-02 20:33:48 +08:00
|
|
|
}
|
2014-06-28 00:25:25 +08:00
|
|
|
|
2015-07-17 10:12:22 +08:00
|
|
|
BlockDriverState *check_to_replace_node(BlockDriverState *parent_bs,
|
|
|
|
const char *node_name, Error **errp)
|
2014-06-28 00:25:25 +08:00
|
|
|
{
|
|
|
|
BlockDriverState *to_replace_bs = bdrv_find_node(node_name);
|
2014-10-21 19:03:58 +08:00
|
|
|
AioContext *aio_context;
|
|
|
|
|
2014-06-28 00:25:25 +08:00
|
|
|
if (!to_replace_bs) {
|
|
|
|
error_setg(errp, "Node name '%s' not found", node_name);
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2014-10-21 19:03:58 +08:00
|
|
|
aio_context = bdrv_get_aio_context(to_replace_bs);
|
|
|
|
aio_context_acquire(aio_context);
|
|
|
|
|
2014-06-28 00:25:25 +08:00
|
|
|
if (bdrv_op_is_blocked(to_replace_bs, BLOCK_OP_TYPE_REPLACE, errp)) {
|
2014-10-21 19:03:58 +08:00
|
|
|
to_replace_bs = NULL;
|
|
|
|
goto out;
|
2014-06-28 00:25:25 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/* We don't want arbitrary node of the BDS chain to be replaced only the top
|
|
|
|
* most non filter in order to prevent data corruption.
|
|
|
|
* Another benefit is that this tests exclude backing files which are
|
|
|
|
* blocked by the backing blockers.
|
|
|
|
*/
|
2015-07-17 10:12:22 +08:00
|
|
|
if (!bdrv_recurse_is_first_non_filter(parent_bs, to_replace_bs)) {
|
2014-06-28 00:25:25 +08:00
|
|
|
error_setg(errp, "Only top most non filter can be replaced");
|
2014-10-21 19:03:58 +08:00
|
|
|
to_replace_bs = NULL;
|
|
|
|
goto out;
|
2014-06-28 00:25:25 +08:00
|
|
|
}
|
|
|
|
|
2014-10-21 19:03:58 +08:00
|
|
|
out:
|
|
|
|
aio_context_release(aio_context);
|
2014-06-28 00:25:25 +08:00
|
|
|
return to_replace_bs;
|
|
|
|
}
|
2014-07-04 18:04:33 +08:00
|
|
|
|
2014-07-19 02:24:56 +08:00
|
|
|
static bool append_open_options(QDict *d, BlockDriverState *bs)
|
|
|
|
{
|
|
|
|
const QDictEntry *entry;
|
2015-04-24 21:20:28 +08:00
|
|
|
QemuOptDesc *desc;
|
2015-04-27 19:46:22 +08:00
|
|
|
BdrvChild *child;
|
2014-07-19 02:24:56 +08:00
|
|
|
bool found_any = false;
|
2015-04-27 19:46:22 +08:00
|
|
|
const char *p;
|
2014-07-19 02:24:56 +08:00
|
|
|
|
|
|
|
for (entry = qdict_first(bs->options); entry;
|
|
|
|
entry = qdict_next(bs->options, entry))
|
|
|
|
{
|
2015-04-27 19:46:22 +08:00
|
|
|
/* Exclude options for children */
|
|
|
|
QLIST_FOREACH(child, &bs->children, next) {
|
|
|
|
if (strstart(qdict_entry_key(entry), child->name, &p)
|
|
|
|
&& (!*p || *p == '.'))
|
|
|
|
{
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (child) {
|
2015-04-24 21:20:28 +08:00
|
|
|
continue;
|
2014-07-19 02:24:56 +08:00
|
|
|
}
|
2015-04-24 21:20:28 +08:00
|
|
|
|
|
|
|
/* And exclude all non-driver-specific options */
|
|
|
|
for (desc = bdrv_runtime_opts.desc; desc->name; desc++) {
|
|
|
|
if (!strcmp(qdict_entry_key(entry), desc->name)) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (desc->name) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
qobject_incref(qdict_entry_value(entry));
|
|
|
|
qdict_put_obj(d, qdict_entry_key(entry), qdict_entry_value(entry));
|
|
|
|
found_any = true;
|
2014-07-19 02:24:56 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
return found_any;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Updates the following BDS fields:
|
|
|
|
* - exact_filename: A filename which may be used for opening a block device
|
|
|
|
* which (mostly) equals the given BDS (even without any
|
|
|
|
* other options; so reading and writing must return the same
|
|
|
|
* results, but caching etc. may be different)
|
|
|
|
* - full_open_options: Options which, when given when opening a block device
|
|
|
|
* (without a filename), result in a BDS (mostly)
|
|
|
|
* equalling the given one
|
|
|
|
* - filename: If exact_filename is set, it is copied here. Otherwise,
|
|
|
|
* full_open_options is converted to a JSON object, prefixed with
|
|
|
|
* "json:" (for use through the JSON pseudo protocol) and put here.
|
|
|
|
*/
|
|
|
|
void bdrv_refresh_filename(BlockDriverState *bs)
|
|
|
|
{
|
|
|
|
BlockDriver *drv = bs->drv;
|
|
|
|
QDict *opts;
|
|
|
|
|
|
|
|
if (!drv) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* This BDS's file name will most probably depend on its file's name, so
|
|
|
|
* refresh that first */
|
|
|
|
if (bs->file) {
|
2015-06-16 20:19:22 +08:00
|
|
|
bdrv_refresh_filename(bs->file->bs);
|
2014-07-19 02:24:56 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
if (drv->bdrv_refresh_filename) {
|
|
|
|
/* Obsolete information is of no use here, so drop the old file name
|
|
|
|
* information before refreshing it */
|
|
|
|
bs->exact_filename[0] = '\0';
|
|
|
|
if (bs->full_open_options) {
|
|
|
|
QDECREF(bs->full_open_options);
|
|
|
|
bs->full_open_options = NULL;
|
|
|
|
}
|
|
|
|
|
2015-04-27 19:50:54 +08:00
|
|
|
opts = qdict_new();
|
|
|
|
append_open_options(opts, bs);
|
|
|
|
drv->bdrv_refresh_filename(bs, opts);
|
|
|
|
QDECREF(opts);
|
2014-07-19 02:24:56 +08:00
|
|
|
} else if (bs->file) {
|
|
|
|
/* Try to reconstruct valid information from the underlying file */
|
|
|
|
bool has_open_options;
|
|
|
|
|
|
|
|
bs->exact_filename[0] = '\0';
|
|
|
|
if (bs->full_open_options) {
|
|
|
|
QDECREF(bs->full_open_options);
|
|
|
|
bs->full_open_options = NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
opts = qdict_new();
|
|
|
|
has_open_options = append_open_options(opts, bs);
|
|
|
|
|
|
|
|
/* If no specific options have been given for this BDS, the filename of
|
|
|
|
* the underlying file should suffice for this one as well */
|
2015-06-16 20:19:22 +08:00
|
|
|
if (bs->file->bs->exact_filename[0] && !has_open_options) {
|
|
|
|
strcpy(bs->exact_filename, bs->file->bs->exact_filename);
|
2014-07-19 02:24:56 +08:00
|
|
|
}
|
|
|
|
/* Reconstructing the full options QDict is simple for most format block
|
|
|
|
* drivers, as long as the full options are known for the underlying
|
|
|
|
* file BDS. The full options QDict of that file BDS should somehow
|
|
|
|
* contain a representation of the filename, therefore the following
|
|
|
|
* suffices without querying the (exact_)filename of this BDS. */
|
2015-06-16 20:19:22 +08:00
|
|
|
if (bs->file->bs->full_open_options) {
|
2014-07-19 02:24:56 +08:00
|
|
|
qdict_put_obj(opts, "driver",
|
|
|
|
QOBJECT(qstring_from_str(drv->format_name)));
|
2015-06-16 20:19:22 +08:00
|
|
|
QINCREF(bs->file->bs->full_open_options);
|
|
|
|
qdict_put_obj(opts, "file",
|
|
|
|
QOBJECT(bs->file->bs->full_open_options));
|
2014-07-19 02:24:56 +08:00
|
|
|
|
|
|
|
bs->full_open_options = opts;
|
|
|
|
} else {
|
|
|
|
QDECREF(opts);
|
|
|
|
}
|
|
|
|
} else if (!bs->full_open_options && qdict_size(bs->options)) {
|
|
|
|
/* There is no underlying file BDS (at least referenced by BDS.file),
|
|
|
|
* so the full options QDict should be equal to the options given
|
|
|
|
* specifically for this block device when it was opened (plus the
|
|
|
|
* driver specification).
|
|
|
|
* Because those options don't change, there is no need to update
|
|
|
|
* full_open_options when it's already set. */
|
|
|
|
|
|
|
|
opts = qdict_new();
|
|
|
|
append_open_options(opts, bs);
|
|
|
|
qdict_put_obj(opts, "driver",
|
|
|
|
QOBJECT(qstring_from_str(drv->format_name)));
|
|
|
|
|
|
|
|
if (bs->exact_filename[0]) {
|
|
|
|
/* This may not work for all block protocol drivers (some may
|
|
|
|
* require this filename to be parsed), but we have to find some
|
|
|
|
* default solution here, so just include it. If some block driver
|
|
|
|
* does not support pure options without any filename at all or
|
|
|
|
* needs some special format of the options QDict, it needs to
|
|
|
|
* implement the driver-specific bdrv_refresh_filename() function.
|
|
|
|
*/
|
|
|
|
qdict_put_obj(opts, "filename",
|
|
|
|
QOBJECT(qstring_from_str(bs->exact_filename)));
|
|
|
|
}
|
|
|
|
|
|
|
|
bs->full_open_options = opts;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (bs->exact_filename[0]) {
|
|
|
|
pstrcpy(bs->filename, sizeof(bs->filename), bs->exact_filename);
|
|
|
|
} else if (bs->full_open_options) {
|
|
|
|
QString *json = qobject_to_json(QOBJECT(bs->full_open_options));
|
|
|
|
snprintf(bs->filename, sizeof(bs->filename), "json:%s",
|
|
|
|
qstring_get_str(json));
|
|
|
|
QDECREF(json);
|
|
|
|
}
|
|
|
|
}
|