blob: b460c369ca1ab06372418223c746e72624442036 [file] [log] [blame]
bellardea2384d2004-08-01 21:59:26 +00001/*
2 * QEMU System Emulator block driver
ths5fafdf22007-09-16 21:08:06 +00003 *
bellardea2384d2004-08-01 21:59:26 +00004 * Copyright (c) 2003 Fabrice Bellard
ths5fafdf22007-09-16 21:08:06 +00005 *
bellardea2384d2004-08-01 21:59:26 +00006 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
24#ifndef BLOCK_INT_H
25#define BLOCK_INT_H
26
pbrookfaf07962007-11-11 02:51:17 +000027#include "block.h"
Kevin Wolf0e7e1982009-05-18 16:42:10 +020028#include "qemu-option.h"
Stefan Hajnoczi1b7bdbc2010-04-10 07:02:42 +010029#include "qemu-queue.h"
Kevin Wolfda1fa912011-07-14 17:27:13 +020030#include "qemu-coroutine.h"
Christoph Hellwigc488c7f2011-08-25 08:26:10 +020031#include "qemu-timer.h"
Luiz Capitulinob2023812011-09-21 17:16:47 -030032#include "qapi-types.h"
pbrookfaf07962007-11-11 02:51:17 +000033
thsec36ba12007-09-16 21:59:02 +000034#define BLOCK_FLAG_ENCRYPT 1
thsec36ba12007-09-16 21:59:02 +000035#define BLOCK_FLAG_COMPAT6 4
36
Zhi Yong Wu0563e192011-11-03 16:57:25 +080037#define BLOCK_IO_LIMIT_READ 0
38#define BLOCK_IO_LIMIT_WRITE 1
39#define BLOCK_IO_LIMIT_TOTAL 2
40
41#define BLOCK_IO_SLICE_TIME 100000000
Zhi Yong Wu98f90db2011-11-08 13:00:14 +080042#define NANOSECONDS_PER_SECOND 1000000000.0
Zhi Yong Wu0563e192011-11-03 16:57:25 +080043
Kevin Wolf0e7e1982009-05-18 16:42:10 +020044#define BLOCK_OPT_SIZE "size"
45#define BLOCK_OPT_ENCRYPT "encryption"
46#define BLOCK_OPT_COMPAT6 "compat6"
47#define BLOCK_OPT_BACKING_FILE "backing_file"
48#define BLOCK_OPT_BACKING_FMT "backing_fmt"
Kevin Wolf73c632e2009-05-19 17:57:21 +020049#define BLOCK_OPT_CLUSTER_SIZE "cluster_size"
Stefan Hajnoczi75411d22010-12-06 16:08:00 +000050#define BLOCK_OPT_TABLE_SIZE "table_size"
Kevin Wolfa35e1c12009-08-17 15:50:10 +020051#define BLOCK_OPT_PREALLOC "preallocation"
Fam Zhengf66fd6c2011-07-19 08:45:23 +080052#define BLOCK_OPT_SUBFMT "subformat"
Kevin Wolf0e7e1982009-05-18 16:42:10 +020053
Stefan Hajnoczidbffbdc2011-11-17 13:40:27 +000054typedef struct BdrvTrackedRequest BdrvTrackedRequest;
55
aliguori6bbff9a2009-03-20 18:25:59 +000056typedef struct AIOPool {
57 void (*cancel)(BlockDriverAIOCB *acb);
58 int aiocb_size;
59 BlockDriverAIOCB *free_aiocb;
60} AIOPool;
61
Zhi Yong Wu0563e192011-11-03 16:57:25 +080062typedef struct BlockIOLimit {
63 int64_t bps[3];
64 int64_t iops[3];
65} BlockIOLimit;
66
67typedef struct BlockIOBaseValue {
68 uint64_t bytes[2];
69 uint64_t ios[2];
70} BlockIOBaseValue;
71
Stefan Hajnoczieeec61f2012-01-18 14:40:43 +000072typedef void BlockJobCancelFunc(void *opaque);
73typedef struct BlockJob BlockJob;
74typedef struct BlockJobType {
75 /** Derived BlockJob struct size */
76 size_t instance_size;
77
78 /** String describing the operation, part of query-block-jobs QMP API */
79 const char *job_type;
80
81 /** Optional callback for job types that support setting a speed limit */
82 int (*set_speed)(BlockJob *job, int64_t value);
83} BlockJobType;
84
85/**
86 * Long-running operation on a BlockDriverState
87 */
88struct BlockJob {
89 const BlockJobType *job_type;
90 BlockDriverState *bs;
91 bool cancelled;
92
93 /* These fields are published by the query-block-jobs QMP API */
94 int64_t offset;
95 int64_t len;
96 int64_t speed;
97
98 BlockDriverCompletionFunc *cb;
99 void *opaque;
100};
101
bellardea2384d2004-08-01 21:59:26 +0000102struct BlockDriver {
103 const char *format_name;
104 int instance_size;
105 int (*bdrv_probe)(const uint8_t *buf, int buf_size, const char *filename);
Christoph Hellwig508c7cb2009-06-15 14:04:22 +0200106 int (*bdrv_probe_device)(const char *filename);
Kevin Wolf66f82ce2010-04-14 14:17:38 +0200107 int (*bdrv_open)(BlockDriverState *bs, int flags);
108 int (*bdrv_file_open)(BlockDriverState *bs, const char *filename, int flags);
ths5fafdf22007-09-16 21:08:06 +0000109 int (*bdrv_read)(BlockDriverState *bs, int64_t sector_num,
bellardea2384d2004-08-01 21:59:26 +0000110 uint8_t *buf, int nb_sectors);
ths5fafdf22007-09-16 21:08:06 +0000111 int (*bdrv_write)(BlockDriverState *bs, int64_t sector_num,
bellardea2384d2004-08-01 21:59:26 +0000112 const uint8_t *buf, int nb_sectors);
bellarde2731ad2004-09-18 19:32:11 +0000113 void (*bdrv_close)(BlockDriverState *bs);
Kevin Wolf0e7e1982009-05-18 16:42:10 +0200114 int (*bdrv_create)(const char *filename, QEMUOptionParameter *options);
bellardea2384d2004-08-01 21:59:26 +0000115 int (*bdrv_set_key)(BlockDriverState *bs, const char *key);
bellard95389c82005-12-18 18:28:15 +0000116 int (*bdrv_make_empty)(BlockDriverState *bs);
bellard83f64092006-08-01 16:21:11 +0000117 /* aio */
aliguorif141eaf2009-04-07 18:43:24 +0000118 BlockDriverAIOCB *(*bdrv_aio_readv)(BlockDriverState *bs,
119 int64_t sector_num, QEMUIOVector *qiov, int nb_sectors,
pbrookce1a14d2006-08-07 02:38:06 +0000120 BlockDriverCompletionFunc *cb, void *opaque);
aliguorif141eaf2009-04-07 18:43:24 +0000121 BlockDriverAIOCB *(*bdrv_aio_writev)(BlockDriverState *bs,
122 int64_t sector_num, QEMUIOVector *qiov, int nb_sectors,
pbrookce1a14d2006-08-07 02:38:06 +0000123 BlockDriverCompletionFunc *cb, void *opaque);
Christoph Hellwigb2e12bc2009-09-04 19:01:49 +0200124 BlockDriverAIOCB *(*bdrv_aio_flush)(BlockDriverState *bs,
125 BlockDriverCompletionFunc *cb, void *opaque);
Paolo Bonzini4265d622011-10-17 12:32:14 +0200126 BlockDriverAIOCB *(*bdrv_aio_discard)(BlockDriverState *bs,
127 int64_t sector_num, int nb_sectors,
128 BlockDriverCompletionFunc *cb, void *opaque);
bellard83f64092006-08-01 16:21:11 +0000129
Kevin Wolfda1fa912011-07-14 17:27:13 +0200130 int coroutine_fn (*bdrv_co_readv)(BlockDriverState *bs,
131 int64_t sector_num, int nb_sectors, QEMUIOVector *qiov);
132 int coroutine_fn (*bdrv_co_writev)(BlockDriverState *bs,
133 int64_t sector_num, int nb_sectors, QEMUIOVector *qiov);
Stefan Hajnoczif08f2dd2012-02-07 13:27:25 +0000134 /*
135 * Efficiently zero a region of the disk image. Typically an image format
136 * would use a compact metadata representation to implement this. This
137 * function pointer may be NULL and .bdrv_co_writev() will be called
138 * instead.
139 */
140 int coroutine_fn (*bdrv_co_write_zeroes)(BlockDriverState *bs,
141 int64_t sector_num, int nb_sectors);
Paolo Bonzini4265d622011-10-17 12:32:14 +0200142 int coroutine_fn (*bdrv_co_discard)(BlockDriverState *bs,
143 int64_t sector_num, int nb_sectors);
Stefan Hajnoczi376ae3f2011-11-14 12:44:19 +0000144 int coroutine_fn (*bdrv_co_is_allocated)(BlockDriverState *bs,
145 int64_t sector_num, int nb_sectors, int *pnum);
Kevin Wolfda1fa912011-07-14 17:27:13 +0200146
Kevin Wolfc68b89a2011-11-10 17:25:44 +0100147 /*
Anthony Liguori0f154232011-11-14 15:09:45 -0600148 * Invalidate any cached meta-data.
149 */
150 void (*bdrv_invalidate_cache)(BlockDriverState *bs);
151
152 /*
Kevin Wolfc68b89a2011-11-10 17:25:44 +0100153 * Flushes all data that was already written to the OS all the way down to
154 * the disk (for example raw-posix calls fsync()).
155 */
156 int coroutine_fn (*bdrv_co_flush_to_disk)(BlockDriverState *bs);
157
Kevin Wolfeb489bb2011-11-10 18:10:11 +0100158 /*
159 * Flushes all internal caches to the OS. The data may still sit in a
160 * writeback cache of the host OS, but it will survive a crash of the qemu
161 * process.
162 */
163 int coroutine_fn (*bdrv_co_flush_to_os)(BlockDriverState *bs);
164
bellard83f64092006-08-01 16:21:11 +0000165 const char *protocol_name;
bellard83f64092006-08-01 16:21:11 +0000166 int (*bdrv_truncate)(BlockDriverState *bs, int64_t offset);
167 int64_t (*bdrv_getlength)(BlockDriverState *bs);
Fam Zheng4a1d5e12011-07-12 19:56:39 +0800168 int64_t (*bdrv_get_allocated_file_size)(BlockDriverState *bs);
ths5fafdf22007-09-16 21:08:06 +0000169 int (*bdrv_write_compressed)(BlockDriverState *bs, int64_t sector_num,
bellardfaea38e2006-08-05 21:31:00 +0000170 const uint8_t *buf, int nb_sectors);
171
ths5fafdf22007-09-16 21:08:06 +0000172 int (*bdrv_snapshot_create)(BlockDriverState *bs,
bellardfaea38e2006-08-05 21:31:00 +0000173 QEMUSnapshotInfo *sn_info);
ths5fafdf22007-09-16 21:08:06 +0000174 int (*bdrv_snapshot_goto)(BlockDriverState *bs,
bellardfaea38e2006-08-05 21:31:00 +0000175 const char *snapshot_id);
176 int (*bdrv_snapshot_delete)(BlockDriverState *bs, const char *snapshot_id);
ths5fafdf22007-09-16 21:08:06 +0000177 int (*bdrv_snapshot_list)(BlockDriverState *bs,
bellardfaea38e2006-08-05 21:31:00 +0000178 QEMUSnapshotInfo **psn_info);
edison51ef6722010-09-21 19:58:41 -0700179 int (*bdrv_snapshot_load_tmp)(BlockDriverState *bs,
180 const char *snapshot_name);
bellardfaea38e2006-08-05 21:31:00 +0000181 int (*bdrv_get_info)(BlockDriverState *bs, BlockDriverInfo *bdi);
bellard83f64092006-08-01 16:21:11 +0000182
Christoph Hellwig45566e92009-07-10 23:11:57 +0200183 int (*bdrv_save_vmstate)(BlockDriverState *bs, const uint8_t *buf,
184 int64_t pos, int size);
185 int (*bdrv_load_vmstate)(BlockDriverState *bs, uint8_t *buf,
186 int64_t pos, int size);
aliguori178e08a2009-04-05 19:10:55 +0000187
Kevin Wolf756e6732010-01-12 12:55:17 +0100188 int (*bdrv_change_backing_file)(BlockDriverState *bs,
189 const char *backing_file, const char *backing_fmt);
190
bellard19cb3732006-08-19 11:45:59 +0000191 /* removable device specific */
192 int (*bdrv_is_inserted)(BlockDriverState *bs);
193 int (*bdrv_media_changed)(BlockDriverState *bs);
Luiz Capitulinof36f3942012-02-03 16:24:53 -0200194 void (*bdrv_eject)(BlockDriverState *bs, bool eject_flag);
Markus Armbruster025e8492011-09-06 18:58:47 +0200195 void (*bdrv_lock_medium)(BlockDriverState *bs, bool locked);
ths3b46e622007-09-17 08:09:54 +0000196
ths985a03b2007-12-24 16:10:43 +0000197 /* to control generic scsi devices */
198 int (*bdrv_ioctl)(BlockDriverState *bs, unsigned long int req, void *buf);
aliguori221f7152009-03-28 17:28:41 +0000199 BlockDriverAIOCB *(*bdrv_aio_ioctl)(BlockDriverState *bs,
200 unsigned long int req, void *buf,
201 BlockDriverCompletionFunc *cb, void *opaque);
ths985a03b2007-12-24 16:10:43 +0000202
Kevin Wolf0e7e1982009-05-18 16:42:10 +0200203 /* List of options for creating images, terminated by name == NULL */
204 QEMUOptionParameter *create_options;
205
aliguori5eb45632009-03-28 17:55:10 +0000206
Kevin Wolf9ac228e2010-06-29 12:37:54 +0200207 /*
208 * Returns 0 for completed check, -errno for internal errors.
209 * The check results are stored in result.
210 */
211 int (*bdrv_check)(BlockDriverState* bs, BdrvCheckResult *result);
aliguorie97fc192009-04-21 23:11:50 +0000212
Kevin Wolf8b9b0cc2010-03-15 17:27:00 +0100213 void (*bdrv_debug_event)(BlockDriverState *bs, BlkDebugEvent event);
214
Kevin Wolf336c1c12010-07-28 11:26:29 +0200215 /*
216 * Returns 1 if newly created images are guaranteed to contain only
217 * zeros, 0 otherwise.
218 */
219 int (*bdrv_has_zero_init)(BlockDriverState *bs);
Kevin Wolf12c09b82009-11-30 16:54:15 +0100220
Stefan Hajnoczi8a22f022010-04-13 10:29:33 +0100221 QLIST_ENTRY(BlockDriver) list;
bellardea2384d2004-08-01 21:59:26 +0000222};
223
Jeff Cody8802d1f2012-02-28 15:54:06 -0500224/*
225 * Note: the function bdrv_append() copies and swaps contents of
226 * BlockDriverStates, so if you add new fields to this struct, please
227 * inspect bdrv_append() to determine if the new fields need to be
228 * copied as well.
229 */
bellardea2384d2004-08-01 21:59:26 +0000230struct BlockDriverState {
bellardd15a7712006-08-06 13:35:09 +0000231 int64_t total_sectors; /* if we are reading a disk image, give its
232 size in sectors */
bellardea2384d2004-08-01 21:59:26 +0000233 int read_only; /* if true, the media is read only */
Naphtali Sprei4dca4b62010-02-14 13:39:18 +0200234 int keep_read_only; /* if true, the media was requested to stay read only */
235 int open_flags; /* flags used to open the file, re-used for re-open */
bellardea2384d2004-08-01 21:59:26 +0000236 int encrypted; /* if true, the media is encrypted */
aliguoric0f4ce72009-03-05 23:01:01 +0000237 int valid_key; /* if true, a valid encryption key has been set */
ths985a03b2007-12-24 16:10:43 +0000238 int sg; /* if true, the device is a /dev/sg* */
Stefan Hajnoczi53fec9d2011-11-28 16:08:47 +0000239 int copy_on_read; /* if true, copy read backing sectors into image
240 note this is a reference count */
bellardea2384d2004-08-01 21:59:26 +0000241
bellard19cb3732006-08-19 11:45:59 +0000242 BlockDriver *drv; /* NULL means no media */
bellardea2384d2004-08-01 21:59:26 +0000243 void *opaque;
244
Markus Armbrusterfa879d62011-08-03 15:07:40 +0200245 void *dev; /* attached device model, if any */
246 /* TODO change to DeviceState when all users are qdevified */
Markus Armbruster0e49de52011-08-03 15:07:41 +0200247 const BlockDevOps *dev_ops;
248 void *dev_opaque;
Markus Armbruster18846de2010-06-29 16:58:30 +0200249
bellardea2384d2004-08-01 21:59:26 +0000250 char filename[1024];
251 char backing_file[1024]; /* if non zero, the image is a diff of
252 this file image */
aliguori5eb45632009-03-28 17:55:10 +0000253 char backing_format[16]; /* if non-zero and backing_file exists */
bellardea2384d2004-08-01 21:59:26 +0000254 int is_temporary;
bellard19cb3732006-08-19 11:45:59 +0000255
bellardea2384d2004-08-01 21:59:26 +0000256 BlockDriverState *backing_hd;
Kevin Wolf66f82ce2010-04-14 14:17:38 +0200257 BlockDriverState *file;
258
Stefan Hajnoczi470c0502012-01-18 14:40:42 +0000259 /* number of in-flight copy-on-read requests */
260 unsigned int copy_on_read_in_flight;
261
Zhi Yong Wu0563e192011-11-03 16:57:25 +0800262 /* the time for latest disk I/O */
263 int64_t slice_time;
264 int64_t slice_start;
265 int64_t slice_end;
266 BlockIOLimit io_limits;
267 BlockIOBaseValue io_base;
268 CoQueue throttled_reqs;
269 QEMUTimer *block_timer;
270 bool io_limits_enabled;
271
thsa36e69d2007-12-02 05:18:19 +0000272 /* I/O stats (display with "info blockstats"). */
Christoph Hellwiga597e792011-08-25 08:26:01 +0200273 uint64_t nr_bytes[BDRV_MAX_IOTYPE];
274 uint64_t nr_ops[BDRV_MAX_IOTYPE];
Christoph Hellwigc488c7f2011-08-25 08:26:10 +0200275 uint64_t total_time_ns[BDRV_MAX_IOTYPE];
Kevin Wolf294cc352010-04-28 14:34:01 +0200276 uint64_t wr_highest_sector;
thsa36e69d2007-12-02 05:18:19 +0000277
aliguori71d07702009-03-03 17:37:16 +0000278 /* Whether the disk can expand beyond total_sectors */
279 int growable;
280
aliguorie268ca52009-04-22 20:20:00 +0000281 /* the memory alignment required for the buffers handled by this driver */
282 int buffer_alignment;
283
Christoph Hellwige900a7b2009-09-04 19:01:15 +0200284 /* do we need to tell the quest if we have a volatile write cache? */
285 int enable_write_cache;
286
bellardea2384d2004-08-01 21:59:26 +0000287 /* NOTE: the following infos are only hints for real hardware
288 drivers. They are not used by the block driver */
bellard46d47672004-11-16 01:45:27 +0000289 int cyls, heads, secs, translation;
Markus Armbrusterabd7f682010-06-02 18:55:17 +0200290 BlockErrorAction on_read_error, on_write_error;
Luiz Capitulinod6bf2792011-10-14 17:11:23 -0300291 bool iostatus_enabled;
Luiz Capitulinob2023812011-09-21 17:16:47 -0300292 BlockDeviceIoStatus iostatus;
bellardea2384d2004-08-01 21:59:26 +0000293 char device_name[32];
Jan Kiszkac6d22832009-11-30 18:21:20 +0100294 unsigned long *dirty_bitmap;
Liran Schouraaa0eb72010-01-26 10:31:48 +0200295 int64_t dirty_count;
Marcelo Tosattidb593f22011-01-26 12:12:34 -0200296 int in_use; /* users other than guest access, eg. block migration */
Stefan Hajnoczi1b7bdbc2010-04-10 07:02:42 +0100297 QTAILQ_ENTRY(BlockDriverState) list;
Stefan Hajnoczidbffbdc2011-11-17 13:40:27 +0000298
299 QLIST_HEAD(, BdrvTrackedRequest) tracked_requests;
Stefan Hajnoczieeec61f2012-01-18 14:40:43 +0000300
301 /* long-running background operation */
302 BlockJob *job;
bellardea2384d2004-08-01 21:59:26 +0000303};
304
bellard83f64092006-08-01 16:21:11 +0000305struct BlockDriverAIOCB {
aliguori6bbff9a2009-03-20 18:25:59 +0000306 AIOPool *pool;
bellard83f64092006-08-01 16:21:11 +0000307 BlockDriverState *bs;
308 BlockDriverCompletionFunc *cb;
pbrookce1a14d2006-08-07 02:38:06 +0000309 void *opaque;
310 BlockDriverAIOCB *next;
bellard83f64092006-08-01 16:21:11 +0000311};
312
bellard95389c82005-12-18 18:28:15 +0000313void get_tmp_filename(char *filename, int size);
314
Christoph Hellwigc16b5a22009-05-25 12:37:32 +0200315void *qemu_aio_get(AIOPool *pool, BlockDriverState *bs,
316 BlockDriverCompletionFunc *cb, void *opaque);
pbrookce1a14d2006-08-07 02:38:06 +0000317void qemu_aio_release(void *p);
318
Zhi Yong Wu0563e192011-11-03 16:57:25 +0800319void bdrv_set_io_limits(BlockDriverState *bs,
320 BlockIOLimit *io_limits);
321
Christoph Hellwig508c7cb2009-06-15 14:04:22 +0200322#ifdef _WIN32
323int is_windows_drive(const char *filename);
324#endif
325
Stefan Hajnoczieeec61f2012-01-18 14:40:43 +0000326void *block_job_create(const BlockJobType *job_type, BlockDriverState *bs,
327 BlockDriverCompletionFunc *cb, void *opaque);
328void block_job_complete(BlockJob *job, int ret);
329int block_job_set_speed(BlockJob *job, int64_t value);
330void block_job_cancel(BlockJob *job);
331bool block_job_is_cancelled(BlockJob *job);
332
Stefan Hajnoczi4f1043b2012-01-18 14:40:44 +0000333int stream_start(BlockDriverState *bs, BlockDriverState *base,
Marcelo Tosattic8c30802012-01-18 14:40:53 +0000334 const char *base_id, BlockDriverCompletionFunc *cb,
335 void *opaque);
Stefan Hajnoczi4f1043b2012-01-18 14:40:44 +0000336
bellardea2384d2004-08-01 21:59:26 +0000337#endif /* BLOCK_INT_H */