Blame view

block.c 44.6 KB
bellard authored
1
2
/*
 * QEMU System Emulator block driver
3
 *
bellard authored
4
 * Copyright (c) 2003 Fabrice Bellard
5
 *
bellard authored
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 * copies of the Software, and to permit persons to whom the Software is
 * furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
 * THE SOFTWARE.
 */
24
25
26
27
28
29
#include "config-host.h"
#ifdef _BSD
/* include native header before sys-queue.h */
#include <sys/queue.h>
#endif
pbrook authored
30
#include "qemu-common.h"
31
#include "monitor.h"
bellard authored
32
#include "block_int.h"
bellard authored
33
bellard authored
34
35
36
37
#ifdef _BSD
#include <sys/types.h>
#include <sys/stat.h>
#include <sys/ioctl.h>
38
#ifndef __DragonFly__
bellard authored
39
40
#include <sys/disk.h>
#endif
41
#endif
bellard authored
42
bellard authored
43
44
45
#define SECTOR_BITS 9
#define SECTOR_SIZE (1 << SECTOR_BITS)
bellard authored
46
47
48
49
50
51
typedef struct BlockDriverAIOCBSync {
    BlockDriverAIOCB common;
    QEMUBH *bh;
    int ret;
} BlockDriverAIOCBSync;
52
53
54
55
56
57
static BlockDriverAIOCB *bdrv_aio_read_em(BlockDriverState *bs,
        int64_t sector_num, uint8_t *buf, int nb_sectors,
        BlockDriverCompletionFunc *cb, void *opaque);
static BlockDriverAIOCB *bdrv_aio_write_em(BlockDriverState *bs,
        int64_t sector_num, const uint8_t *buf, int nb_sectors,
        BlockDriverCompletionFunc *cb, void *opaque);
bellard authored
58
static void bdrv_aio_cancel_em(BlockDriverAIOCB *acb);
59
static int bdrv_read_em(BlockDriverState *bs, int64_t sector_num,
bellard authored
60
61
62
                        uint8_t *buf, int nb_sectors);
static int bdrv_write_em(BlockDriverState *bs, int64_t sector_num,
                         const uint8_t *buf, int nb_sectors);
bellard authored
63
64
65
BlockDriverState *bdrv_first;
bellard authored
66
67
static BlockDriver *first_drv;
bellard authored
68
int path_is_absolute(const char *path)
69
{
bellard authored
70
    const char *p;
71
72
73
74
75
#ifdef _WIN32
    /* specific case for names like: "\\.\d:" */
    if (*path == '/' || *path == '\\')
        return 1;
#endif
bellard authored
76
77
78
79
80
    p = strchr(path, ':');
    if (p)
        p++;
    else
        p = path;
81
82
83
84
85
#ifdef _WIN32
    return (*p == '/' || *p == '\\');
#else
    return (*p == '/');
#endif
86
87
}
bellard authored
88
89
90
91
92
93
/* if filename is absolute, just copy it to dest. Otherwise, build a
   path to it by considering it is relative to base_path. URL are
   supported. */
void path_combine(char *dest, int dest_size,
                  const char *base_path,
                  const char *filename)
94
{
bellard authored
95
96
97
98
99
100
101
102
103
104
105
106
107
    const char *p, *p1;
    int len;

    if (dest_size <= 0)
        return;
    if (path_is_absolute(filename)) {
        pstrcpy(dest, dest_size, filename);
    } else {
        p = strchr(base_path, ':');
        if (p)
            p++;
        else
            p = base_path;
108
109
110
111
112
113
114
115
116
        p1 = strrchr(base_path, '/');
#ifdef _WIN32
        {
            const char *p2;
            p2 = strrchr(base_path, '\\');
            if (!p1 || p2 > p1)
                p1 = p2;
        }
#endif
bellard authored
117
118
119
120
121
122
123
124
125
126
127
128
        if (p1)
            p1++;
        else
            p1 = base_path;
        if (p1 > p)
            p = p1;
        len = p - base_path;
        if (len > dest_size - 1)
            len = dest_size - 1;
        memcpy(dest, base_path, len);
        dest[len] = '\0';
        pstrcat(dest, dest_size, filename);
129
130
131
132
    }
}
133
static void bdrv_register(BlockDriver *bdrv)
bellard authored
134
{
135
    if (!bdrv->bdrv_aio_read) {
bellard authored
136
137
138
139
        /* add AIO emulation layer */
        bdrv->bdrv_aio_read = bdrv_aio_read_em;
        bdrv->bdrv_aio_write = bdrv_aio_write_em;
        bdrv->bdrv_aio_cancel = bdrv_aio_cancel_em;
bellard authored
140
        bdrv->aiocb_size = sizeof(BlockDriverAIOCBSync);
bellard authored
141
142
143
144
145
    } else if (!bdrv->bdrv_read && !bdrv->bdrv_pread) {
        /* add synchronous IO emulation layer */
        bdrv->bdrv_read = bdrv_read_em;
        bdrv->bdrv_write = bdrv_write_em;
    }
bellard authored
146
147
148
    bdrv->next = first_drv;
    first_drv = bdrv;
}
bellard authored
149
150
151
152
153
154
155
156

/* create a new block device (by default it is empty) */
BlockDriverState *bdrv_new(const char *device_name)
{
    BlockDriverState **pbs, *bs;

    bs = qemu_mallocz(sizeof(BlockDriverState));
    pstrcpy(bs->device_name, sizeof(bs->device_name), device_name);
bellard authored
157
158
159
160
161
162
163
    if (device_name[0] != '\0') {
        /* insert at the end */
        pbs = &bdrv_first;
        while (*pbs != NULL)
            pbs = &(*pbs)->next;
        *pbs = bs;
    }
bellard authored
164
165
166
    return bs;
}
bellard authored
167
168
169
170
171
172
173
174
175
176
BlockDriver *bdrv_find_format(const char *format_name)
{
    BlockDriver *drv1;
    for(drv1 = first_drv; drv1 != NULL; drv1 = drv1->next) {
        if (!strcmp(drv1->format_name, format_name))
            return drv1;
    }
    return NULL;
}
177
int bdrv_create(BlockDriver *drv,
bellard authored
178
179
180
181
182
183
184
185
                const char *filename, int64_t size_in_sectors,
                const char *backing_file, int flags)
{
    if (!drv->bdrv_create)
        return -ENOTSUP;
    return drv->bdrv_create(filename, size_in_sectors, backing_file, flags);
}
bellard authored
186
#ifdef _WIN32
187
void get_tmp_filename(char *filename, int size)
bellard authored
188
{
189
    char temp_dir[MAX_PATH];
190
191
192
    GetTempPath(MAX_PATH, temp_dir);
    GetTempFileName(temp_dir, "qem", 0, filename);
bellard authored
193
194
}
#else
195
void get_tmp_filename(char *filename, int size)
bellard authored
196
{
197
    int fd;
198
    const char *tmpdir;
bellard authored
199
    /* XXX: race condition possible */
200
201
202
203
    tmpdir = getenv("TMPDIR");
    if (!tmpdir)
        tmpdir = "/tmp";
    snprintf(filename, size, "%s/vl.XXXXXX", tmpdir);
bellard authored
204
205
206
    fd = mkstemp(filename);
    close(fd);
}
bellard authored
207
#endif
bellard authored
208
209
#ifdef _WIN32
bellard authored
210
211
212
213
214
215
static int is_windows_drive_prefix(const char *filename)
{
    return (((filename[0] >= 'a' && filename[0] <= 'z') ||
             (filename[0] >= 'A' && filename[0] <= 'Z')) &&
            filename[1] == ':');
}
216
217
218
static int is_windows_drive(const char *filename)
{
219
    if (is_windows_drive_prefix(filename) &&
bellard authored
220
        filename[2] == '\0')
221
222
223
224
225
226
227
228
        return 1;
    if (strstart(filename, "\\\\.\\", NULL) ||
        strstart(filename, "//./", NULL))
        return 1;
    return 0;
}
#endif
bellard authored
229
230
231
232
233
234
static BlockDriver *find_protocol(const char *filename)
{
    BlockDriver *drv1;
    char protocol[128];
    int len;
    const char *p;
235
236

#ifdef _WIN32
bellard authored
237
238
    if (is_windows_drive(filename) ||
        is_windows_drive_prefix(filename))
239
240
        return &bdrv_raw;
#endif
bellard authored
241
242
243
244
245
246
247
248
249
    p = strchr(filename, ':');
    if (!p)
        return &bdrv_raw;
    len = p - filename;
    if (len > sizeof(protocol) - 1)
        len = sizeof(protocol) - 1;
    memcpy(protocol, filename, len);
    protocol[len] = '\0';
    for(drv1 = first_drv; drv1 != NULL; drv1 = drv1->next) {
250
        if (drv1->protocol_name &&
bellard authored
251
252
253
254
255
256
            !strcmp(drv1->protocol_name, protocol))
            return drv1;
    }
    return NULL;
}
bellard authored
257
258
/* XXX: force raw format if block or character device ? It would
   simplify the BSD case */
bellard authored
259
260
static BlockDriver *find_image_format(const char *filename)
{
bellard authored
261
    int ret, score, score_max;
bellard authored
262
    BlockDriver *drv1, *drv;
bellard authored
263
264
    uint8_t buf[2048];
    BlockDriverState *bs;
265
266
267
268
269
270
271
272
273
274
275
    /* detect host devices. By convention, /dev/cdrom[N] is always
       recognized as a host CDROM */
    if (strstart(filename, "/dev/cdrom", NULL))
        return &bdrv_host_device;
#ifdef _WIN32
    if (is_windows_drive(filename))
        return &bdrv_host_device;
#else
    {
        struct stat st;
276
        if (stat(filename, &st) >= 0 &&
277
278
279
280
281
            (S_ISCHR(st.st_mode) || S_ISBLK(st.st_mode))) {
            return &bdrv_host_device;
        }
    }
#endif
282
bellard authored
283
    drv = find_protocol(filename);
284
    /* no need to test disk image formats for vvfat */
bellard authored
285
286
    if (drv == &bdrv_vvfat)
        return drv;
287
bellard authored
288
289
290
291
292
293
294
295
296
    ret = bdrv_file_open(&bs, filename, BDRV_O_RDONLY);
    if (ret < 0)
        return NULL;
    ret = bdrv_pread(bs, 0, buf, sizeof(buf));
    bdrv_delete(bs);
    if (ret < 0) {
        return NULL;
    }
bellard authored
297
298
    score_max = 0;
    for(drv1 = first_drv; drv1 != NULL; drv1 = drv1->next) {
bellard authored
299
300
301
302
303
304
        if (drv1->bdrv_probe) {
            score = drv1->bdrv_probe(buf, ret, filename);
            if (score > score_max) {
                score_max = score;
                drv = drv1;
            }
bellard authored
305
        }
bellard authored
306
    }
bellard authored
307
308
309
    return drv;
}
bellard authored
310
int bdrv_file_open(BlockDriverState **pbs, const char *filename, int flags)
bellard authored
311
{
bellard authored
312
313
314
315
316
317
318
319
    BlockDriverState *bs;
    int ret;

    bs = bdrv_new("");
    ret = bdrv_open2(bs, filename, flags | BDRV_O_FILE, NULL);
    if (ret < 0) {
        bdrv_delete(bs);
        return ret;
320
    }
321
    bs->growable = 1;
bellard authored
322
323
324
325
326
327
328
    *pbs = bs;
    return 0;
}

int bdrv_open(BlockDriverState *bs, const char *filename, int flags)
{
    return bdrv_open2(bs, filename, flags, NULL);
bellard authored
329
330
}
bellard authored
331
int bdrv_open2(BlockDriverState *bs, const char *filename, int flags,
bellard authored
332
333
               BlockDriver *drv)
{
bellard authored
334
    int ret, open_flags;
335
336
    char tmp_filename[PATH_MAX];
    char backing_filename[PATH_MAX];
337
bellard authored
338
339
340
    bs->read_only = 0;
    bs->is_temporary = 0;
    bs->encrypted = 0;
341
    bs->valid_key = 0;
bellard authored
342
bellard authored
343
    if (flags & BDRV_O_SNAPSHOT) {
bellard authored
344
345
        BlockDriverState *bs1;
        int64_t total_size;
346
        int is_protocol = 0;
347
bellard authored
348
349
        /* if snapshot, we create a temporary backing file and open it
           instead of opening 'filename' directly */
350
bellard authored
351
352
        /* if there is a backing file, use it */
        bs1 = bdrv_new("");
353
354
        ret = bdrv_open(bs1, filename, 0);
        if (ret < 0) {
bellard authored
355
            bdrv_delete(bs1);
356
            return ret;
bellard authored
357
        }
bellard authored
358
        total_size = bdrv_getlength(bs1) >> SECTOR_BITS;
359
360
361
362

        if (bs1->drv && bs1->drv->protocol_name)
            is_protocol = 1;
bellard authored
363
        bdrv_delete(bs1);
364
bellard authored
365
        get_tmp_filename(tmp_filename, sizeof(tmp_filename));
366
367
368
369
370
371
372
373

        /* Real path is meaningless for protocols */
        if (is_protocol)
            snprintf(backing_filename, sizeof(backing_filename),
                     "%s", filename);
        else
            realpath(filename, backing_filename);
374
375
376
377
        ret = bdrv_create(&bdrv_qcow2, tmp_filename,
                          total_size, backing_filename, 0);
        if (ret < 0) {
            return ret;
bellard authored
378
379
380
381
        }
        filename = tmp_filename;
        bs->is_temporary = 1;
    }
bellard authored
382
bellard authored
383
    pstrcpy(bs->filename, sizeof(bs->filename), filename);
bellard authored
384
385
    if (flags & BDRV_O_FILE) {
        drv = find_protocol(filename);
386
387
388
389
390
391
    } else if (!drv) {
        drv = find_image_format(filename);
    }
    if (!drv) {
        ret = -ENOENT;
        goto unlink_and_fail;
bellard authored
392
393
394
    }
    bs->drv = drv;
    bs->opaque = qemu_mallocz(drv->instance_size);
bellard authored
395
396
397
    /* Note: for compatibility, we open disk image files as RDWR, and
       RDONLY as fallback */
    if (!(flags & BDRV_O_FILE))
398
        open_flags = BDRV_O_RDWR | (flags & BDRV_O_CACHE_MASK);
bellard authored
399
400
401
    else
        open_flags = flags & ~(BDRV_O_FILE | BDRV_O_SNAPSHOT);
    ret = drv->bdrv_open(bs, filename, open_flags);
402
    if ((ret == -EACCES || ret == -EPERM) && !(flags & BDRV_O_FILE)) {
403
        ret = drv->bdrv_open(bs, filename, open_flags & ~BDRV_O_RDWR);
bellard authored
404
405
        bs->read_only = 1;
    }
bellard authored
406
407
    if (ret < 0) {
        qemu_free(bs->opaque);
bellard authored
408
409
        bs->opaque = NULL;
        bs->drv = NULL;
410
411
412
    unlink_and_fail:
        if (bs->is_temporary)
            unlink(filename);
bellard authored
413
        return ret;
414
    }
415
416
417
    if (drv->bdrv_getlength) {
        bs->total_sectors = bdrv_getlength(bs) >> SECTOR_BITS;
    }
418
#ifndef _WIN32
bellard authored
419
420
421
422
    if (bs->is_temporary) {
        unlink(filename);
    }
#endif
bellard authored
423
    if (bs->backing_file[0] != '\0') {
bellard authored
424
425
        /* if there is a backing file, use it */
        bs->backing_hd = bdrv_new("");
bellard authored
426
427
        path_combine(backing_filename, sizeof(backing_filename),
                     filename, bs->backing_file);
428
429
430
431
432
        ret = bdrv_open(bs->backing_hd, backing_filename, open_flags);
        if (ret < 0) {
            bdrv_close(bs);
            return ret;
        }
433
434
    }
435
436
437
438
439
440
    if (!bdrv_key_required(bs)) {
        /* call the change callback */
        bs->media_changed = 1;
        if (bs->change_cb)
            bs->change_cb(bs->change_opaque);
    }
bellard authored
441
    return 0;
bellard authored
442
443
444
445
}

void bdrv_close(BlockDriverState *bs)
{
446
    if (bs->drv) {
bellard authored
447
448
449
450
451
452
453
454
        if (bs->backing_hd)
            bdrv_delete(bs->backing_hd);
        bs->drv->bdrv_close(bs);
        qemu_free(bs->opaque);
#ifdef _WIN32
        if (bs->is_temporary) {
            unlink(bs->filename);
        }
455
#endif
bellard authored
456
457
        bs->opaque = NULL;
        bs->drv = NULL;
bellard authored
458
459

        /* call the change callback */
460
        bs->media_changed = 1;
bellard authored
461
462
463
464
465
466
467
        if (bs->change_cb)
            bs->change_cb(bs->change_opaque);
    }
}

void bdrv_delete(BlockDriverState *bs)
{
468
469
470
471
472
473
474
475
    BlockDriverState **pbs;

    pbs = &bdrv_first;
    while (*pbs != bs && *pbs != NULL)
        pbs = &(*pbs)->next;
    if (*pbs == bs)
        *pbs = bs->next;
bellard authored
476
477
    bdrv_close(bs);
    qemu_free(bs);
bellard authored
478
479
}
480
481
482
/* commit COW file into the raw image */
int bdrv_commit(BlockDriverState *bs)
{
483
    BlockDriver *drv = bs->drv;
bellard authored
484
    int64_t i, total_sectors;
bellard authored
485
486
    int n, j;
    unsigned char sector[512];
487
488
489
    if (!drv)
        return -ENOMEDIUM;
490
491

    if (bs->read_only) {
bellard authored
492
	return -EACCES;
493
494
    }
bellard authored
495
496
497
    if (!bs->backing_hd) {
	return -ENOTSUP;
    }
498
bellard authored
499
500
    total_sectors = bdrv_getlength(bs) >> SECTOR_BITS;
    for (i = 0; i < total_sectors;) {
501
        if (drv->bdrv_is_allocated(bs, i, 65536, &n)) {
bellard authored
502
503
504
505
506
507
508
509
510
            for(j = 0; j < n; j++) {
                if (bdrv_read(bs, i, sector, 1) != 0) {
                    return -EIO;
                }

                if (bdrv_write(bs->backing_hd, i, sector, 1) != 0) {
                    return -EIO;
                }
                i++;
511
	    }
bellard authored
512
513
514
	} else {
            i += n;
        }
515
    }
516
517
518
    if (drv->bdrv_make_empty)
	return drv->bdrv_make_empty(bs);
519
520
521
522
    return 0;
}
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
static int bdrv_check_byte_request(BlockDriverState *bs, int64_t offset,
                                   size_t size)
{
    int64_t len;

    if (!bdrv_is_inserted(bs))
        return -ENOMEDIUM;

    if (bs->growable)
        return 0;

    len = bdrv_getlength(bs);

    if ((offset + size) > len)
        return -EIO;

    return 0;
}

static int bdrv_check_request(BlockDriverState *bs, int64_t sector_num,
                              int nb_sectors)
{
    int64_t offset;

    /* Deal with byte accesses */
    if (sector_num < 0)
        offset = -sector_num;
    else
        offset = sector_num * 512;

    return bdrv_check_byte_request(bs, offset, nb_sectors * 512);
}
556
/* return < 0 if error. See bdrv_write() for the return codes */
557
int bdrv_read(BlockDriverState *bs, int64_t sector_num,
bellard authored
558
559
              uint8_t *buf, int nb_sectors)
{
bellard authored
560
561
    BlockDriver *drv = bs->drv;
562
563
    if (!drv)
        return -ENOMEDIUM;
564
565
    if (bdrv_check_request(bs, sector_num, nb_sectors))
        return -EIO;
bellard authored
566
bellard authored
567
568
569
570
571
572
573
    if (drv->bdrv_pread) {
        int ret, len;
        len = nb_sectors * 512;
        ret = drv->bdrv_pread(bs, sector_num * 512, buf, len);
        if (ret < 0)
            return ret;
        else if (ret != len)
574
            return -EINVAL;
575
576
577
        else {
	    bs->rd_bytes += (unsigned) len;
	    bs->rd_ops ++;
bellard authored
578
            return 0;
579
	}
bellard authored
580
581
    } else {
        return drv->bdrv_read(bs, sector_num, buf, nb_sectors);
582
    }
bellard authored
583
584
}
585
/* Return < 0 if error. Important errors are:
586
587
588
589
590
  -EIO         generic I/O error (may happen for all errors)
  -ENOMEDIUM   No media inserted.
  -EINVAL      Invalid sector number or nb_sectors
  -EACCES      Trying to write a read-only device
*/
591
int bdrv_write(BlockDriverState *bs, int64_t sector_num,
bellard authored
592
593
               const uint8_t *buf, int nb_sectors)
{
bellard authored
594
    BlockDriver *drv = bs->drv;
595
596
    if (!bs->drv)
        return -ENOMEDIUM;
bellard authored
597
    if (bs->read_only)
598
        return -EACCES;
599
600
601
    if (bdrv_check_request(bs, sector_num, nb_sectors))
        return -EIO;
bellard authored
602
    if (drv->bdrv_pwrite) {
603
        int ret, len, count = 0;
bellard authored
604
        len = nb_sectors * 512;
605
606
607
608
609
610
611
612
613
614
615
616
        do {
            ret = drv->bdrv_pwrite(bs, sector_num * 512, buf, len - count);
            if (ret < 0) {
                printf("bdrv_write ret=%d\n", ret);
                return ret;
            }
            count += ret;
            buf += ret;
        } while (count != len);
        bs->wr_bytes += (unsigned) len;
        bs->wr_ops ++;
        return 0;
bellard authored
617
    }
618
    return drv->bdrv_write(bs, sector_num, buf, nb_sectors);
bellard authored
619
620
}
621
static int bdrv_pread_em(BlockDriverState *bs, int64_t offset,
bellard authored
622
                         uint8_t *buf, int count1)
bellard authored
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
{
    uint8_t tmp_buf[SECTOR_SIZE];
    int len, nb_sectors, count;
    int64_t sector_num;

    count = count1;
    /* first read to align to sector start */
    len = (SECTOR_SIZE - offset) & (SECTOR_SIZE - 1);
    if (len > count)
        len = count;
    sector_num = offset >> SECTOR_BITS;
    if (len > 0) {
        if (bdrv_read(bs, sector_num, tmp_buf, 1) < 0)
            return -EIO;
        memcpy(buf, tmp_buf + (offset & (SECTOR_SIZE - 1)), len);
        count -= len;
        if (count == 0)
            return count1;
        sector_num++;
        buf += len;
    }

    /* read the sectors "in place" */
    nb_sectors = count >> SECTOR_BITS;
    if (nb_sectors > 0) {
        if (bdrv_read(bs, sector_num, buf, nb_sectors) < 0)
            return -EIO;
        sector_num += nb_sectors;
        len = nb_sectors << SECTOR_BITS;
        buf += len;
        count -= len;
    }

    /* add data from the last sector */
    if (count > 0) {
        if (bdrv_read(bs, sector_num, tmp_buf, 1) < 0)
            return -EIO;
        memcpy(buf, tmp_buf, count);
    }
    return count1;
}
665
static int bdrv_pwrite_em(BlockDriverState *bs, int64_t offset,
bellard authored
666
                          const uint8_t *buf, int count1)
bellard authored
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
{
    uint8_t tmp_buf[SECTOR_SIZE];
    int len, nb_sectors, count;
    int64_t sector_num;

    count = count1;
    /* first write to align to sector start */
    len = (SECTOR_SIZE - offset) & (SECTOR_SIZE - 1);
    if (len > count)
        len = count;
    sector_num = offset >> SECTOR_BITS;
    if (len > 0) {
        if (bdrv_read(bs, sector_num, tmp_buf, 1) < 0)
            return -EIO;
        memcpy(tmp_buf + (offset & (SECTOR_SIZE - 1)), buf, len);
        if (bdrv_write(bs, sector_num, tmp_buf, 1) < 0)
            return -EIO;
        count -= len;
        if (count == 0)
            return count1;
        sector_num++;
        buf += len;
    }

    /* write the sectors "in place" */
    nb_sectors = count >> SECTOR_BITS;
    if (nb_sectors > 0) {
        if (bdrv_write(bs, sector_num, buf, nb_sectors) < 0)
            return -EIO;
        sector_num += nb_sectors;
        len = nb_sectors << SECTOR_BITS;
        buf += len;
        count -= len;
    }

    /* add data from the last sector */
    if (count > 0) {
        if (bdrv_read(bs, sector_num, tmp_buf, 1) < 0)
            return -EIO;
        memcpy(tmp_buf, buf, count);
        if (bdrv_write(bs, sector_num, tmp_buf, 1) < 0)
            return -EIO;
    }
    return count1;
}

/**
714
 * Read with byte offsets (needed only for file protocols)
bellard authored
715
 */
716
int bdrv_pread(BlockDriverState *bs, int64_t offset,
bellard authored
717
718
719
720
721
               void *buf1, int count1)
{
    BlockDriver *drv = bs->drv;

    if (!drv)
722
        return -ENOMEDIUM;
723
724
725
    if (bdrv_check_byte_request(bs, offset, count1))
        return -EIO;
bellard authored
726
    if (!drv->bdrv_pread)
bellard authored
727
        return bdrv_pread_em(bs, offset, buf1, count1);
bellard authored
728
729
730
    return drv->bdrv_pread(bs, offset, buf1, count1);
}
731
732
/**
 * Write with byte offsets (needed only for file protocols)
bellard authored
733
 */
734
int bdrv_pwrite(BlockDriverState *bs, int64_t offset,
bellard authored
735
736
737
738
739
                const void *buf1, int count1)
{
    BlockDriver *drv = bs->drv;

    if (!drv)
740
        return -ENOMEDIUM;
741
742
743
    if (bdrv_check_byte_request(bs, offset, count1))
        return -EIO;
bellard authored
744
    if (!drv->bdrv_pwrite)
bellard authored
745
        return bdrv_pwrite_em(bs, offset, buf1, count1);
bellard authored
746
747
748
749
750
751
752
753
754
755
    return drv->bdrv_pwrite(bs, offset, buf1, count1);
}

/**
 * Truncate file to 'offset' bytes (needed only for file protocols)
 */
int bdrv_truncate(BlockDriverState *bs, int64_t offset)
{
    BlockDriver *drv = bs->drv;
    if (!drv)
756
        return -ENOMEDIUM;
bellard authored
757
758
759
760
761
762
763
764
765
766
767
768
    if (!drv->bdrv_truncate)
        return -ENOTSUP;
    return drv->bdrv_truncate(bs, offset);
}

/**
 * Length of a file in bytes. Return < 0 if error or unknown.
 */
int64_t bdrv_getlength(BlockDriverState *bs)
{
    BlockDriver *drv = bs->drv;
    if (!drv)
769
        return -ENOMEDIUM;
bellard authored
770
771
772
773
774
    if (!drv->bdrv_getlength) {
        /* legacy mode */
        return bs->total_sectors * SECTOR_SIZE;
    }
    return drv->bdrv_getlength(bs);
bellard authored
775
776
}
777
/* return 0 as number of sectors if no device present or error */
778
void bdrv_get_geometry(BlockDriverState *bs, uint64_t *nb_sectors_ptr)
bellard authored
779
{
780
781
782
783
784
785
786
    int64_t length;
    length = bdrv_getlength(bs);
    if (length < 0)
        length = 0;
    else
        length = length >> SECTOR_BITS;
    *nb_sectors_ptr = length;
bellard authored
787
}
bellard authored
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
struct partition {
        uint8_t boot_ind;           /* 0x80 - active */
        uint8_t head;               /* starting head */
        uint8_t sector;             /* starting sector */
        uint8_t cyl;                /* starting cylinder */
        uint8_t sys_ind;            /* What partition type */
        uint8_t end_head;           /* end head */
        uint8_t end_sector;         /* end sector */
        uint8_t end_cyl;            /* end cylinder */
        uint32_t start_sect;        /* starting sector counting from 0 */
        uint32_t nr_sects;          /* nr of sectors in partition */
} __attribute__((packed));

/* try to guess the disk logical geometry from the MSDOS partition table. Return 0 if OK, -1 if could not guess */
static int guess_disk_lchs(BlockDriverState *bs,
                           int *pcylinders, int *pheads, int *psectors)
{
    uint8_t buf[512];
    int ret, i, heads, sectors, cylinders;
    struct partition *p;
    uint32_t nr_sects;
810
    uint64_t nb_sectors;
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849

    bdrv_get_geometry(bs, &nb_sectors);

    ret = bdrv_read(bs, 0, buf, 1);
    if (ret < 0)
        return -1;
    /* test msdos magic */
    if (buf[510] != 0x55 || buf[511] != 0xaa)
        return -1;
    for(i = 0; i < 4; i++) {
        p = ((struct partition *)(buf + 0x1be)) + i;
        nr_sects = le32_to_cpu(p->nr_sects);
        if (nr_sects && p->end_head) {
            /* We make the assumption that the partition terminates on
               a cylinder boundary */
            heads = p->end_head + 1;
            sectors = p->end_sector & 63;
            if (sectors == 0)
                continue;
            cylinders = nb_sectors / (heads * sectors);
            if (cylinders < 1 || cylinders > 16383)
                continue;
            *pheads = heads;
            *psectors = sectors;
            *pcylinders = cylinders;
#if 0
            printf("guessed geometry: LCHS=%d %d %d\n",
                   cylinders, heads, sectors);
#endif
            return 0;
        }
    }
    return -1;
}

void bdrv_guess_geometry(BlockDriverState *bs, int *pcyls, int *pheads, int *psecs)
{
    int translation, lba_detected = 0;
    int cylinders, heads, secs;
850
    uint64_t nb_sectors;
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904

    /* if a geometry hint is available, use it */
    bdrv_get_geometry(bs, &nb_sectors);
    bdrv_get_geometry_hint(bs, &cylinders, &heads, &secs);
    translation = bdrv_get_translation_hint(bs);
    if (cylinders != 0) {
        *pcyls = cylinders;
        *pheads = heads;
        *psecs = secs;
    } else {
        if (guess_disk_lchs(bs, &cylinders, &heads, &secs) == 0) {
            if (heads > 16) {
                /* if heads > 16, it means that a BIOS LBA
                   translation was active, so the default
                   hardware geometry is OK */
                lba_detected = 1;
                goto default_geometry;
            } else {
                *pcyls = cylinders;
                *pheads = heads;
                *psecs = secs;
                /* disable any translation to be in sync with
                   the logical geometry */
                if (translation == BIOS_ATA_TRANSLATION_AUTO) {
                    bdrv_set_translation_hint(bs,
                                              BIOS_ATA_TRANSLATION_NONE);
                }
            }
        } else {
        default_geometry:
            /* if no geometry, use a standard physical disk geometry */
            cylinders = nb_sectors / (16 * 63);

            if (cylinders > 16383)
                cylinders = 16383;
            else if (cylinders < 2)
                cylinders = 2;
            *pcyls = cylinders;
            *pheads = 16;
            *psecs = 63;
            if ((lba_detected == 1) && (translation == BIOS_ATA_TRANSLATION_AUTO)) {
                if ((*pcyls * *pheads) <= 131072) {
                    bdrv_set_translation_hint(bs,
                                              BIOS_ATA_TRANSLATION_LARGE);
                } else {
                    bdrv_set_translation_hint(bs,
                                              BIOS_ATA_TRANSLATION_LBA);
                }
            }
        }
        bdrv_set_geometry_hint(bs, *pcyls, *pheads, *psecs);
    }
}
905
void bdrv_set_geometry_hint(BlockDriverState *bs,
bellard authored
906
907
908
909
910
911
912
913
914
915
916
917
918
919
                            int cyls, int heads, int secs)
{
    bs->cyls = cyls;
    bs->heads = heads;
    bs->secs = secs;
}

void bdrv_set_type_hint(BlockDriverState *bs, int type)
{
    bs->type = type;
    bs->removable = ((type == BDRV_TYPE_CDROM ||
                      type == BDRV_TYPE_FLOPPY));
}
920
921
922
923
924
void bdrv_set_translation_hint(BlockDriverState *bs, int translation)
{
    bs->translation = translation;
}
925
void bdrv_get_geometry_hint(BlockDriverState *bs,
bellard authored
926
927
928
929
930
931
932
933
934
935
936
937
                            int *pcyls, int *pheads, int *psecs)
{
    *pcyls = bs->cyls;
    *pheads = bs->heads;
    *psecs = bs->secs;
}

int bdrv_get_type_hint(BlockDriverState *bs)
{
    return bs->type;
}
938
939
940
941
942
int bdrv_get_translation_hint(BlockDriverState *bs)
{
    return bs->translation;
}
bellard authored
943
944
945
946
947
948
949
950
951
952
int bdrv_is_removable(BlockDriverState *bs)
{
    return bs->removable;
}

int bdrv_is_read_only(BlockDriverState *bs)
{
    return bs->read_only;
}
953
954
955
956
957
int bdrv_is_sg(BlockDriverState *bs)
{
    return bs->sg;
}
958
/* XXX: no longer used */
959
void bdrv_set_change_cb(BlockDriverState *bs,
bellard authored
960
961
962
963
964
965
                        void (*change_cb)(void *opaque), void *opaque)
{
    bs->change_cb = change_cb;
    bs->change_opaque = opaque;
}
bellard authored
966
967
968
969
970
971
972
int bdrv_is_encrypted(BlockDriverState *bs)
{
    if (bs->backing_hd && bs->backing_hd->encrypted)
        return 1;
    return bs->encrypted;
}
973
974
975
976
977
978
979
980
981
int bdrv_key_required(BlockDriverState *bs)
{
    BlockDriverState *backing_hd = bs->backing_hd;

    if (backing_hd && backing_hd->encrypted && !backing_hd->valid_key)
        return 1;
    return (bs->encrypted && !bs->valid_key);
}
bellard authored
982
983
984
985
986
987
988
989
990
991
992
993
int bdrv_set_key(BlockDriverState *bs, const char *key)
{
    int ret;
    if (bs->backing_hd && bs->backing_hd->encrypted) {
        ret = bdrv_set_key(bs->backing_hd, key);
        if (ret < 0)
            return ret;
        if (!bs->encrypted)
            return 0;
    }
    if (!bs->encrypted || !bs->drv || !bs->drv->bdrv_set_key)
        return -1;
994
    ret = bs->drv->bdrv_set_key(bs, key);
995
996
997
998
999
1000
1001
1002
1003
    if (ret < 0) {
        bs->valid_key = 0;
    } else if (!bs->valid_key) {
        bs->valid_key = 1;
        /* call the change callback now, we skipped it on open */
        bs->media_changed = 1;
        if (bs->change_cb)
            bs->change_cb(bs->change_opaque);
    }
1004
    return ret;
bellard authored
1005
1006
1007
1008
}

void bdrv_get_format(BlockDriverState *bs, char *buf, int buf_size)
{
1009
    if (!bs->drv) {
bellard authored
1010
1011
1012
1013
1014
1015
        buf[0] = '\0';
    } else {
        pstrcpy(buf, buf_size, bs->drv->format_name);
    }
}
1016
void bdrv_iterate_format(void (*it)(void *opaque, const char *name),
bellard authored
1017
1018
1019
1020
1021
1022
1023
1024
1025
                         void *opaque)
{
    BlockDriver *drv;

    for (drv = first_drv; drv != NULL; drv = drv->next) {
        it(opaque, drv->format_name);
    }
}
bellard authored
1026
1027
1028
1029
1030
1031
1032
1033
1034
1035
1036
BlockDriverState *bdrv_find(const char *name)
{
    BlockDriverState *bs;

    for (bs = bdrv_first; bs != NULL; bs = bs->next) {
        if (!strcmp(name, bs->device_name))
            return bs;
    }
    return NULL;
}
1037
void bdrv_iterate(void (*it)(void *opaque, BlockDriverState *bs), void *opaque)
bellard authored
1038
1039
1040
1041
{
    BlockDriverState *bs;

    for (bs = bdrv_first; bs != NULL; bs = bs->next) {
1042
        it(opaque, bs);
bellard authored
1043
1044
1045
    }
}
bellard authored
1046
1047
1048
1049
1050
const char *bdrv_get_device_name(BlockDriverState *bs)
{
    return bs->device_name;
}
pbrook authored
1051
1052
1053
1054
1055
1056
1057
1058
void bdrv_flush(BlockDriverState *bs)
{
    if (bs->drv->bdrv_flush)
        bs->drv->bdrv_flush(bs);
    if (bs->backing_hd)
        bdrv_flush(bs->backing_hd);
}
aliguori authored
1059
1060
1061
1062
1063
1064
1065
1066
1067
1068
void bdrv_flush_all(void)
{
    BlockDriverState *bs;

    for (bs = bdrv_first; bs != NULL; bs = bs->next)
        if (bs->drv && !bdrv_is_read_only(bs) && 
            (!bdrv_is_removable(bs) || bdrv_is_inserted(bs)))
            bdrv_flush(bs);
}
1069
1070
1071
1072
1073
1074
1075
1076
1077
1078
1079
1080
1081
1082
1083
1084
1085
1086
1087
1088
1089
1090
1091
1092
1093
1094
1095
/*
 * Returns true iff the specified sector is present in the disk image. Drivers
 * not implementing the functionality are assumed to not support backing files,
 * hence all their sectors are reported as allocated.
 *
 * 'pnum' is set to the number of sectors (including and immediately following
 * the specified sector) that are known to be in the same
 * allocated/unallocated state.
 *
 * 'nb_sectors' is the max value 'pnum' should be set to.
 */
int bdrv_is_allocated(BlockDriverState *bs, int64_t sector_num, int nb_sectors,
	int *pnum)
{
    int64_t n;
    if (!bs->drv->bdrv_is_allocated) {
        if (sector_num >= bs->total_sectors) {
            *pnum = 0;
            return 0;
        }
        n = bs->total_sectors - sector_num;
        *pnum = (n < nb_sectors) ? (n) : (nb_sectors);
        return 1;
    }
    return bs->drv->bdrv_is_allocated(bs, sector_num, nb_sectors, pnum);
}
1096
void bdrv_info(Monitor *mon)
bellard authored
1097
1098
1099
1100
{
    BlockDriverState *bs;

    for (bs = bdrv_first; bs != NULL; bs = bs->next) {
1101
1102
        monitor_printf(mon, "%s:", bs->device_name);
        monitor_printf(mon, " type=");
bellard authored
1103
1104
        switch(bs->type) {
        case BDRV_TYPE_HD:
1105
            monitor_printf(mon, "hd");
bellard authored
1106
1107
            break;
        case BDRV_TYPE_CDROM:
1108
            monitor_printf(mon, "cdrom");
bellard authored
1109
1110
            break;
        case BDRV_TYPE_FLOPPY:
1111
            monitor_printf(mon, "floppy");
bellard authored
1112
1113
            break;
        }
1114
        monitor_printf(mon, " removable=%d", bs->removable);
bellard authored
1115
        if (bs->removable) {
1116
            monitor_printf(mon, " locked=%d", bs->locked);
bellard authored
1117
        }
1118
        if (bs->drv) {
1119
1120
            monitor_printf(mon, " file=");
            monitor_print_filename(mon, bs->filename);
1121
            if (bs->backing_file[0] != '\0') {
1122
1123
1124
1125
1126
1127
                monitor_printf(mon, " backing_file=");
                monitor_print_filename(mon, bs->backing_file);
            }
            monitor_printf(mon, " ro=%d", bs->read_only);
            monitor_printf(mon, " drv=%s", bs->drv->format_name);
            monitor_printf(mon, " encrypted=%d", bdrv_is_encrypted(bs));
bellard authored
1128
        } else {
1129
            monitor_printf(mon, " [not inserted]");
bellard authored
1130
        }
1131
        monitor_printf(mon, "\n");
bellard authored
1132
1133
    }
}
1134
1135

/* The "info blockstats" command. */
1136
void bdrv_info_stats(Monitor *mon)
1137
1138
{
    BlockDriverState *bs;
1139
    BlockDriverInfo bdi;
1140
1141

    for (bs = bdrv_first; bs != NULL; bs = bs->next) {
1142
1143
1144
1145
1146
1147
1148
1149
1150
        monitor_printf(mon, "%s:"
                       " rd_bytes=%" PRIu64
                       " wr_bytes=%" PRIu64
                       " rd_operations=%" PRIu64
                       " wr_operations=%" PRIu64
                       ,
                       bs->device_name,
                       bs->rd_bytes, bs->wr_bytes,
                       bs->rd_ops, bs->wr_ops);
1151
        if (bdrv_get_info(bs, &bdi) == 0)
1152
1153
1154
1155
            monitor_printf(mon, " high=%" PRId64
                           " bytes_free=%" PRId64,
                           bdi.highest_alloc, bdi.num_free_bytes);
        monitor_printf(mon, "\n");
1156
1157
    }
}
bellard authored
1158
1159
1160
1161
1162
1163
1164
1165
1166
1167
1168
const char *bdrv_get_encrypted_filename(BlockDriverState *bs)
{
    if (bs->backing_hd && bs->backing_hd->encrypted)
        return bs->backing_file;
    else if (bs->encrypted)
        return bs->filename;
    else
        return NULL;
}
1169
void bdrv_get_backing_filename(BlockDriverState *bs,
bellard authored
1170
1171
1172
1173
1174
1175
1176
1177
1178
                               char *filename, int filename_size)
{
    if (!bs->backing_hd) {
        pstrcpy(filename, filename_size, "");
    } else {
        pstrcpy(filename, filename_size, bs->backing_file);
    }
}
1179
int bdrv_write_compressed(BlockDriverState *bs, int64_t sector_num,
bellard authored
1180
1181
1182
1183
                          const uint8_t *buf, int nb_sectors)
{
    BlockDriver *drv = bs->drv;
    if (!drv)
1184
        return -ENOMEDIUM;
bellard authored
1185
1186
1187
1188
    if (!drv->bdrv_write_compressed)
        return -ENOTSUP;
    return drv->bdrv_write_compressed(bs, sector_num, buf, nb_sectors);
}
1189
bellard authored
1190
1191
1192
1193
int bdrv_get_info(BlockDriverState *bs, BlockDriverInfo *bdi)
{
    BlockDriver *drv = bs->drv;
    if (!drv)
1194
        return -ENOMEDIUM;
bellard authored
1195
1196
1197
1198
1199
1200
1201
1202
1203
    if (!drv->bdrv_get_info)
        return -ENOTSUP;
    memset(bdi, 0, sizeof(*bdi));
    return drv->bdrv_get_info(bs, bdi);
}

/**************************************************************/
/* handling of snapshots */
1204
int bdrv_snapshot_create(BlockDriverState *bs,
bellard authored
1205
1206
1207
1208
                         QEMUSnapshotInfo *sn_info)
{
    BlockDriver *drv = bs->drv;
    if (!drv)
1209
        return -ENOMEDIUM;
bellard authored
1210
1211
1212
1213
1214
    if (!drv->bdrv_snapshot_create)
        return -ENOTSUP;
    return drv->bdrv_snapshot_create(bs, sn_info);
}
1215
int bdrv_snapshot_goto(BlockDriverState *bs,
bellard authored
1216
1217
1218
1219
                       const char *snapshot_id)
{
    BlockDriver *drv = bs->drv;
    if (!drv)
1220
        return -ENOMEDIUM;
bellard authored
1221
1222
1223
1224
1225
1226
1227
1228
1229
    if (!drv->bdrv_snapshot_goto)
        return -ENOTSUP;
    return drv->bdrv_snapshot_goto(bs, snapshot_id);
}

int bdrv_snapshot_delete(BlockDriverState *bs, const char *snapshot_id)
{
    BlockDriver *drv = bs->drv;
    if (!drv)
1230
        return -ENOMEDIUM;
bellard authored
1231
1232
1233
1234
1235
    if (!drv->bdrv_snapshot_delete)
        return -ENOTSUP;
    return drv->bdrv_snapshot_delete(bs, snapshot_id);
}
1236
int bdrv_snapshot_list(BlockDriverState *bs,
bellard authored
1237
1238
1239
1240
                       QEMUSnapshotInfo **psn_info)
{
    BlockDriver *drv = bs->drv;
    if (!drv)
1241
        return -ENOMEDIUM;
bellard authored
1242
1243
1244
1245
1246
1247
1248
1249
1250
1251
1252
1253
1254
1255
1256
1257
1258
1259
1260
    if (!drv->bdrv_snapshot_list)
        return -ENOTSUP;
    return drv->bdrv_snapshot_list(bs, psn_info);
}

#define NB_SUFFIXES 4

char *get_human_readable_size(char *buf, int buf_size, int64_t size)
{
    static const char suffixes[NB_SUFFIXES] = "KMGT";
    int64_t base;
    int i;

    if (size <= 999) {
        snprintf(buf, buf_size, "%" PRId64, size);
    } else {
        base = 1024;
        for(i = 0; i < NB_SUFFIXES; i++) {
            if (size < (10 * base)) {
1261
                snprintf(buf, buf_size, "%0.1f%c",
bellard authored
1262
1263
1264
1265
                         (double)size / base,
                         suffixes[i]);
                break;
            } else if (size < (1000 * base) || i == (NB_SUFFIXES - 1)) {
1266
                snprintf(buf, buf_size, "%" PRId64 "%c",
bellard authored
1267
1268
1269
1270
1271
1272
1273
1274
1275
1276
1277
1278
1279
                         ((size + (base >> 1)) / base),
                         suffixes[i]);
                break;
            }
            base = base * 1024;
        }
    }
    return buf;
}

char *bdrv_snapshot_dump(char *buf, int buf_size, QEMUSnapshotInfo *sn)
{
    char buf1[128], date_buf[128], clock_buf[128];
1280
1281
1282
#ifdef _WIN32
    struct tm *ptm;
#else
bellard authored
1283
    struct tm tm;
1284
#endif
bellard authored
1285
1286
1287
1288
    time_t ti;
    int64_t secs;

    if (!sn) {
1289
1290
        snprintf(buf, buf_size,
                 "%-10s%-20s%7s%20s%15s",
bellard authored
1291
1292
1293
                 "ID", "TAG", "VM SIZE", "DATE", "VM CLOCK");
    } else {
        ti = sn->date_sec;
1294
1295
1296
1297
1298
#ifdef _WIN32
        ptm = localtime(&ti);
        strftime(date_buf, sizeof(date_buf),
                 "%Y-%m-%d %H:%M:%S", ptm);
#else
bellard authored
1299
1300
1301
        localtime_r(&ti, &tm);
        strftime(date_buf, sizeof(date_buf),
                 "%Y-%m-%d %H:%M:%S", &tm);
1302
#endif
bellard authored
1303
1304
1305
1306
1307
        secs = sn->vm_clock_nsec / 1000000000;
        snprintf(clock_buf, sizeof(clock_buf),
                 "%02d:%02d:%02d.%03d",
                 (int)(secs / 3600),
                 (int)((secs / 60) % 60),
1308
                 (int)(secs % 60),
bellard authored
1309
1310
                 (int)((sn->vm_clock_nsec / 1000000) % 1000));
        snprintf(buf, buf_size,
1311
                 "%-10s%-20s%7s%20s%15s",
bellard authored
1312
1313
1314
1315
1316
1317
1318
1319
                 sn->id_str, sn->name,
                 get_human_readable_size(buf1, sizeof(buf1), sn->vm_state_size),
                 date_buf,
                 clock_buf);
    }
    return buf;
}
bellard authored
1320
bellard authored
1321
/**************************************************************/
bellard authored
1322
/* async I/Os */
bellard authored
1323
1324
1325
1326
1327
1328
1329
1330
1331
1332
1333
1334
1335
1336
typedef struct VectorTranslationState {
    QEMUIOVector *iov;
    uint8_t *bounce;
    int is_write;
    BlockDriverAIOCB *aiocb;
    BlockDriverAIOCB *this_aiocb;
} VectorTranslationState;

static void bdrv_aio_rw_vector_cb(void *opaque, int ret)
{
    VectorTranslationState *s = opaque;

    if (!s->is_write) {
1337
        qemu_iovec_from_buffer(s->iov, s->bounce, s->iov->size);
1338
    }
1339
    qemu_vfree(s->bounce);
1340
1341
1342
1343
1344
1345
1346
1347
1348
1349
1350
1351
1352
1353
1354
1355
1356
1357
1358
1359
1360
1361
1362
1363
1364
1365
1366
1367
1368
1369
1370
1371
1372
1373
1374
    s->this_aiocb->cb(s->this_aiocb->opaque, ret);
    qemu_aio_release(s->this_aiocb);
}

static BlockDriverAIOCB *bdrv_aio_rw_vector(BlockDriverState *bs,
                                            int64_t sector_num,
                                            QEMUIOVector *iov,
                                            int nb_sectors,
                                            BlockDriverCompletionFunc *cb,
                                            void *opaque,
                                            int is_write)

{
    VectorTranslationState *s = qemu_mallocz(sizeof(*s));
    BlockDriverAIOCB *aiocb = qemu_aio_get(bs, cb, opaque);

    s->this_aiocb = aiocb;
    s->iov = iov;
    s->bounce = qemu_memalign(512, nb_sectors * 512);
    s->is_write = is_write;
    if (is_write) {
        qemu_iovec_to_buffer(s->iov, s->bounce);
        s->aiocb = bdrv_aio_write(bs, sector_num, s->bounce, nb_sectors,
                                  bdrv_aio_rw_vector_cb, s);
    } else {
        s->aiocb = bdrv_aio_read(bs, sector_num, s->bounce, nb_sectors,
                                 bdrv_aio_rw_vector_cb, s);
    }
    return aiocb;
}

BlockDriverAIOCB *bdrv_aio_readv(BlockDriverState *bs, int64_t sector_num,
                                 QEMUIOVector *iov, int nb_sectors,
                                 BlockDriverCompletionFunc *cb, void *opaque)
{
1375
1376
1377
    if (bdrv_check_request(bs, sector_num, nb_sectors))
        return NULL;
1378
1379
1380
1381
1382
1383
1384
1385
    return bdrv_aio_rw_vector(bs, sector_num, iov, nb_sectors,
                              cb, opaque, 0);
}

BlockDriverAIOCB *bdrv_aio_writev(BlockDriverState *bs, int64_t sector_num,
                                  QEMUIOVector *iov, int nb_sectors,
                                  BlockDriverCompletionFunc *cb, void *opaque)
{
1386
1387
1388
    if (bdrv_check_request(bs, sector_num, nb_sectors))
        return NULL;
1389
1390
1391
1392
    return bdrv_aio_rw_vector(bs, sector_num, iov, nb_sectors,
                              cb, opaque, 1);
}
1393
1394
1395
BlockDriverAIOCB *bdrv_aio_read(BlockDriverState *bs, int64_t sector_num,
                                uint8_t *buf, int nb_sectors,
                                BlockDriverCompletionFunc *cb, void *opaque)
bellard authored
1396
1397
{
    BlockDriver *drv = bs->drv;
1398
    BlockDriverAIOCB *ret;
bellard authored
1399
1400
    if (!drv)
1401
        return NULL;
1402
1403
    if (bdrv_check_request(bs, sector_num, nb_sectors))
        return NULL;
1404
1405
1406
1407
1408
1409
1410
1411
1412
1413
    ret = drv->bdrv_aio_read(bs, sector_num, buf, nb_sectors, cb, opaque);

    if (ret) {
	/* Update stats even though technically transfer has not happened. */
	bs->rd_bytes += (unsigned) nb_sectors * SECTOR_SIZE;
	bs->rd_ops ++;
    }

    return ret;
bellard authored
1414
1415
}
1416
1417
1418
BlockDriverAIOCB *bdrv_aio_write(BlockDriverState *bs, int64_t sector_num,
                                 const uint8_t *buf, int nb_sectors,
                                 BlockDriverCompletionFunc *cb, void *opaque)
bellard authored
1419
{
bellard authored
1420
    BlockDriver *drv = bs->drv;
1421
    BlockDriverAIOCB *ret;
bellard authored
1422
1423
    if (!drv)
1424
        return NULL;
bellard authored
1425
    if (bs->read_only)
1426
        return NULL;
1427
1428
    if (bdrv_check_request(bs, sector_num, nb_sectors))
        return NULL;
bellard authored
1429
1430
1431
1432
1433
1434
1435
1436
1437
1438
    ret = drv->bdrv_aio_write(bs, sector_num, buf, nb_sectors, cb, opaque);

    if (ret) {
	/* Update stats even though technically transfer has not happened. */
	bs->wr_bytes += (unsigned) nb_sectors * SECTOR_SIZE;
	bs->wr_ops ++;
    }

    return ret;
bellard authored
1439
1440
1441
1442
}

void bdrv_aio_cancel(BlockDriverAIOCB *acb)
{
1443
    BlockDriver *drv = acb->bs->drv;
bellard authored
1444
1445
1446
1447
1448
1449
    if (acb->cb == bdrv_aio_rw_vector_cb) {
        VectorTranslationState *s = acb->opaque;
        acb = s->aiocb;
    }
1450
    drv->bdrv_aio_cancel(acb);
bellard authored
1451
1452
}
1453
bellard authored
1454
1455
1456
/**************************************************************/
/* async block device emulation */
1457
static void bdrv_aio_bh_cb(void *opaque)
bellard authored
1458
{
1459
1460
1461
    BlockDriverAIOCBSync *acb = opaque;
    acb->common.cb(acb->common.opaque, acb->ret);
    qemu_aio_release(acb);
bellard authored
1462
}
1463
1464
1465
1466
static BlockDriverAIOCB *bdrv_aio_read_em(BlockDriverState *bs,
        int64_t sector_num, uint8_t *buf, int nb_sectors,
        BlockDriverCompletionFunc *cb, void *opaque)
bellard authored
1467
{
1468
    BlockDriverAIOCBSync *acb;
bellard authored
1469
    int ret;
1470
1471
1472
1473
1474
1475
1476
1477

    acb = qemu_aio_get(bs, cb, opaque);
    if (!acb->bh)
        acb->bh = qemu_bh_new(bdrv_aio_bh_cb, acb);
    ret = bdrv_read(bs, sector_num, buf, nb_sectors);
    acb->ret = ret;
    qemu_bh_schedule(acb->bh);
    return &acb->common;
1478
1479
}
1480
1481
1482
static BlockDriverAIOCB *bdrv_aio_write_em(BlockDriverState *bs,
        int64_t sector_num, const uint8_t *buf, int nb_sectors,
        BlockDriverCompletionFunc *cb, void *opaque)
1483
{
1484
    BlockDriverAIOCBSync *acb;
bellard authored
1485
1486
    int ret;
1487
1488
1489
1490
1491
1492
1493
    acb = qemu_aio_get(bs, cb, opaque);
    if (!acb->bh)
        acb->bh = qemu_bh_new(bdrv_aio_bh_cb, acb);
    ret = bdrv_write(bs, sector_num, buf, nb_sectors);
    acb->ret = ret;
    qemu_bh_schedule(acb->bh);
    return &acb->common;
1494
1495
}
1496
static void bdrv_aio_cancel_em(BlockDriverAIOCB *blockacb)
bellard authored
1497
{
1498
1499
1500
    BlockDriverAIOCBSync *acb = (BlockDriverAIOCBSync *)blockacb;
    qemu_bh_cancel(acb->bh);
    qemu_aio_release(acb);
bellard authored
1501
}
bellard authored
1502
bellard authored
1503
1504
/**************************************************************/
/* sync block device emulation */
bellard authored
1505
bellard authored
1506
1507
1508
static void bdrv_rw_em_cb(void *opaque, int ret)
{
    *(int *)opaque = ret;
bellard authored
1509
1510
}
bellard authored
1511
1512
#define NOT_DONE 0x7fffffff
1513
static int bdrv_read_em(BlockDriverState *bs, int64_t sector_num,
bellard authored
1514
                        uint8_t *buf, int nb_sectors)
pbrook authored
1515
{
1516
1517
    int async_ret;
    BlockDriverAIOCB *acb;
bellard authored
1518
1519

    async_ret = NOT_DONE;
1520
    acb = bdrv_aio_read(bs, sector_num, buf, nb_sectors,
bellard authored
1521
                        bdrv_rw_em_cb, &async_ret);
1522
    if (acb == NULL)
1523
        return -1;
1524
bellard authored
1525
1526
1527
    while (async_ret == NOT_DONE) {
        qemu_aio_wait();
    }
1528
bellard authored
1529
    return async_ret;
pbrook authored
1530
1531
}
bellard authored
1532
1533
1534
static int bdrv_write_em(BlockDriverState *bs, int64_t sector_num,
                         const uint8_t *buf, int nb_sectors)
{
1535
1536
    int async_ret;
    BlockDriverAIOCB *acb;
bellard authored
1537
1538

    async_ret = NOT_DONE;
1539
    acb = bdrv_aio_write(bs, sector_num, buf, nb_sectors,
bellard authored
1540
                         bdrv_rw_em_cb, &async_ret);
1541
    if (acb == NULL)
1542
        return -1;
bellard authored
1543
1544
1545
1546
1547
    while (async_ret == NOT_DONE) {
        qemu_aio_wait();
    }
    return async_ret;
}
bellard authored
1548
1549
1550
1551

void bdrv_init(void)
{
    bdrv_register(&bdrv_raw);
1552
    bdrv_register(&bdrv_host_device);
bellard authored
1553
1554
1555
1556
1557
#ifndef _WIN32
    bdrv_register(&bdrv_cow);
#endif
    bdrv_register(&bdrv_qcow);
    bdrv_register(&bdrv_vmdk);
1558
    bdrv_register(&bdrv_cloop);
1559
    bdrv_register(&bdrv_dmg);
1560
    bdrv_register(&bdrv_bochs);
1561
    bdrv_register(&bdrv_vpc);
bellard authored
1562
    bdrv_register(&bdrv_vvfat);
bellard authored
1563
    bdrv_register(&bdrv_qcow2);
1564
    bdrv_register(&bdrv_parallels);
1565
    bdrv_register(&bdrv_nbd);
bellard authored
1566
}
1567
1568
1569
1570
1571
1572
1573
1574
1575
1576
1577
1578
1579
1580
1581
1582
1583
1584
1585
1586
1587
1588
1589
1590
1591
1592
1593

void *qemu_aio_get(BlockDriverState *bs, BlockDriverCompletionFunc *cb,
                   void *opaque)
{
    BlockDriver *drv;
    BlockDriverAIOCB *acb;

    drv = bs->drv;
    if (drv->free_aiocb) {
        acb = drv->free_aiocb;
        drv->free_aiocb = acb->next;
    } else {
        acb = qemu_mallocz(drv->aiocb_size);
    }
    acb->bs = bs;
    acb->cb = cb;
    acb->opaque = opaque;
    return acb;
}

void qemu_aio_release(void *p)
{
    BlockDriverAIOCB *acb = p;
    BlockDriver *drv = acb->bs->drv;
    acb->next = drv->free_aiocb;
    drv->free_aiocb = acb;
}
1594
1595
1596
1597
1598
1599
1600
1601
1602
1603
1604
1605
1606
1607
1608
1609
1610
1611
1612
1613
1614

/**************************************************************/
/* removable device support */

/**
 * Return TRUE if the media is present
 */
int bdrv_is_inserted(BlockDriverState *bs)
{
    BlockDriver *drv = bs->drv;
    int ret;
    if (!drv)
        return 0;
    if (!drv->bdrv_is_inserted)
        return 1;
    ret = drv->bdrv_is_inserted(bs);
    return ret;
}

/**
 * Return TRUE if the media changed since the last call to this
1615
 * function. It is currently only used for floppy disks
1616
1617
1618
1619
1620
1621
1622
1623
1624
1625
1626
1627
1628
1629
1630
1631
1632
1633
1634
1635
1636
1637
1638
1639
1640
1641
1642
1643
1644
1645
1646
1647
1648
1649
1650
1651
1652
1653
1654
1655
1656
1657
1658
1659
1660
1661
1662
1663
1664
1665
1666
1667
1668
 */
int bdrv_media_changed(BlockDriverState *bs)
{
    BlockDriver *drv = bs->drv;
    int ret;

    if (!drv || !drv->bdrv_media_changed)
        ret = -ENOTSUP;
    else
        ret = drv->bdrv_media_changed(bs);
    if (ret == -ENOTSUP)
        ret = bs->media_changed;
    bs->media_changed = 0;
    return ret;
}

/**
 * If eject_flag is TRUE, eject the media. Otherwise, close the tray
 */
void bdrv_eject(BlockDriverState *bs, int eject_flag)
{
    BlockDriver *drv = bs->drv;
    int ret;

    if (!drv || !drv->bdrv_eject) {
        ret = -ENOTSUP;
    } else {
        ret = drv->bdrv_eject(bs, eject_flag);
    }
    if (ret == -ENOTSUP) {
        if (eject_flag)
            bdrv_close(bs);
    }
}

int bdrv_is_locked(BlockDriverState *bs)
{
    return bs->locked;
}

/**
 * Lock or unlock the media (if it is locked, the user won't be able
 * to eject it manually).
 */
void bdrv_set_locked(BlockDriverState *bs, int locked)
{
    BlockDriver *drv = bs->drv;

    bs->locked = locked;
    if (drv && drv->bdrv_set_locked) {
        drv->bdrv_set_locked(bs, locked);
    }
}
1669
1670
1671
1672
1673
1674
1675
1676
1677
1678
1679

/* needed for generic scsi interface */

int bdrv_ioctl(BlockDriverState *bs, unsigned long int req, void *buf)
{
    BlockDriver *drv = bs->drv;

    if (drv && drv->bdrv_ioctl)
        return drv->bdrv_ioctl(bs, req, buf);
    return -ENOTSUP;
}