mmu-hash*: Don't keep looking for PTEs after we find a match
[qemu/agraf.git] / savevm.c
blob35c8d1e4453e84e74e3112b4575780a2a2230abd
1 /*
2 * QEMU System Emulator
4 * Copyright (c) 2003-2008 Fabrice Bellard
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
25 #include "config-host.h"
26 #include "qemu-common.h"
27 #include "hw/hw.h"
28 #include "hw/qdev.h"
29 #include "net/net.h"
30 #include "monitor/monitor.h"
31 #include "sysemu/sysemu.h"
32 #include "qemu/timer.h"
33 #include "audio/audio.h"
34 #include "migration/migration.h"
35 #include "qemu/sockets.h"
36 #include "qemu/queue.h"
37 #include "sysemu/cpus.h"
38 #include "exec/memory.h"
39 #include "qmp-commands.h"
40 #include "trace.h"
41 #include "qemu/bitops.h"
43 #define SELF_ANNOUNCE_ROUNDS 5
45 #ifndef ETH_P_RARP
46 #define ETH_P_RARP 0x8035
47 #endif
48 #define ARP_HTYPE_ETH 0x0001
49 #define ARP_PTYPE_IP 0x0800
50 #define ARP_OP_REQUEST_REV 0x3
52 static int announce_self_create(uint8_t *buf,
53 uint8_t *mac_addr)
55 /* Ethernet header. */
56 memset(buf, 0xff, 6); /* destination MAC addr */
57 memcpy(buf + 6, mac_addr, 6); /* source MAC addr */
58 *(uint16_t *)(buf + 12) = htons(ETH_P_RARP); /* ethertype */
60 /* RARP header. */
61 *(uint16_t *)(buf + 14) = htons(ARP_HTYPE_ETH); /* hardware addr space */
62 *(uint16_t *)(buf + 16) = htons(ARP_PTYPE_IP); /* protocol addr space */
63 *(buf + 18) = 6; /* hardware addr length (ethernet) */
64 *(buf + 19) = 4; /* protocol addr length (IPv4) */
65 *(uint16_t *)(buf + 20) = htons(ARP_OP_REQUEST_REV); /* opcode */
66 memcpy(buf + 22, mac_addr, 6); /* source hw addr */
67 memset(buf + 28, 0x00, 4); /* source protocol addr */
68 memcpy(buf + 32, mac_addr, 6); /* target hw addr */
69 memset(buf + 38, 0x00, 4); /* target protocol addr */
71 /* Padding to get up to 60 bytes (ethernet min packet size, minus FCS). */
72 memset(buf + 42, 0x00, 18);
74 return 60; /* len (FCS will be added by hardware) */
77 static void qemu_announce_self_iter(NICState *nic, void *opaque)
79 uint8_t buf[60];
80 int len;
82 len = announce_self_create(buf, nic->conf->macaddr.a);
84 qemu_send_packet_raw(qemu_get_queue(nic), buf, len);
88 static void qemu_announce_self_once(void *opaque)
90 static int count = SELF_ANNOUNCE_ROUNDS;
91 QEMUTimer *timer = *(QEMUTimer **)opaque;
93 qemu_foreach_nic(qemu_announce_self_iter, NULL);
95 if (--count) {
96 /* delay 50ms, 150ms, 250ms, ... */
97 qemu_mod_timer(timer, qemu_get_clock_ms(rt_clock) +
98 50 + (SELF_ANNOUNCE_ROUNDS - count - 1) * 100);
99 } else {
100 qemu_del_timer(timer);
101 qemu_free_timer(timer);
105 void qemu_announce_self(void)
107 static QEMUTimer *timer;
108 timer = qemu_new_timer_ms(rt_clock, qemu_announce_self_once, &timer);
109 qemu_announce_self_once(&timer);
112 /***********************************************************/
113 /* savevm/loadvm support */
115 #define IO_BUF_SIZE 32768
117 struct QEMUFile {
118 const QEMUFileOps *ops;
119 void *opaque;
120 int is_write;
122 int64_t bytes_xfer;
123 int64_t xfer_limit;
125 int64_t pos; /* start of buffer when writing, end of buffer
126 when reading */
127 int buf_index;
128 int buf_size; /* 0 when writing */
129 uint8_t buf[IO_BUF_SIZE];
131 int last_error;
134 typedef struct QEMUFileStdio
136 FILE *stdio_file;
137 QEMUFile *file;
138 } QEMUFileStdio;
140 typedef struct QEMUFileSocket
142 int fd;
143 QEMUFile *file;
144 } QEMUFileSocket;
146 typedef struct {
147 Coroutine *co;
148 int fd;
149 } FDYieldUntilData;
151 static void fd_coroutine_enter(void *opaque)
153 FDYieldUntilData *data = opaque;
154 qemu_set_fd_handler(data->fd, NULL, NULL, NULL);
155 qemu_coroutine_enter(data->co, NULL);
159 * Yield until a file descriptor becomes readable
161 * Note that this function clobbers the handlers for the file descriptor.
163 static void coroutine_fn yield_until_fd_readable(int fd)
165 FDYieldUntilData data;
167 assert(qemu_in_coroutine());
168 data.co = qemu_coroutine_self();
169 data.fd = fd;
170 qemu_set_fd_handler(fd, fd_coroutine_enter, NULL, &data);
171 qemu_coroutine_yield();
174 static int socket_get_fd(void *opaque)
176 QEMUFileSocket *s = opaque;
178 return s->fd;
181 static int socket_get_buffer(void *opaque, uint8_t *buf, int64_t pos, int size)
183 QEMUFileSocket *s = opaque;
184 ssize_t len;
186 for (;;) {
187 len = qemu_recv(s->fd, buf, size, 0);
188 if (len != -1) {
189 break;
191 if (socket_error() == EAGAIN) {
192 yield_until_fd_readable(s->fd);
193 } else if (socket_error() != EINTR) {
194 break;
198 if (len == -1) {
199 len = -socket_error();
201 return len;
204 static int socket_put_buffer(void *opaque, const uint8_t *buf, int64_t pos, int size)
206 QEMUFileSocket *s = opaque;
207 ssize_t len;
209 len = qemu_send_full(s->fd, buf, size, 0);
210 if (len < size) {
211 len = -socket_error();
213 return len;
216 static int socket_close(void *opaque)
218 QEMUFileSocket *s = opaque;
219 closesocket(s->fd);
220 g_free(s);
221 return 0;
224 static int stdio_get_fd(void *opaque)
226 QEMUFileStdio *s = opaque;
228 return fileno(s->stdio_file);
231 static int stdio_put_buffer(void *opaque, const uint8_t *buf, int64_t pos, int size)
233 QEMUFileStdio *s = opaque;
234 return fwrite(buf, 1, size, s->stdio_file);
237 static int stdio_get_buffer(void *opaque, uint8_t *buf, int64_t pos, int size)
239 QEMUFileStdio *s = opaque;
240 FILE *fp = s->stdio_file;
241 int bytes;
243 for (;;) {
244 clearerr(fp);
245 bytes = fread(buf, 1, size, fp);
246 if (bytes != 0 || !ferror(fp)) {
247 break;
249 if (errno == EAGAIN) {
250 yield_until_fd_readable(fileno(fp));
251 } else if (errno != EINTR) {
252 break;
255 return bytes;
258 static int stdio_pclose(void *opaque)
260 QEMUFileStdio *s = opaque;
261 int ret;
262 ret = pclose(s->stdio_file);
263 if (ret == -1) {
264 ret = -errno;
265 } else if (!WIFEXITED(ret) || WEXITSTATUS(ret) != 0) {
266 /* close succeeded, but non-zero exit code: */
267 ret = -EIO; /* fake errno value */
269 g_free(s);
270 return ret;
273 static int stdio_fclose(void *opaque)
275 QEMUFileStdio *s = opaque;
276 int ret = 0;
278 if (s->file->ops->put_buffer) {
279 int fd = fileno(s->stdio_file);
280 struct stat st;
282 ret = fstat(fd, &st);
283 if (ret == 0 && S_ISREG(st.st_mode)) {
285 * If the file handle is a regular file make sure the
286 * data is flushed to disk before signaling success.
288 ret = fsync(fd);
289 if (ret != 0) {
290 ret = -errno;
291 return ret;
295 if (fclose(s->stdio_file) == EOF) {
296 ret = -errno;
298 g_free(s);
299 return ret;
302 static const QEMUFileOps stdio_pipe_read_ops = {
303 .get_fd = stdio_get_fd,
304 .get_buffer = stdio_get_buffer,
305 .close = stdio_pclose
308 static const QEMUFileOps stdio_pipe_write_ops = {
309 .get_fd = stdio_get_fd,
310 .put_buffer = stdio_put_buffer,
311 .close = stdio_pclose
314 QEMUFile *qemu_popen_cmd(const char *command, const char *mode)
316 FILE *stdio_file;
317 QEMUFileStdio *s;
319 stdio_file = popen(command, mode);
320 if (stdio_file == NULL) {
321 return NULL;
324 if (mode == NULL || (mode[0] != 'r' && mode[0] != 'w') || mode[1] != 0) {
325 fprintf(stderr, "qemu_popen: Argument validity check failed\n");
326 return NULL;
329 s = g_malloc0(sizeof(QEMUFileStdio));
331 s->stdio_file = stdio_file;
333 if(mode[0] == 'r') {
334 s->file = qemu_fopen_ops(s, &stdio_pipe_read_ops);
335 } else {
336 s->file = qemu_fopen_ops(s, &stdio_pipe_write_ops);
338 return s->file;
341 static const QEMUFileOps stdio_file_read_ops = {
342 .get_fd = stdio_get_fd,
343 .get_buffer = stdio_get_buffer,
344 .close = stdio_fclose
347 static const QEMUFileOps stdio_file_write_ops = {
348 .get_fd = stdio_get_fd,
349 .put_buffer = stdio_put_buffer,
350 .close = stdio_fclose
353 QEMUFile *qemu_fdopen(int fd, const char *mode)
355 QEMUFileStdio *s;
357 if (mode == NULL ||
358 (mode[0] != 'r' && mode[0] != 'w') ||
359 mode[1] != 'b' || mode[2] != 0) {
360 fprintf(stderr, "qemu_fdopen: Argument validity check failed\n");
361 return NULL;
364 s = g_malloc0(sizeof(QEMUFileStdio));
365 s->stdio_file = fdopen(fd, mode);
366 if (!s->stdio_file)
367 goto fail;
369 if(mode[0] == 'r') {
370 s->file = qemu_fopen_ops(s, &stdio_file_read_ops);
371 } else {
372 s->file = qemu_fopen_ops(s, &stdio_file_write_ops);
374 return s->file;
376 fail:
377 g_free(s);
378 return NULL;
381 static const QEMUFileOps socket_read_ops = {
382 .get_fd = socket_get_fd,
383 .get_buffer = socket_get_buffer,
384 .close = socket_close
387 static const QEMUFileOps socket_write_ops = {
388 .get_fd = socket_get_fd,
389 .put_buffer = socket_put_buffer,
390 .close = socket_close
393 QEMUFile *qemu_fopen_socket(int fd, const char *mode)
395 QEMUFileSocket *s = g_malloc0(sizeof(QEMUFileSocket));
397 if (mode == NULL ||
398 (mode[0] != 'r' && mode[0] != 'w') ||
399 mode[1] != 'b' || mode[2] != 0) {
400 fprintf(stderr, "qemu_fopen: Argument validity check failed\n");
401 return NULL;
404 s->fd = fd;
405 if (mode[0] == 'w') {
406 socket_set_block(s->fd);
407 s->file = qemu_fopen_ops(s, &socket_write_ops);
408 } else {
409 s->file = qemu_fopen_ops(s, &socket_read_ops);
411 return s->file;
414 QEMUFile *qemu_fopen(const char *filename, const char *mode)
416 QEMUFileStdio *s;
418 if (mode == NULL ||
419 (mode[0] != 'r' && mode[0] != 'w') ||
420 mode[1] != 'b' || mode[2] != 0) {
421 fprintf(stderr, "qemu_fopen: Argument validity check failed\n");
422 return NULL;
425 s = g_malloc0(sizeof(QEMUFileStdio));
427 s->stdio_file = fopen(filename, mode);
428 if (!s->stdio_file)
429 goto fail;
431 if(mode[0] == 'w') {
432 s->file = qemu_fopen_ops(s, &stdio_file_write_ops);
433 } else {
434 s->file = qemu_fopen_ops(s, &stdio_file_read_ops);
436 return s->file;
437 fail:
438 g_free(s);
439 return NULL;
442 static int block_put_buffer(void *opaque, const uint8_t *buf,
443 int64_t pos, int size)
445 bdrv_save_vmstate(opaque, buf, pos, size);
446 return size;
449 static int block_get_buffer(void *opaque, uint8_t *buf, int64_t pos, int size)
451 return bdrv_load_vmstate(opaque, buf, pos, size);
454 static int bdrv_fclose(void *opaque)
456 return bdrv_flush(opaque);
459 static const QEMUFileOps bdrv_read_ops = {
460 .get_buffer = block_get_buffer,
461 .close = bdrv_fclose
464 static const QEMUFileOps bdrv_write_ops = {
465 .put_buffer = block_put_buffer,
466 .close = bdrv_fclose
469 static QEMUFile *qemu_fopen_bdrv(BlockDriverState *bs, int is_writable)
471 if (is_writable)
472 return qemu_fopen_ops(bs, &bdrv_write_ops);
473 return qemu_fopen_ops(bs, &bdrv_read_ops);
476 QEMUFile *qemu_fopen_ops(void *opaque, const QEMUFileOps *ops)
478 QEMUFile *f;
480 f = g_malloc0(sizeof(QEMUFile));
482 f->opaque = opaque;
483 f->ops = ops;
484 f->is_write = 0;
485 return f;
488 int qemu_file_get_error(QEMUFile *f)
490 return f->last_error;
493 static void qemu_file_set_error(QEMUFile *f, int ret)
495 if (f->last_error == 0) {
496 f->last_error = ret;
500 /** Flushes QEMUFile buffer
503 static void qemu_fflush(QEMUFile *f)
505 int ret = 0;
507 if (!f->ops->put_buffer) {
508 return;
510 if (f->is_write && f->buf_index > 0) {
511 ret = f->ops->put_buffer(f->opaque, f->buf, f->pos, f->buf_index);
512 if (ret >= 0) {
513 f->pos += f->buf_index;
515 f->buf_index = 0;
517 if (ret < 0) {
518 qemu_file_set_error(f, ret);
522 static void qemu_fill_buffer(QEMUFile *f)
524 int len;
525 int pending;
527 if (!f->ops->get_buffer)
528 return;
530 if (f->is_write)
531 abort();
533 pending = f->buf_size - f->buf_index;
534 if (pending > 0) {
535 memmove(f->buf, f->buf + f->buf_index, pending);
537 f->buf_index = 0;
538 f->buf_size = pending;
540 len = f->ops->get_buffer(f->opaque, f->buf + pending, f->pos,
541 IO_BUF_SIZE - pending);
542 if (len > 0) {
543 f->buf_size += len;
544 f->pos += len;
545 } else if (len == 0) {
546 qemu_file_set_error(f, -EIO);
547 } else if (len != -EAGAIN)
548 qemu_file_set_error(f, len);
551 int qemu_get_fd(QEMUFile *f)
553 if (f->ops->get_fd) {
554 return f->ops->get_fd(f->opaque);
556 return -1;
559 /** Closes the file
561 * Returns negative error value if any error happened on previous operations or
562 * while closing the file. Returns 0 or positive number on success.
564 * The meaning of return value on success depends on the specific backend
565 * being used.
567 int qemu_fclose(QEMUFile *f)
569 int ret;
570 qemu_fflush(f);
571 ret = qemu_file_get_error(f);
573 if (f->ops->close) {
574 int ret2 = f->ops->close(f->opaque);
575 if (ret >= 0) {
576 ret = ret2;
579 /* If any error was spotted before closing, we should report it
580 * instead of the close() return value.
582 if (f->last_error) {
583 ret = f->last_error;
585 g_free(f);
586 return ret;
589 void qemu_put_buffer(QEMUFile *f, const uint8_t *buf, int size)
591 int l;
593 if (f->last_error) {
594 return;
597 if (f->is_write == 0 && f->buf_index > 0) {
598 fprintf(stderr,
599 "Attempted to write to buffer while read buffer is not empty\n");
600 abort();
603 while (size > 0) {
604 l = IO_BUF_SIZE - f->buf_index;
605 if (l > size)
606 l = size;
607 memcpy(f->buf + f->buf_index, buf, l);
608 f->is_write = 1;
609 f->buf_index += l;
610 f->bytes_xfer += l;
611 buf += l;
612 size -= l;
613 if (f->buf_index >= IO_BUF_SIZE) {
614 qemu_fflush(f);
615 if (qemu_file_get_error(f)) {
616 break;
622 void qemu_put_byte(QEMUFile *f, int v)
624 if (f->last_error) {
625 return;
628 if (f->is_write == 0 && f->buf_index > 0) {
629 fprintf(stderr,
630 "Attempted to write to buffer while read buffer is not empty\n");
631 abort();
634 f->buf[f->buf_index++] = v;
635 f->is_write = 1;
636 if (f->buf_index >= IO_BUF_SIZE) {
637 qemu_fflush(f);
641 static void qemu_file_skip(QEMUFile *f, int size)
643 if (f->buf_index + size <= f->buf_size) {
644 f->buf_index += size;
648 static int qemu_peek_buffer(QEMUFile *f, uint8_t *buf, int size, size_t offset)
650 int pending;
651 int index;
653 if (f->is_write) {
654 abort();
657 index = f->buf_index + offset;
658 pending = f->buf_size - index;
659 if (pending < size) {
660 qemu_fill_buffer(f);
661 index = f->buf_index + offset;
662 pending = f->buf_size - index;
665 if (pending <= 0) {
666 return 0;
668 if (size > pending) {
669 size = pending;
672 memcpy(buf, f->buf + index, size);
673 return size;
676 int qemu_get_buffer(QEMUFile *f, uint8_t *buf, int size)
678 int pending = size;
679 int done = 0;
681 while (pending > 0) {
682 int res;
684 res = qemu_peek_buffer(f, buf, pending, 0);
685 if (res == 0) {
686 return done;
688 qemu_file_skip(f, res);
689 buf += res;
690 pending -= res;
691 done += res;
693 return done;
696 static int qemu_peek_byte(QEMUFile *f, int offset)
698 int index = f->buf_index + offset;
700 if (f->is_write) {
701 abort();
704 if (index >= f->buf_size) {
705 qemu_fill_buffer(f);
706 index = f->buf_index + offset;
707 if (index >= f->buf_size) {
708 return 0;
711 return f->buf[index];
714 int qemu_get_byte(QEMUFile *f)
716 int result;
718 result = qemu_peek_byte(f, 0);
719 qemu_file_skip(f, 1);
720 return result;
723 int64_t qemu_ftell(QEMUFile *f)
725 qemu_fflush(f);
726 return f->pos;
729 int qemu_file_rate_limit(QEMUFile *f)
731 if (qemu_file_get_error(f)) {
732 return 1;
734 if (f->xfer_limit > 0 && f->bytes_xfer > f->xfer_limit) {
735 return 1;
737 return 0;
740 int64_t qemu_file_get_rate_limit(QEMUFile *f)
742 return f->xfer_limit;
745 void qemu_file_set_rate_limit(QEMUFile *f, int64_t limit)
747 f->xfer_limit = limit;
750 void qemu_file_reset_rate_limit(QEMUFile *f)
752 f->bytes_xfer = 0;
755 void qemu_put_be16(QEMUFile *f, unsigned int v)
757 qemu_put_byte(f, v >> 8);
758 qemu_put_byte(f, v);
761 void qemu_put_be32(QEMUFile *f, unsigned int v)
763 qemu_put_byte(f, v >> 24);
764 qemu_put_byte(f, v >> 16);
765 qemu_put_byte(f, v >> 8);
766 qemu_put_byte(f, v);
769 void qemu_put_be64(QEMUFile *f, uint64_t v)
771 qemu_put_be32(f, v >> 32);
772 qemu_put_be32(f, v);
775 unsigned int qemu_get_be16(QEMUFile *f)
777 unsigned int v;
778 v = qemu_get_byte(f) << 8;
779 v |= qemu_get_byte(f);
780 return v;
783 unsigned int qemu_get_be32(QEMUFile *f)
785 unsigned int v;
786 v = qemu_get_byte(f) << 24;
787 v |= qemu_get_byte(f) << 16;
788 v |= qemu_get_byte(f) << 8;
789 v |= qemu_get_byte(f);
790 return v;
793 uint64_t qemu_get_be64(QEMUFile *f)
795 uint64_t v;
796 v = (uint64_t)qemu_get_be32(f) << 32;
797 v |= qemu_get_be32(f);
798 return v;
802 /* timer */
804 void qemu_put_timer(QEMUFile *f, QEMUTimer *ts)
806 uint64_t expire_time;
808 expire_time = qemu_timer_expire_time_ns(ts);
809 qemu_put_be64(f, expire_time);
812 void qemu_get_timer(QEMUFile *f, QEMUTimer *ts)
814 uint64_t expire_time;
816 expire_time = qemu_get_be64(f);
817 if (expire_time != -1) {
818 qemu_mod_timer_ns(ts, expire_time);
819 } else {
820 qemu_del_timer(ts);
825 /* bool */
827 static int get_bool(QEMUFile *f, void *pv, size_t size)
829 bool *v = pv;
830 *v = qemu_get_byte(f);
831 return 0;
834 static void put_bool(QEMUFile *f, void *pv, size_t size)
836 bool *v = pv;
837 qemu_put_byte(f, *v);
840 const VMStateInfo vmstate_info_bool = {
841 .name = "bool",
842 .get = get_bool,
843 .put = put_bool,
846 /* 8 bit int */
848 static int get_int8(QEMUFile *f, void *pv, size_t size)
850 int8_t *v = pv;
851 qemu_get_s8s(f, v);
852 return 0;
855 static void put_int8(QEMUFile *f, void *pv, size_t size)
857 int8_t *v = pv;
858 qemu_put_s8s(f, v);
861 const VMStateInfo vmstate_info_int8 = {
862 .name = "int8",
863 .get = get_int8,
864 .put = put_int8,
867 /* 16 bit int */
869 static int get_int16(QEMUFile *f, void *pv, size_t size)
871 int16_t *v = pv;
872 qemu_get_sbe16s(f, v);
873 return 0;
876 static void put_int16(QEMUFile *f, void *pv, size_t size)
878 int16_t *v = pv;
879 qemu_put_sbe16s(f, v);
882 const VMStateInfo vmstate_info_int16 = {
883 .name = "int16",
884 .get = get_int16,
885 .put = put_int16,
888 /* 32 bit int */
890 static int get_int32(QEMUFile *f, void *pv, size_t size)
892 int32_t *v = pv;
893 qemu_get_sbe32s(f, v);
894 return 0;
897 static void put_int32(QEMUFile *f, void *pv, size_t size)
899 int32_t *v = pv;
900 qemu_put_sbe32s(f, v);
903 const VMStateInfo vmstate_info_int32 = {
904 .name = "int32",
905 .get = get_int32,
906 .put = put_int32,
909 /* 32 bit int. See that the received value is the same than the one
910 in the field */
912 static int get_int32_equal(QEMUFile *f, void *pv, size_t size)
914 int32_t *v = pv;
915 int32_t v2;
916 qemu_get_sbe32s(f, &v2);
918 if (*v == v2)
919 return 0;
920 return -EINVAL;
923 const VMStateInfo vmstate_info_int32_equal = {
924 .name = "int32 equal",
925 .get = get_int32_equal,
926 .put = put_int32,
929 /* 32 bit int. See that the received value is the less or the same
930 than the one in the field */
932 static int get_int32_le(QEMUFile *f, void *pv, size_t size)
934 int32_t *old = pv;
935 int32_t new;
936 qemu_get_sbe32s(f, &new);
938 if (*old <= new)
939 return 0;
940 return -EINVAL;
943 const VMStateInfo vmstate_info_int32_le = {
944 .name = "int32 equal",
945 .get = get_int32_le,
946 .put = put_int32,
949 /* 64 bit int */
951 static int get_int64(QEMUFile *f, void *pv, size_t size)
953 int64_t *v = pv;
954 qemu_get_sbe64s(f, v);
955 return 0;
958 static void put_int64(QEMUFile *f, void *pv, size_t size)
960 int64_t *v = pv;
961 qemu_put_sbe64s(f, v);
964 const VMStateInfo vmstate_info_int64 = {
965 .name = "int64",
966 .get = get_int64,
967 .put = put_int64,
970 /* 8 bit unsigned int */
972 static int get_uint8(QEMUFile *f, void *pv, size_t size)
974 uint8_t *v = pv;
975 qemu_get_8s(f, v);
976 return 0;
979 static void put_uint8(QEMUFile *f, void *pv, size_t size)
981 uint8_t *v = pv;
982 qemu_put_8s(f, v);
985 const VMStateInfo vmstate_info_uint8 = {
986 .name = "uint8",
987 .get = get_uint8,
988 .put = put_uint8,
991 /* 16 bit unsigned int */
993 static int get_uint16(QEMUFile *f, void *pv, size_t size)
995 uint16_t *v = pv;
996 qemu_get_be16s(f, v);
997 return 0;
1000 static void put_uint16(QEMUFile *f, void *pv, size_t size)
1002 uint16_t *v = pv;
1003 qemu_put_be16s(f, v);
1006 const VMStateInfo vmstate_info_uint16 = {
1007 .name = "uint16",
1008 .get = get_uint16,
1009 .put = put_uint16,
1012 /* 32 bit unsigned int */
1014 static int get_uint32(QEMUFile *f, void *pv, size_t size)
1016 uint32_t *v = pv;
1017 qemu_get_be32s(f, v);
1018 return 0;
1021 static void put_uint32(QEMUFile *f, void *pv, size_t size)
1023 uint32_t *v = pv;
1024 qemu_put_be32s(f, v);
1027 const VMStateInfo vmstate_info_uint32 = {
1028 .name = "uint32",
1029 .get = get_uint32,
1030 .put = put_uint32,
1033 /* 32 bit uint. See that the received value is the same than the one
1034 in the field */
1036 static int get_uint32_equal(QEMUFile *f, void *pv, size_t size)
1038 uint32_t *v = pv;
1039 uint32_t v2;
1040 qemu_get_be32s(f, &v2);
1042 if (*v == v2) {
1043 return 0;
1045 return -EINVAL;
1048 const VMStateInfo vmstate_info_uint32_equal = {
1049 .name = "uint32 equal",
1050 .get = get_uint32_equal,
1051 .put = put_uint32,
1054 /* 64 bit unsigned int */
1056 static int get_uint64(QEMUFile *f, void *pv, size_t size)
1058 uint64_t *v = pv;
1059 qemu_get_be64s(f, v);
1060 return 0;
1063 static void put_uint64(QEMUFile *f, void *pv, size_t size)
1065 uint64_t *v = pv;
1066 qemu_put_be64s(f, v);
1069 const VMStateInfo vmstate_info_uint64 = {
1070 .name = "uint64",
1071 .get = get_uint64,
1072 .put = put_uint64,
1075 /* 8 bit int. See that the received value is the same than the one
1076 in the field */
1078 static int get_uint8_equal(QEMUFile *f, void *pv, size_t size)
1080 uint8_t *v = pv;
1081 uint8_t v2;
1082 qemu_get_8s(f, &v2);
1084 if (*v == v2)
1085 return 0;
1086 return -EINVAL;
1089 const VMStateInfo vmstate_info_uint8_equal = {
1090 .name = "uint8 equal",
1091 .get = get_uint8_equal,
1092 .put = put_uint8,
1095 /* 16 bit unsigned int int. See that the received value is the same than the one
1096 in the field */
1098 static int get_uint16_equal(QEMUFile *f, void *pv, size_t size)
1100 uint16_t *v = pv;
1101 uint16_t v2;
1102 qemu_get_be16s(f, &v2);
1104 if (*v == v2)
1105 return 0;
1106 return -EINVAL;
1109 const VMStateInfo vmstate_info_uint16_equal = {
1110 .name = "uint16 equal",
1111 .get = get_uint16_equal,
1112 .put = put_uint16,
1115 /* timers */
1117 static int get_timer(QEMUFile *f, void *pv, size_t size)
1119 QEMUTimer *v = pv;
1120 qemu_get_timer(f, v);
1121 return 0;
1124 static void put_timer(QEMUFile *f, void *pv, size_t size)
1126 QEMUTimer *v = pv;
1127 qemu_put_timer(f, v);
1130 const VMStateInfo vmstate_info_timer = {
1131 .name = "timer",
1132 .get = get_timer,
1133 .put = put_timer,
1136 /* uint8_t buffers */
1138 static int get_buffer(QEMUFile *f, void *pv, size_t size)
1140 uint8_t *v = pv;
1141 qemu_get_buffer(f, v, size);
1142 return 0;
1145 static void put_buffer(QEMUFile *f, void *pv, size_t size)
1147 uint8_t *v = pv;
1148 qemu_put_buffer(f, v, size);
1151 const VMStateInfo vmstate_info_buffer = {
1152 .name = "buffer",
1153 .get = get_buffer,
1154 .put = put_buffer,
1157 /* unused buffers: space that was used for some fields that are
1158 not useful anymore */
1160 static int get_unused_buffer(QEMUFile *f, void *pv, size_t size)
1162 uint8_t buf[1024];
1163 int block_len;
1165 while (size > 0) {
1166 block_len = MIN(sizeof(buf), size);
1167 size -= block_len;
1168 qemu_get_buffer(f, buf, block_len);
1170 return 0;
1173 static void put_unused_buffer(QEMUFile *f, void *pv, size_t size)
1175 static const uint8_t buf[1024];
1176 int block_len;
1178 while (size > 0) {
1179 block_len = MIN(sizeof(buf), size);
1180 size -= block_len;
1181 qemu_put_buffer(f, buf, block_len);
1185 const VMStateInfo vmstate_info_unused_buffer = {
1186 .name = "unused_buffer",
1187 .get = get_unused_buffer,
1188 .put = put_unused_buffer,
1191 /* bitmaps (as defined by bitmap.h). Note that size here is the size
1192 * of the bitmap in bits. The on-the-wire format of a bitmap is 64
1193 * bit words with the bits in big endian order. The in-memory format
1194 * is an array of 'unsigned long', which may be either 32 or 64 bits.
1196 /* This is the number of 64 bit words sent over the wire */
1197 #define BITS_TO_U64S(nr) DIV_ROUND_UP(nr, 64)
1198 static int get_bitmap(QEMUFile *f, void *pv, size_t size)
1200 unsigned long *bmp = pv;
1201 int i, idx = 0;
1202 for (i = 0; i < BITS_TO_U64S(size); i++) {
1203 uint64_t w = qemu_get_be64(f);
1204 bmp[idx++] = w;
1205 if (sizeof(unsigned long) == 4 && idx < BITS_TO_LONGS(size)) {
1206 bmp[idx++] = w >> 32;
1209 return 0;
1212 static void put_bitmap(QEMUFile *f, void *pv, size_t size)
1214 unsigned long *bmp = pv;
1215 int i, idx = 0;
1216 for (i = 0; i < BITS_TO_U64S(size); i++) {
1217 uint64_t w = bmp[idx++];
1218 if (sizeof(unsigned long) == 4 && idx < BITS_TO_LONGS(size)) {
1219 w |= ((uint64_t)bmp[idx++]) << 32;
1221 qemu_put_be64(f, w);
1225 const VMStateInfo vmstate_info_bitmap = {
1226 .name = "bitmap",
1227 .get = get_bitmap,
1228 .put = put_bitmap,
1231 typedef struct CompatEntry {
1232 char idstr[256];
1233 int instance_id;
1234 } CompatEntry;
1236 typedef struct SaveStateEntry {
1237 QTAILQ_ENTRY(SaveStateEntry) entry;
1238 char idstr[256];
1239 int instance_id;
1240 int alias_id;
1241 int version_id;
1242 int section_id;
1243 SaveVMHandlers *ops;
1244 const VMStateDescription *vmsd;
1245 void *opaque;
1246 CompatEntry *compat;
1247 int no_migrate;
1248 int is_ram;
1249 } SaveStateEntry;
1252 static QTAILQ_HEAD(savevm_handlers, SaveStateEntry) savevm_handlers =
1253 QTAILQ_HEAD_INITIALIZER(savevm_handlers);
1254 static int global_section_id;
1256 static int calculate_new_instance_id(const char *idstr)
1258 SaveStateEntry *se;
1259 int instance_id = 0;
1261 QTAILQ_FOREACH(se, &savevm_handlers, entry) {
1262 if (strcmp(idstr, se->idstr) == 0
1263 && instance_id <= se->instance_id) {
1264 instance_id = se->instance_id + 1;
1267 return instance_id;
1270 static int calculate_compat_instance_id(const char *idstr)
1272 SaveStateEntry *se;
1273 int instance_id = 0;
1275 QTAILQ_FOREACH(se, &savevm_handlers, entry) {
1276 if (!se->compat)
1277 continue;
1279 if (strcmp(idstr, se->compat->idstr) == 0
1280 && instance_id <= se->compat->instance_id) {
1281 instance_id = se->compat->instance_id + 1;
1284 return instance_id;
1287 /* TODO: Individual devices generally have very little idea about the rest
1288 of the system, so instance_id should be removed/replaced.
1289 Meanwhile pass -1 as instance_id if you do not already have a clearly
1290 distinguishing id for all instances of your device class. */
1291 int register_savevm_live(DeviceState *dev,
1292 const char *idstr,
1293 int instance_id,
1294 int version_id,
1295 SaveVMHandlers *ops,
1296 void *opaque)
1298 SaveStateEntry *se;
1300 se = g_malloc0(sizeof(SaveStateEntry));
1301 se->version_id = version_id;
1302 se->section_id = global_section_id++;
1303 se->ops = ops;
1304 se->opaque = opaque;
1305 se->vmsd = NULL;
1306 se->no_migrate = 0;
1307 /* if this is a live_savem then set is_ram */
1308 if (ops->save_live_setup != NULL) {
1309 se->is_ram = 1;
1312 if (dev) {
1313 char *id = qdev_get_dev_path(dev);
1314 if (id) {
1315 pstrcpy(se->idstr, sizeof(se->idstr), id);
1316 pstrcat(se->idstr, sizeof(se->idstr), "/");
1317 g_free(id);
1319 se->compat = g_malloc0(sizeof(CompatEntry));
1320 pstrcpy(se->compat->idstr, sizeof(se->compat->idstr), idstr);
1321 se->compat->instance_id = instance_id == -1 ?
1322 calculate_compat_instance_id(idstr) : instance_id;
1323 instance_id = -1;
1326 pstrcat(se->idstr, sizeof(se->idstr), idstr);
1328 if (instance_id == -1) {
1329 se->instance_id = calculate_new_instance_id(se->idstr);
1330 } else {
1331 se->instance_id = instance_id;
1333 assert(!se->compat || se->instance_id == 0);
1334 /* add at the end of list */
1335 QTAILQ_INSERT_TAIL(&savevm_handlers, se, entry);
1336 return 0;
1339 int register_savevm(DeviceState *dev,
1340 const char *idstr,
1341 int instance_id,
1342 int version_id,
1343 SaveStateHandler *save_state,
1344 LoadStateHandler *load_state,
1345 void *opaque)
1347 SaveVMHandlers *ops = g_malloc0(sizeof(SaveVMHandlers));
1348 ops->save_state = save_state;
1349 ops->load_state = load_state;
1350 return register_savevm_live(dev, idstr, instance_id, version_id,
1351 ops, opaque);
1354 void unregister_savevm(DeviceState *dev, const char *idstr, void *opaque)
1356 SaveStateEntry *se, *new_se;
1357 char id[256] = "";
1359 if (dev) {
1360 char *path = qdev_get_dev_path(dev);
1361 if (path) {
1362 pstrcpy(id, sizeof(id), path);
1363 pstrcat(id, sizeof(id), "/");
1364 g_free(path);
1367 pstrcat(id, sizeof(id), idstr);
1369 QTAILQ_FOREACH_SAFE(se, &savevm_handlers, entry, new_se) {
1370 if (strcmp(se->idstr, id) == 0 && se->opaque == opaque) {
1371 QTAILQ_REMOVE(&savevm_handlers, se, entry);
1372 if (se->compat) {
1373 g_free(se->compat);
1375 g_free(se->ops);
1376 g_free(se);
1381 int vmstate_register_with_alias_id(DeviceState *dev, int instance_id,
1382 const VMStateDescription *vmsd,
1383 void *opaque, int alias_id,
1384 int required_for_version)
1386 SaveStateEntry *se;
1388 /* If this triggers, alias support can be dropped for the vmsd. */
1389 assert(alias_id == -1 || required_for_version >= vmsd->minimum_version_id);
1391 se = g_malloc0(sizeof(SaveStateEntry));
1392 se->version_id = vmsd->version_id;
1393 se->section_id = global_section_id++;
1394 se->opaque = opaque;
1395 se->vmsd = vmsd;
1396 se->alias_id = alias_id;
1397 se->no_migrate = vmsd->unmigratable;
1399 if (dev) {
1400 char *id = qdev_get_dev_path(dev);
1401 if (id) {
1402 pstrcpy(se->idstr, sizeof(se->idstr), id);
1403 pstrcat(se->idstr, sizeof(se->idstr), "/");
1404 g_free(id);
1406 se->compat = g_malloc0(sizeof(CompatEntry));
1407 pstrcpy(se->compat->idstr, sizeof(se->compat->idstr), vmsd->name);
1408 se->compat->instance_id = instance_id == -1 ?
1409 calculate_compat_instance_id(vmsd->name) : instance_id;
1410 instance_id = -1;
1413 pstrcat(se->idstr, sizeof(se->idstr), vmsd->name);
1415 if (instance_id == -1) {
1416 se->instance_id = calculate_new_instance_id(se->idstr);
1417 } else {
1418 se->instance_id = instance_id;
1420 assert(!se->compat || se->instance_id == 0);
1421 /* add at the end of list */
1422 QTAILQ_INSERT_TAIL(&savevm_handlers, se, entry);
1423 return 0;
1426 void vmstate_unregister(DeviceState *dev, const VMStateDescription *vmsd,
1427 void *opaque)
1429 SaveStateEntry *se, *new_se;
1431 QTAILQ_FOREACH_SAFE(se, &savevm_handlers, entry, new_se) {
1432 if (se->vmsd == vmsd && se->opaque == opaque) {
1433 QTAILQ_REMOVE(&savevm_handlers, se, entry);
1434 if (se->compat) {
1435 g_free(se->compat);
1437 g_free(se);
1442 static void vmstate_subsection_save(QEMUFile *f, const VMStateDescription *vmsd,
1443 void *opaque);
1444 static int vmstate_subsection_load(QEMUFile *f, const VMStateDescription *vmsd,
1445 void *opaque);
1447 int vmstate_load_state(QEMUFile *f, const VMStateDescription *vmsd,
1448 void *opaque, int version_id)
1450 VMStateField *field = vmsd->fields;
1451 int ret;
1453 if (version_id > vmsd->version_id) {
1454 return -EINVAL;
1456 if (version_id < vmsd->minimum_version_id_old) {
1457 return -EINVAL;
1459 if (version_id < vmsd->minimum_version_id) {
1460 return vmsd->load_state_old(f, opaque, version_id);
1462 if (vmsd->pre_load) {
1463 int ret = vmsd->pre_load(opaque);
1464 if (ret)
1465 return ret;
1467 while(field->name) {
1468 if ((field->field_exists &&
1469 field->field_exists(opaque, version_id)) ||
1470 (!field->field_exists &&
1471 field->version_id <= version_id)) {
1472 void *base_addr = opaque + field->offset;
1473 int i, n_elems = 1;
1474 int size = field->size;
1476 if (field->flags & VMS_VBUFFER) {
1477 size = *(int32_t *)(opaque+field->size_offset);
1478 if (field->flags & VMS_MULTIPLY) {
1479 size *= field->size;
1482 if (field->flags & VMS_ARRAY) {
1483 n_elems = field->num;
1484 } else if (field->flags & VMS_VARRAY_INT32) {
1485 n_elems = *(int32_t *)(opaque+field->num_offset);
1486 } else if (field->flags & VMS_VARRAY_UINT32) {
1487 n_elems = *(uint32_t *)(opaque+field->num_offset);
1488 } else if (field->flags & VMS_VARRAY_UINT16) {
1489 n_elems = *(uint16_t *)(opaque+field->num_offset);
1490 } else if (field->flags & VMS_VARRAY_UINT8) {
1491 n_elems = *(uint8_t *)(opaque+field->num_offset);
1493 if (field->flags & VMS_POINTER) {
1494 base_addr = *(void **)base_addr + field->start;
1496 for (i = 0; i < n_elems; i++) {
1497 void *addr = base_addr + size * i;
1499 if (field->flags & VMS_ARRAY_OF_POINTER) {
1500 addr = *(void **)addr;
1502 if (field->flags & VMS_STRUCT) {
1503 ret = vmstate_load_state(f, field->vmsd, addr, field->vmsd->version_id);
1504 } else {
1505 ret = field->info->get(f, addr, size);
1508 if (ret < 0) {
1509 return ret;
1513 field++;
1515 ret = vmstate_subsection_load(f, vmsd, opaque);
1516 if (ret != 0) {
1517 return ret;
1519 if (vmsd->post_load) {
1520 return vmsd->post_load(opaque, version_id);
1522 return 0;
1525 void vmstate_save_state(QEMUFile *f, const VMStateDescription *vmsd,
1526 void *opaque)
1528 VMStateField *field = vmsd->fields;
1530 if (vmsd->pre_save) {
1531 vmsd->pre_save(opaque);
1533 while(field->name) {
1534 if (!field->field_exists ||
1535 field->field_exists(opaque, vmsd->version_id)) {
1536 void *base_addr = opaque + field->offset;
1537 int i, n_elems = 1;
1538 int size = field->size;
1540 if (field->flags & VMS_VBUFFER) {
1541 size = *(int32_t *)(opaque+field->size_offset);
1542 if (field->flags & VMS_MULTIPLY) {
1543 size *= field->size;
1546 if (field->flags & VMS_ARRAY) {
1547 n_elems = field->num;
1548 } else if (field->flags & VMS_VARRAY_INT32) {
1549 n_elems = *(int32_t *)(opaque+field->num_offset);
1550 } else if (field->flags & VMS_VARRAY_UINT32) {
1551 n_elems = *(uint32_t *)(opaque+field->num_offset);
1552 } else if (field->flags & VMS_VARRAY_UINT16) {
1553 n_elems = *(uint16_t *)(opaque+field->num_offset);
1554 } else if (field->flags & VMS_VARRAY_UINT8) {
1555 n_elems = *(uint8_t *)(opaque+field->num_offset);
1557 if (field->flags & VMS_POINTER) {
1558 base_addr = *(void **)base_addr + field->start;
1560 for (i = 0; i < n_elems; i++) {
1561 void *addr = base_addr + size * i;
1563 if (field->flags & VMS_ARRAY_OF_POINTER) {
1564 addr = *(void **)addr;
1566 if (field->flags & VMS_STRUCT) {
1567 vmstate_save_state(f, field->vmsd, addr);
1568 } else {
1569 field->info->put(f, addr, size);
1573 field++;
1575 vmstate_subsection_save(f, vmsd, opaque);
1578 static int vmstate_load(QEMUFile *f, SaveStateEntry *se, int version_id)
1580 if (!se->vmsd) { /* Old style */
1581 return se->ops->load_state(f, se->opaque, version_id);
1583 return vmstate_load_state(f, se->vmsd, se->opaque, version_id);
1586 static void vmstate_save(QEMUFile *f, SaveStateEntry *se)
1588 if (!se->vmsd) { /* Old style */
1589 se->ops->save_state(f, se->opaque);
1590 return;
1592 vmstate_save_state(f,se->vmsd, se->opaque);
1595 #define QEMU_VM_FILE_MAGIC 0x5145564d
1596 #define QEMU_VM_FILE_VERSION_COMPAT 0x00000002
1597 #define QEMU_VM_FILE_VERSION 0x00000003
1599 #define QEMU_VM_EOF 0x00
1600 #define QEMU_VM_SECTION_START 0x01
1601 #define QEMU_VM_SECTION_PART 0x02
1602 #define QEMU_VM_SECTION_END 0x03
1603 #define QEMU_VM_SECTION_FULL 0x04
1604 #define QEMU_VM_SUBSECTION 0x05
1606 bool qemu_savevm_state_blocked(Error **errp)
1608 SaveStateEntry *se;
1610 QTAILQ_FOREACH(se, &savevm_handlers, entry) {
1611 if (se->no_migrate) {
1612 error_set(errp, QERR_MIGRATION_NOT_SUPPORTED, se->idstr);
1613 return true;
1616 return false;
1619 void qemu_savevm_state_begin(QEMUFile *f,
1620 const MigrationParams *params)
1622 SaveStateEntry *se;
1623 int ret;
1625 QTAILQ_FOREACH(se, &savevm_handlers, entry) {
1626 if (!se->ops || !se->ops->set_params) {
1627 continue;
1629 se->ops->set_params(params, se->opaque);
1632 qemu_put_be32(f, QEMU_VM_FILE_MAGIC);
1633 qemu_put_be32(f, QEMU_VM_FILE_VERSION);
1635 QTAILQ_FOREACH(se, &savevm_handlers, entry) {
1636 int len;
1638 if (!se->ops || !se->ops->save_live_setup) {
1639 continue;
1641 if (se->ops && se->ops->is_active) {
1642 if (!se->ops->is_active(se->opaque)) {
1643 continue;
1646 /* Section type */
1647 qemu_put_byte(f, QEMU_VM_SECTION_START);
1648 qemu_put_be32(f, se->section_id);
1650 /* ID string */
1651 len = strlen(se->idstr);
1652 qemu_put_byte(f, len);
1653 qemu_put_buffer(f, (uint8_t *)se->idstr, len);
1655 qemu_put_be32(f, se->instance_id);
1656 qemu_put_be32(f, se->version_id);
1658 ret = se->ops->save_live_setup(f, se->opaque);
1659 if (ret < 0) {
1660 qemu_file_set_error(f, ret);
1661 break;
1667 * this function has three return values:
1668 * negative: there was one error, and we have -errno.
1669 * 0 : We haven't finished, caller have to go again
1670 * 1 : We have finished, we can go to complete phase
1672 int qemu_savevm_state_iterate(QEMUFile *f)
1674 SaveStateEntry *se;
1675 int ret = 1;
1677 QTAILQ_FOREACH(se, &savevm_handlers, entry) {
1678 if (!se->ops || !se->ops->save_live_iterate) {
1679 continue;
1681 if (se->ops && se->ops->is_active) {
1682 if (!se->ops->is_active(se->opaque)) {
1683 continue;
1686 if (qemu_file_rate_limit(f)) {
1687 return 0;
1689 trace_savevm_section_start();
1690 /* Section type */
1691 qemu_put_byte(f, QEMU_VM_SECTION_PART);
1692 qemu_put_be32(f, se->section_id);
1694 ret = se->ops->save_live_iterate(f, se->opaque);
1695 trace_savevm_section_end(se->section_id);
1697 if (ret < 0) {
1698 qemu_file_set_error(f, ret);
1700 if (ret <= 0) {
1701 /* Do not proceed to the next vmstate before this one reported
1702 completion of the current stage. This serializes the migration
1703 and reduces the probability that a faster changing state is
1704 synchronized over and over again. */
1705 break;
1708 return ret;
1711 void qemu_savevm_state_complete(QEMUFile *f)
1713 SaveStateEntry *se;
1714 int ret;
1716 cpu_synchronize_all_states();
1718 QTAILQ_FOREACH(se, &savevm_handlers, entry) {
1719 if (!se->ops || !se->ops->save_live_complete) {
1720 continue;
1722 if (se->ops && se->ops->is_active) {
1723 if (!se->ops->is_active(se->opaque)) {
1724 continue;
1727 trace_savevm_section_start();
1728 /* Section type */
1729 qemu_put_byte(f, QEMU_VM_SECTION_END);
1730 qemu_put_be32(f, se->section_id);
1732 ret = se->ops->save_live_complete(f, se->opaque);
1733 trace_savevm_section_end(se->section_id);
1734 if (ret < 0) {
1735 qemu_file_set_error(f, ret);
1736 return;
1740 QTAILQ_FOREACH(se, &savevm_handlers, entry) {
1741 int len;
1743 if ((!se->ops || !se->ops->save_state) && !se->vmsd) {
1744 continue;
1746 trace_savevm_section_start();
1747 /* Section type */
1748 qemu_put_byte(f, QEMU_VM_SECTION_FULL);
1749 qemu_put_be32(f, se->section_id);
1751 /* ID string */
1752 len = strlen(se->idstr);
1753 qemu_put_byte(f, len);
1754 qemu_put_buffer(f, (uint8_t *)se->idstr, len);
1756 qemu_put_be32(f, se->instance_id);
1757 qemu_put_be32(f, se->version_id);
1759 vmstate_save(f, se);
1760 trace_savevm_section_end(se->section_id);
1763 qemu_put_byte(f, QEMU_VM_EOF);
1764 qemu_fflush(f);
1767 uint64_t qemu_savevm_state_pending(QEMUFile *f, uint64_t max_size)
1769 SaveStateEntry *se;
1770 uint64_t ret = 0;
1772 QTAILQ_FOREACH(se, &savevm_handlers, entry) {
1773 if (!se->ops || !se->ops->save_live_pending) {
1774 continue;
1776 if (se->ops && se->ops->is_active) {
1777 if (!se->ops->is_active(se->opaque)) {
1778 continue;
1781 ret += se->ops->save_live_pending(f, se->opaque, max_size);
1783 return ret;
1786 void qemu_savevm_state_cancel(void)
1788 SaveStateEntry *se;
1790 QTAILQ_FOREACH(se, &savevm_handlers, entry) {
1791 if (se->ops && se->ops->cancel) {
1792 se->ops->cancel(se->opaque);
1797 static int qemu_savevm_state(QEMUFile *f)
1799 int ret;
1800 MigrationParams params = {
1801 .blk = 0,
1802 .shared = 0
1805 if (qemu_savevm_state_blocked(NULL)) {
1806 return -EINVAL;
1809 qemu_mutex_unlock_iothread();
1810 qemu_savevm_state_begin(f, &params);
1811 qemu_mutex_lock_iothread();
1813 while (qemu_file_get_error(f) == 0) {
1814 if (qemu_savevm_state_iterate(f) > 0) {
1815 break;
1819 ret = qemu_file_get_error(f);
1820 if (ret == 0) {
1821 qemu_savevm_state_complete(f);
1822 ret = qemu_file_get_error(f);
1824 if (ret != 0) {
1825 qemu_savevm_state_cancel();
1827 return ret;
1830 static int qemu_save_device_state(QEMUFile *f)
1832 SaveStateEntry *se;
1834 qemu_put_be32(f, QEMU_VM_FILE_MAGIC);
1835 qemu_put_be32(f, QEMU_VM_FILE_VERSION);
1837 cpu_synchronize_all_states();
1839 QTAILQ_FOREACH(se, &savevm_handlers, entry) {
1840 int len;
1842 if (se->is_ram) {
1843 continue;
1845 if ((!se->ops || !se->ops->save_state) && !se->vmsd) {
1846 continue;
1849 /* Section type */
1850 qemu_put_byte(f, QEMU_VM_SECTION_FULL);
1851 qemu_put_be32(f, se->section_id);
1853 /* ID string */
1854 len = strlen(se->idstr);
1855 qemu_put_byte(f, len);
1856 qemu_put_buffer(f, (uint8_t *)se->idstr, len);
1858 qemu_put_be32(f, se->instance_id);
1859 qemu_put_be32(f, se->version_id);
1861 vmstate_save(f, se);
1864 qemu_put_byte(f, QEMU_VM_EOF);
1866 return qemu_file_get_error(f);
1869 static SaveStateEntry *find_se(const char *idstr, int instance_id)
1871 SaveStateEntry *se;
1873 QTAILQ_FOREACH(se, &savevm_handlers, entry) {
1874 if (!strcmp(se->idstr, idstr) &&
1875 (instance_id == se->instance_id ||
1876 instance_id == se->alias_id))
1877 return se;
1878 /* Migrating from an older version? */
1879 if (strstr(se->idstr, idstr) && se->compat) {
1880 if (!strcmp(se->compat->idstr, idstr) &&
1881 (instance_id == se->compat->instance_id ||
1882 instance_id == se->alias_id))
1883 return se;
1886 return NULL;
1889 static const VMStateDescription *vmstate_get_subsection(const VMStateSubsection *sub, char *idstr)
1891 while(sub && sub->needed) {
1892 if (strcmp(idstr, sub->vmsd->name) == 0) {
1893 return sub->vmsd;
1895 sub++;
1897 return NULL;
1900 static int vmstate_subsection_load(QEMUFile *f, const VMStateDescription *vmsd,
1901 void *opaque)
1903 while (qemu_peek_byte(f, 0) == QEMU_VM_SUBSECTION) {
1904 char idstr[256];
1905 int ret;
1906 uint8_t version_id, len, size;
1907 const VMStateDescription *sub_vmsd;
1909 len = qemu_peek_byte(f, 1);
1910 if (len < strlen(vmsd->name) + 1) {
1911 /* subsection name has be be "section_name/a" */
1912 return 0;
1914 size = qemu_peek_buffer(f, (uint8_t *)idstr, len, 2);
1915 if (size != len) {
1916 return 0;
1918 idstr[size] = 0;
1920 if (strncmp(vmsd->name, idstr, strlen(vmsd->name)) != 0) {
1921 /* it don't have a valid subsection name */
1922 return 0;
1924 sub_vmsd = vmstate_get_subsection(vmsd->subsections, idstr);
1925 if (sub_vmsd == NULL) {
1926 return -ENOENT;
1928 qemu_file_skip(f, 1); /* subsection */
1929 qemu_file_skip(f, 1); /* len */
1930 qemu_file_skip(f, len); /* idstr */
1931 version_id = qemu_get_be32(f);
1933 ret = vmstate_load_state(f, sub_vmsd, opaque, version_id);
1934 if (ret) {
1935 return ret;
1938 return 0;
1941 static void vmstate_subsection_save(QEMUFile *f, const VMStateDescription *vmsd,
1942 void *opaque)
1944 const VMStateSubsection *sub = vmsd->subsections;
1946 while (sub && sub->needed) {
1947 if (sub->needed(opaque)) {
1948 const VMStateDescription *vmsd = sub->vmsd;
1949 uint8_t len;
1951 qemu_put_byte(f, QEMU_VM_SUBSECTION);
1952 len = strlen(vmsd->name);
1953 qemu_put_byte(f, len);
1954 qemu_put_buffer(f, (uint8_t *)vmsd->name, len);
1955 qemu_put_be32(f, vmsd->version_id);
1956 vmstate_save_state(f, vmsd, opaque);
1958 sub++;
1962 typedef struct LoadStateEntry {
1963 QLIST_ENTRY(LoadStateEntry) entry;
1964 SaveStateEntry *se;
1965 int section_id;
1966 int version_id;
1967 } LoadStateEntry;
1969 int qemu_loadvm_state(QEMUFile *f)
1971 QLIST_HEAD(, LoadStateEntry) loadvm_handlers =
1972 QLIST_HEAD_INITIALIZER(loadvm_handlers);
1973 LoadStateEntry *le, *new_le;
1974 uint8_t section_type;
1975 unsigned int v;
1976 int ret;
1978 if (qemu_savevm_state_blocked(NULL)) {
1979 return -EINVAL;
1982 v = qemu_get_be32(f);
1983 if (v != QEMU_VM_FILE_MAGIC)
1984 return -EINVAL;
1986 v = qemu_get_be32(f);
1987 if (v == QEMU_VM_FILE_VERSION_COMPAT) {
1988 fprintf(stderr, "SaveVM v2 format is obsolete and don't work anymore\n");
1989 return -ENOTSUP;
1991 if (v != QEMU_VM_FILE_VERSION)
1992 return -ENOTSUP;
1994 while ((section_type = qemu_get_byte(f)) != QEMU_VM_EOF) {
1995 uint32_t instance_id, version_id, section_id;
1996 SaveStateEntry *se;
1997 char idstr[257];
1998 int len;
2000 switch (section_type) {
2001 case QEMU_VM_SECTION_START:
2002 case QEMU_VM_SECTION_FULL:
2003 /* Read section start */
2004 section_id = qemu_get_be32(f);
2005 len = qemu_get_byte(f);
2006 qemu_get_buffer(f, (uint8_t *)idstr, len);
2007 idstr[len] = 0;
2008 instance_id = qemu_get_be32(f);
2009 version_id = qemu_get_be32(f);
2011 /* Find savevm section */
2012 se = find_se(idstr, instance_id);
2013 if (se == NULL) {
2014 fprintf(stderr, "Unknown savevm section or instance '%s' %d\n", idstr, instance_id);
2015 ret = -EINVAL;
2016 goto out;
2019 /* Validate version */
2020 if (version_id > se->version_id) {
2021 fprintf(stderr, "savevm: unsupported version %d for '%s' v%d\n",
2022 version_id, idstr, se->version_id);
2023 ret = -EINVAL;
2024 goto out;
2027 /* Add entry */
2028 le = g_malloc0(sizeof(*le));
2030 le->se = se;
2031 le->section_id = section_id;
2032 le->version_id = version_id;
2033 QLIST_INSERT_HEAD(&loadvm_handlers, le, entry);
2035 ret = vmstate_load(f, le->se, le->version_id);
2036 if (ret < 0) {
2037 fprintf(stderr, "qemu: warning: error while loading state for instance 0x%x of device '%s'\n",
2038 instance_id, idstr);
2039 goto out;
2041 break;
2042 case QEMU_VM_SECTION_PART:
2043 case QEMU_VM_SECTION_END:
2044 section_id = qemu_get_be32(f);
2046 QLIST_FOREACH(le, &loadvm_handlers, entry) {
2047 if (le->section_id == section_id) {
2048 break;
2051 if (le == NULL) {
2052 fprintf(stderr, "Unknown savevm section %d\n", section_id);
2053 ret = -EINVAL;
2054 goto out;
2057 ret = vmstate_load(f, le->se, le->version_id);
2058 if (ret < 0) {
2059 fprintf(stderr, "qemu: warning: error while loading state section id %d\n",
2060 section_id);
2061 goto out;
2063 break;
2064 default:
2065 fprintf(stderr, "Unknown savevm section type %d\n", section_type);
2066 ret = -EINVAL;
2067 goto out;
2071 cpu_synchronize_all_post_init();
2073 ret = 0;
2075 out:
2076 QLIST_FOREACH_SAFE(le, &loadvm_handlers, entry, new_le) {
2077 QLIST_REMOVE(le, entry);
2078 g_free(le);
2081 if (ret == 0) {
2082 ret = qemu_file_get_error(f);
2085 return ret;
2088 static int bdrv_snapshot_find(BlockDriverState *bs, QEMUSnapshotInfo *sn_info,
2089 const char *name)
2091 QEMUSnapshotInfo *sn_tab, *sn;
2092 int nb_sns, i, ret;
2094 ret = -ENOENT;
2095 nb_sns = bdrv_snapshot_list(bs, &sn_tab);
2096 if (nb_sns < 0)
2097 return ret;
2098 for(i = 0; i < nb_sns; i++) {
2099 sn = &sn_tab[i];
2100 if (!strcmp(sn->id_str, name) || !strcmp(sn->name, name)) {
2101 *sn_info = *sn;
2102 ret = 0;
2103 break;
2106 g_free(sn_tab);
2107 return ret;
2111 * Deletes snapshots of a given name in all opened images.
2113 static int del_existing_snapshots(Monitor *mon, const char *name)
2115 BlockDriverState *bs;
2116 QEMUSnapshotInfo sn1, *snapshot = &sn1;
2117 int ret;
2119 bs = NULL;
2120 while ((bs = bdrv_next(bs))) {
2121 if (bdrv_can_snapshot(bs) &&
2122 bdrv_snapshot_find(bs, snapshot, name) >= 0)
2124 ret = bdrv_snapshot_delete(bs, name);
2125 if (ret < 0) {
2126 monitor_printf(mon,
2127 "Error while deleting snapshot on '%s'\n",
2128 bdrv_get_device_name(bs));
2129 return -1;
2134 return 0;
2137 void do_savevm(Monitor *mon, const QDict *qdict)
2139 BlockDriverState *bs, *bs1;
2140 QEMUSnapshotInfo sn1, *sn = &sn1, old_sn1, *old_sn = &old_sn1;
2141 int ret;
2142 QEMUFile *f;
2143 int saved_vm_running;
2144 uint64_t vm_state_size;
2145 qemu_timeval tv;
2146 struct tm tm;
2147 const char *name = qdict_get_try_str(qdict, "name");
2149 /* Verify if there is a device that doesn't support snapshots and is writable */
2150 bs = NULL;
2151 while ((bs = bdrv_next(bs))) {
2153 if (!bdrv_is_inserted(bs) || bdrv_is_read_only(bs)) {
2154 continue;
2157 if (!bdrv_can_snapshot(bs)) {
2158 monitor_printf(mon, "Device '%s' is writable but does not support snapshots.\n",
2159 bdrv_get_device_name(bs));
2160 return;
2164 bs = bdrv_snapshots();
2165 if (!bs) {
2166 monitor_printf(mon, "No block device can accept snapshots\n");
2167 return;
2170 saved_vm_running = runstate_is_running();
2171 vm_stop(RUN_STATE_SAVE_VM);
2173 memset(sn, 0, sizeof(*sn));
2175 /* fill auxiliary fields */
2176 qemu_gettimeofday(&tv);
2177 sn->date_sec = tv.tv_sec;
2178 sn->date_nsec = tv.tv_usec * 1000;
2179 sn->vm_clock_nsec = qemu_get_clock_ns(vm_clock);
2181 if (name) {
2182 ret = bdrv_snapshot_find(bs, old_sn, name);
2183 if (ret >= 0) {
2184 pstrcpy(sn->name, sizeof(sn->name), old_sn->name);
2185 pstrcpy(sn->id_str, sizeof(sn->id_str), old_sn->id_str);
2186 } else {
2187 pstrcpy(sn->name, sizeof(sn->name), name);
2189 } else {
2190 /* cast below needed for OpenBSD where tv_sec is still 'long' */
2191 localtime_r((const time_t *)&tv.tv_sec, &tm);
2192 strftime(sn->name, sizeof(sn->name), "vm-%Y%m%d%H%M%S", &tm);
2195 /* Delete old snapshots of the same name */
2196 if (name && del_existing_snapshots(mon, name) < 0) {
2197 goto the_end;
2200 /* save the VM state */
2201 f = qemu_fopen_bdrv(bs, 1);
2202 if (!f) {
2203 monitor_printf(mon, "Could not open VM state file\n");
2204 goto the_end;
2206 ret = qemu_savevm_state(f);
2207 vm_state_size = qemu_ftell(f);
2208 qemu_fclose(f);
2209 if (ret < 0) {
2210 monitor_printf(mon, "Error %d while writing VM\n", ret);
2211 goto the_end;
2214 /* create the snapshots */
2216 bs1 = NULL;
2217 while ((bs1 = bdrv_next(bs1))) {
2218 if (bdrv_can_snapshot(bs1)) {
2219 /* Write VM state size only to the image that contains the state */
2220 sn->vm_state_size = (bs == bs1 ? vm_state_size : 0);
2221 ret = bdrv_snapshot_create(bs1, sn);
2222 if (ret < 0) {
2223 monitor_printf(mon, "Error while creating snapshot on '%s'\n",
2224 bdrv_get_device_name(bs1));
2229 the_end:
2230 if (saved_vm_running)
2231 vm_start();
2234 void qmp_xen_save_devices_state(const char *filename, Error **errp)
2236 QEMUFile *f;
2237 int saved_vm_running;
2238 int ret;
2240 saved_vm_running = runstate_is_running();
2241 vm_stop(RUN_STATE_SAVE_VM);
2243 f = qemu_fopen(filename, "wb");
2244 if (!f) {
2245 error_set(errp, QERR_OPEN_FILE_FAILED, filename);
2246 goto the_end;
2248 ret = qemu_save_device_state(f);
2249 qemu_fclose(f);
2250 if (ret < 0) {
2251 error_set(errp, QERR_IO_ERROR);
2254 the_end:
2255 if (saved_vm_running)
2256 vm_start();
2259 int load_vmstate(const char *name)
2261 BlockDriverState *bs, *bs_vm_state;
2262 QEMUSnapshotInfo sn;
2263 QEMUFile *f;
2264 int ret;
2266 bs_vm_state = bdrv_snapshots();
2267 if (!bs_vm_state) {
2268 error_report("No block device supports snapshots");
2269 return -ENOTSUP;
2272 /* Don't even try to load empty VM states */
2273 ret = bdrv_snapshot_find(bs_vm_state, &sn, name);
2274 if (ret < 0) {
2275 return ret;
2276 } else if (sn.vm_state_size == 0) {
2277 error_report("This is a disk-only snapshot. Revert to it offline "
2278 "using qemu-img.");
2279 return -EINVAL;
2282 /* Verify if there is any device that doesn't support snapshots and is
2283 writable and check if the requested snapshot is available too. */
2284 bs = NULL;
2285 while ((bs = bdrv_next(bs))) {
2287 if (!bdrv_is_inserted(bs) || bdrv_is_read_only(bs)) {
2288 continue;
2291 if (!bdrv_can_snapshot(bs)) {
2292 error_report("Device '%s' is writable but does not support snapshots.",
2293 bdrv_get_device_name(bs));
2294 return -ENOTSUP;
2297 ret = bdrv_snapshot_find(bs, &sn, name);
2298 if (ret < 0) {
2299 error_report("Device '%s' does not have the requested snapshot '%s'",
2300 bdrv_get_device_name(bs), name);
2301 return ret;
2305 /* Flush all IO requests so they don't interfere with the new state. */
2306 bdrv_drain_all();
2308 bs = NULL;
2309 while ((bs = bdrv_next(bs))) {
2310 if (bdrv_can_snapshot(bs)) {
2311 ret = bdrv_snapshot_goto(bs, name);
2312 if (ret < 0) {
2313 error_report("Error %d while activating snapshot '%s' on '%s'",
2314 ret, name, bdrv_get_device_name(bs));
2315 return ret;
2320 /* restore the VM state */
2321 f = qemu_fopen_bdrv(bs_vm_state, 0);
2322 if (!f) {
2323 error_report("Could not open VM state file");
2324 return -EINVAL;
2327 qemu_system_reset(VMRESET_SILENT);
2328 ret = qemu_loadvm_state(f);
2330 qemu_fclose(f);
2331 if (ret < 0) {
2332 error_report("Error %d while loading VM state", ret);
2333 return ret;
2336 return 0;
2339 void do_delvm(Monitor *mon, const QDict *qdict)
2341 BlockDriverState *bs, *bs1;
2342 int ret;
2343 const char *name = qdict_get_str(qdict, "name");
2345 bs = bdrv_snapshots();
2346 if (!bs) {
2347 monitor_printf(mon, "No block device supports snapshots\n");
2348 return;
2351 bs1 = NULL;
2352 while ((bs1 = bdrv_next(bs1))) {
2353 if (bdrv_can_snapshot(bs1)) {
2354 ret = bdrv_snapshot_delete(bs1, name);
2355 if (ret < 0) {
2356 if (ret == -ENOTSUP)
2357 monitor_printf(mon,
2358 "Snapshots not supported on device '%s'\n",
2359 bdrv_get_device_name(bs1));
2360 else
2361 monitor_printf(mon, "Error %d while deleting snapshot on "
2362 "'%s'\n", ret, bdrv_get_device_name(bs1));
2368 void do_info_snapshots(Monitor *mon, const QDict *qdict)
2370 BlockDriverState *bs, *bs1;
2371 QEMUSnapshotInfo *sn_tab, *sn, s, *sn_info = &s;
2372 int nb_sns, i, ret, available;
2373 int total;
2374 int *available_snapshots;
2375 char buf[256];
2377 bs = bdrv_snapshots();
2378 if (!bs) {
2379 monitor_printf(mon, "No available block device supports snapshots\n");
2380 return;
2383 nb_sns = bdrv_snapshot_list(bs, &sn_tab);
2384 if (nb_sns < 0) {
2385 monitor_printf(mon, "bdrv_snapshot_list: error %d\n", nb_sns);
2386 return;
2389 if (nb_sns == 0) {
2390 monitor_printf(mon, "There is no snapshot available.\n");
2391 return;
2394 available_snapshots = g_malloc0(sizeof(int) * nb_sns);
2395 total = 0;
2396 for (i = 0; i < nb_sns; i++) {
2397 sn = &sn_tab[i];
2398 available = 1;
2399 bs1 = NULL;
2401 while ((bs1 = bdrv_next(bs1))) {
2402 if (bdrv_can_snapshot(bs1) && bs1 != bs) {
2403 ret = bdrv_snapshot_find(bs1, sn_info, sn->id_str);
2404 if (ret < 0) {
2405 available = 0;
2406 break;
2411 if (available) {
2412 available_snapshots[total] = i;
2413 total++;
2417 if (total > 0) {
2418 monitor_printf(mon, "%s\n", bdrv_snapshot_dump(buf, sizeof(buf), NULL));
2419 for (i = 0; i < total; i++) {
2420 sn = &sn_tab[available_snapshots[i]];
2421 monitor_printf(mon, "%s\n", bdrv_snapshot_dump(buf, sizeof(buf), sn));
2423 } else {
2424 monitor_printf(mon, "There is no suitable snapshot available\n");
2427 g_free(sn_tab);
2428 g_free(available_snapshots);
2432 void vmstate_register_ram(MemoryRegion *mr, DeviceState *dev)
2434 qemu_ram_set_idstr(memory_region_get_ram_addr(mr) & TARGET_PAGE_MASK,
2435 memory_region_name(mr), dev);
2438 void vmstate_unregister_ram(MemoryRegion *mr, DeviceState *dev)
2440 /* Nothing do to while the implementation is in RAMBlock */
2443 void vmstate_register_ram_global(MemoryRegion *mr)
2445 vmstate_register_ram(mr, NULL);