1 // SPDX-License-Identifier: GPL-2.0-only
3 * linux/kernel/power/swap.c
5 * This file provides functions for reading the suspend image from
6 * and writing it to a swap partition.
8 * Copyright (C) 1998,2001-2005 Pavel Machek <pavel@ucw.cz>
9 * Copyright (C) 2006 Rafael J. Wysocki <rjw@sisk.pl>
10 * Copyright (C) 2010-2012 Bojan Smojver <bojan@rexursive.com>
13 #define pr_fmt(fmt) "PM: " fmt
15 #include <linux/module.h>
16 #include <linux/file.h>
17 #include <linux/delay.h>
18 #include <linux/bitops.h>
19 #include <linux/genhd.h>
20 #include <linux/device.h>
21 #include <linux/bio.h>
22 #include <linux/blkdev.h>
23 #include <linux/swap.h>
24 #include <linux/swapops.h>
26 #include <linux/slab.h>
27 #include <linux/lzo.h>
28 #include <linux/vmalloc.h>
29 #include <linux/cpumask.h>
30 #include <linux/atomic.h>
31 #include <linux/kthread.h>
32 #include <linux/crc32.h>
33 #include <linux/ktime.h>
37 #define HIBERNATE_SIG "S1SUSPEND"
40 * When reading an {un,}compressed image, we may restore pages in place,
41 * in which case some architectures need these pages cleaning before they
42 * can be executed. We don't know which pages these may be, so clean the lot.
44 static bool clean_pages_on_read
;
45 static bool clean_pages_on_decompress
;
48 * The swap map is a data structure used for keeping track of each page
49 * written to a swap partition. It consists of many swap_map_page
50 * structures that contain each an array of MAP_PAGE_ENTRIES swap entries.
51 * These structures are stored on the swap and linked together with the
52 * help of the .next_swap member.
54 * The swap map is created during suspend. The swap map pages are
55 * allocated and populated one at a time, so we only need one memory
56 * page to set up the entire structure.
58 * During resume we pick up all swap_map_page structures into a list.
61 #define MAP_PAGE_ENTRIES (PAGE_SIZE / sizeof(sector_t) - 1)
64 * Number of free pages that are not high.
66 static inline unsigned long low_free_pages(void)
68 return nr_free_pages() - nr_free_highpages();
72 * Number of pages required to be kept free while writing the image. Always
73 * half of all available low pages before the writing starts.
75 static inline unsigned long reqd_free_pages(void)
77 return low_free_pages() / 2;
80 struct swap_map_page
{
81 sector_t entries
[MAP_PAGE_ENTRIES
];
85 struct swap_map_page_list
{
86 struct swap_map_page
*map
;
87 struct swap_map_page_list
*next
;
91 * The swap_map_handle structure is used for handling swap in
95 struct swap_map_handle
{
96 struct swap_map_page
*cur
;
97 struct swap_map_page_list
*maps
;
99 sector_t first_sector
;
101 unsigned long reqd_free_pages
;
105 struct swsusp_header
{
106 char reserved
[PAGE_SIZE
- 20 - sizeof(sector_t
) - sizeof(int) -
110 unsigned int flags
; /* Flags to pass to the "boot" kernel */
115 static struct swsusp_header
*swsusp_header
;
118 * The following functions are used for tracing the allocated
119 * swap pages, so that they can be freed in case of an error.
122 struct swsusp_extent
{
128 static struct rb_root swsusp_extents
= RB_ROOT
;
130 static int swsusp_extents_insert(unsigned long swap_offset
)
132 struct rb_node
**new = &(swsusp_extents
.rb_node
);
133 struct rb_node
*parent
= NULL
;
134 struct swsusp_extent
*ext
;
136 /* Figure out where to put the new node */
138 ext
= rb_entry(*new, struct swsusp_extent
, node
);
140 if (swap_offset
< ext
->start
) {
142 if (swap_offset
== ext
->start
- 1) {
146 new = &((*new)->rb_left
);
147 } else if (swap_offset
> ext
->end
) {
149 if (swap_offset
== ext
->end
+ 1) {
153 new = &((*new)->rb_right
);
155 /* It already is in the tree */
159 /* Add the new node and rebalance the tree. */
160 ext
= kzalloc(sizeof(struct swsusp_extent
), GFP_KERNEL
);
164 ext
->start
= swap_offset
;
165 ext
->end
= swap_offset
;
166 rb_link_node(&ext
->node
, parent
, new);
167 rb_insert_color(&ext
->node
, &swsusp_extents
);
172 * alloc_swapdev_block - allocate a swap page and register that it has
173 * been allocated, so that it can be freed in case of an error.
176 sector_t
alloc_swapdev_block(int swap
)
178 unsigned long offset
;
180 offset
= swp_offset(get_swap_page_of_type(swap
));
182 if (swsusp_extents_insert(offset
))
183 swap_free(swp_entry(swap
, offset
));
185 return swapdev_block(swap
, offset
);
191 * free_all_swap_pages - free swap pages allocated for saving image data.
192 * It also frees the extents used to register which swap entries had been
196 void free_all_swap_pages(int swap
)
198 struct rb_node
*node
;
200 while ((node
= swsusp_extents
.rb_node
)) {
201 struct swsusp_extent
*ext
;
202 unsigned long offset
;
204 ext
= rb_entry(node
, struct swsusp_extent
, node
);
205 rb_erase(node
, &swsusp_extents
);
206 for (offset
= ext
->start
; offset
<= ext
->end
; offset
++)
207 swap_free(swp_entry(swap
, offset
));
213 int swsusp_swap_in_use(void)
215 return (swsusp_extents
.rb_node
!= NULL
);
222 static unsigned short root_swap
= 0xffff;
223 static struct block_device
*hib_resume_bdev
;
225 struct hib_bio_batch
{
227 wait_queue_head_t wait
;
229 struct blk_plug plug
;
232 static void hib_init_batch(struct hib_bio_batch
*hb
)
234 atomic_set(&hb
->count
, 0);
235 init_waitqueue_head(&hb
->wait
);
236 hb
->error
= BLK_STS_OK
;
237 blk_start_plug(&hb
->plug
);
240 static void hib_finish_batch(struct hib_bio_batch
*hb
)
242 blk_finish_plug(&hb
->plug
);
245 static void hib_end_io(struct bio
*bio
)
247 struct hib_bio_batch
*hb
= bio
->bi_private
;
248 struct page
*page
= bio_first_page_all(bio
);
250 if (bio
->bi_status
) {
251 pr_alert("Read-error on swap-device (%u:%u:%Lu)\n",
252 MAJOR(bio_dev(bio
)), MINOR(bio_dev(bio
)),
253 (unsigned long long)bio
->bi_iter
.bi_sector
);
256 if (bio_data_dir(bio
) == WRITE
)
258 else if (clean_pages_on_read
)
259 flush_icache_range((unsigned long)page_address(page
),
260 (unsigned long)page_address(page
) + PAGE_SIZE
);
262 if (bio
->bi_status
&& !hb
->error
)
263 hb
->error
= bio
->bi_status
;
264 if (atomic_dec_and_test(&hb
->count
))
270 static int hib_submit_io(int op
, int op_flags
, pgoff_t page_off
, void *addr
,
271 struct hib_bio_batch
*hb
)
273 struct page
*page
= virt_to_page(addr
);
277 bio
= bio_alloc(GFP_NOIO
| __GFP_HIGH
, 1);
278 bio
->bi_iter
.bi_sector
= page_off
* (PAGE_SIZE
>> 9);
279 bio_set_dev(bio
, hib_resume_bdev
);
280 bio_set_op_attrs(bio
, op
, op_flags
);
282 if (bio_add_page(bio
, page
, PAGE_SIZE
, 0) < PAGE_SIZE
) {
283 pr_err("Adding page to bio failed at %llu\n",
284 (unsigned long long)bio
->bi_iter
.bi_sector
);
290 bio
->bi_end_io
= hib_end_io
;
291 bio
->bi_private
= hb
;
292 atomic_inc(&hb
->count
);
295 error
= submit_bio_wait(bio
);
302 static blk_status_t
hib_wait_io(struct hib_bio_batch
*hb
)
305 * We are relying on the behavior of blk_plug that a thread with
306 * a plug will flush the plug list before sleeping.
308 wait_event(hb
->wait
, atomic_read(&hb
->count
) == 0);
309 return blk_status_to_errno(hb
->error
);
316 static int mark_swapfiles(struct swap_map_handle
*handle
, unsigned int flags
)
320 hib_submit_io(REQ_OP_READ
, 0, swsusp_resume_block
,
321 swsusp_header
, NULL
);
322 if (!memcmp("SWAP-SPACE",swsusp_header
->sig
, 10) ||
323 !memcmp("SWAPSPACE2",swsusp_header
->sig
, 10)) {
324 memcpy(swsusp_header
->orig_sig
,swsusp_header
->sig
, 10);
325 memcpy(swsusp_header
->sig
, HIBERNATE_SIG
, 10);
326 swsusp_header
->image
= handle
->first_sector
;
327 swsusp_header
->flags
= flags
;
328 if (flags
& SF_CRC32_MODE
)
329 swsusp_header
->crc32
= handle
->crc32
;
330 error
= hib_submit_io(REQ_OP_WRITE
, REQ_SYNC
,
331 swsusp_resume_block
, swsusp_header
, NULL
);
333 pr_err("Swap header not found!\n");
340 * swsusp_swap_check - check if the resume device is a swap device
341 * and get its index (if so)
343 * This is called before saving image
345 static int swsusp_swap_check(void)
349 if (swsusp_resume_device
)
350 res
= swap_type_of(swsusp_resume_device
, swsusp_resume_block
);
352 res
= find_first_swap(&swsusp_resume_device
);
357 hib_resume_bdev
= blkdev_get_by_dev(swsusp_resume_device
, FMODE_WRITE
,
359 if (IS_ERR(hib_resume_bdev
))
360 return PTR_ERR(hib_resume_bdev
);
362 res
= set_blocksize(hib_resume_bdev
, PAGE_SIZE
);
364 blkdev_put(hib_resume_bdev
, FMODE_WRITE
);
370 * write_page - Write one page to given swap location.
371 * @buf: Address we're writing.
372 * @offset: Offset of the swap page we're writing to.
373 * @hb: bio completion batch
376 static int write_page(void *buf
, sector_t offset
, struct hib_bio_batch
*hb
)
385 src
= (void *)__get_free_page(GFP_NOIO
| __GFP_NOWARN
|
390 ret
= hib_wait_io(hb
); /* Free pages */
393 src
= (void *)__get_free_page(GFP_NOIO
|
400 hb
= NULL
; /* Go synchronous */
407 return hib_submit_io(REQ_OP_WRITE
, REQ_SYNC
, offset
, src
, hb
);
410 static void release_swap_writer(struct swap_map_handle
*handle
)
413 free_page((unsigned long)handle
->cur
);
417 static int get_swap_writer(struct swap_map_handle
*handle
)
421 ret
= swsusp_swap_check();
424 pr_err("Cannot find swap device, try swapon -a\n");
427 handle
->cur
= (struct swap_map_page
*)get_zeroed_page(GFP_KERNEL
);
432 handle
->cur_swap
= alloc_swapdev_block(root_swap
);
433 if (!handle
->cur_swap
) {
438 handle
->reqd_free_pages
= reqd_free_pages();
439 handle
->first_sector
= handle
->cur_swap
;
442 release_swap_writer(handle
);
444 swsusp_close(FMODE_WRITE
);
448 static int swap_write_page(struct swap_map_handle
*handle
, void *buf
,
449 struct hib_bio_batch
*hb
)
456 offset
= alloc_swapdev_block(root_swap
);
457 error
= write_page(buf
, offset
, hb
);
460 handle
->cur
->entries
[handle
->k
++] = offset
;
461 if (handle
->k
>= MAP_PAGE_ENTRIES
) {
462 offset
= alloc_swapdev_block(root_swap
);
465 handle
->cur
->next_swap
= offset
;
466 error
= write_page(handle
->cur
, handle
->cur_swap
, hb
);
469 clear_page(handle
->cur
);
470 handle
->cur_swap
= offset
;
473 if (hb
&& low_free_pages() <= handle
->reqd_free_pages
) {
474 error
= hib_wait_io(hb
);
478 * Recalculate the number of required free pages, to
479 * make sure we never take more than half.
481 handle
->reqd_free_pages
= reqd_free_pages();
488 static int flush_swap_writer(struct swap_map_handle
*handle
)
490 if (handle
->cur
&& handle
->cur_swap
)
491 return write_page(handle
->cur
, handle
->cur_swap
, NULL
);
496 static int swap_writer_finish(struct swap_map_handle
*handle
,
497 unsigned int flags
, int error
)
500 flush_swap_writer(handle
);
502 error
= mark_swapfiles(handle
, flags
);
507 free_all_swap_pages(root_swap
);
508 release_swap_writer(handle
);
509 swsusp_close(FMODE_WRITE
);
514 /* We need to remember how much compressed data we need to read. */
515 #define LZO_HEADER sizeof(size_t)
517 /* Number of pages/bytes we'll compress at one time. */
518 #define LZO_UNC_PAGES 32
519 #define LZO_UNC_SIZE (LZO_UNC_PAGES * PAGE_SIZE)
521 /* Number of pages/bytes we need for compressed data (worst case). */
522 #define LZO_CMP_PAGES DIV_ROUND_UP(lzo1x_worst_compress(LZO_UNC_SIZE) + \
523 LZO_HEADER, PAGE_SIZE)
524 #define LZO_CMP_SIZE (LZO_CMP_PAGES * PAGE_SIZE)
526 /* Maximum number of threads for compression/decompression. */
527 #define LZO_THREADS 3
529 /* Minimum/maximum number of pages for read buffering. */
530 #define LZO_MIN_RD_PAGES 1024
531 #define LZO_MAX_RD_PAGES 8192
535 * save_image - save the suspend image data
538 static int save_image(struct swap_map_handle
*handle
,
539 struct snapshot_handle
*snapshot
,
540 unsigned int nr_to_write
)
546 struct hib_bio_batch hb
;
552 pr_info("Saving image data pages (%u pages)...\n",
554 m
= nr_to_write
/ 10;
560 ret
= snapshot_read_next(snapshot
);
563 ret
= swap_write_page(handle
, data_of(*snapshot
), &hb
);
567 pr_info("Image saving progress: %3d%%\n",
571 err2
= hib_wait_io(&hb
);
572 hib_finish_batch(&hb
);
577 pr_info("Image saving done\n");
578 swsusp_show_speed(start
, stop
, nr_to_write
, "Wrote");
583 * Structure used for CRC32.
586 struct task_struct
*thr
; /* thread */
587 atomic_t ready
; /* ready to start flag */
588 atomic_t stop
; /* ready to stop flag */
589 unsigned run_threads
; /* nr current threads */
590 wait_queue_head_t go
; /* start crc update */
591 wait_queue_head_t done
; /* crc update done */
592 u32
*crc32
; /* points to handle's crc32 */
593 size_t *unc_len
[LZO_THREADS
]; /* uncompressed lengths */
594 unsigned char *unc
[LZO_THREADS
]; /* uncompressed data */
598 * CRC32 update function that runs in its own thread.
600 static int crc32_threadfn(void *data
)
602 struct crc_data
*d
= data
;
606 wait_event(d
->go
, atomic_read(&d
->ready
) ||
607 kthread_should_stop());
608 if (kthread_should_stop()) {
610 atomic_set(&d
->stop
, 1);
614 atomic_set(&d
->ready
, 0);
616 for (i
= 0; i
< d
->run_threads
; i
++)
617 *d
->crc32
= crc32_le(*d
->crc32
,
618 d
->unc
[i
], *d
->unc_len
[i
]);
619 atomic_set(&d
->stop
, 1);
625 * Structure used for LZO data compression.
628 struct task_struct
*thr
; /* thread */
629 atomic_t ready
; /* ready to start flag */
630 atomic_t stop
; /* ready to stop flag */
631 int ret
; /* return code */
632 wait_queue_head_t go
; /* start compression */
633 wait_queue_head_t done
; /* compression done */
634 size_t unc_len
; /* uncompressed length */
635 size_t cmp_len
; /* compressed length */
636 unsigned char unc
[LZO_UNC_SIZE
]; /* uncompressed buffer */
637 unsigned char cmp
[LZO_CMP_SIZE
]; /* compressed buffer */
638 unsigned char wrk
[LZO1X_1_MEM_COMPRESS
]; /* compression workspace */
642 * Compression function that runs in its own thread.
644 static int lzo_compress_threadfn(void *data
)
646 struct cmp_data
*d
= data
;
649 wait_event(d
->go
, atomic_read(&d
->ready
) ||
650 kthread_should_stop());
651 if (kthread_should_stop()) {
654 atomic_set(&d
->stop
, 1);
658 atomic_set(&d
->ready
, 0);
660 d
->ret
= lzo1x_1_compress(d
->unc
, d
->unc_len
,
661 d
->cmp
+ LZO_HEADER
, &d
->cmp_len
,
663 atomic_set(&d
->stop
, 1);
670 * save_image_lzo - Save the suspend image data compressed with LZO.
671 * @handle: Swap map handle to use for saving the image.
672 * @snapshot: Image to read data from.
673 * @nr_to_write: Number of pages to save.
675 static int save_image_lzo(struct swap_map_handle
*handle
,
676 struct snapshot_handle
*snapshot
,
677 unsigned int nr_to_write
)
683 struct hib_bio_batch hb
;
687 unsigned thr
, run_threads
, nr_threads
;
688 unsigned char *page
= NULL
;
689 struct cmp_data
*data
= NULL
;
690 struct crc_data
*crc
= NULL
;
695 * We'll limit the number of threads for compression to limit memory
698 nr_threads
= num_online_cpus() - 1;
699 nr_threads
= clamp_val(nr_threads
, 1, LZO_THREADS
);
701 page
= (void *)__get_free_page(GFP_NOIO
| __GFP_HIGH
);
703 pr_err("Failed to allocate LZO page\n");
708 data
= vmalloc(array_size(nr_threads
, sizeof(*data
)));
710 pr_err("Failed to allocate LZO data\n");
714 for (thr
= 0; thr
< nr_threads
; thr
++)
715 memset(&data
[thr
], 0, offsetof(struct cmp_data
, go
));
717 crc
= kmalloc(sizeof(*crc
), GFP_KERNEL
);
719 pr_err("Failed to allocate crc\n");
723 memset(crc
, 0, offsetof(struct crc_data
, go
));
726 * Start the compression threads.
728 for (thr
= 0; thr
< nr_threads
; thr
++) {
729 init_waitqueue_head(&data
[thr
].go
);
730 init_waitqueue_head(&data
[thr
].done
);
732 data
[thr
].thr
= kthread_run(lzo_compress_threadfn
,
734 "image_compress/%u", thr
);
735 if (IS_ERR(data
[thr
].thr
)) {
736 data
[thr
].thr
= NULL
;
737 pr_err("Cannot start compression threads\n");
744 * Start the CRC32 thread.
746 init_waitqueue_head(&crc
->go
);
747 init_waitqueue_head(&crc
->done
);
750 crc
->crc32
= &handle
->crc32
;
751 for (thr
= 0; thr
< nr_threads
; thr
++) {
752 crc
->unc
[thr
] = data
[thr
].unc
;
753 crc
->unc_len
[thr
] = &data
[thr
].unc_len
;
756 crc
->thr
= kthread_run(crc32_threadfn
, crc
, "image_crc32");
757 if (IS_ERR(crc
->thr
)) {
759 pr_err("Cannot start CRC32 thread\n");
765 * Adjust the number of required free pages after all allocations have
766 * been done. We don't want to run out of pages when writing.
768 handle
->reqd_free_pages
= reqd_free_pages();
770 pr_info("Using %u thread(s) for compression\n", nr_threads
);
771 pr_info("Compressing and saving image data (%u pages)...\n",
773 m
= nr_to_write
/ 10;
779 for (thr
= 0; thr
< nr_threads
; thr
++) {
780 for (off
= 0; off
< LZO_UNC_SIZE
; off
+= PAGE_SIZE
) {
781 ret
= snapshot_read_next(snapshot
);
788 memcpy(data
[thr
].unc
+ off
,
789 data_of(*snapshot
), PAGE_SIZE
);
792 pr_info("Image saving progress: %3d%%\n",
799 data
[thr
].unc_len
= off
;
801 atomic_set(&data
[thr
].ready
, 1);
802 wake_up(&data
[thr
].go
);
808 crc
->run_threads
= thr
;
809 atomic_set(&crc
->ready
, 1);
812 for (run_threads
= thr
, thr
= 0; thr
< run_threads
; thr
++) {
813 wait_event(data
[thr
].done
,
814 atomic_read(&data
[thr
].stop
));
815 atomic_set(&data
[thr
].stop
, 0);
820 pr_err("LZO compression failed\n");
824 if (unlikely(!data
[thr
].cmp_len
||
826 lzo1x_worst_compress(data
[thr
].unc_len
))) {
827 pr_err("Invalid LZO compressed length\n");
832 *(size_t *)data
[thr
].cmp
= data
[thr
].cmp_len
;
835 * Given we are writing one page at a time to disk, we
836 * copy that much from the buffer, although the last
837 * bit will likely be smaller than full page. This is
838 * OK - we saved the length of the compressed data, so
839 * any garbage at the end will be discarded when we
843 off
< LZO_HEADER
+ data
[thr
].cmp_len
;
845 memcpy(page
, data
[thr
].cmp
+ off
, PAGE_SIZE
);
847 ret
= swap_write_page(handle
, page
, &hb
);
853 wait_event(crc
->done
, atomic_read(&crc
->stop
));
854 atomic_set(&crc
->stop
, 0);
858 err2
= hib_wait_io(&hb
);
863 pr_info("Image saving done\n");
864 swsusp_show_speed(start
, stop
, nr_to_write
, "Wrote");
866 hib_finish_batch(&hb
);
869 kthread_stop(crc
->thr
);
873 for (thr
= 0; thr
< nr_threads
; thr
++)
875 kthread_stop(data
[thr
].thr
);
878 if (page
) free_page((unsigned long)page
);
884 * enough_swap - Make sure we have enough swap to save the image.
886 * Returns TRUE or FALSE after checking the total amount of swap
887 * space avaiable from the resume partition.
890 static int enough_swap(unsigned int nr_pages
)
892 unsigned int free_swap
= count_swap_pages(root_swap
, 1);
893 unsigned int required
;
895 pr_debug("Free swap pages: %u\n", free_swap
);
897 required
= PAGES_FOR_IO
+ nr_pages
;
898 return free_swap
> required
;
902 * swsusp_write - Write entire image and metadata.
903 * @flags: flags to pass to the "boot" kernel in the image header
905 * It is important _NOT_ to umount filesystems at this point. We want
906 * them synced (in case something goes wrong) but we DO not want to mark
907 * filesystem clean: it is not. (And it does not matter, if we resume
908 * correctly, we'll mark system clean, anyway.)
911 int swsusp_write(unsigned int flags
)
913 struct swap_map_handle handle
;
914 struct snapshot_handle snapshot
;
915 struct swsusp_info
*header
;
919 pages
= snapshot_get_image_size();
920 error
= get_swap_writer(&handle
);
922 pr_err("Cannot get swap writer\n");
925 if (flags
& SF_NOCOMPRESS_MODE
) {
926 if (!enough_swap(pages
)) {
927 pr_err("Not enough free swap\n");
932 memset(&snapshot
, 0, sizeof(struct snapshot_handle
));
933 error
= snapshot_read_next(&snapshot
);
934 if (error
< (int)PAGE_SIZE
) {
940 header
= (struct swsusp_info
*)data_of(snapshot
);
941 error
= swap_write_page(&handle
, header
, NULL
);
943 error
= (flags
& SF_NOCOMPRESS_MODE
) ?
944 save_image(&handle
, &snapshot
, pages
- 1) :
945 save_image_lzo(&handle
, &snapshot
, pages
- 1);
948 error
= swap_writer_finish(&handle
, flags
, error
);
953 * The following functions allow us to read data using a swap map
954 * in a file-alike way
957 static void release_swap_reader(struct swap_map_handle
*handle
)
959 struct swap_map_page_list
*tmp
;
961 while (handle
->maps
) {
962 if (handle
->maps
->map
)
963 free_page((unsigned long)handle
->maps
->map
);
965 handle
->maps
= handle
->maps
->next
;
971 static int get_swap_reader(struct swap_map_handle
*handle
,
972 unsigned int *flags_p
)
975 struct swap_map_page_list
*tmp
, *last
;
978 *flags_p
= swsusp_header
->flags
;
980 if (!swsusp_header
->image
) /* how can this happen? */
984 last
= handle
->maps
= NULL
;
985 offset
= swsusp_header
->image
;
987 tmp
= kzalloc(sizeof(*handle
->maps
), GFP_KERNEL
);
989 release_swap_reader(handle
);
998 tmp
->map
= (struct swap_map_page
*)
999 __get_free_page(GFP_NOIO
| __GFP_HIGH
);
1001 release_swap_reader(handle
);
1005 error
= hib_submit_io(REQ_OP_READ
, 0, offset
, tmp
->map
, NULL
);
1007 release_swap_reader(handle
);
1010 offset
= tmp
->map
->next_swap
;
1013 handle
->cur
= handle
->maps
->map
;
1017 static int swap_read_page(struct swap_map_handle
*handle
, void *buf
,
1018 struct hib_bio_batch
*hb
)
1022 struct swap_map_page_list
*tmp
;
1026 offset
= handle
->cur
->entries
[handle
->k
];
1029 error
= hib_submit_io(REQ_OP_READ
, 0, offset
, buf
, hb
);
1032 if (++handle
->k
>= MAP_PAGE_ENTRIES
) {
1034 free_page((unsigned long)handle
->maps
->map
);
1036 handle
->maps
= handle
->maps
->next
;
1039 release_swap_reader(handle
);
1041 handle
->cur
= handle
->maps
->map
;
1046 static int swap_reader_finish(struct swap_map_handle
*handle
)
1048 release_swap_reader(handle
);
1054 * load_image - load the image using the swap map handle
1055 * @handle and the snapshot handle @snapshot
1056 * (assume there are @nr_pages pages to load)
1059 static int load_image(struct swap_map_handle
*handle
,
1060 struct snapshot_handle
*snapshot
,
1061 unsigned int nr_to_read
)
1067 struct hib_bio_batch hb
;
1071 hib_init_batch(&hb
);
1073 clean_pages_on_read
= true;
1074 pr_info("Loading image data pages (%u pages)...\n", nr_to_read
);
1075 m
= nr_to_read
/ 10;
1079 start
= ktime_get();
1081 ret
= snapshot_write_next(snapshot
);
1084 ret
= swap_read_page(handle
, data_of(*snapshot
), &hb
);
1087 if (snapshot
->sync_read
)
1088 ret
= hib_wait_io(&hb
);
1091 if (!(nr_pages
% m
))
1092 pr_info("Image loading progress: %3d%%\n",
1096 err2
= hib_wait_io(&hb
);
1097 hib_finish_batch(&hb
);
1102 pr_info("Image loading done\n");
1103 snapshot_write_finalize(snapshot
);
1104 if (!snapshot_image_loaded(snapshot
))
1107 swsusp_show_speed(start
, stop
, nr_to_read
, "Read");
1112 * Structure used for LZO data decompression.
1115 struct task_struct
*thr
; /* thread */
1116 atomic_t ready
; /* ready to start flag */
1117 atomic_t stop
; /* ready to stop flag */
1118 int ret
; /* return code */
1119 wait_queue_head_t go
; /* start decompression */
1120 wait_queue_head_t done
; /* decompression done */
1121 size_t unc_len
; /* uncompressed length */
1122 size_t cmp_len
; /* compressed length */
1123 unsigned char unc
[LZO_UNC_SIZE
]; /* uncompressed buffer */
1124 unsigned char cmp
[LZO_CMP_SIZE
]; /* compressed buffer */
1128 * Deompression function that runs in its own thread.
1130 static int lzo_decompress_threadfn(void *data
)
1132 struct dec_data
*d
= data
;
1135 wait_event(d
->go
, atomic_read(&d
->ready
) ||
1136 kthread_should_stop());
1137 if (kthread_should_stop()) {
1140 atomic_set(&d
->stop
, 1);
1144 atomic_set(&d
->ready
, 0);
1146 d
->unc_len
= LZO_UNC_SIZE
;
1147 d
->ret
= lzo1x_decompress_safe(d
->cmp
+ LZO_HEADER
, d
->cmp_len
,
1148 d
->unc
, &d
->unc_len
);
1149 if (clean_pages_on_decompress
)
1150 flush_icache_range((unsigned long)d
->unc
,
1151 (unsigned long)d
->unc
+ d
->unc_len
);
1153 atomic_set(&d
->stop
, 1);
1160 * load_image_lzo - Load compressed image data and decompress them with LZO.
1161 * @handle: Swap map handle to use for loading data.
1162 * @snapshot: Image to copy uncompressed data into.
1163 * @nr_to_read: Number of pages to load.
1165 static int load_image_lzo(struct swap_map_handle
*handle
,
1166 struct snapshot_handle
*snapshot
,
1167 unsigned int nr_to_read
)
1172 struct hib_bio_batch hb
;
1177 unsigned i
, thr
, run_threads
, nr_threads
;
1178 unsigned ring
= 0, pg
= 0, ring_size
= 0,
1179 have
= 0, want
, need
, asked
= 0;
1180 unsigned long read_pages
= 0;
1181 unsigned char **page
= NULL
;
1182 struct dec_data
*data
= NULL
;
1183 struct crc_data
*crc
= NULL
;
1185 hib_init_batch(&hb
);
1188 * We'll limit the number of threads for decompression to limit memory
1191 nr_threads
= num_online_cpus() - 1;
1192 nr_threads
= clamp_val(nr_threads
, 1, LZO_THREADS
);
1194 page
= vmalloc(array_size(LZO_MAX_RD_PAGES
, sizeof(*page
)));
1196 pr_err("Failed to allocate LZO page\n");
1201 data
= vmalloc(array_size(nr_threads
, sizeof(*data
)));
1203 pr_err("Failed to allocate LZO data\n");
1207 for (thr
= 0; thr
< nr_threads
; thr
++)
1208 memset(&data
[thr
], 0, offsetof(struct dec_data
, go
));
1210 crc
= kmalloc(sizeof(*crc
), GFP_KERNEL
);
1212 pr_err("Failed to allocate crc\n");
1216 memset(crc
, 0, offsetof(struct crc_data
, go
));
1218 clean_pages_on_decompress
= true;
1221 * Start the decompression threads.
1223 for (thr
= 0; thr
< nr_threads
; thr
++) {
1224 init_waitqueue_head(&data
[thr
].go
);
1225 init_waitqueue_head(&data
[thr
].done
);
1227 data
[thr
].thr
= kthread_run(lzo_decompress_threadfn
,
1229 "image_decompress/%u", thr
);
1230 if (IS_ERR(data
[thr
].thr
)) {
1231 data
[thr
].thr
= NULL
;
1232 pr_err("Cannot start decompression threads\n");
1239 * Start the CRC32 thread.
1241 init_waitqueue_head(&crc
->go
);
1242 init_waitqueue_head(&crc
->done
);
1245 crc
->crc32
= &handle
->crc32
;
1246 for (thr
= 0; thr
< nr_threads
; thr
++) {
1247 crc
->unc
[thr
] = data
[thr
].unc
;
1248 crc
->unc_len
[thr
] = &data
[thr
].unc_len
;
1251 crc
->thr
= kthread_run(crc32_threadfn
, crc
, "image_crc32");
1252 if (IS_ERR(crc
->thr
)) {
1254 pr_err("Cannot start CRC32 thread\n");
1260 * Set the number of pages for read buffering.
1261 * This is complete guesswork, because we'll only know the real
1262 * picture once prepare_image() is called, which is much later on
1263 * during the image load phase. We'll assume the worst case and
1264 * say that none of the image pages are from high memory.
1266 if (low_free_pages() > snapshot_get_image_size())
1267 read_pages
= (low_free_pages() - snapshot_get_image_size()) / 2;
1268 read_pages
= clamp_val(read_pages
, LZO_MIN_RD_PAGES
, LZO_MAX_RD_PAGES
);
1270 for (i
= 0; i
< read_pages
; i
++) {
1271 page
[i
] = (void *)__get_free_page(i
< LZO_CMP_PAGES
?
1272 GFP_NOIO
| __GFP_HIGH
:
1273 GFP_NOIO
| __GFP_NOWARN
|
1277 if (i
< LZO_CMP_PAGES
) {
1279 pr_err("Failed to allocate LZO pages\n");
1287 want
= ring_size
= i
;
1289 pr_info("Using %u thread(s) for decompression\n", nr_threads
);
1290 pr_info("Loading and decompressing image data (%u pages)...\n",
1292 m
= nr_to_read
/ 10;
1296 start
= ktime_get();
1298 ret
= snapshot_write_next(snapshot
);
1303 for (i
= 0; !eof
&& i
< want
; i
++) {
1304 ret
= swap_read_page(handle
, page
[ring
], &hb
);
1307 * On real read error, finish. On end of data,
1308 * set EOF flag and just exit the read loop.
1311 handle
->cur
->entries
[handle
->k
]) {
1318 if (++ring
>= ring_size
)
1325 * We are out of data, wait for some more.
1331 ret
= hib_wait_io(&hb
);
1340 if (crc
->run_threads
) {
1341 wait_event(crc
->done
, atomic_read(&crc
->stop
));
1342 atomic_set(&crc
->stop
, 0);
1343 crc
->run_threads
= 0;
1346 for (thr
= 0; have
&& thr
< nr_threads
; thr
++) {
1347 data
[thr
].cmp_len
= *(size_t *)page
[pg
];
1348 if (unlikely(!data
[thr
].cmp_len
||
1350 lzo1x_worst_compress(LZO_UNC_SIZE
))) {
1351 pr_err("Invalid LZO compressed length\n");
1356 need
= DIV_ROUND_UP(data
[thr
].cmp_len
+ LZO_HEADER
,
1367 off
< LZO_HEADER
+ data
[thr
].cmp_len
;
1369 memcpy(data
[thr
].cmp
+ off
,
1370 page
[pg
], PAGE_SIZE
);
1373 if (++pg
>= ring_size
)
1377 atomic_set(&data
[thr
].ready
, 1);
1378 wake_up(&data
[thr
].go
);
1382 * Wait for more data while we are decompressing.
1384 if (have
< LZO_CMP_PAGES
&& asked
) {
1385 ret
= hib_wait_io(&hb
);
1394 for (run_threads
= thr
, thr
= 0; thr
< run_threads
; thr
++) {
1395 wait_event(data
[thr
].done
,
1396 atomic_read(&data
[thr
].stop
));
1397 atomic_set(&data
[thr
].stop
, 0);
1399 ret
= data
[thr
].ret
;
1402 pr_err("LZO decompression failed\n");
1406 if (unlikely(!data
[thr
].unc_len
||
1407 data
[thr
].unc_len
> LZO_UNC_SIZE
||
1408 data
[thr
].unc_len
& (PAGE_SIZE
- 1))) {
1409 pr_err("Invalid LZO uncompressed length\n");
1415 off
< data
[thr
].unc_len
; off
+= PAGE_SIZE
) {
1416 memcpy(data_of(*snapshot
),
1417 data
[thr
].unc
+ off
, PAGE_SIZE
);
1419 if (!(nr_pages
% m
))
1420 pr_info("Image loading progress: %3d%%\n",
1424 ret
= snapshot_write_next(snapshot
);
1426 crc
->run_threads
= thr
+ 1;
1427 atomic_set(&crc
->ready
, 1);
1434 crc
->run_threads
= thr
;
1435 atomic_set(&crc
->ready
, 1);
1440 if (crc
->run_threads
) {
1441 wait_event(crc
->done
, atomic_read(&crc
->stop
));
1442 atomic_set(&crc
->stop
, 0);
1446 pr_info("Image loading done\n");
1447 snapshot_write_finalize(snapshot
);
1448 if (!snapshot_image_loaded(snapshot
))
1451 if (swsusp_header
->flags
& SF_CRC32_MODE
) {
1452 if(handle
->crc32
!= swsusp_header
->crc32
) {
1453 pr_err("Invalid image CRC32!\n");
1459 swsusp_show_speed(start
, stop
, nr_to_read
, "Read");
1461 hib_finish_batch(&hb
);
1462 for (i
= 0; i
< ring_size
; i
++)
1463 free_page((unsigned long)page
[i
]);
1466 kthread_stop(crc
->thr
);
1470 for (thr
= 0; thr
< nr_threads
; thr
++)
1472 kthread_stop(data
[thr
].thr
);
1481 * swsusp_read - read the hibernation image.
1482 * @flags_p: flags passed by the "frozen" kernel in the image header should
1483 * be written into this memory location
1486 int swsusp_read(unsigned int *flags_p
)
1489 struct swap_map_handle handle
;
1490 struct snapshot_handle snapshot
;
1491 struct swsusp_info
*header
;
1493 memset(&snapshot
, 0, sizeof(struct snapshot_handle
));
1494 error
= snapshot_write_next(&snapshot
);
1495 if (error
< (int)PAGE_SIZE
)
1496 return error
< 0 ? error
: -EFAULT
;
1497 header
= (struct swsusp_info
*)data_of(snapshot
);
1498 error
= get_swap_reader(&handle
, flags_p
);
1502 error
= swap_read_page(&handle
, header
, NULL
);
1504 error
= (*flags_p
& SF_NOCOMPRESS_MODE
) ?
1505 load_image(&handle
, &snapshot
, header
->pages
- 1) :
1506 load_image_lzo(&handle
, &snapshot
, header
->pages
- 1);
1508 swap_reader_finish(&handle
);
1511 pr_debug("Image successfully loaded\n");
1513 pr_debug("Error %d resuming\n", error
);
1518 * swsusp_check - Check for swsusp signature in the resume device
1521 int swsusp_check(void)
1525 hib_resume_bdev
= blkdev_get_by_dev(swsusp_resume_device
,
1527 if (!IS_ERR(hib_resume_bdev
)) {
1528 set_blocksize(hib_resume_bdev
, PAGE_SIZE
);
1529 clear_page(swsusp_header
);
1530 error
= hib_submit_io(REQ_OP_READ
, 0,
1531 swsusp_resume_block
,
1532 swsusp_header
, NULL
);
1536 if (!memcmp(HIBERNATE_SIG
, swsusp_header
->sig
, 10)) {
1537 memcpy(swsusp_header
->sig
, swsusp_header
->orig_sig
, 10);
1538 /* Reset swap signature now */
1539 error
= hib_submit_io(REQ_OP_WRITE
, REQ_SYNC
,
1540 swsusp_resume_block
,
1541 swsusp_header
, NULL
);
1548 blkdev_put(hib_resume_bdev
, FMODE_READ
);
1550 pr_debug("Image signature found, resuming\n");
1552 error
= PTR_ERR(hib_resume_bdev
);
1556 pr_debug("Image not found (code %d)\n", error
);
1562 * swsusp_close - close swap device.
1565 void swsusp_close(fmode_t mode
)
1567 if (IS_ERR(hib_resume_bdev
)) {
1568 pr_debug("Image device not initialised\n");
1572 blkdev_put(hib_resume_bdev
, mode
);
1576 * swsusp_unmark - Unmark swsusp signature in the resume device
1579 #ifdef CONFIG_SUSPEND
1580 int swsusp_unmark(void)
1584 hib_submit_io(REQ_OP_READ
, 0, swsusp_resume_block
,
1585 swsusp_header
, NULL
);
1586 if (!memcmp(HIBERNATE_SIG
,swsusp_header
->sig
, 10)) {
1587 memcpy(swsusp_header
->sig
,swsusp_header
->orig_sig
, 10);
1588 error
= hib_submit_io(REQ_OP_WRITE
, REQ_SYNC
,
1589 swsusp_resume_block
,
1590 swsusp_header
, NULL
);
1592 pr_err("Cannot find swsusp signature!\n");
1597 * We just returned from suspend, we don't need the image any more.
1599 free_all_swap_pages(root_swap
);
1605 static int __init
swsusp_header_init(void)
1607 swsusp_header
= (struct swsusp_header
*) __get_free_page(GFP_KERNEL
);
1609 panic("Could not allocate memory for swsusp_header\n");
1613 core_initcall(swsusp_header_init
);