Merge tag 'x86-asm-2024-03-11' of git://git.kernel.org/pub/scm/linux/kernel/git/tip/tip
[linux-2.6-block.git] / kernel / power / swap.c
CommitLineData
55716d26 1// SPDX-License-Identifier: GPL-2.0-only
61159a31
RW
2/*
3 * linux/kernel/power/swap.c
4 *
5 * This file provides functions for reading the suspend image from
6 * and writing it to a swap partition.
7 *
a2531293 8 * Copyright (C) 1998,2001-2005 Pavel Machek <pavel@ucw.cz>
61159a31 9 * Copyright (C) 2006 Rafael J. Wysocki <rjw@sisk.pl>
5a21d489 10 * Copyright (C) 2010-2012 Bojan Smojver <bojan@rexursive.com>
61159a31
RW
11 */
12
64ec72a1
JP
13#define pr_fmt(fmt) "PM: " fmt
14
61159a31 15#include <linux/module.h>
61159a31 16#include <linux/file.h>
61159a31
RW
17#include <linux/delay.h>
18#include <linux/bitops.h>
61159a31 19#include <linux/device.h>
61159a31 20#include <linux/bio.h>
546e0d27 21#include <linux/blkdev.h>
61159a31
RW
22#include <linux/swap.h>
23#include <linux/swapops.h>
24#include <linux/pm.h>
5a0e3ad6 25#include <linux/slab.h>
f996fc96
BS
26#include <linux/lzo.h>
27#include <linux/vmalloc.h>
081a9d04
BS
28#include <linux/cpumask.h>
29#include <linux/atomic.h>
30#include <linux/kthread.h>
31#include <linux/crc32.h>
db597605 32#include <linux/ktime.h>
61159a31
RW
33
34#include "power.h"
35
be8cd644 36#define HIBERNATE_SIG "S1SUSPEND"
61159a31 37
74d95555
DW
38u32 swsusp_hardware_signature;
39
f6cf0545
JM
40/*
41 * When reading an {un,}compressed image, we may restore pages in place,
42 * in which case some architectures need these pages cleaning before they
43 * can be executed. We don't know which pages these may be, so clean the lot.
44 */
45static bool clean_pages_on_read;
46static bool clean_pages_on_decompress;
47
51fb352b
JS
48/*
49 * The swap map is a data structure used for keeping track of each page
50 * written to a swap partition. It consists of many swap_map_page
90133673 51 * structures that contain each an array of MAP_PAGE_ENTRIES swap entries.
51fb352b
JS
52 * These structures are stored on the swap and linked together with the
53 * help of the .next_swap member.
54 *
55 * The swap map is created during suspend. The swap map pages are
56 * allocated and populated one at a time, so we only need one memory
57 * page to set up the entire structure.
58 *
081a9d04 59 * During resume we pick up all swap_map_page structures into a list.
51fb352b
JS
60 */
61
62#define MAP_PAGE_ENTRIES (PAGE_SIZE / sizeof(sector_t) - 1)
63
f8262d47
BS
64/*
65 * Number of free pages that are not high.
66 */
67static inline unsigned long low_free_pages(void)
68{
69 return nr_free_pages() - nr_free_highpages();
70}
71
72/*
73 * Number of pages required to be kept free while writing the image. Always
74 * half of all available low pages before the writing starts.
75 */
76static inline unsigned long reqd_free_pages(void)
77{
78 return low_free_pages() / 2;
79}
80
51fb352b
JS
81struct swap_map_page {
82 sector_t entries[MAP_PAGE_ENTRIES];
83 sector_t next_swap;
84};
85
081a9d04
BS
86struct swap_map_page_list {
87 struct swap_map_page *map;
88 struct swap_map_page_list *next;
89};
90
444e1154 91/*
51fb352b
JS
92 * The swap_map_handle structure is used for handling swap in
93 * a file-alike way
94 */
95
96struct swap_map_handle {
97 struct swap_map_page *cur;
081a9d04 98 struct swap_map_page_list *maps;
51fb352b
JS
99 sector_t cur_swap;
100 sector_t first_sector;
101 unsigned int k;
f8262d47 102 unsigned long reqd_free_pages;
081a9d04 103 u32 crc32;
51fb352b
JS
104};
105
1b29c164 106struct swsusp_header {
081a9d04 107 char reserved[PAGE_SIZE - 20 - sizeof(sector_t) - sizeof(int) -
74d95555
DW
108 sizeof(u32) - sizeof(u32)];
109 u32 hw_sig;
081a9d04 110 u32 crc32;
3aef83e0 111 sector_t image;
a634cc10 112 unsigned int flags; /* Flags to pass to the "boot" kernel */
61159a31
RW
113 char orig_sig[10];
114 char sig[10];
52f5684c 115} __packed;
1b29c164
VG
116
117static struct swsusp_header *swsusp_header;
61159a31 118
444e1154 119/*
0414f2ec
NC
120 * The following functions are used for tracing the allocated
121 * swap pages, so that they can be freed in case of an error.
122 */
123
124struct swsusp_extent {
125 struct rb_node node;
126 unsigned long start;
127 unsigned long end;
128};
129
130static struct rb_root swsusp_extents = RB_ROOT;
131
132static int swsusp_extents_insert(unsigned long swap_offset)
133{
134 struct rb_node **new = &(swsusp_extents.rb_node);
135 struct rb_node *parent = NULL;
136 struct swsusp_extent *ext;
137
138 /* Figure out where to put the new node */
139 while (*new) {
8316bd72 140 ext = rb_entry(*new, struct swsusp_extent, node);
0414f2ec
NC
141 parent = *new;
142 if (swap_offset < ext->start) {
143 /* Try to merge */
144 if (swap_offset == ext->start - 1) {
145 ext->start--;
146 return 0;
147 }
148 new = &((*new)->rb_left);
149 } else if (swap_offset > ext->end) {
150 /* Try to merge */
151 if (swap_offset == ext->end + 1) {
152 ext->end++;
153 return 0;
154 }
155 new = &((*new)->rb_right);
156 } else {
157 /* It already is in the tree */
158 return -EINVAL;
159 }
160 }
161 /* Add the new node and rebalance the tree. */
162 ext = kzalloc(sizeof(struct swsusp_extent), GFP_KERNEL);
163 if (!ext)
164 return -ENOMEM;
165
166 ext->start = swap_offset;
167 ext->end = swap_offset;
168 rb_link_node(&ext->node, parent, new);
169 rb_insert_color(&ext->node, &swsusp_extents);
170 return 0;
171}
172
444e1154 173/*
0414f2ec
NC
174 * alloc_swapdev_block - allocate a swap page and register that it has
175 * been allocated, so that it can be freed in case of an error.
176 */
177
178sector_t alloc_swapdev_block(int swap)
179{
180 unsigned long offset;
181
910321ea 182 offset = swp_offset(get_swap_page_of_type(swap));
0414f2ec
NC
183 if (offset) {
184 if (swsusp_extents_insert(offset))
910321ea 185 swap_free(swp_entry(swap, offset));
0414f2ec
NC
186 else
187 return swapdev_block(swap, offset);
188 }
189 return 0;
190}
191
444e1154 192/*
0414f2ec 193 * free_all_swap_pages - free swap pages allocated for saving image data.
90133673 194 * It also frees the extents used to register which swap entries had been
0414f2ec
NC
195 * allocated.
196 */
197
198void free_all_swap_pages(int swap)
199{
200 struct rb_node *node;
201
202 while ((node = swsusp_extents.rb_node)) {
203 struct swsusp_extent *ext;
204 unsigned long offset;
205
47087eeb 206 ext = rb_entry(node, struct swsusp_extent, node);
0414f2ec
NC
207 rb_erase(node, &swsusp_extents);
208 for (offset = ext->start; offset <= ext->end; offset++)
910321ea 209 swap_free(swp_entry(swap, offset));
0414f2ec
NC
210
211 kfree(ext);
212 }
213}
214
215int swsusp_swap_in_use(void)
216{
217 return (swsusp_extents.rb_node != NULL);
218}
219
61159a31 220/*
3fc6b34f 221 * General things
61159a31
RW
222 */
223
224static unsigned short root_swap = 0xffff;
4379f911 225static struct file *hib_resume_bdev_file;
343df3c7
CH
226
227struct hib_bio_batch {
228 atomic_t count;
229 wait_queue_head_t wait;
4e4cbee9 230 blk_status_t error;
55c4478a 231 struct blk_plug plug;
343df3c7
CH
232};
233
234static void hib_init_batch(struct hib_bio_batch *hb)
235{
236 atomic_set(&hb->count, 0);
237 init_waitqueue_head(&hb->wait);
4e4cbee9 238 hb->error = BLK_STS_OK;
55c4478a
XC
239 blk_start_plug(&hb->plug);
240}
241
242static void hib_finish_batch(struct hib_bio_batch *hb)
243{
244 blk_finish_plug(&hb->plug);
343df3c7
CH
245}
246
4246a0b6 247static void hib_end_io(struct bio *bio)
343df3c7
CH
248{
249 struct hib_bio_batch *hb = bio->bi_private;
263663cd 250 struct page *page = bio_first_page_all(bio);
343df3c7 251
4e4cbee9 252 if (bio->bi_status) {
64ec72a1
JP
253 pr_alert("Read-error on swap-device (%u:%u:%Lu)\n",
254 MAJOR(bio_dev(bio)), MINOR(bio_dev(bio)),
255 (unsigned long long)bio->bi_iter.bi_sector);
343df3c7
CH
256 }
257
258 if (bio_data_dir(bio) == WRITE)
259 put_page(page);
f6cf0545
JM
260 else if (clean_pages_on_read)
261 flush_icache_range((unsigned long)page_address(page),
262 (unsigned long)page_address(page) + PAGE_SIZE);
343df3c7 263
4e4cbee9
CH
264 if (bio->bi_status && !hb->error)
265 hb->error = bio->bi_status;
343df3c7
CH
266 if (atomic_dec_and_test(&hb->count))
267 wake_up(&hb->wait);
268
269 bio_put(bio);
270}
271
568e34ed
BVA
272static int hib_submit_io(blk_opf_t opf, pgoff_t page_off, void *addr,
273 struct hib_bio_batch *hb)
343df3c7
CH
274{
275 struct page *page = virt_to_page(addr);
276 struct bio *bio;
277 int error = 0;
278
4379f911 279 bio = bio_alloc(file_bdev(hib_resume_bdev_file), 1, opf,
e017d304 280 GFP_NOIO | __GFP_HIGH);
343df3c7 281 bio->bi_iter.bi_sector = page_off * (PAGE_SIZE >> 9);
343df3c7
CH
282
283 if (bio_add_page(bio, page, PAGE_SIZE, 0) < PAGE_SIZE) {
64ec72a1
JP
284 pr_err("Adding page to bio failed at %llu\n",
285 (unsigned long long)bio->bi_iter.bi_sector);
343df3c7
CH
286 bio_put(bio);
287 return -EFAULT;
288 }
289
290 if (hb) {
291 bio->bi_end_io = hib_end_io;
292 bio->bi_private = hb;
293 atomic_inc(&hb->count);
4e49ea4a 294 submit_bio(bio);
343df3c7 295 } else {
4e49ea4a 296 error = submit_bio_wait(bio);
343df3c7
CH
297 bio_put(bio);
298 }
299
300 return error;
301}
302
01de5fcd 303static int hib_wait_io(struct hib_bio_batch *hb)
343df3c7 304{
55c4478a
XC
305 /*
306 * We are relying on the behavior of blk_plug that a thread with
307 * a plug will flush the plug list before sleeping.
308 */
343df3c7 309 wait_event(hb->wait, atomic_read(&hb->count) == 0);
01de5fcd 310 return blk_status_to_errno(hb->error);
343df3c7 311}
3fc6b34f 312
3fc6b34f
RW
313/*
314 * Saving part
315 */
51fb352b 316static int mark_swapfiles(struct swap_map_handle *handle, unsigned int flags)
61159a31
RW
317{
318 int error;
319
568e34ed 320 hib_submit_io(REQ_OP_READ, swsusp_resume_block, swsusp_header, NULL);
1b29c164
VG
321 if (!memcmp("SWAP-SPACE",swsusp_header->sig, 10) ||
322 !memcmp("SWAPSPACE2",swsusp_header->sig, 10)) {
323 memcpy(swsusp_header->orig_sig,swsusp_header->sig, 10);
3624eb04 324 memcpy(swsusp_header->sig, HIBERNATE_SIG, 10);
51fb352b 325 swsusp_header->image = handle->first_sector;
74d95555
DW
326 if (swsusp_hardware_signature) {
327 swsusp_header->hw_sig = swsusp_hardware_signature;
328 flags |= SF_HW_SIG;
329 }
a634cc10 330 swsusp_header->flags = flags;
081a9d04
BS
331 if (flags & SF_CRC32_MODE)
332 swsusp_header->crc32 = handle->crc32;
568e34ed 333 error = hib_submit_io(REQ_OP_WRITE | REQ_SYNC,
162b99e3 334 swsusp_resume_block, swsusp_header, NULL);
61159a31 335 } else {
64ec72a1 336 pr_err("Swap header not found!\n");
61159a31
RW
337 error = -ENODEV;
338 }
339 return error;
340}
341
342/**
343 * swsusp_swap_check - check if the resume device is a swap device
344 * and get its index (if so)
6f612af5
JS
345 *
346 * This is called before saving image
61159a31 347 */
6f612af5 348static int swsusp_swap_check(void)
61159a31 349{
3aef83e0
RW
350 int res;
351
21bd9005
CH
352 if (swsusp_resume_device)
353 res = swap_type_of(swsusp_resume_device, swsusp_resume_block);
354 else
355 res = find_first_swap(&swsusp_resume_device);
3aef83e0
RW
356 if (res < 0)
357 return res;
3aef83e0 358 root_swap = res;
21bd9005 359
4379f911 360 hib_resume_bdev_file = bdev_file_open_by_dev(swsusp_resume_device,
05bdb996 361 BLK_OPEN_WRITE, NULL, NULL);
4379f911
CB
362 if (IS_ERR(hib_resume_bdev_file))
363 return PTR_ERR(hib_resume_bdev_file);
3aef83e0 364
4379f911 365 res = set_blocksize(file_bdev(hib_resume_bdev_file), PAGE_SIZE);
3aef83e0 366 if (res < 0)
4379f911 367 fput(hib_resume_bdev_file);
61159a31 368
61159a31
RW
369 return res;
370}
371
372/**
373 * write_page - Write one page to given swap location.
374 * @buf: Address we're writing.
375 * @offset: Offset of the swap page we're writing to.
343df3c7 376 * @hb: bio completion batch
61159a31
RW
377 */
378
343df3c7 379static int write_page(void *buf, sector_t offset, struct hib_bio_batch *hb)
61159a31 380{
3aef83e0 381 void *src;
081a9d04 382 int ret;
3aef83e0
RW
383
384 if (!offset)
385 return -ENOSPC;
386
343df3c7 387 if (hb) {
0eb0b63c 388 src = (void *)__get_free_page(GFP_NOIO | __GFP_NOWARN |
5a21d489 389 __GFP_NORETRY);
3aef83e0 390 if (src) {
3ecb01df 391 copy_page(src, buf);
3aef83e0 392 } else {
343df3c7 393 ret = hib_wait_io(hb); /* Free pages */
081a9d04
BS
394 if (ret)
395 return ret;
0eb0b63c 396 src = (void *)__get_free_page(GFP_NOIO |
5a21d489
BS
397 __GFP_NOWARN |
398 __GFP_NORETRY);
081a9d04
BS
399 if (src) {
400 copy_page(src, buf);
401 } else {
402 WARN_ON_ONCE(1);
343df3c7 403 hb = NULL; /* Go synchronous */
081a9d04
BS
404 src = buf;
405 }
ab954160 406 }
3aef83e0
RW
407 } else {
408 src = buf;
61159a31 409 }
568e34ed 410 return hib_submit_io(REQ_OP_WRITE | REQ_SYNC, offset, src, hb);
61159a31
RW
411}
412
61159a31
RW
413static void release_swap_writer(struct swap_map_handle *handle)
414{
415 if (handle->cur)
416 free_page((unsigned long)handle->cur);
417 handle->cur = NULL;
61159a31
RW
418}
419
420static int get_swap_writer(struct swap_map_handle *handle)
421{
6f612af5
JS
422 int ret;
423
424 ret = swsusp_swap_check();
425 if (ret) {
426 if (ret != -ENOSPC)
64ec72a1 427 pr_err("Cannot find swap device, try swapon -a\n");
6f612af5
JS
428 return ret;
429 }
61159a31 430 handle->cur = (struct swap_map_page *)get_zeroed_page(GFP_KERNEL);
6f612af5
JS
431 if (!handle->cur) {
432 ret = -ENOMEM;
433 goto err_close;
434 }
d1d241cc 435 handle->cur_swap = alloc_swapdev_block(root_swap);
61159a31 436 if (!handle->cur_swap) {
6f612af5
JS
437 ret = -ENOSPC;
438 goto err_rel;
61159a31
RW
439 }
440 handle->k = 0;
f8262d47 441 handle->reqd_free_pages = reqd_free_pages();
51fb352b 442 handle->first_sector = handle->cur_swap;
61159a31 443 return 0;
6f612af5
JS
444err_rel:
445 release_swap_writer(handle);
446err_close:
93745df1 447 swsusp_close();
6f612af5 448 return ret;
61159a31
RW
449}
450
ab954160 451static int swap_write_page(struct swap_map_handle *handle, void *buf,
343df3c7 452 struct hib_bio_batch *hb)
ab954160 453{
bbeaa469 454 int error;
3aef83e0 455 sector_t offset;
61159a31
RW
456
457 if (!handle->cur)
458 return -EINVAL;
d1d241cc 459 offset = alloc_swapdev_block(root_swap);
343df3c7 460 error = write_page(buf, offset, hb);
61159a31
RW
461 if (error)
462 return error;
463 handle->cur->entries[handle->k++] = offset;
464 if (handle->k >= MAP_PAGE_ENTRIES) {
d1d241cc 465 offset = alloc_swapdev_block(root_swap);
61159a31
RW
466 if (!offset)
467 return -ENOSPC;
468 handle->cur->next_swap = offset;
343df3c7 469 error = write_page(handle->cur, handle->cur_swap, hb);
61159a31 470 if (error)
ab954160 471 goto out;
3ecb01df 472 clear_page(handle->cur);
61159a31
RW
473 handle->cur_swap = offset;
474 handle->k = 0;
5a21d489 475
343df3c7
CH
476 if (hb && low_free_pages() <= handle->reqd_free_pages) {
477 error = hib_wait_io(hb);
5a21d489
BS
478 if (error)
479 goto out;
480 /*
481 * Recalculate the number of required free pages, to
482 * make sure we never take more than half.
483 */
484 handle->reqd_free_pages = reqd_free_pages();
485 }
081a9d04 486 }
59a49335 487 out:
ab954160 488 return error;
61159a31
RW
489}
490
491static int flush_swap_writer(struct swap_map_handle *handle)
492{
493 if (handle->cur && handle->cur_swap)
ab954160 494 return write_page(handle->cur, handle->cur_swap, NULL);
61159a31
RW
495 else
496 return -EINVAL;
497}
498
6f612af5
JS
499static int swap_writer_finish(struct swap_map_handle *handle,
500 unsigned int flags, int error)
501{
502 if (!error) {
64ec72a1 503 pr_info("S");
6f612af5 504 error = mark_swapfiles(handle, flags);
64ec72a1 505 pr_cont("|\n");
fef9c8d2 506 flush_swap_writer(handle);
6f612af5
JS
507 }
508
509 if (error)
510 free_all_swap_pages(root_swap);
511 release_swap_writer(handle);
93745df1 512 swsusp_close();
6f612af5
JS
513
514 return error;
515}
516
f996fc96
BS
517/* We need to remember how much compressed data we need to read. */
518#define LZO_HEADER sizeof(size_t)
519
520/* Number of pages/bytes we'll compress at one time. */
521#define LZO_UNC_PAGES 32
522#define LZO_UNC_SIZE (LZO_UNC_PAGES * PAGE_SIZE)
523
524/* Number of pages/bytes we need for compressed data (worst case). */
525#define LZO_CMP_PAGES DIV_ROUND_UP(lzo1x_worst_compress(LZO_UNC_SIZE) + \
526 LZO_HEADER, PAGE_SIZE)
527#define LZO_CMP_SIZE (LZO_CMP_PAGES * PAGE_SIZE)
528
081a9d04
BS
529/* Maximum number of threads for compression/decompression. */
530#define LZO_THREADS 3
531
5a21d489
BS
532/* Minimum/maximum number of pages for read buffering. */
533#define LZO_MIN_RD_PAGES 1024
534#define LZO_MAX_RD_PAGES 8192
081a9d04
BS
535
536
61159a31
RW
537/**
538 * save_image - save the suspend image data
539 */
540
541static int save_image(struct swap_map_handle *handle,
542 struct snapshot_handle *snapshot,
3a4f7577 543 unsigned int nr_to_write)
61159a31
RW
544{
545 unsigned int m;
546 int ret;
3a4f7577 547 int nr_pages;
ab954160 548 int err2;
343df3c7 549 struct hib_bio_batch hb;
db597605
TR
550 ktime_t start;
551 ktime_t stop;
61159a31 552
343df3c7
CH
553 hib_init_batch(&hb);
554
64ec72a1 555 pr_info("Saving image data pages (%u pages)...\n",
23976728 556 nr_to_write);
d8150d35 557 m = nr_to_write / 10;
61159a31
RW
558 if (!m)
559 m = 1;
560 nr_pages = 0;
db597605 561 start = ktime_get();
4ff277f9 562 while (1) {
d3c1b24c 563 ret = snapshot_read_next(snapshot);
4ff277f9
JS
564 if (ret <= 0)
565 break;
343df3c7 566 ret = swap_write_page(handle, data_of(*snapshot), &hb);
4ff277f9
JS
567 if (ret)
568 break;
569 if (!(nr_pages % m))
64ec72a1
JP
570 pr_info("Image saving progress: %3d%%\n",
571 nr_pages / m * 10);
4ff277f9
JS
572 nr_pages++;
573 }
343df3c7 574 err2 = hib_wait_io(&hb);
55c4478a 575 hib_finish_batch(&hb);
db597605 576 stop = ktime_get();
4ff277f9
JS
577 if (!ret)
578 ret = err2;
579 if (!ret)
64ec72a1 580 pr_info("Image saving done\n");
db597605 581 swsusp_show_speed(start, stop, nr_to_write, "Wrote");
4ff277f9 582 return ret;
61159a31
RW
583}
584
6b37dfcb 585/*
081a9d04
BS
586 * Structure used for CRC32.
587 */
588struct crc_data {
589 struct task_struct *thr; /* thread */
590 atomic_t ready; /* ready to start flag */
591 atomic_t stop; /* ready to stop flag */
592 unsigned run_threads; /* nr current threads */
593 wait_queue_head_t go; /* start crc update */
594 wait_queue_head_t done; /* crc update done */
595 u32 *crc32; /* points to handle's crc32 */
596 size_t *unc_len[LZO_THREADS]; /* uncompressed lengths */
597 unsigned char *unc[LZO_THREADS]; /* uncompressed data */
598};
599
6b37dfcb 600/*
081a9d04
BS
601 * CRC32 update function that runs in its own thread.
602 */
603static int crc32_threadfn(void *data)
604{
605 struct crc_data *d = data;
606 unsigned i;
607
608 while (1) {
71cd7e80 609 wait_event(d->go, atomic_read_acquire(&d->ready) ||
081a9d04
BS
610 kthread_should_stop());
611 if (kthread_should_stop()) {
612 d->thr = NULL;
71cd7e80 613 atomic_set_release(&d->stop, 1);
081a9d04
BS
614 wake_up(&d->done);
615 break;
616 }
617 atomic_set(&d->ready, 0);
618
619 for (i = 0; i < d->run_threads; i++)
620 *d->crc32 = crc32_le(*d->crc32,
621 d->unc[i], *d->unc_len[i]);
71cd7e80 622 atomic_set_release(&d->stop, 1);
081a9d04
BS
623 wake_up(&d->done);
624 }
625 return 0;
626}
6b37dfcb 627/*
081a9d04
BS
628 * Structure used for LZO data compression.
629 */
630struct cmp_data {
631 struct task_struct *thr; /* thread */
632 atomic_t ready; /* ready to start flag */
633 atomic_t stop; /* ready to stop flag */
634 int ret; /* return code */
635 wait_queue_head_t go; /* start compression */
636 wait_queue_head_t done; /* compression done */
637 size_t unc_len; /* uncompressed length */
638 size_t cmp_len; /* compressed length */
639 unsigned char unc[LZO_UNC_SIZE]; /* uncompressed buffer */
640 unsigned char cmp[LZO_CMP_SIZE]; /* compressed buffer */
641 unsigned char wrk[LZO1X_1_MEM_COMPRESS]; /* compression workspace */
642};
643
6b37dfcb 644/*
081a9d04
BS
645 * Compression function that runs in its own thread.
646 */
647static int lzo_compress_threadfn(void *data)
648{
649 struct cmp_data *d = data;
650
651 while (1) {
71cd7e80 652 wait_event(d->go, atomic_read_acquire(&d->ready) ||
081a9d04
BS
653 kthread_should_stop());
654 if (kthread_should_stop()) {
655 d->thr = NULL;
656 d->ret = -1;
71cd7e80 657 atomic_set_release(&d->stop, 1);
081a9d04
BS
658 wake_up(&d->done);
659 break;
660 }
661 atomic_set(&d->ready, 0);
662
663 d->ret = lzo1x_1_compress(d->unc, d->unc_len,
664 d->cmp + LZO_HEADER, &d->cmp_len,
665 d->wrk);
71cd7e80 666 atomic_set_release(&d->stop, 1);
081a9d04
BS
667 wake_up(&d->done);
668 }
669 return 0;
670}
f996fc96
BS
671
672/**
673 * save_image_lzo - Save the suspend image data compressed with LZO.
057b0a75 674 * @handle: Swap map handle to use for saving the image.
f996fc96
BS
675 * @snapshot: Image to read data from.
676 * @nr_to_write: Number of pages to save.
677 */
678static int save_image_lzo(struct swap_map_handle *handle,
679 struct snapshot_handle *snapshot,
680 unsigned int nr_to_write)
681{
682 unsigned int m;
683 int ret = 0;
684 int nr_pages;
685 int err2;
343df3c7 686 struct hib_bio_batch hb;
db597605
TR
687 ktime_t start;
688 ktime_t stop;
081a9d04
BS
689 size_t off;
690 unsigned thr, run_threads, nr_threads;
691 unsigned char *page = NULL;
692 struct cmp_data *data = NULL;
693 struct crc_data *crc = NULL;
694
343df3c7
CH
695 hib_init_batch(&hb);
696
081a9d04
BS
697 /*
698 * We'll limit the number of threads for compression to limit memory
699 * footprint.
700 */
701 nr_threads = num_online_cpus() - 1;
702 nr_threads = clamp_val(nr_threads, 1, LZO_THREADS);
f996fc96 703
0eb0b63c 704 page = (void *)__get_free_page(GFP_NOIO | __GFP_HIGH);
f996fc96 705 if (!page) {
64ec72a1 706 pr_err("Failed to allocate LZO page\n");
081a9d04
BS
707 ret = -ENOMEM;
708 goto out_clean;
f996fc96
BS
709 }
710
9437e393 711 data = vzalloc(array_size(nr_threads, sizeof(*data)));
081a9d04 712 if (!data) {
64ec72a1 713 pr_err("Failed to allocate LZO data\n");
081a9d04
BS
714 ret = -ENOMEM;
715 goto out_clean;
f996fc96
BS
716 }
717
9437e393 718 crc = kzalloc(sizeof(*crc), GFP_KERNEL);
081a9d04 719 if (!crc) {
64ec72a1 720 pr_err("Failed to allocate crc\n");
081a9d04
BS
721 ret = -ENOMEM;
722 goto out_clean;
723 }
081a9d04
BS
724
725 /*
726 * Start the compression threads.
727 */
728 for (thr = 0; thr < nr_threads; thr++) {
729 init_waitqueue_head(&data[thr].go);
730 init_waitqueue_head(&data[thr].done);
731
732 data[thr].thr = kthread_run(lzo_compress_threadfn,
733 &data[thr],
734 "image_compress/%u", thr);
735 if (IS_ERR(data[thr].thr)) {
736 data[thr].thr = NULL;
64ec72a1 737 pr_err("Cannot start compression threads\n");
081a9d04
BS
738 ret = -ENOMEM;
739 goto out_clean;
740 }
f996fc96
BS
741 }
742
081a9d04
BS
743 /*
744 * Start the CRC32 thread.
745 */
746 init_waitqueue_head(&crc->go);
747 init_waitqueue_head(&crc->done);
748
749 handle->crc32 = 0;
750 crc->crc32 = &handle->crc32;
751 for (thr = 0; thr < nr_threads; thr++) {
752 crc->unc[thr] = data[thr].unc;
753 crc->unc_len[thr] = &data[thr].unc_len;
754 }
755
756 crc->thr = kthread_run(crc32_threadfn, crc, "image_crc32");
757 if (IS_ERR(crc->thr)) {
758 crc->thr = NULL;
64ec72a1 759 pr_err("Cannot start CRC32 thread\n");
081a9d04
BS
760 ret = -ENOMEM;
761 goto out_clean;
f996fc96
BS
762 }
763
5a21d489
BS
764 /*
765 * Adjust the number of required free pages after all allocations have
766 * been done. We don't want to run out of pages when writing.
767 */
768 handle->reqd_free_pages = reqd_free_pages();
769
64ec72a1
JP
770 pr_info("Using %u thread(s) for compression\n", nr_threads);
771 pr_info("Compressing and saving image data (%u pages)...\n",
772 nr_to_write);
d8150d35 773 m = nr_to_write / 10;
f996fc96
BS
774 if (!m)
775 m = 1;
776 nr_pages = 0;
db597605 777 start = ktime_get();
f996fc96 778 for (;;) {
081a9d04
BS
779 for (thr = 0; thr < nr_threads; thr++) {
780 for (off = 0; off < LZO_UNC_SIZE; off += PAGE_SIZE) {
781 ret = snapshot_read_next(snapshot);
782 if (ret < 0)
783 goto out_finish;
784
785 if (!ret)
786 break;
787
788 memcpy(data[thr].unc + off,
789 data_of(*snapshot), PAGE_SIZE);
790
791 if (!(nr_pages % m))
64ec72a1
JP
792 pr_info("Image saving progress: %3d%%\n",
793 nr_pages / m * 10);
081a9d04
BS
794 nr_pages++;
795 }
796 if (!off)
f996fc96
BS
797 break;
798
081a9d04 799 data[thr].unc_len = off;
f996fc96 800
71cd7e80 801 atomic_set_release(&data[thr].ready, 1);
081a9d04 802 wake_up(&data[thr].go);
f996fc96
BS
803 }
804
081a9d04 805 if (!thr)
f996fc96
BS
806 break;
807
081a9d04 808 crc->run_threads = thr;
71cd7e80 809 atomic_set_release(&crc->ready, 1);
081a9d04 810 wake_up(&crc->go);
f996fc96 811
081a9d04
BS
812 for (run_threads = thr, thr = 0; thr < run_threads; thr++) {
813 wait_event(data[thr].done,
71cd7e80 814 atomic_read_acquire(&data[thr].stop));
081a9d04 815 atomic_set(&data[thr].stop, 0);
f996fc96 816
081a9d04 817 ret = data[thr].ret;
f996fc96 818
081a9d04 819 if (ret < 0) {
64ec72a1 820 pr_err("LZO compression failed\n");
081a9d04
BS
821 goto out_finish;
822 }
f996fc96 823
081a9d04
BS
824 if (unlikely(!data[thr].cmp_len ||
825 data[thr].cmp_len >
826 lzo1x_worst_compress(data[thr].unc_len))) {
64ec72a1 827 pr_err("Invalid LZO compressed length\n");
081a9d04 828 ret = -1;
f996fc96 829 goto out_finish;
081a9d04
BS
830 }
831
832 *(size_t *)data[thr].cmp = data[thr].cmp_len;
833
834 /*
835 * Given we are writing one page at a time to disk, we
836 * copy that much from the buffer, although the last
837 * bit will likely be smaller than full page. This is
838 * OK - we saved the length of the compressed data, so
839 * any garbage at the end will be discarded when we
840 * read it.
841 */
842 for (off = 0;
843 off < LZO_HEADER + data[thr].cmp_len;
844 off += PAGE_SIZE) {
845 memcpy(page, data[thr].cmp + off, PAGE_SIZE);
846
343df3c7 847 ret = swap_write_page(handle, page, &hb);
081a9d04
BS
848 if (ret)
849 goto out_finish;
850 }
f996fc96 851 }
081a9d04 852
71cd7e80 853 wait_event(crc->done, atomic_read_acquire(&crc->stop));
081a9d04 854 atomic_set(&crc->stop, 0);
f996fc96
BS
855 }
856
857out_finish:
343df3c7 858 err2 = hib_wait_io(&hb);
db597605 859 stop = ktime_get();
f996fc96
BS
860 if (!ret)
861 ret = err2;
d8150d35 862 if (!ret)
64ec72a1 863 pr_info("Image saving done\n");
db597605 864 swsusp_show_speed(start, stop, nr_to_write, "Wrote");
081a9d04 865out_clean:
55c4478a 866 hib_finish_batch(&hb);
081a9d04
BS
867 if (crc) {
868 if (crc->thr)
869 kthread_stop(crc->thr);
870 kfree(crc);
871 }
872 if (data) {
873 for (thr = 0; thr < nr_threads; thr++)
874 if (data[thr].thr)
875 kthread_stop(data[thr].thr);
876 vfree(data);
877 }
878 if (page) free_page((unsigned long)page);
f996fc96
BS
879
880 return ret;
881}
882
61159a31
RW
883/**
884 * enough_swap - Make sure we have enough swap to save the image.
885 *
886 * Returns TRUE or FALSE after checking the total amount of swap
e4b2897a 887 * space available from the resume partition.
61159a31
RW
888 */
889
8ffdfe35 890static int enough_swap(unsigned int nr_pages)
61159a31
RW
891{
892 unsigned int free_swap = count_swap_pages(root_swap, 1);
f996fc96 893 unsigned int required;
61159a31 894
64ec72a1 895 pr_debug("Free swap pages: %u\n", free_swap);
f996fc96 896
ee34a370 897 required = PAGES_FOR_IO + nr_pages;
f996fc96 898 return free_swap > required;
61159a31
RW
899}
900
901/**
902 * swsusp_write - Write entire image and metadata.
a634cc10 903 * @flags: flags to pass to the "boot" kernel in the image header
61159a31
RW
904 *
905 * It is important _NOT_ to umount filesystems at this point. We want
906 * them synced (in case something goes wrong) but we DO not want to mark
907 * filesystem clean: it is not. (And it does not matter, if we resume
908 * correctly, we'll mark system clean, anyway.)
909 */
910
a634cc10 911int swsusp_write(unsigned int flags)
61159a31
RW
912{
913 struct swap_map_handle handle;
914 struct snapshot_handle snapshot;
915 struct swsusp_info *header;
6f612af5 916 unsigned long pages;
61159a31
RW
917 int error;
918
6f612af5
JS
919 pages = snapshot_get_image_size();
920 error = get_swap_writer(&handle);
3aef83e0 921 if (error) {
64ec72a1 922 pr_err("Cannot get swap writer\n");
61159a31
RW
923 return error;
924 }
ee34a370 925 if (flags & SF_NOCOMPRESS_MODE) {
8ffdfe35 926 if (!enough_swap(pages)) {
64ec72a1 927 pr_err("Not enough free swap\n");
ee34a370
BS
928 error = -ENOSPC;
929 goto out_finish;
930 }
6f612af5 931 }
61159a31 932 memset(&snapshot, 0, sizeof(struct snapshot_handle));
d3c1b24c 933 error = snapshot_read_next(&snapshot);
d5641c64 934 if (error < (int)PAGE_SIZE) {
3aef83e0
RW
935 if (error >= 0)
936 error = -EFAULT;
937
6f612af5 938 goto out_finish;
3aef83e0 939 }
61159a31 940 header = (struct swsusp_info *)data_of(snapshot);
6f612af5 941 error = swap_write_page(&handle, header, NULL);
f996fc96
BS
942 if (!error) {
943 error = (flags & SF_NOCOMPRESS_MODE) ?
944 save_image(&handle, &snapshot, pages - 1) :
945 save_image_lzo(&handle, &snapshot, pages - 1);
946 }
6f612af5
JS
947out_finish:
948 error = swap_writer_finish(&handle, flags, error);
61159a31
RW
949 return error;
950}
951
6b37dfcb 952/*
61159a31 953 * The following functions allow us to read data using a swap map
6b37dfcb 954 * in a file-like way.
61159a31
RW
955 */
956
957static void release_swap_reader(struct swap_map_handle *handle)
958{
081a9d04
BS
959 struct swap_map_page_list *tmp;
960
961 while (handle->maps) {
962 if (handle->maps->map)
963 free_page((unsigned long)handle->maps->map);
964 tmp = handle->maps;
965 handle->maps = handle->maps->next;
966 kfree(tmp);
967 }
61159a31
RW
968 handle->cur = NULL;
969}
970
6f612af5
JS
971static int get_swap_reader(struct swap_map_handle *handle,
972 unsigned int *flags_p)
61159a31
RW
973{
974 int error;
081a9d04
BS
975 struct swap_map_page_list *tmp, *last;
976 sector_t offset;
61159a31 977
6f612af5
JS
978 *flags_p = swsusp_header->flags;
979
980 if (!swsusp_header->image) /* how can this happen? */
61159a31 981 return -EINVAL;
3aef83e0 982
081a9d04
BS
983 handle->cur = NULL;
984 last = handle->maps = NULL;
985 offset = swsusp_header->image;
986 while (offset) {
2f02a7ec 987 tmp = kzalloc(sizeof(*handle->maps), GFP_KERNEL);
081a9d04
BS
988 if (!tmp) {
989 release_swap_reader(handle);
990 return -ENOMEM;
991 }
081a9d04
BS
992 if (!handle->maps)
993 handle->maps = tmp;
994 if (last)
995 last->next = tmp;
996 last = tmp;
997
998 tmp->map = (struct swap_map_page *)
0eb0b63c 999 __get_free_page(GFP_NOIO | __GFP_HIGH);
081a9d04
BS
1000 if (!tmp->map) {
1001 release_swap_reader(handle);
1002 return -ENOMEM;
1003 }
3aef83e0 1004
568e34ed 1005 error = hib_submit_io(REQ_OP_READ, offset, tmp->map, NULL);
081a9d04
BS
1006 if (error) {
1007 release_swap_reader(handle);
1008 return error;
1009 }
1010 offset = tmp->map->next_swap;
61159a31
RW
1011 }
1012 handle->k = 0;
081a9d04 1013 handle->cur = handle->maps->map;
61159a31
RW
1014 return 0;
1015}
1016
546e0d27 1017static int swap_read_page(struct swap_map_handle *handle, void *buf,
343df3c7 1018 struct hib_bio_batch *hb)
61159a31 1019{
3aef83e0 1020 sector_t offset;
61159a31 1021 int error;
081a9d04 1022 struct swap_map_page_list *tmp;
61159a31
RW
1023
1024 if (!handle->cur)
1025 return -EINVAL;
1026 offset = handle->cur->entries[handle->k];
1027 if (!offset)
1028 return -EFAULT;
568e34ed 1029 error = hib_submit_io(REQ_OP_READ, offset, buf, hb);
61159a31
RW
1030 if (error)
1031 return error;
1032 if (++handle->k >= MAP_PAGE_ENTRIES) {
1033 handle->k = 0;
081a9d04
BS
1034 free_page((unsigned long)handle->maps->map);
1035 tmp = handle->maps;
1036 handle->maps = handle->maps->next;
1037 kfree(tmp);
1038 if (!handle->maps)
61159a31 1039 release_swap_reader(handle);
081a9d04
BS
1040 else
1041 handle->cur = handle->maps->map;
61159a31
RW
1042 }
1043 return error;
1044}
1045
6f612af5
JS
1046static int swap_reader_finish(struct swap_map_handle *handle)
1047{
1048 release_swap_reader(handle);
1049
1050 return 0;
1051}
1052
61159a31
RW
1053/**
1054 * load_image - load the image using the swap map handle
1055 * @handle and the snapshot handle @snapshot
1056 * (assume there are @nr_pages pages to load)
1057 */
1058
1059static int load_image(struct swap_map_handle *handle,
1060 struct snapshot_handle *snapshot,
546e0d27 1061 unsigned int nr_to_read)
61159a31
RW
1062{
1063 unsigned int m;
081a9d04 1064 int ret = 0;
db597605
TR
1065 ktime_t start;
1066 ktime_t stop;
343df3c7 1067 struct hib_bio_batch hb;
546e0d27
AM
1068 int err2;
1069 unsigned nr_pages;
61159a31 1070
343df3c7
CH
1071 hib_init_batch(&hb);
1072
f6cf0545 1073 clean_pages_on_read = true;
64ec72a1 1074 pr_info("Loading image data pages (%u pages)...\n", nr_to_read);
d8150d35 1075 m = nr_to_read / 10;
61159a31
RW
1076 if (!m)
1077 m = 1;
1078 nr_pages = 0;
db597605 1079 start = ktime_get();
546e0d27 1080 for ( ; ; ) {
081a9d04
BS
1081 ret = snapshot_write_next(snapshot);
1082 if (ret <= 0)
546e0d27 1083 break;
343df3c7 1084 ret = swap_read_page(handle, data_of(*snapshot), &hb);
081a9d04 1085 if (ret)
546e0d27
AM
1086 break;
1087 if (snapshot->sync_read)
343df3c7 1088 ret = hib_wait_io(&hb);
081a9d04 1089 if (ret)
546e0d27
AM
1090 break;
1091 if (!(nr_pages % m))
64ec72a1
JP
1092 pr_info("Image loading progress: %3d%%\n",
1093 nr_pages / m * 10);
546e0d27
AM
1094 nr_pages++;
1095 }
343df3c7 1096 err2 = hib_wait_io(&hb);
55c4478a 1097 hib_finish_batch(&hb);
db597605 1098 stop = ktime_get();
081a9d04
BS
1099 if (!ret)
1100 ret = err2;
1101 if (!ret) {
64ec72a1 1102 pr_info("Image loading done\n");
8357376d 1103 snapshot_write_finalize(snapshot);
e655a250 1104 if (!snapshot_image_loaded(snapshot))
081a9d04 1105 ret = -ENODATA;
d8150d35 1106 }
db597605 1107 swsusp_show_speed(start, stop, nr_to_read, "Read");
081a9d04
BS
1108 return ret;
1109}
1110
6b37dfcb 1111/*
081a9d04
BS
1112 * Structure used for LZO data decompression.
1113 */
1114struct dec_data {
1115 struct task_struct *thr; /* thread */
1116 atomic_t ready; /* ready to start flag */
1117 atomic_t stop; /* ready to stop flag */
1118 int ret; /* return code */
1119 wait_queue_head_t go; /* start decompression */
1120 wait_queue_head_t done; /* decompression done */
1121 size_t unc_len; /* uncompressed length */
1122 size_t cmp_len; /* compressed length */
1123 unsigned char unc[LZO_UNC_SIZE]; /* uncompressed buffer */
1124 unsigned char cmp[LZO_CMP_SIZE]; /* compressed buffer */
1125};
1126
6b37dfcb 1127/*
6be2408a 1128 * Decompression function that runs in its own thread.
081a9d04
BS
1129 */
1130static int lzo_decompress_threadfn(void *data)
1131{
1132 struct dec_data *d = data;
1133
1134 while (1) {
71cd7e80 1135 wait_event(d->go, atomic_read_acquire(&d->ready) ||
081a9d04
BS
1136 kthread_should_stop());
1137 if (kthread_should_stop()) {
1138 d->thr = NULL;
1139 d->ret = -1;
71cd7e80 1140 atomic_set_release(&d->stop, 1);
081a9d04
BS
1141 wake_up(&d->done);
1142 break;
1143 }
1144 atomic_set(&d->ready, 0);
1145
1146 d->unc_len = LZO_UNC_SIZE;
1147 d->ret = lzo1x_decompress_safe(d->cmp + LZO_HEADER, d->cmp_len,
1148 d->unc, &d->unc_len);
f6cf0545
JM
1149 if (clean_pages_on_decompress)
1150 flush_icache_range((unsigned long)d->unc,
1151 (unsigned long)d->unc + d->unc_len);
1152
71cd7e80 1153 atomic_set_release(&d->stop, 1);
081a9d04
BS
1154 wake_up(&d->done);
1155 }
1156 return 0;
61159a31
RW
1157}
1158
f996fc96
BS
1159/**
1160 * load_image_lzo - Load compressed image data and decompress them with LZO.
1161 * @handle: Swap map handle to use for loading data.
1162 * @snapshot: Image to copy uncompressed data into.
1163 * @nr_to_read: Number of pages to load.
1164 */
1165static int load_image_lzo(struct swap_map_handle *handle,
1166 struct snapshot_handle *snapshot,
1167 unsigned int nr_to_read)
1168{
1169 unsigned int m;
081a9d04
BS
1170 int ret = 0;
1171 int eof = 0;
343df3c7 1172 struct hib_bio_batch hb;
db597605
TR
1173 ktime_t start;
1174 ktime_t stop;
f996fc96 1175 unsigned nr_pages;
081a9d04
BS
1176 size_t off;
1177 unsigned i, thr, run_threads, nr_threads;
1178 unsigned ring = 0, pg = 0, ring_size = 0,
1179 have = 0, want, need, asked = 0;
5a21d489 1180 unsigned long read_pages = 0;
081a9d04
BS
1181 unsigned char **page = NULL;
1182 struct dec_data *data = NULL;
1183 struct crc_data *crc = NULL;
1184
343df3c7
CH
1185 hib_init_batch(&hb);
1186
081a9d04
BS
1187 /*
1188 * We'll limit the number of threads for decompression to limit memory
1189 * footprint.
1190 */
1191 nr_threads = num_online_cpus() - 1;
1192 nr_threads = clamp_val(nr_threads, 1, LZO_THREADS);
1193
42bc47b3 1194 page = vmalloc(array_size(LZO_MAX_RD_PAGES, sizeof(*page)));
081a9d04 1195 if (!page) {
64ec72a1 1196 pr_err("Failed to allocate LZO page\n");
081a9d04
BS
1197 ret = -ENOMEM;
1198 goto out_clean;
1199 }
9f339caf 1200
9437e393 1201 data = vzalloc(array_size(nr_threads, sizeof(*data)));
081a9d04 1202 if (!data) {
64ec72a1 1203 pr_err("Failed to allocate LZO data\n");
081a9d04
BS
1204 ret = -ENOMEM;
1205 goto out_clean;
1206 }
9f339caf 1207
9437e393 1208 crc = kzalloc(sizeof(*crc), GFP_KERNEL);
081a9d04 1209 if (!crc) {
64ec72a1 1210 pr_err("Failed to allocate crc\n");
081a9d04
BS
1211 ret = -ENOMEM;
1212 goto out_clean;
1213 }
081a9d04 1214
f6cf0545
JM
1215 clean_pages_on_decompress = true;
1216
081a9d04
BS
1217 /*
1218 * Start the decompression threads.
1219 */
1220 for (thr = 0; thr < nr_threads; thr++) {
1221 init_waitqueue_head(&data[thr].go);
1222 init_waitqueue_head(&data[thr].done);
1223
1224 data[thr].thr = kthread_run(lzo_decompress_threadfn,
1225 &data[thr],
1226 "image_decompress/%u", thr);
1227 if (IS_ERR(data[thr].thr)) {
1228 data[thr].thr = NULL;
64ec72a1 1229 pr_err("Cannot start decompression threads\n");
081a9d04
BS
1230 ret = -ENOMEM;
1231 goto out_clean;
9f339caf 1232 }
f996fc96
BS
1233 }
1234
081a9d04
BS
1235 /*
1236 * Start the CRC32 thread.
1237 */
1238 init_waitqueue_head(&crc->go);
1239 init_waitqueue_head(&crc->done);
1240
1241 handle->crc32 = 0;
1242 crc->crc32 = &handle->crc32;
1243 for (thr = 0; thr < nr_threads; thr++) {
1244 crc->unc[thr] = data[thr].unc;
1245 crc->unc_len[thr] = &data[thr].unc_len;
f996fc96
BS
1246 }
1247
081a9d04
BS
1248 crc->thr = kthread_run(crc32_threadfn, crc, "image_crc32");
1249 if (IS_ERR(crc->thr)) {
1250 crc->thr = NULL;
64ec72a1 1251 pr_err("Cannot start CRC32 thread\n");
081a9d04
BS
1252 ret = -ENOMEM;
1253 goto out_clean;
1254 }
9f339caf 1255
081a9d04 1256 /*
5a21d489
BS
1257 * Set the number of pages for read buffering.
1258 * This is complete guesswork, because we'll only know the real
1259 * picture once prepare_image() is called, which is much later on
1260 * during the image load phase. We'll assume the worst case and
1261 * say that none of the image pages are from high memory.
081a9d04 1262 */
5a21d489
BS
1263 if (low_free_pages() > snapshot_get_image_size())
1264 read_pages = (low_free_pages() - snapshot_get_image_size()) / 2;
1265 read_pages = clamp_val(read_pages, LZO_MIN_RD_PAGES, LZO_MAX_RD_PAGES);
9f339caf 1266
081a9d04
BS
1267 for (i = 0; i < read_pages; i++) {
1268 page[i] = (void *)__get_free_page(i < LZO_CMP_PAGES ?
0eb0b63c
CH
1269 GFP_NOIO | __GFP_HIGH :
1270 GFP_NOIO | __GFP_NOWARN |
71baba4b 1271 __GFP_NORETRY);
5a21d489 1272
081a9d04
BS
1273 if (!page[i]) {
1274 if (i < LZO_CMP_PAGES) {
1275 ring_size = i;
64ec72a1 1276 pr_err("Failed to allocate LZO pages\n");
081a9d04
BS
1277 ret = -ENOMEM;
1278 goto out_clean;
1279 } else {
1280 break;
1281 }
1282 }
f996fc96 1283 }
081a9d04 1284 want = ring_size = i;
f996fc96 1285
64ec72a1
JP
1286 pr_info("Using %u thread(s) for decompression\n", nr_threads);
1287 pr_info("Loading and decompressing image data (%u pages)...\n",
1288 nr_to_read);
d8150d35 1289 m = nr_to_read / 10;
f996fc96
BS
1290 if (!m)
1291 m = 1;
1292 nr_pages = 0;
db597605 1293 start = ktime_get();
f996fc96 1294
081a9d04
BS
1295 ret = snapshot_write_next(snapshot);
1296 if (ret <= 0)
f996fc96
BS
1297 goto out_finish;
1298
081a9d04
BS
1299 for(;;) {
1300 for (i = 0; !eof && i < want; i++) {
343df3c7 1301 ret = swap_read_page(handle, page[ring], &hb);
081a9d04
BS
1302 if (ret) {
1303 /*
1304 * On real read error, finish. On end of data,
1305 * set EOF flag and just exit the read loop.
1306 */
1307 if (handle->cur &&
1308 handle->cur->entries[handle->k]) {
1309 goto out_finish;
1310 } else {
1311 eof = 1;
1312 break;
1313 }
1314 }
1315 if (++ring >= ring_size)
1316 ring = 0;
f996fc96 1317 }
081a9d04
BS
1318 asked += i;
1319 want -= i;
f996fc96 1320
081a9d04
BS
1321 /*
1322 * We are out of data, wait for some more.
1323 */
1324 if (!have) {
1325 if (!asked)
1326 break;
1327
343df3c7 1328 ret = hib_wait_io(&hb);
081a9d04 1329 if (ret)
f996fc96 1330 goto out_finish;
081a9d04
BS
1331 have += asked;
1332 asked = 0;
1333 if (eof)
1334 eof = 2;
9f339caf 1335 }
f996fc96 1336
081a9d04 1337 if (crc->run_threads) {
71cd7e80 1338 wait_event(crc->done, atomic_read_acquire(&crc->stop));
081a9d04
BS
1339 atomic_set(&crc->stop, 0);
1340 crc->run_threads = 0;
f996fc96
BS
1341 }
1342
081a9d04
BS
1343 for (thr = 0; have && thr < nr_threads; thr++) {
1344 data[thr].cmp_len = *(size_t *)page[pg];
1345 if (unlikely(!data[thr].cmp_len ||
1346 data[thr].cmp_len >
1347 lzo1x_worst_compress(LZO_UNC_SIZE))) {
64ec72a1 1348 pr_err("Invalid LZO compressed length\n");
081a9d04
BS
1349 ret = -1;
1350 goto out_finish;
1351 }
1352
1353 need = DIV_ROUND_UP(data[thr].cmp_len + LZO_HEADER,
1354 PAGE_SIZE);
1355 if (need > have) {
1356 if (eof > 1) {
1357 ret = -1;
1358 goto out_finish;
1359 }
1360 break;
1361 }
1362
1363 for (off = 0;
1364 off < LZO_HEADER + data[thr].cmp_len;
1365 off += PAGE_SIZE) {
1366 memcpy(data[thr].cmp + off,
1367 page[pg], PAGE_SIZE);
1368 have--;
1369 want++;
1370 if (++pg >= ring_size)
1371 pg = 0;
1372 }
1373
71cd7e80 1374 atomic_set_release(&data[thr].ready, 1);
081a9d04 1375 wake_up(&data[thr].go);
f996fc96
BS
1376 }
1377
081a9d04
BS
1378 /*
1379 * Wait for more data while we are decompressing.
1380 */
1381 if (have < LZO_CMP_PAGES && asked) {
343df3c7 1382 ret = hib_wait_io(&hb);
081a9d04
BS
1383 if (ret)
1384 goto out_finish;
1385 have += asked;
1386 asked = 0;
1387 if (eof)
1388 eof = 2;
f996fc96
BS
1389 }
1390
081a9d04
BS
1391 for (run_threads = thr, thr = 0; thr < run_threads; thr++) {
1392 wait_event(data[thr].done,
71cd7e80 1393 atomic_read_acquire(&data[thr].stop));
081a9d04
BS
1394 atomic_set(&data[thr].stop, 0);
1395
1396 ret = data[thr].ret;
f996fc96 1397
081a9d04 1398 if (ret < 0) {
64ec72a1 1399 pr_err("LZO decompression failed\n");
081a9d04
BS
1400 goto out_finish;
1401 }
f996fc96 1402
081a9d04
BS
1403 if (unlikely(!data[thr].unc_len ||
1404 data[thr].unc_len > LZO_UNC_SIZE ||
1405 data[thr].unc_len & (PAGE_SIZE - 1))) {
64ec72a1 1406 pr_err("Invalid LZO uncompressed length\n");
081a9d04 1407 ret = -1;
f996fc96 1408 goto out_finish;
081a9d04
BS
1409 }
1410
1411 for (off = 0;
1412 off < data[thr].unc_len; off += PAGE_SIZE) {
1413 memcpy(data_of(*snapshot),
1414 data[thr].unc + off, PAGE_SIZE);
1415
1416 if (!(nr_pages % m))
64ec72a1
JP
1417 pr_info("Image loading progress: %3d%%\n",
1418 nr_pages / m * 10);
081a9d04
BS
1419 nr_pages++;
1420
1421 ret = snapshot_write_next(snapshot);
1422 if (ret <= 0) {
1423 crc->run_threads = thr + 1;
71cd7e80 1424 atomic_set_release(&crc->ready, 1);
081a9d04
BS
1425 wake_up(&crc->go);
1426 goto out_finish;
1427 }
1428 }
f996fc96 1429 }
081a9d04
BS
1430
1431 crc->run_threads = thr;
71cd7e80 1432 atomic_set_release(&crc->ready, 1);
081a9d04 1433 wake_up(&crc->go);
f996fc96
BS
1434 }
1435
1436out_finish:
081a9d04 1437 if (crc->run_threads) {
71cd7e80 1438 wait_event(crc->done, atomic_read_acquire(&crc->stop));
081a9d04
BS
1439 atomic_set(&crc->stop, 0);
1440 }
db597605 1441 stop = ktime_get();
081a9d04 1442 if (!ret) {
64ec72a1 1443 pr_info("Image loading done\n");
f996fc96
BS
1444 snapshot_write_finalize(snapshot);
1445 if (!snapshot_image_loaded(snapshot))
081a9d04
BS
1446 ret = -ENODATA;
1447 if (!ret) {
1448 if (swsusp_header->flags & SF_CRC32_MODE) {
1449 if(handle->crc32 != swsusp_header->crc32) {
64ec72a1 1450 pr_err("Invalid image CRC32!\n");
081a9d04
BS
1451 ret = -ENODATA;
1452 }
1453 }
1454 }
d8150d35 1455 }
db597605 1456 swsusp_show_speed(start, stop, nr_to_read, "Read");
081a9d04 1457out_clean:
55c4478a 1458 hib_finish_batch(&hb);
081a9d04 1459 for (i = 0; i < ring_size; i++)
9f339caf 1460 free_page((unsigned long)page[i]);
081a9d04
BS
1461 if (crc) {
1462 if (crc->thr)
1463 kthread_stop(crc->thr);
1464 kfree(crc);
1465 }
1466 if (data) {
1467 for (thr = 0; thr < nr_threads; thr++)
1468 if (data[thr].thr)
1469 kthread_stop(data[thr].thr);
1470 vfree(data);
1471 }
6c45de0d 1472 vfree(page);
f996fc96 1473
081a9d04 1474 return ret;
f996fc96
BS
1475}
1476
a634cc10
RW
1477/**
1478 * swsusp_read - read the hibernation image.
1479 * @flags_p: flags passed by the "frozen" kernel in the image header should
b595076a 1480 * be written into this memory location
a634cc10
RW
1481 */
1482
1483int swsusp_read(unsigned int *flags_p)
61159a31
RW
1484{
1485 int error;
1486 struct swap_map_handle handle;
1487 struct snapshot_handle snapshot;
1488 struct swsusp_info *header;
1489
61159a31 1490 memset(&snapshot, 0, sizeof(struct snapshot_handle));
d3c1b24c 1491 error = snapshot_write_next(&snapshot);
d5641c64 1492 if (error < (int)PAGE_SIZE)
61159a31
RW
1493 return error < 0 ? error : -EFAULT;
1494 header = (struct swsusp_info *)data_of(snapshot);
6f612af5
JS
1495 error = get_swap_reader(&handle, flags_p);
1496 if (error)
1497 goto end;
61159a31 1498 if (!error)
546e0d27 1499 error = swap_read_page(&handle, header, NULL);
f996fc96
BS
1500 if (!error) {
1501 error = (*flags_p & SF_NOCOMPRESS_MODE) ?
1502 load_image(&handle, &snapshot, header->pages - 1) :
1503 load_image_lzo(&handle, &snapshot, header->pages - 1);
1504 }
6f612af5
JS
1505 swap_reader_finish(&handle);
1506end:
61159a31 1507 if (!error)
64ec72a1 1508 pr_debug("Image successfully loaded\n");
61159a31 1509 else
64ec72a1 1510 pr_debug("Error %d resuming\n", error);
61159a31
RW
1511 return error;
1512}
1513
c889d079
CH
1514static void *swsusp_holder;
1515
61159a31 1516/**
7bf770f7 1517 * swsusp_check - Open the resume device and check for the swsusp signature.
40d84e19 1518 * @exclusive: Open the resume device exclusively.
61159a31
RW
1519 */
1520
40d84e19 1521int swsusp_check(bool exclusive)
61159a31 1522{
40d84e19 1523 void *holder = exclusive ? &swsusp_holder : NULL;
61159a31 1524 int error;
5904de0d 1525
4379f911 1526 hib_resume_bdev_file = bdev_file_open_by_dev(swsusp_resume_device,
e017d304 1527 BLK_OPEN_READ, holder, NULL);
4379f911
CB
1528 if (!IS_ERR(hib_resume_bdev_file)) {
1529 set_blocksize(file_bdev(hib_resume_bdev_file), PAGE_SIZE);
3ecb01df 1530 clear_page(swsusp_header);
568e34ed 1531 error = hib_submit_io(REQ_OP_READ, swsusp_resume_block,
1b29c164 1532 swsusp_header, NULL);
9a154d9d 1533 if (error)
76b57e61 1534 goto put;
9a154d9d 1535
3624eb04 1536 if (!memcmp(HIBERNATE_SIG, swsusp_header->sig, 10)) {
1b29c164 1537 memcpy(swsusp_header->sig, swsusp_header->orig_sig, 10);
61159a31 1538 /* Reset swap signature now */
568e34ed 1539 error = hib_submit_io(REQ_OP_WRITE | REQ_SYNC,
162b99e3 1540 swsusp_resume_block,
1b29c164 1541 swsusp_header, NULL);
61159a31 1542 } else {
76b57e61 1543 error = -EINVAL;
61159a31 1544 }
74d95555
DW
1545 if (!error && swsusp_header->flags & SF_HW_SIG &&
1546 swsusp_header->hw_sig != swsusp_hardware_signature) {
1547 pr_info("Suspend image hardware signature mismatch (%08x now %08x); aborting resume.\n",
1548 swsusp_header->hw_sig, swsusp_hardware_signature);
1549 error = -EINVAL;
1550 }
76b57e61
JS
1551
1552put:
61159a31 1553 if (error)
4379f911 1554 fput(hib_resume_bdev_file);
61159a31 1555 else
64ec72a1 1556 pr_debug("Image signature found, resuming\n");
61159a31 1557 } else {
4379f911 1558 error = PTR_ERR(hib_resume_bdev_file);
61159a31
RW
1559 }
1560
1561 if (error)
64ec72a1 1562 pr_debug("Image not found (code %d)\n", error);
61159a31
RW
1563
1564 return error;
1565}
1566
1567/**
7bf770f7 1568 * swsusp_close - close resume device.
61159a31
RW
1569 */
1570
93745df1 1571void swsusp_close(void)
61159a31 1572{
4379f911 1573 if (IS_ERR(hib_resume_bdev_file)) {
64ec72a1 1574 pr_debug("Image device not initialised\n");
61159a31
RW
1575 return;
1576 }
1577
4379f911 1578 fput(hib_resume_bdev_file);
61159a31 1579}
1b29c164 1580
62c552cc
BS
1581/**
1582 * swsusp_unmark - Unmark swsusp signature in the resume device
1583 */
1584
1585#ifdef CONFIG_SUSPEND
1586int swsusp_unmark(void)
1587{
1588 int error;
1589
568e34ed
BVA
1590 hib_submit_io(REQ_OP_READ, swsusp_resume_block,
1591 swsusp_header, NULL);
62c552cc
BS
1592 if (!memcmp(HIBERNATE_SIG,swsusp_header->sig, 10)) {
1593 memcpy(swsusp_header->sig,swsusp_header->orig_sig, 10);
568e34ed 1594 error = hib_submit_io(REQ_OP_WRITE | REQ_SYNC,
162b99e3 1595 swsusp_resume_block,
62c552cc
BS
1596 swsusp_header, NULL);
1597 } else {
64ec72a1 1598 pr_err("Cannot find swsusp signature!\n");
62c552cc
BS
1599 error = -ENODEV;
1600 }
1601
1602 /*
1603 * We just returned from suspend, we don't need the image any more.
1604 */
1605 free_all_swap_pages(root_swap);
1606
1607 return error;
1608}
1609#endif
1610
afd8d7c7 1611static int __init swsusp_header_init(void)
1b29c164
VG
1612{
1613 swsusp_header = (struct swsusp_header*) __get_free_page(GFP_KERNEL);
1614 if (!swsusp_header)
1615 panic("Could not allocate memory for swsusp_header\n");
1616 return 0;
1617}
1618
1619core_initcall(swsusp_header_init);