PM: hibernate: swap: Use vzalloc() and kzalloc()
[linux-2.6-block.git] / kernel / power / swap.c
CommitLineData
55716d26 1// SPDX-License-Identifier: GPL-2.0-only
61159a31
RW
2/*
3 * linux/kernel/power/swap.c
4 *
5 * This file provides functions for reading the suspend image from
6 * and writing it to a swap partition.
7 *
a2531293 8 * Copyright (C) 1998,2001-2005 Pavel Machek <pavel@ucw.cz>
61159a31 9 * Copyright (C) 2006 Rafael J. Wysocki <rjw@sisk.pl>
5a21d489 10 * Copyright (C) 2010-2012 Bojan Smojver <bojan@rexursive.com>
61159a31
RW
11 */
12
64ec72a1
JP
13#define pr_fmt(fmt) "PM: " fmt
14
61159a31 15#include <linux/module.h>
61159a31 16#include <linux/file.h>
61159a31
RW
17#include <linux/delay.h>
18#include <linux/bitops.h>
19#include <linux/genhd.h>
20#include <linux/device.h>
61159a31 21#include <linux/bio.h>
546e0d27 22#include <linux/blkdev.h>
61159a31
RW
23#include <linux/swap.h>
24#include <linux/swapops.h>
25#include <linux/pm.h>
5a0e3ad6 26#include <linux/slab.h>
f996fc96
BS
27#include <linux/lzo.h>
28#include <linux/vmalloc.h>
081a9d04
BS
29#include <linux/cpumask.h>
30#include <linux/atomic.h>
31#include <linux/kthread.h>
32#include <linux/crc32.h>
db597605 33#include <linux/ktime.h>
61159a31
RW
34
35#include "power.h"
36
be8cd644 37#define HIBERNATE_SIG "S1SUSPEND"
61159a31 38
f6cf0545
JM
39/*
40 * When reading an {un,}compressed image, we may restore pages in place,
41 * in which case some architectures need these pages cleaning before they
42 * can be executed. We don't know which pages these may be, so clean the lot.
43 */
44static bool clean_pages_on_read;
45static bool clean_pages_on_decompress;
46
51fb352b
JS
47/*
48 * The swap map is a data structure used for keeping track of each page
49 * written to a swap partition. It consists of many swap_map_page
90133673 50 * structures that contain each an array of MAP_PAGE_ENTRIES swap entries.
51fb352b
JS
51 * These structures are stored on the swap and linked together with the
52 * help of the .next_swap member.
53 *
54 * The swap map is created during suspend. The swap map pages are
55 * allocated and populated one at a time, so we only need one memory
56 * page to set up the entire structure.
57 *
081a9d04 58 * During resume we pick up all swap_map_page structures into a list.
51fb352b
JS
59 */
60
61#define MAP_PAGE_ENTRIES (PAGE_SIZE / sizeof(sector_t) - 1)
62
f8262d47
BS
63/*
64 * Number of free pages that are not high.
65 */
66static inline unsigned long low_free_pages(void)
67{
68 return nr_free_pages() - nr_free_highpages();
69}
70
71/*
72 * Number of pages required to be kept free while writing the image. Always
73 * half of all available low pages before the writing starts.
74 */
75static inline unsigned long reqd_free_pages(void)
76{
77 return low_free_pages() / 2;
78}
79
51fb352b
JS
80struct swap_map_page {
81 sector_t entries[MAP_PAGE_ENTRIES];
82 sector_t next_swap;
83};
84
081a9d04
BS
85struct swap_map_page_list {
86 struct swap_map_page *map;
87 struct swap_map_page_list *next;
88};
89
51fb352b
JS
90/**
91 * The swap_map_handle structure is used for handling swap in
92 * a file-alike way
93 */
94
95struct swap_map_handle {
96 struct swap_map_page *cur;
081a9d04 97 struct swap_map_page_list *maps;
51fb352b
JS
98 sector_t cur_swap;
99 sector_t first_sector;
100 unsigned int k;
f8262d47 101 unsigned long reqd_free_pages;
081a9d04 102 u32 crc32;
51fb352b
JS
103};
104
1b29c164 105struct swsusp_header {
081a9d04
BS
106 char reserved[PAGE_SIZE - 20 - sizeof(sector_t) - sizeof(int) -
107 sizeof(u32)];
108 u32 crc32;
3aef83e0 109 sector_t image;
a634cc10 110 unsigned int flags; /* Flags to pass to the "boot" kernel */
61159a31
RW
111 char orig_sig[10];
112 char sig[10];
52f5684c 113} __packed;
1b29c164
VG
114
115static struct swsusp_header *swsusp_header;
61159a31 116
0414f2ec
NC
117/**
118 * The following functions are used for tracing the allocated
119 * swap pages, so that they can be freed in case of an error.
120 */
121
122struct swsusp_extent {
123 struct rb_node node;
124 unsigned long start;
125 unsigned long end;
126};
127
128static struct rb_root swsusp_extents = RB_ROOT;
129
130static int swsusp_extents_insert(unsigned long swap_offset)
131{
132 struct rb_node **new = &(swsusp_extents.rb_node);
133 struct rb_node *parent = NULL;
134 struct swsusp_extent *ext;
135
136 /* Figure out where to put the new node */
137 while (*new) {
8316bd72 138 ext = rb_entry(*new, struct swsusp_extent, node);
0414f2ec
NC
139 parent = *new;
140 if (swap_offset < ext->start) {
141 /* Try to merge */
142 if (swap_offset == ext->start - 1) {
143 ext->start--;
144 return 0;
145 }
146 new = &((*new)->rb_left);
147 } else if (swap_offset > ext->end) {
148 /* Try to merge */
149 if (swap_offset == ext->end + 1) {
150 ext->end++;
151 return 0;
152 }
153 new = &((*new)->rb_right);
154 } else {
155 /* It already is in the tree */
156 return -EINVAL;
157 }
158 }
159 /* Add the new node and rebalance the tree. */
160 ext = kzalloc(sizeof(struct swsusp_extent), GFP_KERNEL);
161 if (!ext)
162 return -ENOMEM;
163
164 ext->start = swap_offset;
165 ext->end = swap_offset;
166 rb_link_node(&ext->node, parent, new);
167 rb_insert_color(&ext->node, &swsusp_extents);
168 return 0;
169}
170
171/**
172 * alloc_swapdev_block - allocate a swap page and register that it has
173 * been allocated, so that it can be freed in case of an error.
174 */
175
176sector_t alloc_swapdev_block(int swap)
177{
178 unsigned long offset;
179
910321ea 180 offset = swp_offset(get_swap_page_of_type(swap));
0414f2ec
NC
181 if (offset) {
182 if (swsusp_extents_insert(offset))
910321ea 183 swap_free(swp_entry(swap, offset));
0414f2ec
NC
184 else
185 return swapdev_block(swap, offset);
186 }
187 return 0;
188}
189
190/**
191 * free_all_swap_pages - free swap pages allocated for saving image data.
90133673 192 * It also frees the extents used to register which swap entries had been
0414f2ec
NC
193 * allocated.
194 */
195
196void free_all_swap_pages(int swap)
197{
198 struct rb_node *node;
199
200 while ((node = swsusp_extents.rb_node)) {
201 struct swsusp_extent *ext;
202 unsigned long offset;
203
47087eeb 204 ext = rb_entry(node, struct swsusp_extent, node);
0414f2ec
NC
205 rb_erase(node, &swsusp_extents);
206 for (offset = ext->start; offset <= ext->end; offset++)
910321ea 207 swap_free(swp_entry(swap, offset));
0414f2ec
NC
208
209 kfree(ext);
210 }
211}
212
213int swsusp_swap_in_use(void)
214{
215 return (swsusp_extents.rb_node != NULL);
216}
217
61159a31 218/*
3fc6b34f 219 * General things
61159a31
RW
220 */
221
222static unsigned short root_swap = 0xffff;
343df3c7
CH
223static struct block_device *hib_resume_bdev;
224
225struct hib_bio_batch {
226 atomic_t count;
227 wait_queue_head_t wait;
4e4cbee9 228 blk_status_t error;
55c4478a 229 struct blk_plug plug;
343df3c7
CH
230};
231
232static void hib_init_batch(struct hib_bio_batch *hb)
233{
234 atomic_set(&hb->count, 0);
235 init_waitqueue_head(&hb->wait);
4e4cbee9 236 hb->error = BLK_STS_OK;
55c4478a
XC
237 blk_start_plug(&hb->plug);
238}
239
240static void hib_finish_batch(struct hib_bio_batch *hb)
241{
242 blk_finish_plug(&hb->plug);
343df3c7
CH
243}
244
4246a0b6 245static void hib_end_io(struct bio *bio)
343df3c7
CH
246{
247 struct hib_bio_batch *hb = bio->bi_private;
263663cd 248 struct page *page = bio_first_page_all(bio);
343df3c7 249
4e4cbee9 250 if (bio->bi_status) {
64ec72a1
JP
251 pr_alert("Read-error on swap-device (%u:%u:%Lu)\n",
252 MAJOR(bio_dev(bio)), MINOR(bio_dev(bio)),
253 (unsigned long long)bio->bi_iter.bi_sector);
343df3c7
CH
254 }
255
256 if (bio_data_dir(bio) == WRITE)
257 put_page(page);
f6cf0545
JM
258 else if (clean_pages_on_read)
259 flush_icache_range((unsigned long)page_address(page),
260 (unsigned long)page_address(page) + PAGE_SIZE);
343df3c7 261
4e4cbee9
CH
262 if (bio->bi_status && !hb->error)
263 hb->error = bio->bi_status;
343df3c7
CH
264 if (atomic_dec_and_test(&hb->count))
265 wake_up(&hb->wait);
266
267 bio_put(bio);
268}
269
162b99e3 270static int hib_submit_io(int op, int op_flags, pgoff_t page_off, void *addr,
343df3c7
CH
271 struct hib_bio_batch *hb)
272{
273 struct page *page = virt_to_page(addr);
274 struct bio *bio;
275 int error = 0;
276
0eb0b63c 277 bio = bio_alloc(GFP_NOIO | __GFP_HIGH, 1);
343df3c7 278 bio->bi_iter.bi_sector = page_off * (PAGE_SIZE >> 9);
74d46992 279 bio_set_dev(bio, hib_resume_bdev);
162b99e3 280 bio_set_op_attrs(bio, op, op_flags);
343df3c7
CH
281
282 if (bio_add_page(bio, page, PAGE_SIZE, 0) < PAGE_SIZE) {
64ec72a1
JP
283 pr_err("Adding page to bio failed at %llu\n",
284 (unsigned long long)bio->bi_iter.bi_sector);
343df3c7
CH
285 bio_put(bio);
286 return -EFAULT;
287 }
288
289 if (hb) {
290 bio->bi_end_io = hib_end_io;
291 bio->bi_private = hb;
292 atomic_inc(&hb->count);
4e49ea4a 293 submit_bio(bio);
343df3c7 294 } else {
4e49ea4a 295 error = submit_bio_wait(bio);
343df3c7
CH
296 bio_put(bio);
297 }
298
299 return error;
300}
301
01de5fcd 302static int hib_wait_io(struct hib_bio_batch *hb)
343df3c7 303{
55c4478a
XC
304 /*
305 * We are relying on the behavior of blk_plug that a thread with
306 * a plug will flush the plug list before sleeping.
307 */
343df3c7 308 wait_event(hb->wait, atomic_read(&hb->count) == 0);
01de5fcd 309 return blk_status_to_errno(hb->error);
343df3c7 310}
3fc6b34f 311
3fc6b34f
RW
312/*
313 * Saving part
314 */
61159a31 315
51fb352b 316static int mark_swapfiles(struct swap_map_handle *handle, unsigned int flags)
61159a31
RW
317{
318 int error;
319
70fd7614 320 hib_submit_io(REQ_OP_READ, 0, swsusp_resume_block,
162b99e3 321 swsusp_header, NULL);
1b29c164
VG
322 if (!memcmp("SWAP-SPACE",swsusp_header->sig, 10) ||
323 !memcmp("SWAPSPACE2",swsusp_header->sig, 10)) {
324 memcpy(swsusp_header->orig_sig,swsusp_header->sig, 10);
3624eb04 325 memcpy(swsusp_header->sig, HIBERNATE_SIG, 10);
51fb352b 326 swsusp_header->image = handle->first_sector;
a634cc10 327 swsusp_header->flags = flags;
081a9d04
BS
328 if (flags & SF_CRC32_MODE)
329 swsusp_header->crc32 = handle->crc32;
70fd7614 330 error = hib_submit_io(REQ_OP_WRITE, REQ_SYNC,
162b99e3 331 swsusp_resume_block, swsusp_header, NULL);
61159a31 332 } else {
64ec72a1 333 pr_err("Swap header not found!\n");
61159a31
RW
334 error = -ENODEV;
335 }
336 return error;
337}
338
339/**
340 * swsusp_swap_check - check if the resume device is a swap device
341 * and get its index (if so)
6f612af5
JS
342 *
343 * This is called before saving image
61159a31 344 */
6f612af5 345static int swsusp_swap_check(void)
61159a31 346{
3aef83e0
RW
347 int res;
348
21bd9005
CH
349 if (swsusp_resume_device)
350 res = swap_type_of(swsusp_resume_device, swsusp_resume_block);
351 else
352 res = find_first_swap(&swsusp_resume_device);
3aef83e0
RW
353 if (res < 0)
354 return res;
3aef83e0 355 root_swap = res;
21bd9005 356
36daaa98
CH
357 hib_resume_bdev = blkdev_get_by_dev(swsusp_resume_device, FMODE_WRITE,
358 NULL);
359 if (IS_ERR(hib_resume_bdev))
360 return PTR_ERR(hib_resume_bdev);
3aef83e0 361
8a0d613f 362 res = set_blocksize(hib_resume_bdev, PAGE_SIZE);
3aef83e0 363 if (res < 0)
8a0d613f 364 blkdev_put(hib_resume_bdev, FMODE_WRITE);
61159a31 365
61159a31
RW
366 return res;
367}
368
369/**
370 * write_page - Write one page to given swap location.
371 * @buf: Address we're writing.
372 * @offset: Offset of the swap page we're writing to.
343df3c7 373 * @hb: bio completion batch
61159a31
RW
374 */
375
343df3c7 376static int write_page(void *buf, sector_t offset, struct hib_bio_batch *hb)
61159a31 377{
3aef83e0 378 void *src;
081a9d04 379 int ret;
3aef83e0
RW
380
381 if (!offset)
382 return -ENOSPC;
383
343df3c7 384 if (hb) {
0eb0b63c 385 src = (void *)__get_free_page(GFP_NOIO | __GFP_NOWARN |
5a21d489 386 __GFP_NORETRY);
3aef83e0 387 if (src) {
3ecb01df 388 copy_page(src, buf);
3aef83e0 389 } else {
343df3c7 390 ret = hib_wait_io(hb); /* Free pages */
081a9d04
BS
391 if (ret)
392 return ret;
0eb0b63c 393 src = (void *)__get_free_page(GFP_NOIO |
5a21d489
BS
394 __GFP_NOWARN |
395 __GFP_NORETRY);
081a9d04
BS
396 if (src) {
397 copy_page(src, buf);
398 } else {
399 WARN_ON_ONCE(1);
343df3c7 400 hb = NULL; /* Go synchronous */
081a9d04
BS
401 src = buf;
402 }
ab954160 403 }
3aef83e0
RW
404 } else {
405 src = buf;
61159a31 406 }
70fd7614 407 return hib_submit_io(REQ_OP_WRITE, REQ_SYNC, offset, src, hb);
61159a31
RW
408}
409
61159a31
RW
410static void release_swap_writer(struct swap_map_handle *handle)
411{
412 if (handle->cur)
413 free_page((unsigned long)handle->cur);
414 handle->cur = NULL;
61159a31
RW
415}
416
417static int get_swap_writer(struct swap_map_handle *handle)
418{
6f612af5
JS
419 int ret;
420
421 ret = swsusp_swap_check();
422 if (ret) {
423 if (ret != -ENOSPC)
64ec72a1 424 pr_err("Cannot find swap device, try swapon -a\n");
6f612af5
JS
425 return ret;
426 }
61159a31 427 handle->cur = (struct swap_map_page *)get_zeroed_page(GFP_KERNEL);
6f612af5
JS
428 if (!handle->cur) {
429 ret = -ENOMEM;
430 goto err_close;
431 }
d1d241cc 432 handle->cur_swap = alloc_swapdev_block(root_swap);
61159a31 433 if (!handle->cur_swap) {
6f612af5
JS
434 ret = -ENOSPC;
435 goto err_rel;
61159a31
RW
436 }
437 handle->k = 0;
f8262d47 438 handle->reqd_free_pages = reqd_free_pages();
51fb352b 439 handle->first_sector = handle->cur_swap;
61159a31 440 return 0;
6f612af5
JS
441err_rel:
442 release_swap_writer(handle);
443err_close:
444 swsusp_close(FMODE_WRITE);
445 return ret;
61159a31
RW
446}
447
ab954160 448static int swap_write_page(struct swap_map_handle *handle, void *buf,
343df3c7 449 struct hib_bio_batch *hb)
ab954160
AM
450{
451 int error = 0;
3aef83e0 452 sector_t offset;
61159a31
RW
453
454 if (!handle->cur)
455 return -EINVAL;
d1d241cc 456 offset = alloc_swapdev_block(root_swap);
343df3c7 457 error = write_page(buf, offset, hb);
61159a31
RW
458 if (error)
459 return error;
460 handle->cur->entries[handle->k++] = offset;
461 if (handle->k >= MAP_PAGE_ENTRIES) {
d1d241cc 462 offset = alloc_swapdev_block(root_swap);
61159a31
RW
463 if (!offset)
464 return -ENOSPC;
465 handle->cur->next_swap = offset;
343df3c7 466 error = write_page(handle->cur, handle->cur_swap, hb);
61159a31 467 if (error)
ab954160 468 goto out;
3ecb01df 469 clear_page(handle->cur);
61159a31
RW
470 handle->cur_swap = offset;
471 handle->k = 0;
5a21d489 472
343df3c7
CH
473 if (hb && low_free_pages() <= handle->reqd_free_pages) {
474 error = hib_wait_io(hb);
5a21d489
BS
475 if (error)
476 goto out;
477 /*
478 * Recalculate the number of required free pages, to
479 * make sure we never take more than half.
480 */
481 handle->reqd_free_pages = reqd_free_pages();
482 }
081a9d04 483 }
59a49335 484 out:
ab954160 485 return error;
61159a31
RW
486}
487
488static int flush_swap_writer(struct swap_map_handle *handle)
489{
490 if (handle->cur && handle->cur_swap)
ab954160 491 return write_page(handle->cur, handle->cur_swap, NULL);
61159a31
RW
492 else
493 return -EINVAL;
494}
495
6f612af5
JS
496static int swap_writer_finish(struct swap_map_handle *handle,
497 unsigned int flags, int error)
498{
499 if (!error) {
64ec72a1 500 pr_info("S");
6f612af5 501 error = mark_swapfiles(handle, flags);
64ec72a1 502 pr_cont("|\n");
fef9c8d2 503 flush_swap_writer(handle);
6f612af5
JS
504 }
505
506 if (error)
507 free_all_swap_pages(root_swap);
508 release_swap_writer(handle);
509 swsusp_close(FMODE_WRITE);
510
511 return error;
512}
513
f996fc96
BS
514/* We need to remember how much compressed data we need to read. */
515#define LZO_HEADER sizeof(size_t)
516
517/* Number of pages/bytes we'll compress at one time. */
518#define LZO_UNC_PAGES 32
519#define LZO_UNC_SIZE (LZO_UNC_PAGES * PAGE_SIZE)
520
521/* Number of pages/bytes we need for compressed data (worst case). */
522#define LZO_CMP_PAGES DIV_ROUND_UP(lzo1x_worst_compress(LZO_UNC_SIZE) + \
523 LZO_HEADER, PAGE_SIZE)
524#define LZO_CMP_SIZE (LZO_CMP_PAGES * PAGE_SIZE)
525
081a9d04
BS
526/* Maximum number of threads for compression/decompression. */
527#define LZO_THREADS 3
528
5a21d489
BS
529/* Minimum/maximum number of pages for read buffering. */
530#define LZO_MIN_RD_PAGES 1024
531#define LZO_MAX_RD_PAGES 8192
081a9d04
BS
532
533
61159a31
RW
534/**
535 * save_image - save the suspend image data
536 */
537
538static int save_image(struct swap_map_handle *handle,
539 struct snapshot_handle *snapshot,
3a4f7577 540 unsigned int nr_to_write)
61159a31
RW
541{
542 unsigned int m;
543 int ret;
3a4f7577 544 int nr_pages;
ab954160 545 int err2;
343df3c7 546 struct hib_bio_batch hb;
db597605
TR
547 ktime_t start;
548 ktime_t stop;
61159a31 549
343df3c7
CH
550 hib_init_batch(&hb);
551
64ec72a1 552 pr_info("Saving image data pages (%u pages)...\n",
23976728 553 nr_to_write);
d8150d35 554 m = nr_to_write / 10;
61159a31
RW
555 if (!m)
556 m = 1;
557 nr_pages = 0;
db597605 558 start = ktime_get();
4ff277f9 559 while (1) {
d3c1b24c 560 ret = snapshot_read_next(snapshot);
4ff277f9
JS
561 if (ret <= 0)
562 break;
343df3c7 563 ret = swap_write_page(handle, data_of(*snapshot), &hb);
4ff277f9
JS
564 if (ret)
565 break;
566 if (!(nr_pages % m))
64ec72a1
JP
567 pr_info("Image saving progress: %3d%%\n",
568 nr_pages / m * 10);
4ff277f9
JS
569 nr_pages++;
570 }
343df3c7 571 err2 = hib_wait_io(&hb);
55c4478a 572 hib_finish_batch(&hb);
db597605 573 stop = ktime_get();
4ff277f9
JS
574 if (!ret)
575 ret = err2;
576 if (!ret)
64ec72a1 577 pr_info("Image saving done\n");
db597605 578 swsusp_show_speed(start, stop, nr_to_write, "Wrote");
4ff277f9 579 return ret;
61159a31
RW
580}
581
081a9d04
BS
582/**
583 * Structure used for CRC32.
584 */
585struct crc_data {
586 struct task_struct *thr; /* thread */
587 atomic_t ready; /* ready to start flag */
588 atomic_t stop; /* ready to stop flag */
589 unsigned run_threads; /* nr current threads */
590 wait_queue_head_t go; /* start crc update */
591 wait_queue_head_t done; /* crc update done */
592 u32 *crc32; /* points to handle's crc32 */
593 size_t *unc_len[LZO_THREADS]; /* uncompressed lengths */
594 unsigned char *unc[LZO_THREADS]; /* uncompressed data */
595};
596
597/**
598 * CRC32 update function that runs in its own thread.
599 */
600static int crc32_threadfn(void *data)
601{
602 struct crc_data *d = data;
603 unsigned i;
604
605 while (1) {
606 wait_event(d->go, atomic_read(&d->ready) ||
607 kthread_should_stop());
608 if (kthread_should_stop()) {
609 d->thr = NULL;
610 atomic_set(&d->stop, 1);
611 wake_up(&d->done);
612 break;
613 }
614 atomic_set(&d->ready, 0);
615
616 for (i = 0; i < d->run_threads; i++)
617 *d->crc32 = crc32_le(*d->crc32,
618 d->unc[i], *d->unc_len[i]);
619 atomic_set(&d->stop, 1);
620 wake_up(&d->done);
621 }
622 return 0;
623}
624/**
625 * Structure used for LZO data compression.
626 */
627struct cmp_data {
628 struct task_struct *thr; /* thread */
629 atomic_t ready; /* ready to start flag */
630 atomic_t stop; /* ready to stop flag */
631 int ret; /* return code */
632 wait_queue_head_t go; /* start compression */
633 wait_queue_head_t done; /* compression done */
634 size_t unc_len; /* uncompressed length */
635 size_t cmp_len; /* compressed length */
636 unsigned char unc[LZO_UNC_SIZE]; /* uncompressed buffer */
637 unsigned char cmp[LZO_CMP_SIZE]; /* compressed buffer */
638 unsigned char wrk[LZO1X_1_MEM_COMPRESS]; /* compression workspace */
639};
640
641/**
642 * Compression function that runs in its own thread.
643 */
644static int lzo_compress_threadfn(void *data)
645{
646 struct cmp_data *d = data;
647
648 while (1) {
649 wait_event(d->go, atomic_read(&d->ready) ||
650 kthread_should_stop());
651 if (kthread_should_stop()) {
652 d->thr = NULL;
653 d->ret = -1;
654 atomic_set(&d->stop, 1);
655 wake_up(&d->done);
656 break;
657 }
658 atomic_set(&d->ready, 0);
659
660 d->ret = lzo1x_1_compress(d->unc, d->unc_len,
661 d->cmp + LZO_HEADER, &d->cmp_len,
662 d->wrk);
663 atomic_set(&d->stop, 1);
664 wake_up(&d->done);
665 }
666 return 0;
667}
f996fc96
BS
668
669/**
670 * save_image_lzo - Save the suspend image data compressed with LZO.
057b0a75 671 * @handle: Swap map handle to use for saving the image.
f996fc96
BS
672 * @snapshot: Image to read data from.
673 * @nr_to_write: Number of pages to save.
674 */
675static int save_image_lzo(struct swap_map_handle *handle,
676 struct snapshot_handle *snapshot,
677 unsigned int nr_to_write)
678{
679 unsigned int m;
680 int ret = 0;
681 int nr_pages;
682 int err2;
343df3c7 683 struct hib_bio_batch hb;
db597605
TR
684 ktime_t start;
685 ktime_t stop;
081a9d04
BS
686 size_t off;
687 unsigned thr, run_threads, nr_threads;
688 unsigned char *page = NULL;
689 struct cmp_data *data = NULL;
690 struct crc_data *crc = NULL;
691
343df3c7
CH
692 hib_init_batch(&hb);
693
081a9d04
BS
694 /*
695 * We'll limit the number of threads for compression to limit memory
696 * footprint.
697 */
698 nr_threads = num_online_cpus() - 1;
699 nr_threads = clamp_val(nr_threads, 1, LZO_THREADS);
f996fc96 700
0eb0b63c 701 page = (void *)__get_free_page(GFP_NOIO | __GFP_HIGH);
f996fc96 702 if (!page) {
64ec72a1 703 pr_err("Failed to allocate LZO page\n");
081a9d04
BS
704 ret = -ENOMEM;
705 goto out_clean;
f996fc96
BS
706 }
707
9437e393 708 data = vzalloc(array_size(nr_threads, sizeof(*data)));
081a9d04 709 if (!data) {
64ec72a1 710 pr_err("Failed to allocate LZO data\n");
081a9d04
BS
711 ret = -ENOMEM;
712 goto out_clean;
f996fc96
BS
713 }
714
9437e393 715 crc = kzalloc(sizeof(*crc), GFP_KERNEL);
081a9d04 716 if (!crc) {
64ec72a1 717 pr_err("Failed to allocate crc\n");
081a9d04
BS
718 ret = -ENOMEM;
719 goto out_clean;
720 }
081a9d04
BS
721
722 /*
723 * Start the compression threads.
724 */
725 for (thr = 0; thr < nr_threads; thr++) {
726 init_waitqueue_head(&data[thr].go);
727 init_waitqueue_head(&data[thr].done);
728
729 data[thr].thr = kthread_run(lzo_compress_threadfn,
730 &data[thr],
731 "image_compress/%u", thr);
732 if (IS_ERR(data[thr].thr)) {
733 data[thr].thr = NULL;
64ec72a1 734 pr_err("Cannot start compression threads\n");
081a9d04
BS
735 ret = -ENOMEM;
736 goto out_clean;
737 }
f996fc96
BS
738 }
739
081a9d04
BS
740 /*
741 * Start the CRC32 thread.
742 */
743 init_waitqueue_head(&crc->go);
744 init_waitqueue_head(&crc->done);
745
746 handle->crc32 = 0;
747 crc->crc32 = &handle->crc32;
748 for (thr = 0; thr < nr_threads; thr++) {
749 crc->unc[thr] = data[thr].unc;
750 crc->unc_len[thr] = &data[thr].unc_len;
751 }
752
753 crc->thr = kthread_run(crc32_threadfn, crc, "image_crc32");
754 if (IS_ERR(crc->thr)) {
755 crc->thr = NULL;
64ec72a1 756 pr_err("Cannot start CRC32 thread\n");
081a9d04
BS
757 ret = -ENOMEM;
758 goto out_clean;
f996fc96
BS
759 }
760
5a21d489
BS
761 /*
762 * Adjust the number of required free pages after all allocations have
763 * been done. We don't want to run out of pages when writing.
764 */
765 handle->reqd_free_pages = reqd_free_pages();
766
64ec72a1
JP
767 pr_info("Using %u thread(s) for compression\n", nr_threads);
768 pr_info("Compressing and saving image data (%u pages)...\n",
769 nr_to_write);
d8150d35 770 m = nr_to_write / 10;
f996fc96
BS
771 if (!m)
772 m = 1;
773 nr_pages = 0;
db597605 774 start = ktime_get();
f996fc96 775 for (;;) {
081a9d04
BS
776 for (thr = 0; thr < nr_threads; thr++) {
777 for (off = 0; off < LZO_UNC_SIZE; off += PAGE_SIZE) {
778 ret = snapshot_read_next(snapshot);
779 if (ret < 0)
780 goto out_finish;
781
782 if (!ret)
783 break;
784
785 memcpy(data[thr].unc + off,
786 data_of(*snapshot), PAGE_SIZE);
787
788 if (!(nr_pages % m))
64ec72a1
JP
789 pr_info("Image saving progress: %3d%%\n",
790 nr_pages / m * 10);
081a9d04
BS
791 nr_pages++;
792 }
793 if (!off)
f996fc96
BS
794 break;
795
081a9d04 796 data[thr].unc_len = off;
f996fc96 797
081a9d04
BS
798 atomic_set(&data[thr].ready, 1);
799 wake_up(&data[thr].go);
f996fc96
BS
800 }
801
081a9d04 802 if (!thr)
f996fc96
BS
803 break;
804
081a9d04
BS
805 crc->run_threads = thr;
806 atomic_set(&crc->ready, 1);
807 wake_up(&crc->go);
f996fc96 808
081a9d04
BS
809 for (run_threads = thr, thr = 0; thr < run_threads; thr++) {
810 wait_event(data[thr].done,
811 atomic_read(&data[thr].stop));
812 atomic_set(&data[thr].stop, 0);
f996fc96 813
081a9d04 814 ret = data[thr].ret;
f996fc96 815
081a9d04 816 if (ret < 0) {
64ec72a1 817 pr_err("LZO compression failed\n");
081a9d04
BS
818 goto out_finish;
819 }
f996fc96 820
081a9d04
BS
821 if (unlikely(!data[thr].cmp_len ||
822 data[thr].cmp_len >
823 lzo1x_worst_compress(data[thr].unc_len))) {
64ec72a1 824 pr_err("Invalid LZO compressed length\n");
081a9d04 825 ret = -1;
f996fc96 826 goto out_finish;
081a9d04
BS
827 }
828
829 *(size_t *)data[thr].cmp = data[thr].cmp_len;
830
831 /*
832 * Given we are writing one page at a time to disk, we
833 * copy that much from the buffer, although the last
834 * bit will likely be smaller than full page. This is
835 * OK - we saved the length of the compressed data, so
836 * any garbage at the end will be discarded when we
837 * read it.
838 */
839 for (off = 0;
840 off < LZO_HEADER + data[thr].cmp_len;
841 off += PAGE_SIZE) {
842 memcpy(page, data[thr].cmp + off, PAGE_SIZE);
843
343df3c7 844 ret = swap_write_page(handle, page, &hb);
081a9d04
BS
845 if (ret)
846 goto out_finish;
847 }
f996fc96 848 }
081a9d04
BS
849
850 wait_event(crc->done, atomic_read(&crc->stop));
851 atomic_set(&crc->stop, 0);
f996fc96
BS
852 }
853
854out_finish:
343df3c7 855 err2 = hib_wait_io(&hb);
db597605 856 stop = ktime_get();
f996fc96
BS
857 if (!ret)
858 ret = err2;
d8150d35 859 if (!ret)
64ec72a1 860 pr_info("Image saving done\n");
db597605 861 swsusp_show_speed(start, stop, nr_to_write, "Wrote");
081a9d04 862out_clean:
55c4478a 863 hib_finish_batch(&hb);
081a9d04
BS
864 if (crc) {
865 if (crc->thr)
866 kthread_stop(crc->thr);
867 kfree(crc);
868 }
869 if (data) {
870 for (thr = 0; thr < nr_threads; thr++)
871 if (data[thr].thr)
872 kthread_stop(data[thr].thr);
873 vfree(data);
874 }
875 if (page) free_page((unsigned long)page);
f996fc96
BS
876
877 return ret;
878}
879
61159a31
RW
880/**
881 * enough_swap - Make sure we have enough swap to save the image.
882 *
883 * Returns TRUE or FALSE after checking the total amount of swap
e4b2897a 884 * space available from the resume partition.
61159a31
RW
885 */
886
8ffdfe35 887static int enough_swap(unsigned int nr_pages)
61159a31
RW
888{
889 unsigned int free_swap = count_swap_pages(root_swap, 1);
f996fc96 890 unsigned int required;
61159a31 891
64ec72a1 892 pr_debug("Free swap pages: %u\n", free_swap);
f996fc96 893
ee34a370 894 required = PAGES_FOR_IO + nr_pages;
f996fc96 895 return free_swap > required;
61159a31
RW
896}
897
898/**
899 * swsusp_write - Write entire image and metadata.
a634cc10 900 * @flags: flags to pass to the "boot" kernel in the image header
61159a31
RW
901 *
902 * It is important _NOT_ to umount filesystems at this point. We want
903 * them synced (in case something goes wrong) but we DO not want to mark
904 * filesystem clean: it is not. (And it does not matter, if we resume
905 * correctly, we'll mark system clean, anyway.)
906 */
907
a634cc10 908int swsusp_write(unsigned int flags)
61159a31
RW
909{
910 struct swap_map_handle handle;
911 struct snapshot_handle snapshot;
912 struct swsusp_info *header;
6f612af5 913 unsigned long pages;
61159a31
RW
914 int error;
915
6f612af5
JS
916 pages = snapshot_get_image_size();
917 error = get_swap_writer(&handle);
3aef83e0 918 if (error) {
64ec72a1 919 pr_err("Cannot get swap writer\n");
61159a31
RW
920 return error;
921 }
ee34a370 922 if (flags & SF_NOCOMPRESS_MODE) {
8ffdfe35 923 if (!enough_swap(pages)) {
64ec72a1 924 pr_err("Not enough free swap\n");
ee34a370
BS
925 error = -ENOSPC;
926 goto out_finish;
927 }
6f612af5 928 }
61159a31 929 memset(&snapshot, 0, sizeof(struct snapshot_handle));
d3c1b24c 930 error = snapshot_read_next(&snapshot);
d5641c64 931 if (error < (int)PAGE_SIZE) {
3aef83e0
RW
932 if (error >= 0)
933 error = -EFAULT;
934
6f612af5 935 goto out_finish;
3aef83e0 936 }
61159a31 937 header = (struct swsusp_info *)data_of(snapshot);
6f612af5 938 error = swap_write_page(&handle, header, NULL);
f996fc96
BS
939 if (!error) {
940 error = (flags & SF_NOCOMPRESS_MODE) ?
941 save_image(&handle, &snapshot, pages - 1) :
942 save_image_lzo(&handle, &snapshot, pages - 1);
943 }
6f612af5
JS
944out_finish:
945 error = swap_writer_finish(&handle, flags, error);
61159a31
RW
946 return error;
947}
948
61159a31
RW
949/**
950 * The following functions allow us to read data using a swap map
951 * in a file-alike way
952 */
953
954static void release_swap_reader(struct swap_map_handle *handle)
955{
081a9d04
BS
956 struct swap_map_page_list *tmp;
957
958 while (handle->maps) {
959 if (handle->maps->map)
960 free_page((unsigned long)handle->maps->map);
961 tmp = handle->maps;
962 handle->maps = handle->maps->next;
963 kfree(tmp);
964 }
61159a31
RW
965 handle->cur = NULL;
966}
967
6f612af5
JS
968static int get_swap_reader(struct swap_map_handle *handle,
969 unsigned int *flags_p)
61159a31
RW
970{
971 int error;
081a9d04
BS
972 struct swap_map_page_list *tmp, *last;
973 sector_t offset;
61159a31 974
6f612af5
JS
975 *flags_p = swsusp_header->flags;
976
977 if (!swsusp_header->image) /* how can this happen? */
61159a31 978 return -EINVAL;
3aef83e0 979
081a9d04
BS
980 handle->cur = NULL;
981 last = handle->maps = NULL;
982 offset = swsusp_header->image;
983 while (offset) {
2f02a7ec 984 tmp = kzalloc(sizeof(*handle->maps), GFP_KERNEL);
081a9d04
BS
985 if (!tmp) {
986 release_swap_reader(handle);
987 return -ENOMEM;
988 }
081a9d04
BS
989 if (!handle->maps)
990 handle->maps = tmp;
991 if (last)
992 last->next = tmp;
993 last = tmp;
994
995 tmp->map = (struct swap_map_page *)
0eb0b63c 996 __get_free_page(GFP_NOIO | __GFP_HIGH);
081a9d04
BS
997 if (!tmp->map) {
998 release_swap_reader(handle);
999 return -ENOMEM;
1000 }
3aef83e0 1001
70fd7614 1002 error = hib_submit_io(REQ_OP_READ, 0, offset, tmp->map, NULL);
081a9d04
BS
1003 if (error) {
1004 release_swap_reader(handle);
1005 return error;
1006 }
1007 offset = tmp->map->next_swap;
61159a31
RW
1008 }
1009 handle->k = 0;
081a9d04 1010 handle->cur = handle->maps->map;
61159a31
RW
1011 return 0;
1012}
1013
546e0d27 1014static int swap_read_page(struct swap_map_handle *handle, void *buf,
343df3c7 1015 struct hib_bio_batch *hb)
61159a31 1016{
3aef83e0 1017 sector_t offset;
61159a31 1018 int error;
081a9d04 1019 struct swap_map_page_list *tmp;
61159a31
RW
1020
1021 if (!handle->cur)
1022 return -EINVAL;
1023 offset = handle->cur->entries[handle->k];
1024 if (!offset)
1025 return -EFAULT;
70fd7614 1026 error = hib_submit_io(REQ_OP_READ, 0, offset, buf, hb);
61159a31
RW
1027 if (error)
1028 return error;
1029 if (++handle->k >= MAP_PAGE_ENTRIES) {
1030 handle->k = 0;
081a9d04
BS
1031 free_page((unsigned long)handle->maps->map);
1032 tmp = handle->maps;
1033 handle->maps = handle->maps->next;
1034 kfree(tmp);
1035 if (!handle->maps)
61159a31 1036 release_swap_reader(handle);
081a9d04
BS
1037 else
1038 handle->cur = handle->maps->map;
61159a31
RW
1039 }
1040 return error;
1041}
1042
6f612af5
JS
1043static int swap_reader_finish(struct swap_map_handle *handle)
1044{
1045 release_swap_reader(handle);
1046
1047 return 0;
1048}
1049
61159a31
RW
1050/**
1051 * load_image - load the image using the swap map handle
1052 * @handle and the snapshot handle @snapshot
1053 * (assume there are @nr_pages pages to load)
1054 */
1055
1056static int load_image(struct swap_map_handle *handle,
1057 struct snapshot_handle *snapshot,
546e0d27 1058 unsigned int nr_to_read)
61159a31
RW
1059{
1060 unsigned int m;
081a9d04 1061 int ret = 0;
db597605
TR
1062 ktime_t start;
1063 ktime_t stop;
343df3c7 1064 struct hib_bio_batch hb;
546e0d27
AM
1065 int err2;
1066 unsigned nr_pages;
61159a31 1067
343df3c7
CH
1068 hib_init_batch(&hb);
1069
f6cf0545 1070 clean_pages_on_read = true;
64ec72a1 1071 pr_info("Loading image data pages (%u pages)...\n", nr_to_read);
d8150d35 1072 m = nr_to_read / 10;
61159a31
RW
1073 if (!m)
1074 m = 1;
1075 nr_pages = 0;
db597605 1076 start = ktime_get();
546e0d27 1077 for ( ; ; ) {
081a9d04
BS
1078 ret = snapshot_write_next(snapshot);
1079 if (ret <= 0)
546e0d27 1080 break;
343df3c7 1081 ret = swap_read_page(handle, data_of(*snapshot), &hb);
081a9d04 1082 if (ret)
546e0d27
AM
1083 break;
1084 if (snapshot->sync_read)
343df3c7 1085 ret = hib_wait_io(&hb);
081a9d04 1086 if (ret)
546e0d27
AM
1087 break;
1088 if (!(nr_pages % m))
64ec72a1
JP
1089 pr_info("Image loading progress: %3d%%\n",
1090 nr_pages / m * 10);
546e0d27
AM
1091 nr_pages++;
1092 }
343df3c7 1093 err2 = hib_wait_io(&hb);
55c4478a 1094 hib_finish_batch(&hb);
db597605 1095 stop = ktime_get();
081a9d04
BS
1096 if (!ret)
1097 ret = err2;
1098 if (!ret) {
64ec72a1 1099 pr_info("Image loading done\n");
8357376d 1100 snapshot_write_finalize(snapshot);
e655a250 1101 if (!snapshot_image_loaded(snapshot))
081a9d04 1102 ret = -ENODATA;
d8150d35 1103 }
db597605 1104 swsusp_show_speed(start, stop, nr_to_read, "Read");
081a9d04
BS
1105 return ret;
1106}
1107
1108/**
1109 * Structure used for LZO data decompression.
1110 */
1111struct dec_data {
1112 struct task_struct *thr; /* thread */
1113 atomic_t ready; /* ready to start flag */
1114 atomic_t stop; /* ready to stop flag */
1115 int ret; /* return code */
1116 wait_queue_head_t go; /* start decompression */
1117 wait_queue_head_t done; /* decompression done */
1118 size_t unc_len; /* uncompressed length */
1119 size_t cmp_len; /* compressed length */
1120 unsigned char unc[LZO_UNC_SIZE]; /* uncompressed buffer */
1121 unsigned char cmp[LZO_CMP_SIZE]; /* compressed buffer */
1122};
1123
1124/**
6be2408a 1125 * Decompression function that runs in its own thread.
081a9d04
BS
1126 */
1127static int lzo_decompress_threadfn(void *data)
1128{
1129 struct dec_data *d = data;
1130
1131 while (1) {
1132 wait_event(d->go, atomic_read(&d->ready) ||
1133 kthread_should_stop());
1134 if (kthread_should_stop()) {
1135 d->thr = NULL;
1136 d->ret = -1;
1137 atomic_set(&d->stop, 1);
1138 wake_up(&d->done);
1139 break;
1140 }
1141 atomic_set(&d->ready, 0);
1142
1143 d->unc_len = LZO_UNC_SIZE;
1144 d->ret = lzo1x_decompress_safe(d->cmp + LZO_HEADER, d->cmp_len,
1145 d->unc, &d->unc_len);
f6cf0545
JM
1146 if (clean_pages_on_decompress)
1147 flush_icache_range((unsigned long)d->unc,
1148 (unsigned long)d->unc + d->unc_len);
1149
081a9d04
BS
1150 atomic_set(&d->stop, 1);
1151 wake_up(&d->done);
1152 }
1153 return 0;
61159a31
RW
1154}
1155
f996fc96
BS
1156/**
1157 * load_image_lzo - Load compressed image data and decompress them with LZO.
1158 * @handle: Swap map handle to use for loading data.
1159 * @snapshot: Image to copy uncompressed data into.
1160 * @nr_to_read: Number of pages to load.
1161 */
1162static int load_image_lzo(struct swap_map_handle *handle,
1163 struct snapshot_handle *snapshot,
1164 unsigned int nr_to_read)
1165{
1166 unsigned int m;
081a9d04
BS
1167 int ret = 0;
1168 int eof = 0;
343df3c7 1169 struct hib_bio_batch hb;
db597605
TR
1170 ktime_t start;
1171 ktime_t stop;
f996fc96 1172 unsigned nr_pages;
081a9d04
BS
1173 size_t off;
1174 unsigned i, thr, run_threads, nr_threads;
1175 unsigned ring = 0, pg = 0, ring_size = 0,
1176 have = 0, want, need, asked = 0;
5a21d489 1177 unsigned long read_pages = 0;
081a9d04
BS
1178 unsigned char **page = NULL;
1179 struct dec_data *data = NULL;
1180 struct crc_data *crc = NULL;
1181
343df3c7
CH
1182 hib_init_batch(&hb);
1183
081a9d04
BS
1184 /*
1185 * We'll limit the number of threads for decompression to limit memory
1186 * footprint.
1187 */
1188 nr_threads = num_online_cpus() - 1;
1189 nr_threads = clamp_val(nr_threads, 1, LZO_THREADS);
1190
42bc47b3 1191 page = vmalloc(array_size(LZO_MAX_RD_PAGES, sizeof(*page)));
081a9d04 1192 if (!page) {
64ec72a1 1193 pr_err("Failed to allocate LZO page\n");
081a9d04
BS
1194 ret = -ENOMEM;
1195 goto out_clean;
1196 }
9f339caf 1197
9437e393 1198 data = vzalloc(array_size(nr_threads, sizeof(*data)));
081a9d04 1199 if (!data) {
64ec72a1 1200 pr_err("Failed to allocate LZO data\n");
081a9d04
BS
1201 ret = -ENOMEM;
1202 goto out_clean;
1203 }
9f339caf 1204
9437e393 1205 crc = kzalloc(sizeof(*crc), GFP_KERNEL);
081a9d04 1206 if (!crc) {
64ec72a1 1207 pr_err("Failed to allocate crc\n");
081a9d04
BS
1208 ret = -ENOMEM;
1209 goto out_clean;
1210 }
081a9d04 1211
f6cf0545
JM
1212 clean_pages_on_decompress = true;
1213
081a9d04
BS
1214 /*
1215 * Start the decompression threads.
1216 */
1217 for (thr = 0; thr < nr_threads; thr++) {
1218 init_waitqueue_head(&data[thr].go);
1219 init_waitqueue_head(&data[thr].done);
1220
1221 data[thr].thr = kthread_run(lzo_decompress_threadfn,
1222 &data[thr],
1223 "image_decompress/%u", thr);
1224 if (IS_ERR(data[thr].thr)) {
1225 data[thr].thr = NULL;
64ec72a1 1226 pr_err("Cannot start decompression threads\n");
081a9d04
BS
1227 ret = -ENOMEM;
1228 goto out_clean;
9f339caf 1229 }
f996fc96
BS
1230 }
1231
081a9d04
BS
1232 /*
1233 * Start the CRC32 thread.
1234 */
1235 init_waitqueue_head(&crc->go);
1236 init_waitqueue_head(&crc->done);
1237
1238 handle->crc32 = 0;
1239 crc->crc32 = &handle->crc32;
1240 for (thr = 0; thr < nr_threads; thr++) {
1241 crc->unc[thr] = data[thr].unc;
1242 crc->unc_len[thr] = &data[thr].unc_len;
f996fc96
BS
1243 }
1244
081a9d04
BS
1245 crc->thr = kthread_run(crc32_threadfn, crc, "image_crc32");
1246 if (IS_ERR(crc->thr)) {
1247 crc->thr = NULL;
64ec72a1 1248 pr_err("Cannot start CRC32 thread\n");
081a9d04
BS
1249 ret = -ENOMEM;
1250 goto out_clean;
1251 }
9f339caf 1252
081a9d04 1253 /*
5a21d489
BS
1254 * Set the number of pages for read buffering.
1255 * This is complete guesswork, because we'll only know the real
1256 * picture once prepare_image() is called, which is much later on
1257 * during the image load phase. We'll assume the worst case and
1258 * say that none of the image pages are from high memory.
081a9d04 1259 */
5a21d489
BS
1260 if (low_free_pages() > snapshot_get_image_size())
1261 read_pages = (low_free_pages() - snapshot_get_image_size()) / 2;
1262 read_pages = clamp_val(read_pages, LZO_MIN_RD_PAGES, LZO_MAX_RD_PAGES);
9f339caf 1263
081a9d04
BS
1264 for (i = 0; i < read_pages; i++) {
1265 page[i] = (void *)__get_free_page(i < LZO_CMP_PAGES ?
0eb0b63c
CH
1266 GFP_NOIO | __GFP_HIGH :
1267 GFP_NOIO | __GFP_NOWARN |
71baba4b 1268 __GFP_NORETRY);
5a21d489 1269
081a9d04
BS
1270 if (!page[i]) {
1271 if (i < LZO_CMP_PAGES) {
1272 ring_size = i;
64ec72a1 1273 pr_err("Failed to allocate LZO pages\n");
081a9d04
BS
1274 ret = -ENOMEM;
1275 goto out_clean;
1276 } else {
1277 break;
1278 }
1279 }
f996fc96 1280 }
081a9d04 1281 want = ring_size = i;
f996fc96 1282
64ec72a1
JP
1283 pr_info("Using %u thread(s) for decompression\n", nr_threads);
1284 pr_info("Loading and decompressing image data (%u pages)...\n",
1285 nr_to_read);
d8150d35 1286 m = nr_to_read / 10;
f996fc96
BS
1287 if (!m)
1288 m = 1;
1289 nr_pages = 0;
db597605 1290 start = ktime_get();
f996fc96 1291
081a9d04
BS
1292 ret = snapshot_write_next(snapshot);
1293 if (ret <= 0)
f996fc96
BS
1294 goto out_finish;
1295
081a9d04
BS
1296 for(;;) {
1297 for (i = 0; !eof && i < want; i++) {
343df3c7 1298 ret = swap_read_page(handle, page[ring], &hb);
081a9d04
BS
1299 if (ret) {
1300 /*
1301 * On real read error, finish. On end of data,
1302 * set EOF flag and just exit the read loop.
1303 */
1304 if (handle->cur &&
1305 handle->cur->entries[handle->k]) {
1306 goto out_finish;
1307 } else {
1308 eof = 1;
1309 break;
1310 }
1311 }
1312 if (++ring >= ring_size)
1313 ring = 0;
f996fc96 1314 }
081a9d04
BS
1315 asked += i;
1316 want -= i;
f996fc96 1317
081a9d04
BS
1318 /*
1319 * We are out of data, wait for some more.
1320 */
1321 if (!have) {
1322 if (!asked)
1323 break;
1324
343df3c7 1325 ret = hib_wait_io(&hb);
081a9d04 1326 if (ret)
f996fc96 1327 goto out_finish;
081a9d04
BS
1328 have += asked;
1329 asked = 0;
1330 if (eof)
1331 eof = 2;
9f339caf 1332 }
f996fc96 1333
081a9d04
BS
1334 if (crc->run_threads) {
1335 wait_event(crc->done, atomic_read(&crc->stop));
1336 atomic_set(&crc->stop, 0);
1337 crc->run_threads = 0;
f996fc96
BS
1338 }
1339
081a9d04
BS
1340 for (thr = 0; have && thr < nr_threads; thr++) {
1341 data[thr].cmp_len = *(size_t *)page[pg];
1342 if (unlikely(!data[thr].cmp_len ||
1343 data[thr].cmp_len >
1344 lzo1x_worst_compress(LZO_UNC_SIZE))) {
64ec72a1 1345 pr_err("Invalid LZO compressed length\n");
081a9d04
BS
1346 ret = -1;
1347 goto out_finish;
1348 }
1349
1350 need = DIV_ROUND_UP(data[thr].cmp_len + LZO_HEADER,
1351 PAGE_SIZE);
1352 if (need > have) {
1353 if (eof > 1) {
1354 ret = -1;
1355 goto out_finish;
1356 }
1357 break;
1358 }
1359
1360 for (off = 0;
1361 off < LZO_HEADER + data[thr].cmp_len;
1362 off += PAGE_SIZE) {
1363 memcpy(data[thr].cmp + off,
1364 page[pg], PAGE_SIZE);
1365 have--;
1366 want++;
1367 if (++pg >= ring_size)
1368 pg = 0;
1369 }
1370
1371 atomic_set(&data[thr].ready, 1);
1372 wake_up(&data[thr].go);
f996fc96
BS
1373 }
1374
081a9d04
BS
1375 /*
1376 * Wait for more data while we are decompressing.
1377 */
1378 if (have < LZO_CMP_PAGES && asked) {
343df3c7 1379 ret = hib_wait_io(&hb);
081a9d04
BS
1380 if (ret)
1381 goto out_finish;
1382 have += asked;
1383 asked = 0;
1384 if (eof)
1385 eof = 2;
f996fc96
BS
1386 }
1387
081a9d04
BS
1388 for (run_threads = thr, thr = 0; thr < run_threads; thr++) {
1389 wait_event(data[thr].done,
1390 atomic_read(&data[thr].stop));
1391 atomic_set(&data[thr].stop, 0);
1392
1393 ret = data[thr].ret;
f996fc96 1394
081a9d04 1395 if (ret < 0) {
64ec72a1 1396 pr_err("LZO decompression failed\n");
081a9d04
BS
1397 goto out_finish;
1398 }
f996fc96 1399
081a9d04
BS
1400 if (unlikely(!data[thr].unc_len ||
1401 data[thr].unc_len > LZO_UNC_SIZE ||
1402 data[thr].unc_len & (PAGE_SIZE - 1))) {
64ec72a1 1403 pr_err("Invalid LZO uncompressed length\n");
081a9d04 1404 ret = -1;
f996fc96 1405 goto out_finish;
081a9d04
BS
1406 }
1407
1408 for (off = 0;
1409 off < data[thr].unc_len; off += PAGE_SIZE) {
1410 memcpy(data_of(*snapshot),
1411 data[thr].unc + off, PAGE_SIZE);
1412
1413 if (!(nr_pages % m))
64ec72a1
JP
1414 pr_info("Image loading progress: %3d%%\n",
1415 nr_pages / m * 10);
081a9d04
BS
1416 nr_pages++;
1417
1418 ret = snapshot_write_next(snapshot);
1419 if (ret <= 0) {
1420 crc->run_threads = thr + 1;
1421 atomic_set(&crc->ready, 1);
1422 wake_up(&crc->go);
1423 goto out_finish;
1424 }
1425 }
f996fc96 1426 }
081a9d04
BS
1427
1428 crc->run_threads = thr;
1429 atomic_set(&crc->ready, 1);
1430 wake_up(&crc->go);
f996fc96
BS
1431 }
1432
1433out_finish:
081a9d04
BS
1434 if (crc->run_threads) {
1435 wait_event(crc->done, atomic_read(&crc->stop));
1436 atomic_set(&crc->stop, 0);
1437 }
db597605 1438 stop = ktime_get();
081a9d04 1439 if (!ret) {
64ec72a1 1440 pr_info("Image loading done\n");
f996fc96
BS
1441 snapshot_write_finalize(snapshot);
1442 if (!snapshot_image_loaded(snapshot))
081a9d04
BS
1443 ret = -ENODATA;
1444 if (!ret) {
1445 if (swsusp_header->flags & SF_CRC32_MODE) {
1446 if(handle->crc32 != swsusp_header->crc32) {
64ec72a1 1447 pr_err("Invalid image CRC32!\n");
081a9d04
BS
1448 ret = -ENODATA;
1449 }
1450 }
1451 }
d8150d35 1452 }
db597605 1453 swsusp_show_speed(start, stop, nr_to_read, "Read");
081a9d04 1454out_clean:
55c4478a 1455 hib_finish_batch(&hb);
081a9d04 1456 for (i = 0; i < ring_size; i++)
9f339caf 1457 free_page((unsigned long)page[i]);
081a9d04
BS
1458 if (crc) {
1459 if (crc->thr)
1460 kthread_stop(crc->thr);
1461 kfree(crc);
1462 }
1463 if (data) {
1464 for (thr = 0; thr < nr_threads; thr++)
1465 if (data[thr].thr)
1466 kthread_stop(data[thr].thr);
1467 vfree(data);
1468 }
6c45de0d 1469 vfree(page);
f996fc96 1470
081a9d04 1471 return ret;
f996fc96
BS
1472}
1473
a634cc10
RW
1474/**
1475 * swsusp_read - read the hibernation image.
1476 * @flags_p: flags passed by the "frozen" kernel in the image header should
b595076a 1477 * be written into this memory location
a634cc10
RW
1478 */
1479
1480int swsusp_read(unsigned int *flags_p)
61159a31
RW
1481{
1482 int error;
1483 struct swap_map_handle handle;
1484 struct snapshot_handle snapshot;
1485 struct swsusp_info *header;
1486
61159a31 1487 memset(&snapshot, 0, sizeof(struct snapshot_handle));
d3c1b24c 1488 error = snapshot_write_next(&snapshot);
d5641c64 1489 if (error < (int)PAGE_SIZE)
61159a31
RW
1490 return error < 0 ? error : -EFAULT;
1491 header = (struct swsusp_info *)data_of(snapshot);
6f612af5
JS
1492 error = get_swap_reader(&handle, flags_p);
1493 if (error)
1494 goto end;
61159a31 1495 if (!error)
546e0d27 1496 error = swap_read_page(&handle, header, NULL);
f996fc96
BS
1497 if (!error) {
1498 error = (*flags_p & SF_NOCOMPRESS_MODE) ?
1499 load_image(&handle, &snapshot, header->pages - 1) :
1500 load_image_lzo(&handle, &snapshot, header->pages - 1);
1501 }
6f612af5
JS
1502 swap_reader_finish(&handle);
1503end:
61159a31 1504 if (!error)
64ec72a1 1505 pr_debug("Image successfully loaded\n");
61159a31 1506 else
64ec72a1 1507 pr_debug("Error %d resuming\n", error);
61159a31
RW
1508 return error;
1509}
1510
1511/**
1512 * swsusp_check - Check for swsusp signature in the resume device
1513 */
1514
1515int swsusp_check(void)
1516{
1517 int error;
1518
d4d77629
TH
1519 hib_resume_bdev = blkdev_get_by_dev(swsusp_resume_device,
1520 FMODE_READ, NULL);
8a0d613f
JS
1521 if (!IS_ERR(hib_resume_bdev)) {
1522 set_blocksize(hib_resume_bdev, PAGE_SIZE);
3ecb01df 1523 clear_page(swsusp_header);
70fd7614 1524 error = hib_submit_io(REQ_OP_READ, 0,
162b99e3 1525 swsusp_resume_block,
1b29c164 1526 swsusp_header, NULL);
9a154d9d 1527 if (error)
76b57e61 1528 goto put;
9a154d9d 1529
3624eb04 1530 if (!memcmp(HIBERNATE_SIG, swsusp_header->sig, 10)) {
1b29c164 1531 memcpy(swsusp_header->sig, swsusp_header->orig_sig, 10);
61159a31 1532 /* Reset swap signature now */
70fd7614 1533 error = hib_submit_io(REQ_OP_WRITE, REQ_SYNC,
162b99e3 1534 swsusp_resume_block,
1b29c164 1535 swsusp_header, NULL);
61159a31 1536 } else {
76b57e61 1537 error = -EINVAL;
61159a31 1538 }
76b57e61
JS
1539
1540put:
61159a31 1541 if (error)
8a0d613f 1542 blkdev_put(hib_resume_bdev, FMODE_READ);
61159a31 1543 else
64ec72a1 1544 pr_debug("Image signature found, resuming\n");
61159a31 1545 } else {
8a0d613f 1546 error = PTR_ERR(hib_resume_bdev);
61159a31
RW
1547 }
1548
1549 if (error)
64ec72a1 1550 pr_debug("Image not found (code %d)\n", error);
61159a31
RW
1551
1552 return error;
1553}
1554
1555/**
1556 * swsusp_close - close swap device.
1557 */
1558
c2dd0dae 1559void swsusp_close(fmode_t mode)
61159a31 1560{
8a0d613f 1561 if (IS_ERR(hib_resume_bdev)) {
64ec72a1 1562 pr_debug("Image device not initialised\n");
61159a31
RW
1563 return;
1564 }
1565
8a0d613f 1566 blkdev_put(hib_resume_bdev, mode);
61159a31 1567}
1b29c164 1568
62c552cc
BS
1569/**
1570 * swsusp_unmark - Unmark swsusp signature in the resume device
1571 */
1572
1573#ifdef CONFIG_SUSPEND
1574int swsusp_unmark(void)
1575{
1576 int error;
1577
70fd7614 1578 hib_submit_io(REQ_OP_READ, 0, swsusp_resume_block,
162b99e3 1579 swsusp_header, NULL);
62c552cc
BS
1580 if (!memcmp(HIBERNATE_SIG,swsusp_header->sig, 10)) {
1581 memcpy(swsusp_header->sig,swsusp_header->orig_sig, 10);
70fd7614 1582 error = hib_submit_io(REQ_OP_WRITE, REQ_SYNC,
162b99e3 1583 swsusp_resume_block,
62c552cc
BS
1584 swsusp_header, NULL);
1585 } else {
64ec72a1 1586 pr_err("Cannot find swsusp signature!\n");
62c552cc
BS
1587 error = -ENODEV;
1588 }
1589
1590 /*
1591 * We just returned from suspend, we don't need the image any more.
1592 */
1593 free_all_swap_pages(root_swap);
1594
1595 return error;
1596}
1597#endif
1598
afd8d7c7 1599static int __init swsusp_header_init(void)
1b29c164
VG
1600{
1601 swsusp_header = (struct swsusp_header*) __get_free_page(GFP_KERNEL);
1602 if (!swsusp_header)
1603 panic("Could not allocate memory for swsusp_header\n");
1604 return 0;
1605}
1606
1607core_initcall(swsusp_header_init);