]>
Commit | Line | Data |
---|---|---|
61159a31 RW |
1 | /* |
2 | * linux/kernel/power/swap.c | |
3 | * | |
4 | * This file provides functions for reading the suspend image from | |
5 | * and writing it to a swap partition. | |
6 | * | |
a2531293 | 7 | * Copyright (C) 1998,2001-2005 Pavel Machek <pavel@ucw.cz> |
61159a31 | 8 | * Copyright (C) 2006 Rafael J. Wysocki <rjw@sisk.pl> |
5a21d489 | 9 | * Copyright (C) 2010-2012 Bojan Smojver <bojan@rexursive.com> |
61159a31 RW |
10 | * |
11 | * This file is released under the GPLv2. | |
12 | * | |
13 | */ | |
14 | ||
15 | #include <linux/module.h> | |
61159a31 | 16 | #include <linux/file.h> |
61159a31 RW |
17 | #include <linux/delay.h> |
18 | #include <linux/bitops.h> | |
19 | #include <linux/genhd.h> | |
20 | #include <linux/device.h> | |
61159a31 | 21 | #include <linux/bio.h> |
546e0d27 | 22 | #include <linux/blkdev.h> |
61159a31 RW |
23 | #include <linux/swap.h> |
24 | #include <linux/swapops.h> | |
25 | #include <linux/pm.h> | |
5a0e3ad6 | 26 | #include <linux/slab.h> |
f996fc96 BS |
27 | #include <linux/lzo.h> |
28 | #include <linux/vmalloc.h> | |
081a9d04 BS |
29 | #include <linux/cpumask.h> |
30 | #include <linux/atomic.h> | |
31 | #include <linux/kthread.h> | |
32 | #include <linux/crc32.h> | |
db597605 | 33 | #include <linux/ktime.h> |
61159a31 RW |
34 | |
35 | #include "power.h" | |
36 | ||
be8cd644 | 37 | #define HIBERNATE_SIG "S1SUSPEND" |
61159a31 | 38 | |
51fb352b JS |
39 | /* |
40 | * The swap map is a data structure used for keeping track of each page | |
41 | * written to a swap partition. It consists of many swap_map_page | |
90133673 | 42 | * structures that contain each an array of MAP_PAGE_ENTRIES swap entries. |
51fb352b JS |
43 | * These structures are stored on the swap and linked together with the |
44 | * help of the .next_swap member. | |
45 | * | |
46 | * The swap map is created during suspend. The swap map pages are | |
47 | * allocated and populated one at a time, so we only need one memory | |
48 | * page to set up the entire structure. | |
49 | * | |
081a9d04 | 50 | * During resume we pick up all swap_map_page structures into a list. |
51fb352b JS |
51 | */ |
52 | ||
53 | #define MAP_PAGE_ENTRIES (PAGE_SIZE / sizeof(sector_t) - 1) | |
54 | ||
f8262d47 BS |
55 | /* |
56 | * Number of free pages that are not high. | |
57 | */ | |
58 | static inline unsigned long low_free_pages(void) | |
59 | { | |
60 | return nr_free_pages() - nr_free_highpages(); | |
61 | } | |
62 | ||
63 | /* | |
64 | * Number of pages required to be kept free while writing the image. Always | |
65 | * half of all available low pages before the writing starts. | |
66 | */ | |
67 | static inline unsigned long reqd_free_pages(void) | |
68 | { | |
69 | return low_free_pages() / 2; | |
70 | } | |
71 | ||
51fb352b JS |
72 | struct swap_map_page { |
73 | sector_t entries[MAP_PAGE_ENTRIES]; | |
74 | sector_t next_swap; | |
75 | }; | |
76 | ||
081a9d04 BS |
77 | struct swap_map_page_list { |
78 | struct swap_map_page *map; | |
79 | struct swap_map_page_list *next; | |
80 | }; | |
81 | ||
51fb352b JS |
82 | /** |
83 | * The swap_map_handle structure is used for handling swap in | |
84 | * a file-alike way | |
85 | */ | |
86 | ||
87 | struct swap_map_handle { | |
88 | struct swap_map_page *cur; | |
081a9d04 | 89 | struct swap_map_page_list *maps; |
51fb352b JS |
90 | sector_t cur_swap; |
91 | sector_t first_sector; | |
92 | unsigned int k; | |
f8262d47 | 93 | unsigned long reqd_free_pages; |
081a9d04 | 94 | u32 crc32; |
51fb352b JS |
95 | }; |
96 | ||
1b29c164 | 97 | struct swsusp_header { |
081a9d04 BS |
98 | char reserved[PAGE_SIZE - 20 - sizeof(sector_t) - sizeof(int) - |
99 | sizeof(u32)]; | |
100 | u32 crc32; | |
3aef83e0 | 101 | sector_t image; |
a634cc10 | 102 | unsigned int flags; /* Flags to pass to the "boot" kernel */ |
61159a31 RW |
103 | char orig_sig[10]; |
104 | char sig[10]; | |
52f5684c | 105 | } __packed; |
1b29c164 VG |
106 | |
107 | static struct swsusp_header *swsusp_header; | |
61159a31 | 108 | |
0414f2ec NC |
109 | /** |
110 | * The following functions are used for tracing the allocated | |
111 | * swap pages, so that they can be freed in case of an error. | |
112 | */ | |
113 | ||
114 | struct swsusp_extent { | |
115 | struct rb_node node; | |
116 | unsigned long start; | |
117 | unsigned long end; | |
118 | }; | |
119 | ||
120 | static struct rb_root swsusp_extents = RB_ROOT; | |
121 | ||
122 | static int swsusp_extents_insert(unsigned long swap_offset) | |
123 | { | |
124 | struct rb_node **new = &(swsusp_extents.rb_node); | |
125 | struct rb_node *parent = NULL; | |
126 | struct swsusp_extent *ext; | |
127 | ||
128 | /* Figure out where to put the new node */ | |
129 | while (*new) { | |
8316bd72 | 130 | ext = rb_entry(*new, struct swsusp_extent, node); |
0414f2ec NC |
131 | parent = *new; |
132 | if (swap_offset < ext->start) { | |
133 | /* Try to merge */ | |
134 | if (swap_offset == ext->start - 1) { | |
135 | ext->start--; | |
136 | return 0; | |
137 | } | |
138 | new = &((*new)->rb_left); | |
139 | } else if (swap_offset > ext->end) { | |
140 | /* Try to merge */ | |
141 | if (swap_offset == ext->end + 1) { | |
142 | ext->end++; | |
143 | return 0; | |
144 | } | |
145 | new = &((*new)->rb_right); | |
146 | } else { | |
147 | /* It already is in the tree */ | |
148 | return -EINVAL; | |
149 | } | |
150 | } | |
151 | /* Add the new node and rebalance the tree. */ | |
152 | ext = kzalloc(sizeof(struct swsusp_extent), GFP_KERNEL); | |
153 | if (!ext) | |
154 | return -ENOMEM; | |
155 | ||
156 | ext->start = swap_offset; | |
157 | ext->end = swap_offset; | |
158 | rb_link_node(&ext->node, parent, new); | |
159 | rb_insert_color(&ext->node, &swsusp_extents); | |
160 | return 0; | |
161 | } | |
162 | ||
163 | /** | |
164 | * alloc_swapdev_block - allocate a swap page and register that it has | |
165 | * been allocated, so that it can be freed in case of an error. | |
166 | */ | |
167 | ||
168 | sector_t alloc_swapdev_block(int swap) | |
169 | { | |
170 | unsigned long offset; | |
171 | ||
910321ea | 172 | offset = swp_offset(get_swap_page_of_type(swap)); |
0414f2ec NC |
173 | if (offset) { |
174 | if (swsusp_extents_insert(offset)) | |
910321ea | 175 | swap_free(swp_entry(swap, offset)); |
0414f2ec NC |
176 | else |
177 | return swapdev_block(swap, offset); | |
178 | } | |
179 | return 0; | |
180 | } | |
181 | ||
182 | /** | |
183 | * free_all_swap_pages - free swap pages allocated for saving image data. | |
90133673 | 184 | * It also frees the extents used to register which swap entries had been |
0414f2ec NC |
185 | * allocated. |
186 | */ | |
187 | ||
188 | void free_all_swap_pages(int swap) | |
189 | { | |
190 | struct rb_node *node; | |
191 | ||
192 | while ((node = swsusp_extents.rb_node)) { | |
193 | struct swsusp_extent *ext; | |
194 | unsigned long offset; | |
195 | ||
196 | ext = container_of(node, struct swsusp_extent, node); | |
197 | rb_erase(node, &swsusp_extents); | |
198 | for (offset = ext->start; offset <= ext->end; offset++) | |
910321ea | 199 | swap_free(swp_entry(swap, offset)); |
0414f2ec NC |
200 | |
201 | kfree(ext); | |
202 | } | |
203 | } | |
204 | ||
205 | int swsusp_swap_in_use(void) | |
206 | { | |
207 | return (swsusp_extents.rb_node != NULL); | |
208 | } | |
209 | ||
61159a31 | 210 | /* |
3fc6b34f | 211 | * General things |
61159a31 RW |
212 | */ |
213 | ||
214 | static unsigned short root_swap = 0xffff; | |
343df3c7 CH |
215 | static struct block_device *hib_resume_bdev; |
216 | ||
217 | struct hib_bio_batch { | |
218 | atomic_t count; | |
219 | wait_queue_head_t wait; | |
220 | int error; | |
221 | }; | |
222 | ||
223 | static void hib_init_batch(struct hib_bio_batch *hb) | |
224 | { | |
225 | atomic_set(&hb->count, 0); | |
226 | init_waitqueue_head(&hb->wait); | |
227 | hb->error = 0; | |
228 | } | |
229 | ||
4246a0b6 | 230 | static void hib_end_io(struct bio *bio) |
343df3c7 CH |
231 | { |
232 | struct hib_bio_batch *hb = bio->bi_private; | |
343df3c7 CH |
233 | struct page *page = bio->bi_io_vec[0].bv_page; |
234 | ||
4246a0b6 | 235 | if (bio->bi_error) { |
343df3c7 CH |
236 | printk(KERN_ALERT "Read-error on swap-device (%u:%u:%Lu)\n", |
237 | imajor(bio->bi_bdev->bd_inode), | |
238 | iminor(bio->bi_bdev->bd_inode), | |
239 | (unsigned long long)bio->bi_iter.bi_sector); | |
343df3c7 CH |
240 | } |
241 | ||
242 | if (bio_data_dir(bio) == WRITE) | |
243 | put_page(page); | |
244 | ||
4246a0b6 CH |
245 | if (bio->bi_error && !hb->error) |
246 | hb->error = bio->bi_error; | |
343df3c7 CH |
247 | if (atomic_dec_and_test(&hb->count)) |
248 | wake_up(&hb->wait); | |
249 | ||
250 | bio_put(bio); | |
251 | } | |
252 | ||
253 | static int hib_submit_io(int rw, pgoff_t page_off, void *addr, | |
254 | struct hib_bio_batch *hb) | |
255 | { | |
256 | struct page *page = virt_to_page(addr); | |
257 | struct bio *bio; | |
258 | int error = 0; | |
259 | ||
71baba4b | 260 | bio = bio_alloc(__GFP_RECLAIM | __GFP_HIGH, 1); |
343df3c7 CH |
261 | bio->bi_iter.bi_sector = page_off * (PAGE_SIZE >> 9); |
262 | bio->bi_bdev = hib_resume_bdev; | |
263 | ||
264 | if (bio_add_page(bio, page, PAGE_SIZE, 0) < PAGE_SIZE) { | |
265 | printk(KERN_ERR "PM: Adding page to bio failed at %llu\n", | |
266 | (unsigned long long)bio->bi_iter.bi_sector); | |
267 | bio_put(bio); | |
268 | return -EFAULT; | |
269 | } | |
270 | ||
271 | if (hb) { | |
272 | bio->bi_end_io = hib_end_io; | |
273 | bio->bi_private = hb; | |
274 | atomic_inc(&hb->count); | |
275 | submit_bio(rw, bio); | |
276 | } else { | |
277 | error = submit_bio_wait(rw, bio); | |
278 | bio_put(bio); | |
279 | } | |
280 | ||
281 | return error; | |
282 | } | |
283 | ||
284 | static int hib_wait_io(struct hib_bio_batch *hb) | |
285 | { | |
286 | wait_event(hb->wait, atomic_read(&hb->count) == 0); | |
287 | return hb->error; | |
288 | } | |
3fc6b34f | 289 | |
3fc6b34f RW |
290 | /* |
291 | * Saving part | |
292 | */ | |
61159a31 | 293 | |
51fb352b | 294 | static int mark_swapfiles(struct swap_map_handle *handle, unsigned int flags) |
61159a31 RW |
295 | { |
296 | int error; | |
297 | ||
343df3c7 | 298 | hib_submit_io(READ_SYNC, swsusp_resume_block, swsusp_header, NULL); |
1b29c164 VG |
299 | if (!memcmp("SWAP-SPACE",swsusp_header->sig, 10) || |
300 | !memcmp("SWAPSPACE2",swsusp_header->sig, 10)) { | |
301 | memcpy(swsusp_header->orig_sig,swsusp_header->sig, 10); | |
3624eb04 | 302 | memcpy(swsusp_header->sig, HIBERNATE_SIG, 10); |
51fb352b | 303 | swsusp_header->image = handle->first_sector; |
a634cc10 | 304 | swsusp_header->flags = flags; |
081a9d04 BS |
305 | if (flags & SF_CRC32_MODE) |
306 | swsusp_header->crc32 = handle->crc32; | |
343df3c7 | 307 | error = hib_submit_io(WRITE_SYNC, swsusp_resume_block, |
1b29c164 | 308 | swsusp_header, NULL); |
61159a31 | 309 | } else { |
23976728 | 310 | printk(KERN_ERR "PM: Swap header not found!\n"); |
61159a31 RW |
311 | error = -ENODEV; |
312 | } | |
313 | return error; | |
314 | } | |
315 | ||
316 | /** | |
317 | * swsusp_swap_check - check if the resume device is a swap device | |
318 | * and get its index (if so) | |
6f612af5 JS |
319 | * |
320 | * This is called before saving image | |
61159a31 | 321 | */ |
6f612af5 | 322 | static int swsusp_swap_check(void) |
61159a31 | 323 | { |
3aef83e0 RW |
324 | int res; |
325 | ||
7bf23687 | 326 | res = swap_type_of(swsusp_resume_device, swsusp_resume_block, |
8a0d613f | 327 | &hib_resume_bdev); |
3aef83e0 RW |
328 | if (res < 0) |
329 | return res; | |
330 | ||
331 | root_swap = res; | |
e525fd89 | 332 | res = blkdev_get(hib_resume_bdev, FMODE_WRITE, NULL); |
7bf23687 RW |
333 | if (res) |
334 | return res; | |
3aef83e0 | 335 | |
8a0d613f | 336 | res = set_blocksize(hib_resume_bdev, PAGE_SIZE); |
3aef83e0 | 337 | if (res < 0) |
8a0d613f | 338 | blkdev_put(hib_resume_bdev, FMODE_WRITE); |
61159a31 | 339 | |
61159a31 RW |
340 | return res; |
341 | } | |
342 | ||
343 | /** | |
344 | * write_page - Write one page to given swap location. | |
345 | * @buf: Address we're writing. | |
346 | * @offset: Offset of the swap page we're writing to. | |
343df3c7 | 347 | * @hb: bio completion batch |
61159a31 RW |
348 | */ |
349 | ||
343df3c7 | 350 | static int write_page(void *buf, sector_t offset, struct hib_bio_batch *hb) |
61159a31 | 351 | { |
3aef83e0 | 352 | void *src; |
081a9d04 | 353 | int ret; |
3aef83e0 RW |
354 | |
355 | if (!offset) | |
356 | return -ENOSPC; | |
357 | ||
343df3c7 | 358 | if (hb) { |
71baba4b | 359 | src = (void *)__get_free_page(__GFP_RECLAIM | __GFP_NOWARN | |
5a21d489 | 360 | __GFP_NORETRY); |
3aef83e0 | 361 | if (src) { |
3ecb01df | 362 | copy_page(src, buf); |
3aef83e0 | 363 | } else { |
343df3c7 | 364 | ret = hib_wait_io(hb); /* Free pages */ |
081a9d04 BS |
365 | if (ret) |
366 | return ret; | |
71baba4b | 367 | src = (void *)__get_free_page(__GFP_RECLAIM | |
5a21d489 BS |
368 | __GFP_NOWARN | |
369 | __GFP_NORETRY); | |
081a9d04 BS |
370 | if (src) { |
371 | copy_page(src, buf); | |
372 | } else { | |
373 | WARN_ON_ONCE(1); | |
343df3c7 | 374 | hb = NULL; /* Go synchronous */ |
081a9d04 BS |
375 | src = buf; |
376 | } | |
ab954160 | 377 | } |
3aef83e0 RW |
378 | } else { |
379 | src = buf; | |
61159a31 | 380 | } |
343df3c7 | 381 | return hib_submit_io(WRITE_SYNC, offset, src, hb); |
61159a31 RW |
382 | } |
383 | ||
61159a31 RW |
384 | static void release_swap_writer(struct swap_map_handle *handle) |
385 | { | |
386 | if (handle->cur) | |
387 | free_page((unsigned long)handle->cur); | |
388 | handle->cur = NULL; | |
61159a31 RW |
389 | } |
390 | ||
391 | static int get_swap_writer(struct swap_map_handle *handle) | |
392 | { | |
6f612af5 JS |
393 | int ret; |
394 | ||
395 | ret = swsusp_swap_check(); | |
396 | if (ret) { | |
397 | if (ret != -ENOSPC) | |
398 | printk(KERN_ERR "PM: Cannot find swap device, try " | |
399 | "swapon -a.\n"); | |
400 | return ret; | |
401 | } | |
61159a31 | 402 | handle->cur = (struct swap_map_page *)get_zeroed_page(GFP_KERNEL); |
6f612af5 JS |
403 | if (!handle->cur) { |
404 | ret = -ENOMEM; | |
405 | goto err_close; | |
406 | } | |
d1d241cc | 407 | handle->cur_swap = alloc_swapdev_block(root_swap); |
61159a31 | 408 | if (!handle->cur_swap) { |
6f612af5 JS |
409 | ret = -ENOSPC; |
410 | goto err_rel; | |
61159a31 RW |
411 | } |
412 | handle->k = 0; | |
f8262d47 | 413 | handle->reqd_free_pages = reqd_free_pages(); |
51fb352b | 414 | handle->first_sector = handle->cur_swap; |
61159a31 | 415 | return 0; |
6f612af5 JS |
416 | err_rel: |
417 | release_swap_writer(handle); | |
418 | err_close: | |
419 | swsusp_close(FMODE_WRITE); | |
420 | return ret; | |
61159a31 RW |
421 | } |
422 | ||
ab954160 | 423 | static int swap_write_page(struct swap_map_handle *handle, void *buf, |
343df3c7 | 424 | struct hib_bio_batch *hb) |
ab954160 AM |
425 | { |
426 | int error = 0; | |
3aef83e0 | 427 | sector_t offset; |
61159a31 RW |
428 | |
429 | if (!handle->cur) | |
430 | return -EINVAL; | |
d1d241cc | 431 | offset = alloc_swapdev_block(root_swap); |
343df3c7 | 432 | error = write_page(buf, offset, hb); |
61159a31 RW |
433 | if (error) |
434 | return error; | |
435 | handle->cur->entries[handle->k++] = offset; | |
436 | if (handle->k >= MAP_PAGE_ENTRIES) { | |
d1d241cc | 437 | offset = alloc_swapdev_block(root_swap); |
61159a31 RW |
438 | if (!offset) |
439 | return -ENOSPC; | |
440 | handle->cur->next_swap = offset; | |
343df3c7 | 441 | error = write_page(handle->cur, handle->cur_swap, hb); |
61159a31 | 442 | if (error) |
ab954160 | 443 | goto out; |
3ecb01df | 444 | clear_page(handle->cur); |
61159a31 RW |
445 | handle->cur_swap = offset; |
446 | handle->k = 0; | |
5a21d489 | 447 | |
343df3c7 CH |
448 | if (hb && low_free_pages() <= handle->reqd_free_pages) { |
449 | error = hib_wait_io(hb); | |
5a21d489 BS |
450 | if (error) |
451 | goto out; | |
452 | /* | |
453 | * Recalculate the number of required free pages, to | |
454 | * make sure we never take more than half. | |
455 | */ | |
456 | handle->reqd_free_pages = reqd_free_pages(); | |
457 | } | |
081a9d04 | 458 | } |
59a49335 | 459 | out: |
ab954160 | 460 | return error; |
61159a31 RW |
461 | } |
462 | ||
463 | static int flush_swap_writer(struct swap_map_handle *handle) | |
464 | { | |
465 | if (handle->cur && handle->cur_swap) | |
ab954160 | 466 | return write_page(handle->cur, handle->cur_swap, NULL); |
61159a31 RW |
467 | else |
468 | return -EINVAL; | |
469 | } | |
470 | ||
6f612af5 JS |
471 | static int swap_writer_finish(struct swap_map_handle *handle, |
472 | unsigned int flags, int error) | |
473 | { | |
474 | if (!error) { | |
475 | flush_swap_writer(handle); | |
476 | printk(KERN_INFO "PM: S"); | |
477 | error = mark_swapfiles(handle, flags); | |
478 | printk("|\n"); | |
479 | } | |
480 | ||
481 | if (error) | |
482 | free_all_swap_pages(root_swap); | |
483 | release_swap_writer(handle); | |
484 | swsusp_close(FMODE_WRITE); | |
485 | ||
486 | return error; | |
487 | } | |
488 | ||
f996fc96 BS |
489 | /* We need to remember how much compressed data we need to read. */ |
490 | #define LZO_HEADER sizeof(size_t) | |
491 | ||
492 | /* Number of pages/bytes we'll compress at one time. */ | |
493 | #define LZO_UNC_PAGES 32 | |
494 | #define LZO_UNC_SIZE (LZO_UNC_PAGES * PAGE_SIZE) | |
495 | ||
496 | /* Number of pages/bytes we need for compressed data (worst case). */ | |
497 | #define LZO_CMP_PAGES DIV_ROUND_UP(lzo1x_worst_compress(LZO_UNC_SIZE) + \ | |
498 | LZO_HEADER, PAGE_SIZE) | |
499 | #define LZO_CMP_SIZE (LZO_CMP_PAGES * PAGE_SIZE) | |
500 | ||
081a9d04 BS |
501 | /* Maximum number of threads for compression/decompression. */ |
502 | #define LZO_THREADS 3 | |
503 | ||
5a21d489 BS |
504 | /* Minimum/maximum number of pages for read buffering. */ |
505 | #define LZO_MIN_RD_PAGES 1024 | |
506 | #define LZO_MAX_RD_PAGES 8192 | |
081a9d04 BS |
507 | |
508 | ||
61159a31 RW |
509 | /** |
510 | * save_image - save the suspend image data | |
511 | */ | |
512 | ||
513 | static int save_image(struct swap_map_handle *handle, | |
514 | struct snapshot_handle *snapshot, | |
3a4f7577 | 515 | unsigned int nr_to_write) |
61159a31 RW |
516 | { |
517 | unsigned int m; | |
518 | int ret; | |
3a4f7577 | 519 | int nr_pages; |
ab954160 | 520 | int err2; |
343df3c7 | 521 | struct hib_bio_batch hb; |
db597605 TR |
522 | ktime_t start; |
523 | ktime_t stop; | |
61159a31 | 524 | |
343df3c7 CH |
525 | hib_init_batch(&hb); |
526 | ||
d8150d35 | 527 | printk(KERN_INFO "PM: Saving image data pages (%u pages)...\n", |
23976728 | 528 | nr_to_write); |
d8150d35 | 529 | m = nr_to_write / 10; |
61159a31 RW |
530 | if (!m) |
531 | m = 1; | |
532 | nr_pages = 0; | |
db597605 | 533 | start = ktime_get(); |
4ff277f9 | 534 | while (1) { |
d3c1b24c | 535 | ret = snapshot_read_next(snapshot); |
4ff277f9 JS |
536 | if (ret <= 0) |
537 | break; | |
343df3c7 | 538 | ret = swap_write_page(handle, data_of(*snapshot), &hb); |
4ff277f9 JS |
539 | if (ret) |
540 | break; | |
541 | if (!(nr_pages % m)) | |
d8150d35 BS |
542 | printk(KERN_INFO "PM: Image saving progress: %3d%%\n", |
543 | nr_pages / m * 10); | |
4ff277f9 JS |
544 | nr_pages++; |
545 | } | |
343df3c7 | 546 | err2 = hib_wait_io(&hb); |
db597605 | 547 | stop = ktime_get(); |
4ff277f9 JS |
548 | if (!ret) |
549 | ret = err2; | |
550 | if (!ret) | |
d8150d35 | 551 | printk(KERN_INFO "PM: Image saving done.\n"); |
db597605 | 552 | swsusp_show_speed(start, stop, nr_to_write, "Wrote"); |
4ff277f9 | 553 | return ret; |
61159a31 RW |
554 | } |
555 | ||
081a9d04 BS |
556 | /** |
557 | * Structure used for CRC32. | |
558 | */ | |
559 | struct crc_data { | |
560 | struct task_struct *thr; /* thread */ | |
561 | atomic_t ready; /* ready to start flag */ | |
562 | atomic_t stop; /* ready to stop flag */ | |
563 | unsigned run_threads; /* nr current threads */ | |
564 | wait_queue_head_t go; /* start crc update */ | |
565 | wait_queue_head_t done; /* crc update done */ | |
566 | u32 *crc32; /* points to handle's crc32 */ | |
567 | size_t *unc_len[LZO_THREADS]; /* uncompressed lengths */ | |
568 | unsigned char *unc[LZO_THREADS]; /* uncompressed data */ | |
569 | }; | |
570 | ||
571 | /** | |
572 | * CRC32 update function that runs in its own thread. | |
573 | */ | |
574 | static int crc32_threadfn(void *data) | |
575 | { | |
576 | struct crc_data *d = data; | |
577 | unsigned i; | |
578 | ||
579 | while (1) { | |
580 | wait_event(d->go, atomic_read(&d->ready) || | |
581 | kthread_should_stop()); | |
582 | if (kthread_should_stop()) { | |
583 | d->thr = NULL; | |
584 | atomic_set(&d->stop, 1); | |
585 | wake_up(&d->done); | |
586 | break; | |
587 | } | |
588 | atomic_set(&d->ready, 0); | |
589 | ||
590 | for (i = 0; i < d->run_threads; i++) | |
591 | *d->crc32 = crc32_le(*d->crc32, | |
592 | d->unc[i], *d->unc_len[i]); | |
593 | atomic_set(&d->stop, 1); | |
594 | wake_up(&d->done); | |
595 | } | |
596 | return 0; | |
597 | } | |
598 | /** | |
599 | * Structure used for LZO data compression. | |
600 | */ | |
601 | struct cmp_data { | |
602 | struct task_struct *thr; /* thread */ | |
603 | atomic_t ready; /* ready to start flag */ | |
604 | atomic_t stop; /* ready to stop flag */ | |
605 | int ret; /* return code */ | |
606 | wait_queue_head_t go; /* start compression */ | |
607 | wait_queue_head_t done; /* compression done */ | |
608 | size_t unc_len; /* uncompressed length */ | |
609 | size_t cmp_len; /* compressed length */ | |
610 | unsigned char unc[LZO_UNC_SIZE]; /* uncompressed buffer */ | |
611 | unsigned char cmp[LZO_CMP_SIZE]; /* compressed buffer */ | |
612 | unsigned char wrk[LZO1X_1_MEM_COMPRESS]; /* compression workspace */ | |
613 | }; | |
614 | ||
615 | /** | |
616 | * Compression function that runs in its own thread. | |
617 | */ | |
618 | static int lzo_compress_threadfn(void *data) | |
619 | { | |
620 | struct cmp_data *d = data; | |
621 | ||
622 | while (1) { | |
623 | wait_event(d->go, atomic_read(&d->ready) || | |
624 | kthread_should_stop()); | |
625 | if (kthread_should_stop()) { | |
626 | d->thr = NULL; | |
627 | d->ret = -1; | |
628 | atomic_set(&d->stop, 1); | |
629 | wake_up(&d->done); | |
630 | break; | |
631 | } | |
632 | atomic_set(&d->ready, 0); | |
633 | ||
634 | d->ret = lzo1x_1_compress(d->unc, d->unc_len, | |
635 | d->cmp + LZO_HEADER, &d->cmp_len, | |
636 | d->wrk); | |
637 | atomic_set(&d->stop, 1); | |
638 | wake_up(&d->done); | |
639 | } | |
640 | return 0; | |
641 | } | |
f996fc96 BS |
642 | |
643 | /** | |
644 | * save_image_lzo - Save the suspend image data compressed with LZO. | |
057b0a75 | 645 | * @handle: Swap map handle to use for saving the image. |
f996fc96 BS |
646 | * @snapshot: Image to read data from. |
647 | * @nr_to_write: Number of pages to save. | |
648 | */ | |
649 | static int save_image_lzo(struct swap_map_handle *handle, | |
650 | struct snapshot_handle *snapshot, | |
651 | unsigned int nr_to_write) | |
652 | { | |
653 | unsigned int m; | |
654 | int ret = 0; | |
655 | int nr_pages; | |
656 | int err2; | |
343df3c7 | 657 | struct hib_bio_batch hb; |
db597605 TR |
658 | ktime_t start; |
659 | ktime_t stop; | |
081a9d04 BS |
660 | size_t off; |
661 | unsigned thr, run_threads, nr_threads; | |
662 | unsigned char *page = NULL; | |
663 | struct cmp_data *data = NULL; | |
664 | struct crc_data *crc = NULL; | |
665 | ||
343df3c7 CH |
666 | hib_init_batch(&hb); |
667 | ||
081a9d04 BS |
668 | /* |
669 | * We'll limit the number of threads for compression to limit memory | |
670 | * footprint. | |
671 | */ | |
672 | nr_threads = num_online_cpus() - 1; | |
673 | nr_threads = clamp_val(nr_threads, 1, LZO_THREADS); | |
f996fc96 | 674 | |
71baba4b | 675 | page = (void *)__get_free_page(__GFP_RECLAIM | __GFP_HIGH); |
f996fc96 BS |
676 | if (!page) { |
677 | printk(KERN_ERR "PM: Failed to allocate LZO page\n"); | |
081a9d04 BS |
678 | ret = -ENOMEM; |
679 | goto out_clean; | |
f996fc96 BS |
680 | } |
681 | ||
081a9d04 BS |
682 | data = vmalloc(sizeof(*data) * nr_threads); |
683 | if (!data) { | |
684 | printk(KERN_ERR "PM: Failed to allocate LZO data\n"); | |
685 | ret = -ENOMEM; | |
686 | goto out_clean; | |
f996fc96 | 687 | } |
081a9d04 BS |
688 | for (thr = 0; thr < nr_threads; thr++) |
689 | memset(&data[thr], 0, offsetof(struct cmp_data, go)); | |
f996fc96 | 690 | |
081a9d04 BS |
691 | crc = kmalloc(sizeof(*crc), GFP_KERNEL); |
692 | if (!crc) { | |
693 | printk(KERN_ERR "PM: Failed to allocate crc\n"); | |
694 | ret = -ENOMEM; | |
695 | goto out_clean; | |
696 | } | |
697 | memset(crc, 0, offsetof(struct crc_data, go)); | |
698 | ||
699 | /* | |
700 | * Start the compression threads. | |
701 | */ | |
702 | for (thr = 0; thr < nr_threads; thr++) { | |
703 | init_waitqueue_head(&data[thr].go); | |
704 | init_waitqueue_head(&data[thr].done); | |
705 | ||
706 | data[thr].thr = kthread_run(lzo_compress_threadfn, | |
707 | &data[thr], | |
708 | "image_compress/%u", thr); | |
709 | if (IS_ERR(data[thr].thr)) { | |
710 | data[thr].thr = NULL; | |
711 | printk(KERN_ERR | |
712 | "PM: Cannot start compression threads\n"); | |
713 | ret = -ENOMEM; | |
714 | goto out_clean; | |
715 | } | |
f996fc96 BS |
716 | } |
717 | ||
081a9d04 BS |
718 | /* |
719 | * Start the CRC32 thread. | |
720 | */ | |
721 | init_waitqueue_head(&crc->go); | |
722 | init_waitqueue_head(&crc->done); | |
723 | ||
724 | handle->crc32 = 0; | |
725 | crc->crc32 = &handle->crc32; | |
726 | for (thr = 0; thr < nr_threads; thr++) { | |
727 | crc->unc[thr] = data[thr].unc; | |
728 | crc->unc_len[thr] = &data[thr].unc_len; | |
729 | } | |
730 | ||
731 | crc->thr = kthread_run(crc32_threadfn, crc, "image_crc32"); | |
732 | if (IS_ERR(crc->thr)) { | |
733 | crc->thr = NULL; | |
734 | printk(KERN_ERR "PM: Cannot start CRC32 thread\n"); | |
735 | ret = -ENOMEM; | |
736 | goto out_clean; | |
f996fc96 BS |
737 | } |
738 | ||
5a21d489 BS |
739 | /* |
740 | * Adjust the number of required free pages after all allocations have | |
741 | * been done. We don't want to run out of pages when writing. | |
742 | */ | |
743 | handle->reqd_free_pages = reqd_free_pages(); | |
744 | ||
f996fc96 | 745 | printk(KERN_INFO |
081a9d04 | 746 | "PM: Using %u thread(s) for compression.\n" |
d8150d35 | 747 | "PM: Compressing and saving image data (%u pages)...\n", |
081a9d04 | 748 | nr_threads, nr_to_write); |
d8150d35 | 749 | m = nr_to_write / 10; |
f996fc96 BS |
750 | if (!m) |
751 | m = 1; | |
752 | nr_pages = 0; | |
db597605 | 753 | start = ktime_get(); |
f996fc96 | 754 | for (;;) { |
081a9d04 BS |
755 | for (thr = 0; thr < nr_threads; thr++) { |
756 | for (off = 0; off < LZO_UNC_SIZE; off += PAGE_SIZE) { | |
757 | ret = snapshot_read_next(snapshot); | |
758 | if (ret < 0) | |
759 | goto out_finish; | |
760 | ||
761 | if (!ret) | |
762 | break; | |
763 | ||
764 | memcpy(data[thr].unc + off, | |
765 | data_of(*snapshot), PAGE_SIZE); | |
766 | ||
767 | if (!(nr_pages % m)) | |
d8150d35 BS |
768 | printk(KERN_INFO |
769 | "PM: Image saving progress: " | |
770 | "%3d%%\n", | |
771 | nr_pages / m * 10); | |
081a9d04 BS |
772 | nr_pages++; |
773 | } | |
774 | if (!off) | |
f996fc96 BS |
775 | break; |
776 | ||
081a9d04 | 777 | data[thr].unc_len = off; |
f996fc96 | 778 | |
081a9d04 BS |
779 | atomic_set(&data[thr].ready, 1); |
780 | wake_up(&data[thr].go); | |
f996fc96 BS |
781 | } |
782 | ||
081a9d04 | 783 | if (!thr) |
f996fc96 BS |
784 | break; |
785 | ||
081a9d04 BS |
786 | crc->run_threads = thr; |
787 | atomic_set(&crc->ready, 1); | |
788 | wake_up(&crc->go); | |
f996fc96 | 789 | |
081a9d04 BS |
790 | for (run_threads = thr, thr = 0; thr < run_threads; thr++) { |
791 | wait_event(data[thr].done, | |
792 | atomic_read(&data[thr].stop)); | |
793 | atomic_set(&data[thr].stop, 0); | |
f996fc96 | 794 | |
081a9d04 | 795 | ret = data[thr].ret; |
f996fc96 | 796 | |
081a9d04 BS |
797 | if (ret < 0) { |
798 | printk(KERN_ERR "PM: LZO compression failed\n"); | |
799 | goto out_finish; | |
800 | } | |
f996fc96 | 801 | |
081a9d04 BS |
802 | if (unlikely(!data[thr].cmp_len || |
803 | data[thr].cmp_len > | |
804 | lzo1x_worst_compress(data[thr].unc_len))) { | |
805 | printk(KERN_ERR | |
806 | "PM: Invalid LZO compressed length\n"); | |
807 | ret = -1; | |
f996fc96 | 808 | goto out_finish; |
081a9d04 BS |
809 | } |
810 | ||
811 | *(size_t *)data[thr].cmp = data[thr].cmp_len; | |
812 | ||
813 | /* | |
814 | * Given we are writing one page at a time to disk, we | |
815 | * copy that much from the buffer, although the last | |
816 | * bit will likely be smaller than full page. This is | |
817 | * OK - we saved the length of the compressed data, so | |
818 | * any garbage at the end will be discarded when we | |
819 | * read it. | |
820 | */ | |
821 | for (off = 0; | |
822 | off < LZO_HEADER + data[thr].cmp_len; | |
823 | off += PAGE_SIZE) { | |
824 | memcpy(page, data[thr].cmp + off, PAGE_SIZE); | |
825 | ||
343df3c7 | 826 | ret = swap_write_page(handle, page, &hb); |
081a9d04 BS |
827 | if (ret) |
828 | goto out_finish; | |
829 | } | |
f996fc96 | 830 | } |
081a9d04 BS |
831 | |
832 | wait_event(crc->done, atomic_read(&crc->stop)); | |
833 | atomic_set(&crc->stop, 0); | |
f996fc96 BS |
834 | } |
835 | ||
836 | out_finish: | |
343df3c7 | 837 | err2 = hib_wait_io(&hb); |
db597605 | 838 | stop = ktime_get(); |
f996fc96 BS |
839 | if (!ret) |
840 | ret = err2; | |
d8150d35 BS |
841 | if (!ret) |
842 | printk(KERN_INFO "PM: Image saving done.\n"); | |
db597605 | 843 | swsusp_show_speed(start, stop, nr_to_write, "Wrote"); |
081a9d04 BS |
844 | out_clean: |
845 | if (crc) { | |
846 | if (crc->thr) | |
847 | kthread_stop(crc->thr); | |
848 | kfree(crc); | |
849 | } | |
850 | if (data) { | |
851 | for (thr = 0; thr < nr_threads; thr++) | |
852 | if (data[thr].thr) | |
853 | kthread_stop(data[thr].thr); | |
854 | vfree(data); | |
855 | } | |
856 | if (page) free_page((unsigned long)page); | |
f996fc96 BS |
857 | |
858 | return ret; | |
859 | } | |
860 | ||
61159a31 RW |
861 | /** |
862 | * enough_swap - Make sure we have enough swap to save the image. | |
863 | * | |
864 | * Returns TRUE or FALSE after checking the total amount of swap | |
865 | * space avaiable from the resume partition. | |
866 | */ | |
867 | ||
f996fc96 | 868 | static int enough_swap(unsigned int nr_pages, unsigned int flags) |
61159a31 RW |
869 | { |
870 | unsigned int free_swap = count_swap_pages(root_swap, 1); | |
f996fc96 | 871 | unsigned int required; |
61159a31 | 872 | |
23976728 | 873 | pr_debug("PM: Free swap pages: %u\n", free_swap); |
f996fc96 | 874 | |
ee34a370 | 875 | required = PAGES_FOR_IO + nr_pages; |
f996fc96 | 876 | return free_swap > required; |
61159a31 RW |
877 | } |
878 | ||
879 | /** | |
880 | * swsusp_write - Write entire image and metadata. | |
a634cc10 | 881 | * @flags: flags to pass to the "boot" kernel in the image header |
61159a31 RW |
882 | * |
883 | * It is important _NOT_ to umount filesystems at this point. We want | |
884 | * them synced (in case something goes wrong) but we DO not want to mark | |
885 | * filesystem clean: it is not. (And it does not matter, if we resume | |
886 | * correctly, we'll mark system clean, anyway.) | |
887 | */ | |
888 | ||
a634cc10 | 889 | int swsusp_write(unsigned int flags) |
61159a31 RW |
890 | { |
891 | struct swap_map_handle handle; | |
892 | struct snapshot_handle snapshot; | |
893 | struct swsusp_info *header; | |
6f612af5 | 894 | unsigned long pages; |
61159a31 RW |
895 | int error; |
896 | ||
6f612af5 JS |
897 | pages = snapshot_get_image_size(); |
898 | error = get_swap_writer(&handle); | |
3aef83e0 | 899 | if (error) { |
6f612af5 | 900 | printk(KERN_ERR "PM: Cannot get swap writer\n"); |
61159a31 RW |
901 | return error; |
902 | } | |
ee34a370 BS |
903 | if (flags & SF_NOCOMPRESS_MODE) { |
904 | if (!enough_swap(pages, flags)) { | |
905 | printk(KERN_ERR "PM: Not enough free swap\n"); | |
906 | error = -ENOSPC; | |
907 | goto out_finish; | |
908 | } | |
6f612af5 | 909 | } |
61159a31 | 910 | memset(&snapshot, 0, sizeof(struct snapshot_handle)); |
d3c1b24c | 911 | error = snapshot_read_next(&snapshot); |
3aef83e0 RW |
912 | if (error < PAGE_SIZE) { |
913 | if (error >= 0) | |
914 | error = -EFAULT; | |
915 | ||
6f612af5 | 916 | goto out_finish; |
3aef83e0 | 917 | } |
61159a31 | 918 | header = (struct swsusp_info *)data_of(snapshot); |
6f612af5 | 919 | error = swap_write_page(&handle, header, NULL); |
f996fc96 BS |
920 | if (!error) { |
921 | error = (flags & SF_NOCOMPRESS_MODE) ? | |
922 | save_image(&handle, &snapshot, pages - 1) : | |
923 | save_image_lzo(&handle, &snapshot, pages - 1); | |
924 | } | |
6f612af5 JS |
925 | out_finish: |
926 | error = swap_writer_finish(&handle, flags, error); | |
61159a31 RW |
927 | return error; |
928 | } | |
929 | ||
61159a31 RW |
930 | /** |
931 | * The following functions allow us to read data using a swap map | |
932 | * in a file-alike way | |
933 | */ | |
934 | ||
935 | static void release_swap_reader(struct swap_map_handle *handle) | |
936 | { | |
081a9d04 BS |
937 | struct swap_map_page_list *tmp; |
938 | ||
939 | while (handle->maps) { | |
940 | if (handle->maps->map) | |
941 | free_page((unsigned long)handle->maps->map); | |
942 | tmp = handle->maps; | |
943 | handle->maps = handle->maps->next; | |
944 | kfree(tmp); | |
945 | } | |
61159a31 RW |
946 | handle->cur = NULL; |
947 | } | |
948 | ||
6f612af5 JS |
949 | static int get_swap_reader(struct swap_map_handle *handle, |
950 | unsigned int *flags_p) | |
61159a31 RW |
951 | { |
952 | int error; | |
081a9d04 BS |
953 | struct swap_map_page_list *tmp, *last; |
954 | sector_t offset; | |
61159a31 | 955 | |
6f612af5 JS |
956 | *flags_p = swsusp_header->flags; |
957 | ||
958 | if (!swsusp_header->image) /* how can this happen? */ | |
61159a31 | 959 | return -EINVAL; |
3aef83e0 | 960 | |
081a9d04 BS |
961 | handle->cur = NULL; |
962 | last = handle->maps = NULL; | |
963 | offset = swsusp_header->image; | |
964 | while (offset) { | |
965 | tmp = kmalloc(sizeof(*handle->maps), GFP_KERNEL); | |
966 | if (!tmp) { | |
967 | release_swap_reader(handle); | |
968 | return -ENOMEM; | |
969 | } | |
970 | memset(tmp, 0, sizeof(*tmp)); | |
971 | if (!handle->maps) | |
972 | handle->maps = tmp; | |
973 | if (last) | |
974 | last->next = tmp; | |
975 | last = tmp; | |
976 | ||
977 | tmp->map = (struct swap_map_page *) | |
71baba4b | 978 | __get_free_page(__GFP_RECLAIM | __GFP_HIGH); |
081a9d04 BS |
979 | if (!tmp->map) { |
980 | release_swap_reader(handle); | |
981 | return -ENOMEM; | |
982 | } | |
3aef83e0 | 983 | |
343df3c7 | 984 | error = hib_submit_io(READ_SYNC, offset, tmp->map, NULL); |
081a9d04 BS |
985 | if (error) { |
986 | release_swap_reader(handle); | |
987 | return error; | |
988 | } | |
989 | offset = tmp->map->next_swap; | |
61159a31 RW |
990 | } |
991 | handle->k = 0; | |
081a9d04 | 992 | handle->cur = handle->maps->map; |
61159a31 RW |
993 | return 0; |
994 | } | |
995 | ||
546e0d27 | 996 | static int swap_read_page(struct swap_map_handle *handle, void *buf, |
343df3c7 | 997 | struct hib_bio_batch *hb) |
61159a31 | 998 | { |
3aef83e0 | 999 | sector_t offset; |
61159a31 | 1000 | int error; |
081a9d04 | 1001 | struct swap_map_page_list *tmp; |
61159a31 RW |
1002 | |
1003 | if (!handle->cur) | |
1004 | return -EINVAL; | |
1005 | offset = handle->cur->entries[handle->k]; | |
1006 | if (!offset) | |
1007 | return -EFAULT; | |
343df3c7 | 1008 | error = hib_submit_io(READ_SYNC, offset, buf, hb); |
61159a31 RW |
1009 | if (error) |
1010 | return error; | |
1011 | if (++handle->k >= MAP_PAGE_ENTRIES) { | |
1012 | handle->k = 0; | |
081a9d04 BS |
1013 | free_page((unsigned long)handle->maps->map); |
1014 | tmp = handle->maps; | |
1015 | handle->maps = handle->maps->next; | |
1016 | kfree(tmp); | |
1017 | if (!handle->maps) | |
61159a31 | 1018 | release_swap_reader(handle); |
081a9d04 BS |
1019 | else |
1020 | handle->cur = handle->maps->map; | |
61159a31 RW |
1021 | } |
1022 | return error; | |
1023 | } | |
1024 | ||
6f612af5 JS |
1025 | static int swap_reader_finish(struct swap_map_handle *handle) |
1026 | { | |
1027 | release_swap_reader(handle); | |
1028 | ||
1029 | return 0; | |
1030 | } | |
1031 | ||
61159a31 RW |
1032 | /** |
1033 | * load_image - load the image using the swap map handle | |
1034 | * @handle and the snapshot handle @snapshot | |
1035 | * (assume there are @nr_pages pages to load) | |
1036 | */ | |
1037 | ||
1038 | static int load_image(struct swap_map_handle *handle, | |
1039 | struct snapshot_handle *snapshot, | |
546e0d27 | 1040 | unsigned int nr_to_read) |
61159a31 RW |
1041 | { |
1042 | unsigned int m; | |
081a9d04 | 1043 | int ret = 0; |
db597605 TR |
1044 | ktime_t start; |
1045 | ktime_t stop; | |
343df3c7 | 1046 | struct hib_bio_batch hb; |
546e0d27 AM |
1047 | int err2; |
1048 | unsigned nr_pages; | |
61159a31 | 1049 | |
343df3c7 CH |
1050 | hib_init_batch(&hb); |
1051 | ||
d8150d35 | 1052 | printk(KERN_INFO "PM: Loading image data pages (%u pages)...\n", |
23976728 | 1053 | nr_to_read); |
d8150d35 | 1054 | m = nr_to_read / 10; |
61159a31 RW |
1055 | if (!m) |
1056 | m = 1; | |
1057 | nr_pages = 0; | |
db597605 | 1058 | start = ktime_get(); |
546e0d27 | 1059 | for ( ; ; ) { |
081a9d04 BS |
1060 | ret = snapshot_write_next(snapshot); |
1061 | if (ret <= 0) | |
546e0d27 | 1062 | break; |
343df3c7 | 1063 | ret = swap_read_page(handle, data_of(*snapshot), &hb); |
081a9d04 | 1064 | if (ret) |
546e0d27 AM |
1065 | break; |
1066 | if (snapshot->sync_read) | |
343df3c7 | 1067 | ret = hib_wait_io(&hb); |
081a9d04 | 1068 | if (ret) |
546e0d27 AM |
1069 | break; |
1070 | if (!(nr_pages % m)) | |
d8150d35 BS |
1071 | printk(KERN_INFO "PM: Image loading progress: %3d%%\n", |
1072 | nr_pages / m * 10); | |
546e0d27 AM |
1073 | nr_pages++; |
1074 | } | |
343df3c7 | 1075 | err2 = hib_wait_io(&hb); |
db597605 | 1076 | stop = ktime_get(); |
081a9d04 BS |
1077 | if (!ret) |
1078 | ret = err2; | |
1079 | if (!ret) { | |
d8150d35 | 1080 | printk(KERN_INFO "PM: Image loading done.\n"); |
8357376d | 1081 | snapshot_write_finalize(snapshot); |
e655a250 | 1082 | if (!snapshot_image_loaded(snapshot)) |
081a9d04 | 1083 | ret = -ENODATA; |
d8150d35 | 1084 | } |
db597605 | 1085 | swsusp_show_speed(start, stop, nr_to_read, "Read"); |
081a9d04 BS |
1086 | return ret; |
1087 | } | |
1088 | ||
1089 | /** | |
1090 | * Structure used for LZO data decompression. | |
1091 | */ | |
1092 | struct dec_data { | |
1093 | struct task_struct *thr; /* thread */ | |
1094 | atomic_t ready; /* ready to start flag */ | |
1095 | atomic_t stop; /* ready to stop flag */ | |
1096 | int ret; /* return code */ | |
1097 | wait_queue_head_t go; /* start decompression */ | |
1098 | wait_queue_head_t done; /* decompression done */ | |
1099 | size_t unc_len; /* uncompressed length */ | |
1100 | size_t cmp_len; /* compressed length */ | |
1101 | unsigned char unc[LZO_UNC_SIZE]; /* uncompressed buffer */ | |
1102 | unsigned char cmp[LZO_CMP_SIZE]; /* compressed buffer */ | |
1103 | }; | |
1104 | ||
1105 | /** | |
1106 | * Deompression function that runs in its own thread. | |
1107 | */ | |
1108 | static int lzo_decompress_threadfn(void *data) | |
1109 | { | |
1110 | struct dec_data *d = data; | |
1111 | ||
1112 | while (1) { | |
1113 | wait_event(d->go, atomic_read(&d->ready) || | |
1114 | kthread_should_stop()); | |
1115 | if (kthread_should_stop()) { | |
1116 | d->thr = NULL; | |
1117 | d->ret = -1; | |
1118 | atomic_set(&d->stop, 1); | |
1119 | wake_up(&d->done); | |
1120 | break; | |
1121 | } | |
1122 | atomic_set(&d->ready, 0); | |
1123 | ||
1124 | d->unc_len = LZO_UNC_SIZE; | |
1125 | d->ret = lzo1x_decompress_safe(d->cmp + LZO_HEADER, d->cmp_len, | |
1126 | d->unc, &d->unc_len); | |
1127 | atomic_set(&d->stop, 1); | |
1128 | wake_up(&d->done); | |
1129 | } | |
1130 | return 0; | |
61159a31 RW |
1131 | } |
1132 | ||
f996fc96 BS |
1133 | /** |
1134 | * load_image_lzo - Load compressed image data and decompress them with LZO. | |
1135 | * @handle: Swap map handle to use for loading data. | |
1136 | * @snapshot: Image to copy uncompressed data into. | |
1137 | * @nr_to_read: Number of pages to load. | |
1138 | */ | |
1139 | static int load_image_lzo(struct swap_map_handle *handle, | |
1140 | struct snapshot_handle *snapshot, | |
1141 | unsigned int nr_to_read) | |
1142 | { | |
1143 | unsigned int m; | |
081a9d04 BS |
1144 | int ret = 0; |
1145 | int eof = 0; | |
343df3c7 | 1146 | struct hib_bio_batch hb; |
db597605 TR |
1147 | ktime_t start; |
1148 | ktime_t stop; | |
f996fc96 | 1149 | unsigned nr_pages; |
081a9d04 BS |
1150 | size_t off; |
1151 | unsigned i, thr, run_threads, nr_threads; | |
1152 | unsigned ring = 0, pg = 0, ring_size = 0, | |
1153 | have = 0, want, need, asked = 0; | |
5a21d489 | 1154 | unsigned long read_pages = 0; |
081a9d04 BS |
1155 | unsigned char **page = NULL; |
1156 | struct dec_data *data = NULL; | |
1157 | struct crc_data *crc = NULL; | |
1158 | ||
343df3c7 CH |
1159 | hib_init_batch(&hb); |
1160 | ||
081a9d04 BS |
1161 | /* |
1162 | * We'll limit the number of threads for decompression to limit memory | |
1163 | * footprint. | |
1164 | */ | |
1165 | nr_threads = num_online_cpus() - 1; | |
1166 | nr_threads = clamp_val(nr_threads, 1, LZO_THREADS); | |
1167 | ||
5a21d489 | 1168 | page = vmalloc(sizeof(*page) * LZO_MAX_RD_PAGES); |
081a9d04 BS |
1169 | if (!page) { |
1170 | printk(KERN_ERR "PM: Failed to allocate LZO page\n"); | |
1171 | ret = -ENOMEM; | |
1172 | goto out_clean; | |
1173 | } | |
9f339caf | 1174 | |
081a9d04 BS |
1175 | data = vmalloc(sizeof(*data) * nr_threads); |
1176 | if (!data) { | |
1177 | printk(KERN_ERR "PM: Failed to allocate LZO data\n"); | |
1178 | ret = -ENOMEM; | |
1179 | goto out_clean; | |
1180 | } | |
1181 | for (thr = 0; thr < nr_threads; thr++) | |
1182 | memset(&data[thr], 0, offsetof(struct dec_data, go)); | |
9f339caf | 1183 | |
081a9d04 BS |
1184 | crc = kmalloc(sizeof(*crc), GFP_KERNEL); |
1185 | if (!crc) { | |
1186 | printk(KERN_ERR "PM: Failed to allocate crc\n"); | |
1187 | ret = -ENOMEM; | |
1188 | goto out_clean; | |
1189 | } | |
1190 | memset(crc, 0, offsetof(struct crc_data, go)); | |
1191 | ||
1192 | /* | |
1193 | * Start the decompression threads. | |
1194 | */ | |
1195 | for (thr = 0; thr < nr_threads; thr++) { | |
1196 | init_waitqueue_head(&data[thr].go); | |
1197 | init_waitqueue_head(&data[thr].done); | |
1198 | ||
1199 | data[thr].thr = kthread_run(lzo_decompress_threadfn, | |
1200 | &data[thr], | |
1201 | "image_decompress/%u", thr); | |
1202 | if (IS_ERR(data[thr].thr)) { | |
1203 | data[thr].thr = NULL; | |
1204 | printk(KERN_ERR | |
1205 | "PM: Cannot start decompression threads\n"); | |
1206 | ret = -ENOMEM; | |
1207 | goto out_clean; | |
9f339caf | 1208 | } |
f996fc96 BS |
1209 | } |
1210 | ||
081a9d04 BS |
1211 | /* |
1212 | * Start the CRC32 thread. | |
1213 | */ | |
1214 | init_waitqueue_head(&crc->go); | |
1215 | init_waitqueue_head(&crc->done); | |
1216 | ||
1217 | handle->crc32 = 0; | |
1218 | crc->crc32 = &handle->crc32; | |
1219 | for (thr = 0; thr < nr_threads; thr++) { | |
1220 | crc->unc[thr] = data[thr].unc; | |
1221 | crc->unc_len[thr] = &data[thr].unc_len; | |
f996fc96 BS |
1222 | } |
1223 | ||
081a9d04 BS |
1224 | crc->thr = kthread_run(crc32_threadfn, crc, "image_crc32"); |
1225 | if (IS_ERR(crc->thr)) { | |
1226 | crc->thr = NULL; | |
1227 | printk(KERN_ERR "PM: Cannot start CRC32 thread\n"); | |
1228 | ret = -ENOMEM; | |
1229 | goto out_clean; | |
1230 | } | |
9f339caf | 1231 | |
081a9d04 | 1232 | /* |
5a21d489 BS |
1233 | * Set the number of pages for read buffering. |
1234 | * This is complete guesswork, because we'll only know the real | |
1235 | * picture once prepare_image() is called, which is much later on | |
1236 | * during the image load phase. We'll assume the worst case and | |
1237 | * say that none of the image pages are from high memory. | |
081a9d04 | 1238 | */ |
5a21d489 BS |
1239 | if (low_free_pages() > snapshot_get_image_size()) |
1240 | read_pages = (low_free_pages() - snapshot_get_image_size()) / 2; | |
1241 | read_pages = clamp_val(read_pages, LZO_MIN_RD_PAGES, LZO_MAX_RD_PAGES); | |
9f339caf | 1242 | |
081a9d04 BS |
1243 | for (i = 0; i < read_pages; i++) { |
1244 | page[i] = (void *)__get_free_page(i < LZO_CMP_PAGES ? | |
71baba4b MG |
1245 | __GFP_RECLAIM | __GFP_HIGH : |
1246 | __GFP_RECLAIM | __GFP_NOWARN | | |
1247 | __GFP_NORETRY); | |
5a21d489 | 1248 | |
081a9d04 BS |
1249 | if (!page[i]) { |
1250 | if (i < LZO_CMP_PAGES) { | |
1251 | ring_size = i; | |
1252 | printk(KERN_ERR | |
1253 | "PM: Failed to allocate LZO pages\n"); | |
1254 | ret = -ENOMEM; | |
1255 | goto out_clean; | |
1256 | } else { | |
1257 | break; | |
1258 | } | |
1259 | } | |
f996fc96 | 1260 | } |
081a9d04 | 1261 | want = ring_size = i; |
f996fc96 BS |
1262 | |
1263 | printk(KERN_INFO | |
081a9d04 | 1264 | "PM: Using %u thread(s) for decompression.\n" |
d8150d35 | 1265 | "PM: Loading and decompressing image data (%u pages)...\n", |
081a9d04 | 1266 | nr_threads, nr_to_read); |
d8150d35 | 1267 | m = nr_to_read / 10; |
f996fc96 BS |
1268 | if (!m) |
1269 | m = 1; | |
1270 | nr_pages = 0; | |
db597605 | 1271 | start = ktime_get(); |
f996fc96 | 1272 | |
081a9d04 BS |
1273 | ret = snapshot_write_next(snapshot); |
1274 | if (ret <= 0) | |
f996fc96 BS |
1275 | goto out_finish; |
1276 | ||
081a9d04 BS |
1277 | for(;;) { |
1278 | for (i = 0; !eof && i < want; i++) { | |
343df3c7 | 1279 | ret = swap_read_page(handle, page[ring], &hb); |
081a9d04 BS |
1280 | if (ret) { |
1281 | /* | |
1282 | * On real read error, finish. On end of data, | |
1283 | * set EOF flag and just exit the read loop. | |
1284 | */ | |
1285 | if (handle->cur && | |
1286 | handle->cur->entries[handle->k]) { | |
1287 | goto out_finish; | |
1288 | } else { | |
1289 | eof = 1; | |
1290 | break; | |
1291 | } | |
1292 | } | |
1293 | if (++ring >= ring_size) | |
1294 | ring = 0; | |
f996fc96 | 1295 | } |
081a9d04 BS |
1296 | asked += i; |
1297 | want -= i; | |
f996fc96 | 1298 | |
081a9d04 BS |
1299 | /* |
1300 | * We are out of data, wait for some more. | |
1301 | */ | |
1302 | if (!have) { | |
1303 | if (!asked) | |
1304 | break; | |
1305 | ||
343df3c7 | 1306 | ret = hib_wait_io(&hb); |
081a9d04 | 1307 | if (ret) |
f996fc96 | 1308 | goto out_finish; |
081a9d04 BS |
1309 | have += asked; |
1310 | asked = 0; | |
1311 | if (eof) | |
1312 | eof = 2; | |
9f339caf | 1313 | } |
f996fc96 | 1314 | |
081a9d04 BS |
1315 | if (crc->run_threads) { |
1316 | wait_event(crc->done, atomic_read(&crc->stop)); | |
1317 | atomic_set(&crc->stop, 0); | |
1318 | crc->run_threads = 0; | |
f996fc96 BS |
1319 | } |
1320 | ||
081a9d04 BS |
1321 | for (thr = 0; have && thr < nr_threads; thr++) { |
1322 | data[thr].cmp_len = *(size_t *)page[pg]; | |
1323 | if (unlikely(!data[thr].cmp_len || | |
1324 | data[thr].cmp_len > | |
1325 | lzo1x_worst_compress(LZO_UNC_SIZE))) { | |
1326 | printk(KERN_ERR | |
1327 | "PM: Invalid LZO compressed length\n"); | |
1328 | ret = -1; | |
1329 | goto out_finish; | |
1330 | } | |
1331 | ||
1332 | need = DIV_ROUND_UP(data[thr].cmp_len + LZO_HEADER, | |
1333 | PAGE_SIZE); | |
1334 | if (need > have) { | |
1335 | if (eof > 1) { | |
1336 | ret = -1; | |
1337 | goto out_finish; | |
1338 | } | |
1339 | break; | |
1340 | } | |
1341 | ||
1342 | for (off = 0; | |
1343 | off < LZO_HEADER + data[thr].cmp_len; | |
1344 | off += PAGE_SIZE) { | |
1345 | memcpy(data[thr].cmp + off, | |
1346 | page[pg], PAGE_SIZE); | |
1347 | have--; | |
1348 | want++; | |
1349 | if (++pg >= ring_size) | |
1350 | pg = 0; | |
1351 | } | |
1352 | ||
1353 | atomic_set(&data[thr].ready, 1); | |
1354 | wake_up(&data[thr].go); | |
f996fc96 BS |
1355 | } |
1356 | ||
081a9d04 BS |
1357 | /* |
1358 | * Wait for more data while we are decompressing. | |
1359 | */ | |
1360 | if (have < LZO_CMP_PAGES && asked) { | |
343df3c7 | 1361 | ret = hib_wait_io(&hb); |
081a9d04 BS |
1362 | if (ret) |
1363 | goto out_finish; | |
1364 | have += asked; | |
1365 | asked = 0; | |
1366 | if (eof) | |
1367 | eof = 2; | |
f996fc96 BS |
1368 | } |
1369 | ||
081a9d04 BS |
1370 | for (run_threads = thr, thr = 0; thr < run_threads; thr++) { |
1371 | wait_event(data[thr].done, | |
1372 | atomic_read(&data[thr].stop)); | |
1373 | atomic_set(&data[thr].stop, 0); | |
1374 | ||
1375 | ret = data[thr].ret; | |
f996fc96 | 1376 | |
081a9d04 BS |
1377 | if (ret < 0) { |
1378 | printk(KERN_ERR | |
1379 | "PM: LZO decompression failed\n"); | |
1380 | goto out_finish; | |
1381 | } | |
f996fc96 | 1382 | |
081a9d04 BS |
1383 | if (unlikely(!data[thr].unc_len || |
1384 | data[thr].unc_len > LZO_UNC_SIZE || | |
1385 | data[thr].unc_len & (PAGE_SIZE - 1))) { | |
1386 | printk(KERN_ERR | |
1387 | "PM: Invalid LZO uncompressed length\n"); | |
1388 | ret = -1; | |
f996fc96 | 1389 | goto out_finish; |
081a9d04 BS |
1390 | } |
1391 | ||
1392 | for (off = 0; | |
1393 | off < data[thr].unc_len; off += PAGE_SIZE) { | |
1394 | memcpy(data_of(*snapshot), | |
1395 | data[thr].unc + off, PAGE_SIZE); | |
1396 | ||
1397 | if (!(nr_pages % m)) | |
d8150d35 BS |
1398 | printk(KERN_INFO |
1399 | "PM: Image loading progress: " | |
1400 | "%3d%%\n", | |
1401 | nr_pages / m * 10); | |
081a9d04 BS |
1402 | nr_pages++; |
1403 | ||
1404 | ret = snapshot_write_next(snapshot); | |
1405 | if (ret <= 0) { | |
1406 | crc->run_threads = thr + 1; | |
1407 | atomic_set(&crc->ready, 1); | |
1408 | wake_up(&crc->go); | |
1409 | goto out_finish; | |
1410 | } | |
1411 | } | |
f996fc96 | 1412 | } |
081a9d04 BS |
1413 | |
1414 | crc->run_threads = thr; | |
1415 | atomic_set(&crc->ready, 1); | |
1416 | wake_up(&crc->go); | |
f996fc96 BS |
1417 | } |
1418 | ||
1419 | out_finish: | |
081a9d04 BS |
1420 | if (crc->run_threads) { |
1421 | wait_event(crc->done, atomic_read(&crc->stop)); | |
1422 | atomic_set(&crc->stop, 0); | |
1423 | } | |
db597605 | 1424 | stop = ktime_get(); |
081a9d04 | 1425 | if (!ret) { |
d8150d35 | 1426 | printk(KERN_INFO "PM: Image loading done.\n"); |
f996fc96 BS |
1427 | snapshot_write_finalize(snapshot); |
1428 | if (!snapshot_image_loaded(snapshot)) | |
081a9d04 BS |
1429 | ret = -ENODATA; |
1430 | if (!ret) { | |
1431 | if (swsusp_header->flags & SF_CRC32_MODE) { | |
1432 | if(handle->crc32 != swsusp_header->crc32) { | |
1433 | printk(KERN_ERR | |
1434 | "PM: Invalid image CRC32!\n"); | |
1435 | ret = -ENODATA; | |
1436 | } | |
1437 | } | |
1438 | } | |
d8150d35 | 1439 | } |
db597605 | 1440 | swsusp_show_speed(start, stop, nr_to_read, "Read"); |
081a9d04 BS |
1441 | out_clean: |
1442 | for (i = 0; i < ring_size; i++) | |
9f339caf | 1443 | free_page((unsigned long)page[i]); |
081a9d04 BS |
1444 | if (crc) { |
1445 | if (crc->thr) | |
1446 | kthread_stop(crc->thr); | |
1447 | kfree(crc); | |
1448 | } | |
1449 | if (data) { | |
1450 | for (thr = 0; thr < nr_threads; thr++) | |
1451 | if (data[thr].thr) | |
1452 | kthread_stop(data[thr].thr); | |
1453 | vfree(data); | |
1454 | } | |
6c45de0d | 1455 | vfree(page); |
f996fc96 | 1456 | |
081a9d04 | 1457 | return ret; |
f996fc96 BS |
1458 | } |
1459 | ||
a634cc10 RW |
1460 | /** |
1461 | * swsusp_read - read the hibernation image. | |
1462 | * @flags_p: flags passed by the "frozen" kernel in the image header should | |
b595076a | 1463 | * be written into this memory location |
a634cc10 RW |
1464 | */ |
1465 | ||
1466 | int swsusp_read(unsigned int *flags_p) | |
61159a31 RW |
1467 | { |
1468 | int error; | |
1469 | struct swap_map_handle handle; | |
1470 | struct snapshot_handle snapshot; | |
1471 | struct swsusp_info *header; | |
1472 | ||
61159a31 | 1473 | memset(&snapshot, 0, sizeof(struct snapshot_handle)); |
d3c1b24c | 1474 | error = snapshot_write_next(&snapshot); |
61159a31 RW |
1475 | if (error < PAGE_SIZE) |
1476 | return error < 0 ? error : -EFAULT; | |
1477 | header = (struct swsusp_info *)data_of(snapshot); | |
6f612af5 JS |
1478 | error = get_swap_reader(&handle, flags_p); |
1479 | if (error) | |
1480 | goto end; | |
61159a31 | 1481 | if (!error) |
546e0d27 | 1482 | error = swap_read_page(&handle, header, NULL); |
f996fc96 BS |
1483 | if (!error) { |
1484 | error = (*flags_p & SF_NOCOMPRESS_MODE) ? | |
1485 | load_image(&handle, &snapshot, header->pages - 1) : | |
1486 | load_image_lzo(&handle, &snapshot, header->pages - 1); | |
1487 | } | |
6f612af5 JS |
1488 | swap_reader_finish(&handle); |
1489 | end: | |
61159a31 | 1490 | if (!error) |
23976728 | 1491 | pr_debug("PM: Image successfully loaded\n"); |
61159a31 | 1492 | else |
23976728 | 1493 | pr_debug("PM: Error %d resuming\n", error); |
61159a31 RW |
1494 | return error; |
1495 | } | |
1496 | ||
1497 | /** | |
1498 | * swsusp_check - Check for swsusp signature in the resume device | |
1499 | */ | |
1500 | ||
1501 | int swsusp_check(void) | |
1502 | { | |
1503 | int error; | |
1504 | ||
d4d77629 TH |
1505 | hib_resume_bdev = blkdev_get_by_dev(swsusp_resume_device, |
1506 | FMODE_READ, NULL); | |
8a0d613f JS |
1507 | if (!IS_ERR(hib_resume_bdev)) { |
1508 | set_blocksize(hib_resume_bdev, PAGE_SIZE); | |
3ecb01df | 1509 | clear_page(swsusp_header); |
343df3c7 | 1510 | error = hib_submit_io(READ_SYNC, swsusp_resume_block, |
1b29c164 | 1511 | swsusp_header, NULL); |
9a154d9d | 1512 | if (error) |
76b57e61 | 1513 | goto put; |
9a154d9d | 1514 | |
3624eb04 | 1515 | if (!memcmp(HIBERNATE_SIG, swsusp_header->sig, 10)) { |
1b29c164 | 1516 | memcpy(swsusp_header->sig, swsusp_header->orig_sig, 10); |
61159a31 | 1517 | /* Reset swap signature now */ |
343df3c7 | 1518 | error = hib_submit_io(WRITE_SYNC, swsusp_resume_block, |
1b29c164 | 1519 | swsusp_header, NULL); |
61159a31 | 1520 | } else { |
76b57e61 | 1521 | error = -EINVAL; |
61159a31 | 1522 | } |
76b57e61 JS |
1523 | |
1524 | put: | |
61159a31 | 1525 | if (error) |
8a0d613f | 1526 | blkdev_put(hib_resume_bdev, FMODE_READ); |
61159a31 | 1527 | else |
d0941ead | 1528 | pr_debug("PM: Image signature found, resuming\n"); |
61159a31 | 1529 | } else { |
8a0d613f | 1530 | error = PTR_ERR(hib_resume_bdev); |
61159a31 RW |
1531 | } |
1532 | ||
1533 | if (error) | |
d0941ead | 1534 | pr_debug("PM: Image not found (code %d)\n", error); |
61159a31 RW |
1535 | |
1536 | return error; | |
1537 | } | |
1538 | ||
1539 | /** | |
1540 | * swsusp_close - close swap device. | |
1541 | */ | |
1542 | ||
c2dd0dae | 1543 | void swsusp_close(fmode_t mode) |
61159a31 | 1544 | { |
8a0d613f | 1545 | if (IS_ERR(hib_resume_bdev)) { |
23976728 | 1546 | pr_debug("PM: Image device not initialised\n"); |
61159a31 RW |
1547 | return; |
1548 | } | |
1549 | ||
8a0d613f | 1550 | blkdev_put(hib_resume_bdev, mode); |
61159a31 | 1551 | } |
1b29c164 | 1552 | |
62c552cc BS |
1553 | /** |
1554 | * swsusp_unmark - Unmark swsusp signature in the resume device | |
1555 | */ | |
1556 | ||
1557 | #ifdef CONFIG_SUSPEND | |
1558 | int swsusp_unmark(void) | |
1559 | { | |
1560 | int error; | |
1561 | ||
343df3c7 | 1562 | hib_submit_io(READ_SYNC, swsusp_resume_block, swsusp_header, NULL); |
62c552cc BS |
1563 | if (!memcmp(HIBERNATE_SIG,swsusp_header->sig, 10)) { |
1564 | memcpy(swsusp_header->sig,swsusp_header->orig_sig, 10); | |
343df3c7 | 1565 | error = hib_submit_io(WRITE_SYNC, swsusp_resume_block, |
62c552cc BS |
1566 | swsusp_header, NULL); |
1567 | } else { | |
1568 | printk(KERN_ERR "PM: Cannot find swsusp signature!\n"); | |
1569 | error = -ENODEV; | |
1570 | } | |
1571 | ||
1572 | /* | |
1573 | * We just returned from suspend, we don't need the image any more. | |
1574 | */ | |
1575 | free_all_swap_pages(root_swap); | |
1576 | ||
1577 | return error; | |
1578 | } | |
1579 | #endif | |
1580 | ||
1b29c164 VG |
1581 | static int swsusp_header_init(void) |
1582 | { | |
1583 | swsusp_header = (struct swsusp_header*) __get_free_page(GFP_KERNEL); | |
1584 | if (!swsusp_header) | |
1585 | panic("Could not allocate memory for swsusp_header\n"); | |
1586 | return 0; | |
1587 | } | |
1588 | ||
1589 | core_initcall(swsusp_header_init); |