1 /* 2 * linux/kernel/power/swap.c 3 * 4 * This file provides functions for reading the suspend image from 5 * and writing it to a swap partition. 6 * 7 * Copyright (C) 1998,2001-2005 Pavel Machek <pavel@suse.cz> 8 * Copyright (C) 2006 Rafael J. Wysocki <rjw@sisk.pl> 9 * 10 * This file is released under the GPLv2. 11 * 12 */ 13 14 #include <linux/module.h> 15 #include <linux/file.h> 16 #include <linux/delay.h> 17 #include <linux/bitops.h> 18 #include <linux/genhd.h> 19 #include <linux/device.h> 20 #include <linux/buffer_head.h> 21 #include <linux/bio.h> 22 #include <linux/blkdev.h> 23 #include <linux/swap.h> 24 #include <linux/swapops.h> 25 #include <linux/pm.h> 26 #include <linux/slab.h> 27 28 #include "power.h" 29 30 #define SWSUSP_SIG "S1SUSPEND" 31 32 struct swsusp_header { 33 char reserved[PAGE_SIZE - 20 - sizeof(sector_t) - sizeof(int)]; 34 sector_t image; 35 unsigned int flags; /* Flags to pass to the "boot" kernel */ 36 char orig_sig[10]; 37 char sig[10]; 38 } __attribute__((packed)); 39 40 static struct swsusp_header *swsusp_header; 41 42 /** 43 * The following functions are used for tracing the allocated 44 * swap pages, so that they can be freed in case of an error. 45 */ 46 47 struct swsusp_extent { 48 struct rb_node node; 49 unsigned long start; 50 unsigned long end; 51 }; 52 53 static struct rb_root swsusp_extents = RB_ROOT; 54 55 static int swsusp_extents_insert(unsigned long swap_offset) 56 { 57 struct rb_node **new = &(swsusp_extents.rb_node); 58 struct rb_node *parent = NULL; 59 struct swsusp_extent *ext; 60 61 /* Figure out where to put the new node */ 62 while (*new) { 63 ext = container_of(*new, struct swsusp_extent, node); 64 parent = *new; 65 if (swap_offset < ext->start) { 66 /* Try to merge */ 67 if (swap_offset == ext->start - 1) { 68 ext->start--; 69 return 0; 70 } 71 new = &((*new)->rb_left); 72 } else if (swap_offset > ext->end) { 73 /* Try to merge */ 74 if (swap_offset == ext->end + 1) { 75 ext->end++; 76 return 0; 77 } 78 new = &((*new)->rb_right); 79 } else { 80 /* It already is in the tree */ 81 return -EINVAL; 82 } 83 } 84 /* Add the new node and rebalance the tree. */ 85 ext = kzalloc(sizeof(struct swsusp_extent), GFP_KERNEL); 86 if (!ext) 87 return -ENOMEM; 88 89 ext->start = swap_offset; 90 ext->end = swap_offset; 91 rb_link_node(&ext->node, parent, new); 92 rb_insert_color(&ext->node, &swsusp_extents); 93 return 0; 94 } 95 96 /** 97 * alloc_swapdev_block - allocate a swap page and register that it has 98 * been allocated, so that it can be freed in case of an error. 99 */ 100 101 sector_t alloc_swapdev_block(int swap) 102 { 103 unsigned long offset; 104 105 offset = swp_offset(get_swap_page_of_type(swap)); 106 if (offset) { 107 if (swsusp_extents_insert(offset)) 108 swap_free(swp_entry(swap, offset)); 109 else 110 return swapdev_block(swap, offset); 111 } 112 return 0; 113 } 114 115 /** 116 * free_all_swap_pages - free swap pages allocated for saving image data. 117 * It also frees the extents used to register which swap entres had been 118 * allocated. 119 */ 120 121 void free_all_swap_pages(int swap) 122 { 123 struct rb_node *node; 124 125 while ((node = swsusp_extents.rb_node)) { 126 struct swsusp_extent *ext; 127 unsigned long offset; 128 129 ext = container_of(node, struct swsusp_extent, node); 130 rb_erase(node, &swsusp_extents); 131 for (offset = ext->start; offset <= ext->end; offset++) 132 swap_free(swp_entry(swap, offset)); 133 134 kfree(ext); 135 } 136 } 137 138 int swsusp_swap_in_use(void) 139 { 140 return (swsusp_extents.rb_node != NULL); 141 } 142 143 /* 144 * General things 145 */ 146 147 static unsigned short root_swap = 0xffff; 148 static struct block_device *resume_bdev; 149 150 /** 151 * submit - submit BIO request. 152 * @rw: READ or WRITE. 153 * @off physical offset of page. 154 * @page: page we're reading or writing. 155 * @bio_chain: list of pending biod (for async reading) 156 * 157 * Straight from the textbook - allocate and initialize the bio. 158 * If we're reading, make sure the page is marked as dirty. 159 * Then submit it and, if @bio_chain == NULL, wait. 160 */ 161 static int submit(int rw, pgoff_t page_off, struct page *page, 162 struct bio **bio_chain) 163 { 164 const int bio_rw = rw | (1 << BIO_RW_SYNCIO) | (1 << BIO_RW_UNPLUG); 165 struct bio *bio; 166 167 bio = bio_alloc(__GFP_WAIT | __GFP_HIGH, 1); 168 bio->bi_sector = page_off * (PAGE_SIZE >> 9); 169 bio->bi_bdev = resume_bdev; 170 bio->bi_end_io = end_swap_bio_read; 171 172 if (bio_add_page(bio, page, PAGE_SIZE, 0) < PAGE_SIZE) { 173 printk(KERN_ERR "PM: Adding page to bio failed at %ld\n", 174 page_off); 175 bio_put(bio); 176 return -EFAULT; 177 } 178 179 lock_page(page); 180 bio_get(bio); 181 182 if (bio_chain == NULL) { 183 submit_bio(bio_rw, bio); 184 wait_on_page_locked(page); 185 if (rw == READ) 186 bio_set_pages_dirty(bio); 187 bio_put(bio); 188 } else { 189 if (rw == READ) 190 get_page(page); /* These pages are freed later */ 191 bio->bi_private = *bio_chain; 192 *bio_chain = bio; 193 submit_bio(bio_rw, bio); 194 } 195 return 0; 196 } 197 198 static int bio_read_page(pgoff_t page_off, void *addr, struct bio **bio_chain) 199 { 200 return submit(READ, page_off, virt_to_page(addr), bio_chain); 201 } 202 203 static int bio_write_page(pgoff_t page_off, void *addr, struct bio **bio_chain) 204 { 205 return submit(WRITE, page_off, virt_to_page(addr), bio_chain); 206 } 207 208 static int wait_on_bio_chain(struct bio **bio_chain) 209 { 210 struct bio *bio; 211 struct bio *next_bio; 212 int ret = 0; 213 214 if (bio_chain == NULL) 215 return 0; 216 217 bio = *bio_chain; 218 if (bio == NULL) 219 return 0; 220 while (bio) { 221 struct page *page; 222 223 next_bio = bio->bi_private; 224 page = bio->bi_io_vec[0].bv_page; 225 wait_on_page_locked(page); 226 if (!PageUptodate(page) || PageError(page)) 227 ret = -EIO; 228 put_page(page); 229 bio_put(bio); 230 bio = next_bio; 231 } 232 *bio_chain = NULL; 233 return ret; 234 } 235 236 /* 237 * Saving part 238 */ 239 240 static int mark_swapfiles(sector_t start, unsigned int flags) 241 { 242 int error; 243 244 bio_read_page(swsusp_resume_block, swsusp_header, NULL); 245 if (!memcmp("SWAP-SPACE",swsusp_header->sig, 10) || 246 !memcmp("SWAPSPACE2",swsusp_header->sig, 10)) { 247 memcpy(swsusp_header->orig_sig,swsusp_header->sig, 10); 248 memcpy(swsusp_header->sig,SWSUSP_SIG, 10); 249 swsusp_header->image = start; 250 swsusp_header->flags = flags; 251 error = bio_write_page(swsusp_resume_block, 252 swsusp_header, NULL); 253 } else { 254 printk(KERN_ERR "PM: Swap header not found!\n"); 255 error = -ENODEV; 256 } 257 return error; 258 } 259 260 /** 261 * swsusp_swap_check - check if the resume device is a swap device 262 * and get its index (if so) 263 */ 264 265 static int swsusp_swap_check(void) /* This is called before saving image */ 266 { 267 int res; 268 269 res = swap_type_of(swsusp_resume_device, swsusp_resume_block, 270 &resume_bdev); 271 if (res < 0) 272 return res; 273 274 root_swap = res; 275 res = blkdev_get(resume_bdev, FMODE_WRITE); 276 if (res) 277 return res; 278 279 res = set_blocksize(resume_bdev, PAGE_SIZE); 280 if (res < 0) 281 blkdev_put(resume_bdev, FMODE_WRITE); 282 283 return res; 284 } 285 286 /** 287 * write_page - Write one page to given swap location. 288 * @buf: Address we're writing. 289 * @offset: Offset of the swap page we're writing to. 290 * @bio_chain: Link the next write BIO here 291 */ 292 293 static int write_page(void *buf, sector_t offset, struct bio **bio_chain) 294 { 295 void *src; 296 297 if (!offset) 298 return -ENOSPC; 299 300 if (bio_chain) { 301 src = (void *)__get_free_page(__GFP_WAIT | __GFP_HIGH); 302 if (src) { 303 memcpy(src, buf, PAGE_SIZE); 304 } else { 305 WARN_ON_ONCE(1); 306 bio_chain = NULL; /* Go synchronous */ 307 src = buf; 308 } 309 } else { 310 src = buf; 311 } 312 return bio_write_page(offset, src, bio_chain); 313 } 314 315 /* 316 * The swap map is a data structure used for keeping track of each page 317 * written to a swap partition. It consists of many swap_map_page 318 * structures that contain each an array of MAP_PAGE_SIZE swap entries. 319 * These structures are stored on the swap and linked together with the 320 * help of the .next_swap member. 321 * 322 * The swap map is created during suspend. The swap map pages are 323 * allocated and populated one at a time, so we only need one memory 324 * page to set up the entire structure. 325 * 326 * During resume we also only need to use one swap_map_page structure 327 * at a time. 328 */ 329 330 #define MAP_PAGE_ENTRIES (PAGE_SIZE / sizeof(sector_t) - 1) 331 332 struct swap_map_page { 333 sector_t entries[MAP_PAGE_ENTRIES]; 334 sector_t next_swap; 335 }; 336 337 /** 338 * The swap_map_handle structure is used for handling swap in 339 * a file-alike way 340 */ 341 342 struct swap_map_handle { 343 struct swap_map_page *cur; 344 sector_t cur_swap; 345 unsigned int k; 346 }; 347 348 static void release_swap_writer(struct swap_map_handle *handle) 349 { 350 if (handle->cur) 351 free_page((unsigned long)handle->cur); 352 handle->cur = NULL; 353 } 354 355 static int get_swap_writer(struct swap_map_handle *handle) 356 { 357 handle->cur = (struct swap_map_page *)get_zeroed_page(GFP_KERNEL); 358 if (!handle->cur) 359 return -ENOMEM; 360 handle->cur_swap = alloc_swapdev_block(root_swap); 361 if (!handle->cur_swap) { 362 release_swap_writer(handle); 363 return -ENOSPC; 364 } 365 handle->k = 0; 366 return 0; 367 } 368 369 static int swap_write_page(struct swap_map_handle *handle, void *buf, 370 struct bio **bio_chain) 371 { 372 int error = 0; 373 sector_t offset; 374 375 if (!handle->cur) 376 return -EINVAL; 377 offset = alloc_swapdev_block(root_swap); 378 error = write_page(buf, offset, bio_chain); 379 if (error) 380 return error; 381 handle->cur->entries[handle->k++] = offset; 382 if (handle->k >= MAP_PAGE_ENTRIES) { 383 error = wait_on_bio_chain(bio_chain); 384 if (error) 385 goto out; 386 offset = alloc_swapdev_block(root_swap); 387 if (!offset) 388 return -ENOSPC; 389 handle->cur->next_swap = offset; 390 error = write_page(handle->cur, handle->cur_swap, NULL); 391 if (error) 392 goto out; 393 memset(handle->cur, 0, PAGE_SIZE); 394 handle->cur_swap = offset; 395 handle->k = 0; 396 } 397 out: 398 return error; 399 } 400 401 static int flush_swap_writer(struct swap_map_handle *handle) 402 { 403 if (handle->cur && handle->cur_swap) 404 return write_page(handle->cur, handle->cur_swap, NULL); 405 else 406 return -EINVAL; 407 } 408 409 /** 410 * save_image - save the suspend image data 411 */ 412 413 static int save_image(struct swap_map_handle *handle, 414 struct snapshot_handle *snapshot, 415 unsigned int nr_to_write) 416 { 417 unsigned int m; 418 int ret; 419 int nr_pages; 420 int err2; 421 struct bio *bio; 422 struct timeval start; 423 struct timeval stop; 424 425 printk(KERN_INFO "PM: Saving image data pages (%u pages) ... ", 426 nr_to_write); 427 m = nr_to_write / 100; 428 if (!m) 429 m = 1; 430 nr_pages = 0; 431 bio = NULL; 432 do_gettimeofday(&start); 433 while (1) { 434 ret = snapshot_read_next(snapshot, PAGE_SIZE); 435 if (ret <= 0) 436 break; 437 ret = swap_write_page(handle, data_of(*snapshot), &bio); 438 if (ret) 439 break; 440 if (!(nr_pages % m)) 441 printk(KERN_CONT "\b\b\b\b%3d%%", nr_pages / m); 442 nr_pages++; 443 } 444 err2 = wait_on_bio_chain(&bio); 445 do_gettimeofday(&stop); 446 if (!ret) 447 ret = err2; 448 if (!ret) 449 printk(KERN_CONT "\b\b\b\bdone\n"); 450 else 451 printk(KERN_CONT "\n"); 452 swsusp_show_speed(&start, &stop, nr_to_write, "Wrote"); 453 return ret; 454 } 455 456 /** 457 * enough_swap - Make sure we have enough swap to save the image. 458 * 459 * Returns TRUE or FALSE after checking the total amount of swap 460 * space avaiable from the resume partition. 461 */ 462 463 static int enough_swap(unsigned int nr_pages) 464 { 465 unsigned int free_swap = count_swap_pages(root_swap, 1); 466 467 pr_debug("PM: Free swap pages: %u\n", free_swap); 468 return free_swap > nr_pages + PAGES_FOR_IO; 469 } 470 471 /** 472 * swsusp_write - Write entire image and metadata. 473 * @flags: flags to pass to the "boot" kernel in the image header 474 * 475 * It is important _NOT_ to umount filesystems at this point. We want 476 * them synced (in case something goes wrong) but we DO not want to mark 477 * filesystem clean: it is not. (And it does not matter, if we resume 478 * correctly, we'll mark system clean, anyway.) 479 */ 480 481 int swsusp_write(unsigned int flags) 482 { 483 struct swap_map_handle handle; 484 struct snapshot_handle snapshot; 485 struct swsusp_info *header; 486 int error; 487 488 error = swsusp_swap_check(); 489 if (error) { 490 printk(KERN_ERR "PM: Cannot find swap device, try " 491 "swapon -a.\n"); 492 return error; 493 } 494 memset(&snapshot, 0, sizeof(struct snapshot_handle)); 495 error = snapshot_read_next(&snapshot, PAGE_SIZE); 496 if (error < PAGE_SIZE) { 497 if (error >= 0) 498 error = -EFAULT; 499 500 goto out; 501 } 502 header = (struct swsusp_info *)data_of(snapshot); 503 if (!enough_swap(header->pages)) { 504 printk(KERN_ERR "PM: Not enough free swap\n"); 505 error = -ENOSPC; 506 goto out; 507 } 508 error = get_swap_writer(&handle); 509 if (!error) { 510 sector_t start = handle.cur_swap; 511 512 error = swap_write_page(&handle, header, NULL); 513 if (!error) 514 error = save_image(&handle, &snapshot, 515 header->pages - 1); 516 517 if (!error) { 518 flush_swap_writer(&handle); 519 printk(KERN_INFO "PM: S"); 520 error = mark_swapfiles(start, flags); 521 printk("|\n"); 522 } 523 } 524 if (error) 525 free_all_swap_pages(root_swap); 526 527 release_swap_writer(&handle); 528 out: 529 swsusp_close(FMODE_WRITE); 530 return error; 531 } 532 533 /** 534 * The following functions allow us to read data using a swap map 535 * in a file-alike way 536 */ 537 538 static void release_swap_reader(struct swap_map_handle *handle) 539 { 540 if (handle->cur) 541 free_page((unsigned long)handle->cur); 542 handle->cur = NULL; 543 } 544 545 static int get_swap_reader(struct swap_map_handle *handle, sector_t start) 546 { 547 int error; 548 549 if (!start) 550 return -EINVAL; 551 552 handle->cur = (struct swap_map_page *)get_zeroed_page(__GFP_WAIT | __GFP_HIGH); 553 if (!handle->cur) 554 return -ENOMEM; 555 556 error = bio_read_page(start, handle->cur, NULL); 557 if (error) { 558 release_swap_reader(handle); 559 return error; 560 } 561 handle->k = 0; 562 return 0; 563 } 564 565 static int swap_read_page(struct swap_map_handle *handle, void *buf, 566 struct bio **bio_chain) 567 { 568 sector_t offset; 569 int error; 570 571 if (!handle->cur) 572 return -EINVAL; 573 offset = handle->cur->entries[handle->k]; 574 if (!offset) 575 return -EFAULT; 576 error = bio_read_page(offset, buf, bio_chain); 577 if (error) 578 return error; 579 if (++handle->k >= MAP_PAGE_ENTRIES) { 580 error = wait_on_bio_chain(bio_chain); 581 handle->k = 0; 582 offset = handle->cur->next_swap; 583 if (!offset) 584 release_swap_reader(handle); 585 else if (!error) 586 error = bio_read_page(offset, handle->cur, NULL); 587 } 588 return error; 589 } 590 591 /** 592 * load_image - load the image using the swap map handle 593 * @handle and the snapshot handle @snapshot 594 * (assume there are @nr_pages pages to load) 595 */ 596 597 static int load_image(struct swap_map_handle *handle, 598 struct snapshot_handle *snapshot, 599 unsigned int nr_to_read) 600 { 601 unsigned int m; 602 int error = 0; 603 struct timeval start; 604 struct timeval stop; 605 struct bio *bio; 606 int err2; 607 unsigned nr_pages; 608 609 printk(KERN_INFO "PM: Loading image data pages (%u pages) ... ", 610 nr_to_read); 611 m = nr_to_read / 100; 612 if (!m) 613 m = 1; 614 nr_pages = 0; 615 bio = NULL; 616 do_gettimeofday(&start); 617 for ( ; ; ) { 618 error = snapshot_write_next(snapshot, PAGE_SIZE); 619 if (error <= 0) 620 break; 621 error = swap_read_page(handle, data_of(*snapshot), &bio); 622 if (error) 623 break; 624 if (snapshot->sync_read) 625 error = wait_on_bio_chain(&bio); 626 if (error) 627 break; 628 if (!(nr_pages % m)) 629 printk("\b\b\b\b%3d%%", nr_pages / m); 630 nr_pages++; 631 } 632 err2 = wait_on_bio_chain(&bio); 633 do_gettimeofday(&stop); 634 if (!error) 635 error = err2; 636 if (!error) { 637 printk("\b\b\b\bdone\n"); 638 snapshot_write_finalize(snapshot); 639 if (!snapshot_image_loaded(snapshot)) 640 error = -ENODATA; 641 } else 642 printk("\n"); 643 swsusp_show_speed(&start, &stop, nr_to_read, "Read"); 644 return error; 645 } 646 647 /** 648 * swsusp_read - read the hibernation image. 649 * @flags_p: flags passed by the "frozen" kernel in the image header should 650 * be written into this memeory location 651 */ 652 653 int swsusp_read(unsigned int *flags_p) 654 { 655 int error; 656 struct swap_map_handle handle; 657 struct snapshot_handle snapshot; 658 struct swsusp_info *header; 659 660 *flags_p = swsusp_header->flags; 661 662 memset(&snapshot, 0, sizeof(struct snapshot_handle)); 663 error = snapshot_write_next(&snapshot, PAGE_SIZE); 664 if (error < PAGE_SIZE) 665 return error < 0 ? error : -EFAULT; 666 header = (struct swsusp_info *)data_of(snapshot); 667 error = get_swap_reader(&handle, swsusp_header->image); 668 if (!error) 669 error = swap_read_page(&handle, header, NULL); 670 if (!error) 671 error = load_image(&handle, &snapshot, header->pages - 1); 672 release_swap_reader(&handle); 673 674 if (!error) 675 pr_debug("PM: Image successfully loaded\n"); 676 else 677 pr_debug("PM: Error %d resuming\n", error); 678 return error; 679 } 680 681 /** 682 * swsusp_check - Check for swsusp signature in the resume device 683 */ 684 685 int swsusp_check(void) 686 { 687 int error; 688 689 resume_bdev = open_by_devnum(swsusp_resume_device, FMODE_READ); 690 if (!IS_ERR(resume_bdev)) { 691 set_blocksize(resume_bdev, PAGE_SIZE); 692 memset(swsusp_header, 0, PAGE_SIZE); 693 error = bio_read_page(swsusp_resume_block, 694 swsusp_header, NULL); 695 if (error) 696 goto put; 697 698 if (!memcmp(SWSUSP_SIG, swsusp_header->sig, 10)) { 699 memcpy(swsusp_header->sig, swsusp_header->orig_sig, 10); 700 /* Reset swap signature now */ 701 error = bio_write_page(swsusp_resume_block, 702 swsusp_header, NULL); 703 } else { 704 error = -EINVAL; 705 } 706 707 put: 708 if (error) 709 blkdev_put(resume_bdev, FMODE_READ); 710 else 711 pr_debug("PM: Signature found, resuming\n"); 712 } else { 713 error = PTR_ERR(resume_bdev); 714 } 715 716 if (error) 717 pr_debug("PM: Error %d checking image file\n", error); 718 719 return error; 720 } 721 722 /** 723 * swsusp_close - close swap device. 724 */ 725 726 void swsusp_close(fmode_t mode) 727 { 728 if (IS_ERR(resume_bdev)) { 729 pr_debug("PM: Image device not initialised\n"); 730 return; 731 } 732 733 blkdev_put(resume_bdev, mode); 734 } 735 736 static int swsusp_header_init(void) 737 { 738 swsusp_header = (struct swsusp_header*) __get_free_page(GFP_KERNEL); 739 if (!swsusp_header) 740 panic("Could not allocate memory for swsusp_header\n"); 741 return 0; 742 } 743 744 core_initcall(swsusp_header_init); 745