swap.c 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635
  1. /*
  2. * linux/kernel/power/swap.c
  3. *
  4. * This file provides functions for reading the suspend image from
  5. * and writing it to a swap partition.
  6. *
  7. * Copyright (C) 1998,2001-2005 Pavel Machek <pavel@suse.cz>
  8. * Copyright (C) 2006 Rafael J. Wysocki <rjw@sisk.pl>
  9. *
  10. * This file is released under the GPLv2.
  11. *
  12. */
  13. #include <linux/module.h>
  14. #include <linux/smp_lock.h>
  15. #include <linux/file.h>
  16. #include <linux/utsname.h>
  17. #include <linux/version.h>
  18. #include <linux/delay.h>
  19. #include <linux/bitops.h>
  20. #include <linux/genhd.h>
  21. #include <linux/device.h>
  22. #include <linux/buffer_head.h>
  23. #include <linux/bio.h>
  24. #include <linux/swap.h>
  25. #include <linux/swapops.h>
  26. #include <linux/pm.h>
  27. #include "power.h"
  28. extern char resume_file[];
  29. #define SWSUSP_SIG "S1SUSPEND"
  30. static struct swsusp_header {
  31. char reserved[PAGE_SIZE - 20 - sizeof(swp_entry_t)];
  32. swp_entry_t image;
  33. char orig_sig[10];
  34. char sig[10];
  35. } __attribute__((packed, aligned(PAGE_SIZE))) swsusp_header;
  36. /*
  37. * Saving part...
  38. */
  39. static unsigned short root_swap = 0xffff;
  40. static int mark_swapfiles(swp_entry_t start)
  41. {
  42. int error;
  43. rw_swap_page_sync(READ, swp_entry(root_swap, 0),
  44. virt_to_page((unsigned long)&swsusp_header), NULL);
  45. if (!memcmp("SWAP-SPACE",swsusp_header.sig, 10) ||
  46. !memcmp("SWAPSPACE2",swsusp_header.sig, 10)) {
  47. memcpy(swsusp_header.orig_sig,swsusp_header.sig, 10);
  48. memcpy(swsusp_header.sig,SWSUSP_SIG, 10);
  49. swsusp_header.image = start;
  50. error = rw_swap_page_sync(WRITE, swp_entry(root_swap, 0),
  51. virt_to_page((unsigned long)&swsusp_header),
  52. NULL);
  53. } else {
  54. pr_debug("swsusp: Partition is not swap space.\n");
  55. error = -ENODEV;
  56. }
  57. return error;
  58. }
  59. /**
  60. * swsusp_swap_check - check if the resume device is a swap device
  61. * and get its index (if so)
  62. */
  63. static int swsusp_swap_check(void) /* This is called before saving image */
  64. {
  65. int res = swap_type_of(swsusp_resume_device);
  66. if (res >= 0) {
  67. root_swap = res;
  68. return 0;
  69. }
  70. return res;
  71. }
  72. /**
  73. * write_page - Write one page to given swap location.
  74. * @buf: Address we're writing.
  75. * @offset: Offset of the swap page we're writing to.
  76. * @bio_chain: Link the next write BIO here
  77. */
  78. static int write_page(void *buf, unsigned long offset, struct bio **bio_chain)
  79. {
  80. swp_entry_t entry;
  81. int error = -ENOSPC;
  82. if (offset) {
  83. struct page *page = virt_to_page(buf);
  84. if (bio_chain) {
  85. /*
  86. * Whether or not we successfully allocated a copy page,
  87. * we take a ref on the page here. It gets undone in
  88. * wait_on_bio_chain().
  89. */
  90. struct page *page_copy;
  91. page_copy = alloc_page(GFP_ATOMIC);
  92. if (page_copy == NULL) {
  93. WARN_ON_ONCE(1);
  94. bio_chain = NULL; /* Go synchronous */
  95. get_page(page);
  96. } else {
  97. memcpy(page_address(page_copy),
  98. page_address(page), PAGE_SIZE);
  99. page = page_copy;
  100. }
  101. }
  102. entry = swp_entry(root_swap, offset);
  103. error = rw_swap_page_sync(WRITE, entry, page, bio_chain);
  104. }
  105. return error;
  106. }
  107. /*
  108. * The swap map is a data structure used for keeping track of each page
  109. * written to a swap partition. It consists of many swap_map_page
  110. * structures that contain each an array of MAP_PAGE_SIZE swap entries.
  111. * These structures are stored on the swap and linked together with the
  112. * help of the .next_swap member.
  113. *
  114. * The swap map is created during suspend. The swap map pages are
  115. * allocated and populated one at a time, so we only need one memory
  116. * page to set up the entire structure.
  117. *
  118. * During resume we also only need to use one swap_map_page structure
  119. * at a time.
  120. */
  121. #define MAP_PAGE_ENTRIES (PAGE_SIZE / sizeof(long) - 1)
  122. struct swap_map_page {
  123. unsigned long entries[MAP_PAGE_ENTRIES];
  124. unsigned long next_swap;
  125. };
  126. /**
  127. * The swap_map_handle structure is used for handling swap in
  128. * a file-alike way
  129. */
  130. struct swap_map_handle {
  131. struct swap_map_page *cur;
  132. unsigned long cur_swap;
  133. struct bitmap_page *bitmap;
  134. unsigned int k;
  135. };
  136. static void release_swap_writer(struct swap_map_handle *handle)
  137. {
  138. if (handle->cur)
  139. free_page((unsigned long)handle->cur);
  140. handle->cur = NULL;
  141. if (handle->bitmap)
  142. free_bitmap(handle->bitmap);
  143. handle->bitmap = NULL;
  144. }
  145. static void show_speed(struct timeval *start, struct timeval *stop,
  146. unsigned nr_pages, char *msg)
  147. {
  148. s64 elapsed_centisecs64;
  149. int centisecs;
  150. int k;
  151. int kps;
  152. elapsed_centisecs64 = timeval_to_ns(stop) - timeval_to_ns(start);
  153. do_div(elapsed_centisecs64, NSEC_PER_SEC / 100);
  154. centisecs = elapsed_centisecs64;
  155. if (centisecs == 0)
  156. centisecs = 1; /* avoid div-by-zero */
  157. k = nr_pages * (PAGE_SIZE / 1024);
  158. kps = (k * 100) / centisecs;
  159. printk("%s %d kbytes in %d.%02d seconds (%d.%02d MB/s)\n", msg, k,
  160. centisecs / 100, centisecs % 100,
  161. kps / 1000, (kps % 1000) / 10);
  162. }
  163. static int get_swap_writer(struct swap_map_handle *handle)
  164. {
  165. handle->cur = (struct swap_map_page *)get_zeroed_page(GFP_KERNEL);
  166. if (!handle->cur)
  167. return -ENOMEM;
  168. handle->bitmap = alloc_bitmap(count_swap_pages(root_swap, 0));
  169. if (!handle->bitmap) {
  170. release_swap_writer(handle);
  171. return -ENOMEM;
  172. }
  173. handle->cur_swap = alloc_swap_page(root_swap, handle->bitmap);
  174. if (!handle->cur_swap) {
  175. release_swap_writer(handle);
  176. return -ENOSPC;
  177. }
  178. handle->k = 0;
  179. return 0;
  180. }
  181. static int wait_on_bio_chain(struct bio **bio_chain)
  182. {
  183. struct bio *bio;
  184. struct bio *next_bio;
  185. int ret = 0;
  186. if (bio_chain == NULL)
  187. return 0;
  188. bio = *bio_chain;
  189. while (bio) {
  190. struct page *page;
  191. next_bio = bio->bi_private;
  192. page = bio->bi_io_vec[0].bv_page;
  193. wait_on_page_locked(page);
  194. if (!PageUptodate(page) || PageError(page))
  195. ret = -EIO;
  196. put_page(page);
  197. bio_put(bio);
  198. bio = next_bio;
  199. }
  200. *bio_chain = NULL;
  201. return ret;
  202. }
  203. static int swap_write_page(struct swap_map_handle *handle, void *buf,
  204. struct bio **bio_chain)
  205. {
  206. int error = 0;
  207. unsigned long offset;
  208. if (!handle->cur)
  209. return -EINVAL;
  210. offset = alloc_swap_page(root_swap, handle->bitmap);
  211. error = write_page(buf, offset, bio_chain);
  212. if (error)
  213. return error;
  214. handle->cur->entries[handle->k++] = offset;
  215. if (handle->k >= MAP_PAGE_ENTRIES) {
  216. error = wait_on_bio_chain(bio_chain);
  217. if (error)
  218. goto out;
  219. offset = alloc_swap_page(root_swap, handle->bitmap);
  220. if (!offset)
  221. return -ENOSPC;
  222. handle->cur->next_swap = offset;
  223. error = write_page(handle->cur, handle->cur_swap, NULL);
  224. if (error)
  225. goto out;
  226. memset(handle->cur, 0, PAGE_SIZE);
  227. handle->cur_swap = offset;
  228. handle->k = 0;
  229. }
  230. out:
  231. return error;
  232. }
  233. static int flush_swap_writer(struct swap_map_handle *handle)
  234. {
  235. if (handle->cur && handle->cur_swap)
  236. return write_page(handle->cur, handle->cur_swap, NULL);
  237. else
  238. return -EINVAL;
  239. }
  240. /**
  241. * save_image - save the suspend image data
  242. */
  243. static int save_image(struct swap_map_handle *handle,
  244. struct snapshot_handle *snapshot,
  245. unsigned int nr_to_write)
  246. {
  247. unsigned int m;
  248. int ret;
  249. int error = 0;
  250. int nr_pages;
  251. int err2;
  252. struct bio *bio;
  253. struct timeval start;
  254. struct timeval stop;
  255. printk("Saving image data pages (%u pages) ... ", nr_to_write);
  256. m = nr_to_write / 100;
  257. if (!m)
  258. m = 1;
  259. nr_pages = 0;
  260. bio = NULL;
  261. do_gettimeofday(&start);
  262. do {
  263. ret = snapshot_read_next(snapshot, PAGE_SIZE);
  264. if (ret > 0) {
  265. error = swap_write_page(handle, data_of(*snapshot),
  266. &bio);
  267. if (error)
  268. break;
  269. if (!(nr_pages % m))
  270. printk("\b\b\b\b%3d%%", nr_pages / m);
  271. nr_pages++;
  272. }
  273. } while (ret > 0);
  274. err2 = wait_on_bio_chain(&bio);
  275. do_gettimeofday(&stop);
  276. if (!error)
  277. error = err2;
  278. if (!error)
  279. printk("\b\b\b\bdone\n");
  280. show_speed(&start, &stop, nr_to_write, "Wrote");
  281. return error;
  282. }
  283. /**
  284. * enough_swap - Make sure we have enough swap to save the image.
  285. *
  286. * Returns TRUE or FALSE after checking the total amount of swap
  287. * space avaiable from the resume partition.
  288. */
  289. static int enough_swap(unsigned int nr_pages)
  290. {
  291. unsigned int free_swap = count_swap_pages(root_swap, 1);
  292. pr_debug("swsusp: free swap pages: %u\n", free_swap);
  293. return free_swap > (nr_pages + PAGES_FOR_IO +
  294. (nr_pages + PBES_PER_PAGE - 1) / PBES_PER_PAGE);
  295. }
  296. /**
  297. * swsusp_write - Write entire image and metadata.
  298. *
  299. * It is important _NOT_ to umount filesystems at this point. We want
  300. * them synced (in case something goes wrong) but we DO not want to mark
  301. * filesystem clean: it is not. (And it does not matter, if we resume
  302. * correctly, we'll mark system clean, anyway.)
  303. */
  304. int swsusp_write(void)
  305. {
  306. struct swap_map_handle handle;
  307. struct snapshot_handle snapshot;
  308. struct swsusp_info *header;
  309. int error;
  310. if ((error = swsusp_swap_check())) {
  311. printk(KERN_ERR "swsusp: Cannot find swap device, try swapon -a.\n");
  312. return error;
  313. }
  314. memset(&snapshot, 0, sizeof(struct snapshot_handle));
  315. error = snapshot_read_next(&snapshot, PAGE_SIZE);
  316. if (error < PAGE_SIZE)
  317. return error < 0 ? error : -EFAULT;
  318. header = (struct swsusp_info *)data_of(snapshot);
  319. if (!enough_swap(header->pages)) {
  320. printk(KERN_ERR "swsusp: Not enough free swap\n");
  321. return -ENOSPC;
  322. }
  323. error = get_swap_writer(&handle);
  324. if (!error) {
  325. unsigned long start = handle.cur_swap;
  326. error = swap_write_page(&handle, header, NULL);
  327. if (!error)
  328. error = save_image(&handle, &snapshot,
  329. header->pages - 1);
  330. if (!error) {
  331. flush_swap_writer(&handle);
  332. printk("S");
  333. error = mark_swapfiles(swp_entry(root_swap, start));
  334. printk("|\n");
  335. }
  336. }
  337. if (error)
  338. free_all_swap_pages(root_swap, handle.bitmap);
  339. release_swap_writer(&handle);
  340. return error;
  341. }
  342. /*
  343. * Using bio to read from swap.
  344. * This code requires a bit more work than just using buffer heads
  345. * but, it is the recommended way for 2.5/2.6.
  346. * The following are to signal the beginning and end of I/O. Bios
  347. * finish asynchronously, while we want them to happen synchronously.
  348. * A simple atomic_t, and a wait loop take care of this problem.
  349. */
  350. static atomic_t io_done = ATOMIC_INIT(0);
  351. static int end_io(struct bio *bio, unsigned int num, int err)
  352. {
  353. if (!test_bit(BIO_UPTODATE, &bio->bi_flags)) {
  354. printk(KERN_ERR "I/O error reading swsusp image.\n");
  355. return -EIO;
  356. }
  357. atomic_set(&io_done, 0);
  358. return 0;
  359. }
  360. static struct block_device *resume_bdev;
  361. /**
  362. * submit - submit BIO request.
  363. * @rw: READ or WRITE.
  364. * @off physical offset of page.
  365. * @page: page we're reading or writing.
  366. *
  367. * Straight from the textbook - allocate and initialize the bio.
  368. * If we're writing, make sure the page is marked as dirty.
  369. * Then submit it and wait.
  370. */
  371. static int submit(int rw, pgoff_t page_off, void *page)
  372. {
  373. int error = 0;
  374. struct bio *bio;
  375. bio = bio_alloc(GFP_ATOMIC, 1);
  376. if (!bio)
  377. return -ENOMEM;
  378. bio->bi_sector = page_off * (PAGE_SIZE >> 9);
  379. bio->bi_bdev = resume_bdev;
  380. bio->bi_end_io = end_io;
  381. if (bio_add_page(bio, virt_to_page(page), PAGE_SIZE, 0) < PAGE_SIZE) {
  382. printk("swsusp: ERROR: adding page to bio at %ld\n",page_off);
  383. error = -EFAULT;
  384. goto Done;
  385. }
  386. atomic_set(&io_done, 1);
  387. submit_bio(rw | (1 << BIO_RW_SYNC), bio);
  388. while (atomic_read(&io_done))
  389. yield();
  390. if (rw == READ)
  391. bio_set_pages_dirty(bio);
  392. Done:
  393. bio_put(bio);
  394. return error;
  395. }
  396. static int bio_read_page(pgoff_t page_off, void *page)
  397. {
  398. return submit(READ, page_off, page);
  399. }
  400. static int bio_write_page(pgoff_t page_off, void *page)
  401. {
  402. return submit(WRITE, page_off, page);
  403. }
  404. /**
  405. * The following functions allow us to read data using a swap map
  406. * in a file-alike way
  407. */
  408. static void release_swap_reader(struct swap_map_handle *handle)
  409. {
  410. if (handle->cur)
  411. free_page((unsigned long)handle->cur);
  412. handle->cur = NULL;
  413. }
  414. static int get_swap_reader(struct swap_map_handle *handle,
  415. swp_entry_t start)
  416. {
  417. int error;
  418. if (!swp_offset(start))
  419. return -EINVAL;
  420. handle->cur = (struct swap_map_page *)get_zeroed_page(GFP_ATOMIC);
  421. if (!handle->cur)
  422. return -ENOMEM;
  423. error = bio_read_page(swp_offset(start), handle->cur);
  424. if (error) {
  425. release_swap_reader(handle);
  426. return error;
  427. }
  428. handle->k = 0;
  429. return 0;
  430. }
  431. static int swap_read_page(struct swap_map_handle *handle, void *buf)
  432. {
  433. unsigned long offset;
  434. int error;
  435. if (!handle->cur)
  436. return -EINVAL;
  437. offset = handle->cur->entries[handle->k];
  438. if (!offset)
  439. return -EFAULT;
  440. error = bio_read_page(offset, buf);
  441. if (error)
  442. return error;
  443. if (++handle->k >= MAP_PAGE_ENTRIES) {
  444. handle->k = 0;
  445. offset = handle->cur->next_swap;
  446. if (!offset)
  447. release_swap_reader(handle);
  448. else
  449. error = bio_read_page(offset, handle->cur);
  450. }
  451. return error;
  452. }
  453. /**
  454. * load_image - load the image using the swap map handle
  455. * @handle and the snapshot handle @snapshot
  456. * (assume there are @nr_pages pages to load)
  457. */
  458. static int load_image(struct swap_map_handle *handle,
  459. struct snapshot_handle *snapshot,
  460. unsigned int nr_pages)
  461. {
  462. unsigned int m;
  463. int ret;
  464. int error = 0;
  465. struct timeval start;
  466. struct timeval stop;
  467. printk("Loading image data pages (%u pages) ... ", nr_pages);
  468. m = nr_pages / 100;
  469. if (!m)
  470. m = 1;
  471. nr_pages = 0;
  472. do_gettimeofday(&start);
  473. do {
  474. ret = snapshot_write_next(snapshot, PAGE_SIZE);
  475. if (ret > 0) {
  476. error = swap_read_page(handle, data_of(*snapshot));
  477. if (error)
  478. break;
  479. if (!(nr_pages % m))
  480. printk("\b\b\b\b%3d%%", nr_pages / m);
  481. nr_pages++;
  482. }
  483. } while (ret > 0);
  484. do_gettimeofday(&stop);
  485. if (!error) {
  486. printk("\b\b\b\bdone\n");
  487. if (!snapshot_image_loaded(snapshot))
  488. error = -ENODATA;
  489. }
  490. show_speed(&start, &stop, nr_pages, "Read");
  491. return error;
  492. }
  493. int swsusp_read(void)
  494. {
  495. int error;
  496. struct swap_map_handle handle;
  497. struct snapshot_handle snapshot;
  498. struct swsusp_info *header;
  499. if (IS_ERR(resume_bdev)) {
  500. pr_debug("swsusp: block device not initialised\n");
  501. return PTR_ERR(resume_bdev);
  502. }
  503. memset(&snapshot, 0, sizeof(struct snapshot_handle));
  504. error = snapshot_write_next(&snapshot, PAGE_SIZE);
  505. if (error < PAGE_SIZE)
  506. return error < 0 ? error : -EFAULT;
  507. header = (struct swsusp_info *)data_of(snapshot);
  508. error = get_swap_reader(&handle, swsusp_header.image);
  509. if (!error)
  510. error = swap_read_page(&handle, header);
  511. if (!error)
  512. error = load_image(&handle, &snapshot, header->pages - 1);
  513. release_swap_reader(&handle);
  514. blkdev_put(resume_bdev);
  515. if (!error)
  516. pr_debug("swsusp: Reading resume file was successful\n");
  517. else
  518. pr_debug("swsusp: Error %d resuming\n", error);
  519. return error;
  520. }
  521. /**
  522. * swsusp_check - Check for swsusp signature in the resume device
  523. */
  524. int swsusp_check(void)
  525. {
  526. int error;
  527. resume_bdev = open_by_devnum(swsusp_resume_device, FMODE_READ);
  528. if (!IS_ERR(resume_bdev)) {
  529. set_blocksize(resume_bdev, PAGE_SIZE);
  530. memset(&swsusp_header, 0, sizeof(swsusp_header));
  531. if ((error = bio_read_page(0, &swsusp_header)))
  532. return error;
  533. if (!memcmp(SWSUSP_SIG, swsusp_header.sig, 10)) {
  534. memcpy(swsusp_header.sig, swsusp_header.orig_sig, 10);
  535. /* Reset swap signature now */
  536. error = bio_write_page(0, &swsusp_header);
  537. } else {
  538. return -EINVAL;
  539. }
  540. if (error)
  541. blkdev_put(resume_bdev);
  542. else
  543. pr_debug("swsusp: Signature found, resuming\n");
  544. } else {
  545. error = PTR_ERR(resume_bdev);
  546. }
  547. if (error)
  548. pr_debug("swsusp: Error %d check for resume file\n", error);
  549. return error;
  550. }
  551. /**
  552. * swsusp_close - close swap device.
  553. */
  554. void swsusp_close(void)
  555. {
  556. if (IS_ERR(resume_bdev)) {
  557. pr_debug("swsusp: block device not initialised\n");
  558. return;
  559. }
  560. blkdev_put(resume_bdev);
  561. }