2005-04-16 22:20:36 +00:00
|
|
|
/*
|
|
|
|
* linux/kernel/power/swsusp.c
|
|
|
|
*
|
2005-10-30 22:59:58 +00:00
|
|
|
* This file provides code to write suspend image to swap and read it back.
|
2005-04-16 22:20:36 +00:00
|
|
|
*
|
|
|
|
* Copyright (C) 1998-2001 Gabor Kuti <seasons@fornax.hu>
|
2005-10-30 22:59:56 +00:00
|
|
|
* Copyright (C) 1998,2001-2005 Pavel Machek <pavel@suse.cz>
|
2005-04-16 22:20:36 +00:00
|
|
|
*
|
|
|
|
* This file is released under the GPLv2.
|
|
|
|
*
|
|
|
|
* I'd like to thank the following people for their work:
|
2005-06-25 21:55:12 +00:00
|
|
|
*
|
2005-04-16 22:20:36 +00:00
|
|
|
* Pavel Machek <pavel@ucw.cz>:
|
|
|
|
* Modifications, defectiveness pointing, being with me at the very beginning,
|
|
|
|
* suspend to swap space, stop all tasks. Port to 2.4.18-ac and 2.5.17.
|
|
|
|
*
|
2005-06-25 21:55:12 +00:00
|
|
|
* Steve Doddi <dirk@loth.demon.co.uk>:
|
2005-04-16 22:20:36 +00:00
|
|
|
* Support the possibility of hardware state restoring.
|
|
|
|
*
|
|
|
|
* Raph <grey.havens@earthling.net>:
|
|
|
|
* Support for preserving states of network devices and virtual console
|
|
|
|
* (including X and svgatextmode)
|
|
|
|
*
|
|
|
|
* Kurt Garloff <garloff@suse.de>:
|
|
|
|
* Straightened the critical function in order to prevent compilers from
|
|
|
|
* playing tricks with local variables.
|
|
|
|
*
|
|
|
|
* Andreas Mohr <a.mohr@mailto.de>
|
|
|
|
*
|
|
|
|
* Alex Badea <vampire@go.ro>:
|
|
|
|
* Fixed runaway init
|
|
|
|
*
|
2006-01-06 08:13:05 +00:00
|
|
|
* Rafael J. Wysocki <rjw@sisk.pl>
|
2006-03-23 11:00:00 +00:00
|
|
|
* Reworked the freeing of memory and the handling of swap
|
2006-01-06 08:13:05 +00:00
|
|
|
*
|
2005-04-16 22:20:36 +00:00
|
|
|
* More state savers are welcome. Especially for the scsi layer...
|
|
|
|
*
|
|
|
|
* For TODOs,FIXMEs also look in Documentation/power/swsusp.txt
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include <linux/mm.h>
|
|
|
|
#include <linux/suspend.h>
|
|
|
|
#include <linux/spinlock.h>
|
|
|
|
#include <linux/kernel.h>
|
|
|
|
#include <linux/major.h>
|
|
|
|
#include <linux/swap.h>
|
|
|
|
#include <linux/pm.h>
|
|
|
|
#include <linux/swapops.h>
|
|
|
|
#include <linux/bootmem.h>
|
|
|
|
#include <linux/syscalls.h>
|
|
|
|
#include <linux/highmem.h>
|
|
|
|
|
|
|
|
#include "power.h"
|
|
|
|
|
2006-01-06 08:15:56 +00:00
|
|
|
/*
|
2006-02-01 11:05:07 +00:00
|
|
|
* Preferred image size in bytes (tunable via /sys/power/image_size).
|
2006-01-06 08:15:56 +00:00
|
|
|
* When it is set to N, swsusp will do its best to ensure the image
|
2006-02-01 11:05:07 +00:00
|
|
|
* size will not exceed N bytes, but if that is impossible, it will
|
2006-01-06 08:15:56 +00:00
|
|
|
* try to create the smallest image possible.
|
|
|
|
*/
|
2006-02-01 11:05:07 +00:00
|
|
|
unsigned long image_size = 500 * 1024 * 1024;
|
2006-01-06 08:15:56 +00:00
|
|
|
|
2006-03-23 10:59:59 +00:00
|
|
|
int in_suspend __nosavedata = 0;
|
|
|
|
|
2006-06-26 01:41:00 +00:00
|
|
|
#ifdef CONFIG_HIGHMEM
|
|
|
|
unsigned int count_highmem_pages(void);
|
|
|
|
int save_highmem(void);
|
|
|
|
int restore_highmem(void);
|
|
|
|
#else
|
|
|
|
static inline int save_highmem(void) { return 0; }
|
|
|
|
static inline int restore_highmem(void) { return 0; }
|
|
|
|
static inline unsigned int count_highmem_pages(void) { return 0; }
|
|
|
|
#endif
|
|
|
|
|
2005-04-16 22:20:36 +00:00
|
|
|
/**
|
2006-03-23 10:59:59 +00:00
|
|
|
* The following functions are used for tracing the allocated
|
|
|
|
* swap pages, so that they can be freed in case of an error.
|
2006-01-06 08:13:05 +00:00
|
|
|
*
|
2006-03-23 10:59:59 +00:00
|
|
|
* The functions operate on a linked bitmap structure defined
|
2006-03-23 11:00:00 +00:00
|
|
|
* in power.h
|
2005-04-16 22:20:36 +00:00
|
|
|
*/
|
2006-01-06 08:13:05 +00:00
|
|
|
|
2006-03-23 11:00:00 +00:00
|
|
|
void free_bitmap(struct bitmap_page *bitmap)
|
2005-04-16 22:20:36 +00:00
|
|
|
{
|
2006-03-23 10:59:59 +00:00
|
|
|
struct bitmap_page *bp;
|
2005-04-16 22:20:36 +00:00
|
|
|
|
2006-03-23 10:59:59 +00:00
|
|
|
while (bitmap) {
|
|
|
|
bp = bitmap->next;
|
|
|
|
free_page((unsigned long)bitmap);
|
|
|
|
bitmap = bp;
|
2006-01-06 08:13:05 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2006-03-23 11:00:00 +00:00
|
|
|
struct bitmap_page *alloc_bitmap(unsigned int nr_bits)
|
2006-01-06 08:13:05 +00:00
|
|
|
{
|
2006-03-23 10:59:59 +00:00
|
|
|
struct bitmap_page *bitmap, *bp;
|
|
|
|
unsigned int n;
|
2006-01-06 08:13:05 +00:00
|
|
|
|
2006-03-23 10:59:59 +00:00
|
|
|
if (!nr_bits)
|
2006-01-06 08:13:05 +00:00
|
|
|
return NULL;
|
|
|
|
|
2006-03-23 10:59:59 +00:00
|
|
|
bitmap = (struct bitmap_page *)get_zeroed_page(GFP_KERNEL);
|
|
|
|
bp = bitmap;
|
|
|
|
for (n = BITMAP_PAGE_BITS; n < nr_bits; n += BITMAP_PAGE_BITS) {
|
|
|
|
bp->next = (struct bitmap_page *)get_zeroed_page(GFP_KERNEL);
|
|
|
|
bp = bp->next;
|
|
|
|
if (!bp) {
|
|
|
|
free_bitmap(bitmap);
|
2006-01-06 08:13:05 +00:00
|
|
|
return NULL;
|
|
|
|
}
|
2005-04-16 22:20:36 +00:00
|
|
|
}
|
2006-03-23 10:59:59 +00:00
|
|
|
return bitmap;
|
2005-04-16 22:20:36 +00:00
|
|
|
}
|
|
|
|
|
2006-03-23 10:59:59 +00:00
|
|
|
static int bitmap_set(struct bitmap_page *bitmap, unsigned long bit)
|
2005-04-16 22:20:36 +00:00
|
|
|
{
|
2006-03-23 10:59:59 +00:00
|
|
|
unsigned int n;
|
|
|
|
|
|
|
|
n = BITMAP_PAGE_BITS;
|
|
|
|
while (bitmap && n <= bit) {
|
|
|
|
n += BITMAP_PAGE_BITS;
|
|
|
|
bitmap = bitmap->next;
|
|
|
|
}
|
|
|
|
if (!bitmap)
|
|
|
|
return -EINVAL;
|
|
|
|
n -= BITMAP_PAGE_BITS;
|
|
|
|
bit -= n;
|
|
|
|
n = 0;
|
|
|
|
while (bit >= BITS_PER_CHUNK) {
|
|
|
|
bit -= BITS_PER_CHUNK;
|
|
|
|
n++;
|
2006-01-06 08:13:05 +00:00
|
|
|
}
|
2006-03-23 10:59:59 +00:00
|
|
|
bitmap->chunks[n] |= (1UL << bit);
|
|
|
|
return 0;
|
2006-01-06 08:13:05 +00:00
|
|
|
}
|
2005-04-16 22:20:36 +00:00
|
|
|
|
2006-03-23 11:00:00 +00:00
|
|
|
unsigned long alloc_swap_page(int swap, struct bitmap_page *bitmap)
|
2006-01-06 08:13:05 +00:00
|
|
|
{
|
2006-03-23 10:59:59 +00:00
|
|
|
unsigned long offset;
|
|
|
|
|
|
|
|
offset = swp_offset(get_swap_page_of_type(swap));
|
|
|
|
if (offset) {
|
|
|
|
if (bitmap_set(bitmap, offset)) {
|
|
|
|
swap_free(swp_entry(swap, offset));
|
|
|
|
offset = 0;
|
|
|
|
}
|
2006-01-06 08:13:05 +00:00
|
|
|
}
|
2006-03-23 10:59:59 +00:00
|
|
|
return offset;
|
2006-01-06 08:13:05 +00:00
|
|
|
}
|
2005-04-16 22:20:36 +00:00
|
|
|
|
2006-03-23 11:00:00 +00:00
|
|
|
void free_all_swap_pages(int swap, struct bitmap_page *bitmap)
|
2006-01-06 08:13:05 +00:00
|
|
|
{
|
2006-03-23 10:59:59 +00:00
|
|
|
unsigned int bit, n;
|
|
|
|
unsigned long test;
|
2006-01-06 08:13:05 +00:00
|
|
|
|
2006-03-23 10:59:59 +00:00
|
|
|
bit = 0;
|
|
|
|
while (bitmap) {
|
|
|
|
for (n = 0; n < BITMAP_PAGE_CHUNKS; n++)
|
|
|
|
for (test = 1UL; test; test <<= 1) {
|
|
|
|
if (bitmap->chunks[n] & test)
|
|
|
|
swap_free(swp_entry(swap, bit));
|
|
|
|
bit++;
|
|
|
|
}
|
|
|
|
bitmap = bitmap->next;
|
2005-04-16 22:20:36 +00:00
|
|
|
}
|
2006-01-06 08:13:05 +00:00
|
|
|
}
|
|
|
|
|
2006-01-06 08:13:46 +00:00
|
|
|
/**
|
|
|
|
* swsusp_shrink_memory - Try to free as much memory as needed
|
|
|
|
*
|
|
|
|
* ... but do not OOM-kill anyone
|
|
|
|
*
|
|
|
|
* Notice: all userland should be stopped before it is called, or
|
|
|
|
* livelock is possible.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#define SHRINK_BITE 10000
|
2006-06-23 09:03:18 +00:00
|
|
|
static inline unsigned long __shrink_memory(long tmp)
|
|
|
|
{
|
|
|
|
if (tmp > SHRINK_BITE)
|
|
|
|
tmp = SHRINK_BITE;
|
|
|
|
return shrink_all_memory(tmp);
|
|
|
|
}
|
2006-01-06 08:13:46 +00:00
|
|
|
|
|
|
|
int swsusp_shrink_memory(void)
|
|
|
|
{
|
2006-01-06 08:15:22 +00:00
|
|
|
long size, tmp;
|
2006-01-06 08:13:46 +00:00
|
|
|
struct zone *zone;
|
|
|
|
unsigned long pages = 0;
|
|
|
|
unsigned int i = 0;
|
|
|
|
char *p = "-\\|/";
|
|
|
|
|
|
|
|
printk("Shrinking memory... ");
|
|
|
|
do {
|
2006-06-26 01:41:00 +00:00
|
|
|
size = 2 * count_highmem_pages();
|
2006-09-26 06:32:54 +00:00
|
|
|
size += size / 50 + count_data_pages() + PAGES_FOR_IO;
|
2006-01-06 08:15:22 +00:00
|
|
|
tmp = size;
|
2006-01-06 08:13:46 +00:00
|
|
|
for_each_zone (zone)
|
2006-06-23 09:04:46 +00:00
|
|
|
if (!is_highmem(zone) && populated_zone(zone)) {
|
2006-01-06 08:13:46 +00:00
|
|
|
tmp -= zone->free_pages;
|
2006-06-23 09:04:46 +00:00
|
|
|
tmp += zone->lowmem_reserve[ZONE_NORMAL];
|
2006-09-26 06:32:54 +00:00
|
|
|
tmp += snapshot_additional_pages(zone);
|
2006-06-23 09:04:46 +00:00
|
|
|
}
|
2006-01-06 08:13:46 +00:00
|
|
|
if (tmp > 0) {
|
2006-06-23 09:03:18 +00:00
|
|
|
tmp = __shrink_memory(tmp);
|
2006-01-06 08:13:46 +00:00
|
|
|
if (!tmp)
|
|
|
|
return -ENOMEM;
|
|
|
|
pages += tmp;
|
2006-02-01 11:05:07 +00:00
|
|
|
} else if (size > image_size / PAGE_SIZE) {
|
2006-06-23 09:03:18 +00:00
|
|
|
tmp = __shrink_memory(size - (image_size / PAGE_SIZE));
|
2006-01-06 08:15:22 +00:00
|
|
|
pages += tmp;
|
2006-01-06 08:13:46 +00:00
|
|
|
}
|
|
|
|
printk("\b%c", p[i++%4]);
|
|
|
|
} while (tmp > 0);
|
|
|
|
printk("\bdone (%lu pages freed)\n", pages);
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2005-04-16 22:20:36 +00:00
|
|
|
int swsusp_suspend(void)
|
|
|
|
{
|
|
|
|
int error;
|
2005-11-09 05:34:41 +00:00
|
|
|
|
2005-04-16 22:20:36 +00:00
|
|
|
if ((error = arch_prepare_suspend()))
|
|
|
|
return error;
|
|
|
|
local_irq_disable();
|
|
|
|
/* At this point, device_suspend() has been called, but *not*
|
|
|
|
* device_power_down(). We *must* device_power_down() now.
|
|
|
|
* Otherwise, drivers for some devices (e.g. interrupt controllers)
|
|
|
|
* become desynchronized with the actual state of the hardware
|
|
|
|
* at resume time, and evil weirdness ensues.
|
|
|
|
*/
|
|
|
|
if ((error = device_power_down(PMSG_FREEZE))) {
|
2005-09-03 22:57:05 +00:00
|
|
|
printk(KERN_ERR "Some devices failed to power down, aborting suspend\n");
|
2005-11-09 05:34:41 +00:00
|
|
|
goto Enable_irqs;
|
2005-04-16 22:20:36 +00:00
|
|
|
}
|
2005-07-08 00:56:44 +00:00
|
|
|
|
2006-06-26 01:41:00 +00:00
|
|
|
if ((error = save_highmem())) {
|
2005-11-09 05:34:41 +00:00
|
|
|
printk(KERN_ERR "swsusp: Not enough free pages for highmem\n");
|
|
|
|
goto Restore_highmem;
|
2005-07-08 00:56:44 +00:00
|
|
|
}
|
|
|
|
|
2005-04-16 22:20:36 +00:00
|
|
|
save_processor_state();
|
|
|
|
if ((error = swsusp_arch_suspend()))
|
2005-09-03 22:57:05 +00:00
|
|
|
printk(KERN_ERR "Error %d suspending\n", error);
|
2005-04-16 22:20:36 +00:00
|
|
|
/* Restore control flow magically appears here */
|
|
|
|
restore_processor_state();
|
2005-11-09 05:34:41 +00:00
|
|
|
Restore_highmem:
|
2006-06-26 01:41:00 +00:00
|
|
|
restore_highmem();
|
2006-08-15 06:11:08 +00:00
|
|
|
/* NOTE: device_power_up() is just a resume() for devices
|
|
|
|
* that suspended with irqs off ... no overall powerup.
|
|
|
|
*/
|
2005-04-16 22:20:36 +00:00
|
|
|
device_power_up();
|
2005-11-09 05:34:41 +00:00
|
|
|
Enable_irqs:
|
2005-04-16 22:20:36 +00:00
|
|
|
local_irq_enable();
|
|
|
|
return error;
|
|
|
|
}
|
|
|
|
|
|
|
|
int swsusp_resume(void)
|
|
|
|
{
|
|
|
|
int error;
|
2006-08-15 06:11:08 +00:00
|
|
|
|
2005-04-16 22:20:36 +00:00
|
|
|
local_irq_disable();
|
2006-08-15 06:11:08 +00:00
|
|
|
/* NOTE: device_power_down() is just a suspend() with irqs off;
|
|
|
|
* it has no special "power things down" semantics
|
|
|
|
*/
|
|
|
|
if (device_power_down(PMSG_PRETHAW))
|
2005-04-16 22:20:36 +00:00
|
|
|
printk(KERN_ERR "Some devices failed to power down, very bad\n");
|
|
|
|
/* We'll ignore saved state, but this gets preempt count (etc) right */
|
|
|
|
save_processor_state();
|
|
|
|
error = swsusp_arch_resume();
|
|
|
|
/* Code below is only ever reached in case of failure. Otherwise
|
|
|
|
* execution continues at place where swsusp_arch_suspend was called
|
|
|
|
*/
|
|
|
|
BUG_ON(!error);
|
2005-10-30 22:59:58 +00:00
|
|
|
/* The only reason why swsusp_arch_resume() can fail is memory being
|
|
|
|
* very tight, so we have to free it as soon as we can to avoid
|
|
|
|
* subsequent failures
|
|
|
|
*/
|
|
|
|
swsusp_free();
|
2005-04-16 22:20:36 +00:00
|
|
|
restore_processor_state();
|
2006-06-26 01:41:00 +00:00
|
|
|
restore_highmem();
|
2005-09-06 22:16:27 +00:00
|
|
|
touch_softlockup_watchdog();
|
2005-04-16 22:20:36 +00:00
|
|
|
device_power_up();
|
|
|
|
local_irq_enable();
|
|
|
|
return error;
|
|
|
|
}
|