Eric Lee / smarc-ti-linux-kernel | Embedian Git Server

Blame view

mm/swapfile.c 76.8 KB

1da177e4c Linus Torvalds Linux-2.6.12-rc2	1 2 3 4 5 6	/* * linux/mm/swapfile.c * * Copyright (C) 1991, 1992, 1993, 1994 Linus Torvalds * Swap reorganised 29.12.95, Stephen Tweedie */
1da177e4c Linus Torvalds Linux-2.6.12-rc2	7 8 9 10 11 12 13 14 15	#include <linux/mm.h> #include <linux/hugetlb.h> #include <linux/mman.h> #include <linux/slab.h> #include <linux/kernel_stat.h> #include <linux/swap.h> #include <linux/vmalloc.h> #include <linux/pagemap.h> #include <linux/namei.h>
072441e21 Hugh Dickins mm: move shmem pr...	16	#include <linux/shmem_fs.h>
1da177e4c Linus Torvalds Linux-2.6.12-rc2	17	#include <linux/blkdev.h>
20137a490 Hugh Dickins swapfile: swapon ...	18	#include <linux/random.h>
1da177e4c Linus Torvalds Linux-2.6.12-rc2	19 20 21 22	#include <linux/writeback.h> #include <linux/proc_fs.h> #include <linux/seq_file.h> #include <linux/init.h>
5ad646880 Hugh Dickins ksm: let shared p...	23	#include <linux/ksm.h>
1da177e4c Linus Torvalds Linux-2.6.12-rc2	24 25 26	#include <linux/rmap.h> #include <linux/security.h> #include <linux/backing-dev.h>
fc0abb145 Ingo Molnar [PATCH] sem2mutex...	27	#include <linux/mutex.h>
c59ede7b7 Randy.Dunlap [PATCH] move capa...	28	#include <linux/capability.h>
1da177e4c Linus Torvalds Linux-2.6.12-rc2	29	#include <linux/syscalls.h>
8a9f3ccd2 Balbir Singh Memory controller...	30	#include <linux/memcontrol.h>
66d7dd518 Kay Sievers /proc/swaps: supp...	31	#include <linux/poll.h>
72788c385 David Rientjes oom: replace PF_O...	32	#include <linux/oom.h>
38b5faf4b Dan Magenheimer mm: frontswap: co...	33 34	#include <linux/frontswap.h> #include <linux/swapfile.h>
f981c5950 Mel Gorman mm: methods for t...	35	#include <linux/export.h>
1da177e4c Linus Torvalds Linux-2.6.12-rc2	36 37 38 39	#include <asm/pgtable.h> #include <asm/tlbflush.h> #include <linux/swapops.h>
27a7faa07 KAMEZAWA Hiroyuki memcg: swap cgrou...	40	#include <linux/page_cgroup.h>
1da177e4c Linus Torvalds Linux-2.6.12-rc2	41
570a335b8 Hugh Dickins swap_info: swap c...	42 43 44	static bool swap_count_continued(struct swap_info_struct , pgoff_t, unsigned char); static void free_swap_count_continuations(struct swap_info_struct );
d4906e1aa Lee Schermerhorn swap: rework map_...	45	static sector_t map_swap_entry(swp_entry_t, struct block_device**);
570a335b8 Hugh Dickins swap_info: swap c...	46
38b5faf4b Dan Magenheimer mm: frontswap: co...	47	DEFINE_SPINLOCK(swap_lock);
7c363b8c6 Adrian Bunk mm/swapfile.c: ma...	48	static unsigned int nr_swapfiles;
ec8acf20a Shaohua Li swap: add per-par...	49 50	atomic_long_t nr_swap_pages; /* protected with swap_lock. reading in vm_swap_full() doesn't need lock */
1da177e4c Linus Torvalds Linux-2.6.12-rc2	51	long total_swap_pages;
78ecba081 Hugh Dickins mm: fix ever-decr...	52	static int least_priority;
ec8acf20a Shaohua Li swap: add per-par...	53	static atomic_t highest_priority_index = ATOMIC_INIT(-1);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	54
1da177e4c Linus Torvalds Linux-2.6.12-rc2	55 56 57 58	static const char Bad_file[] = "Bad swap file entry "; static const char Unused_file[] = "Unused swap file entry "; static const char Bad_offset[] = "Bad swap offset entry "; static const char Unused_offset[] = "Unused swap offset entry ";
38b5faf4b Dan Magenheimer mm: frontswap: co...	59	struct swap_list_t swap_list = {-1, -1};
1da177e4c Linus Torvalds Linux-2.6.12-rc2	60
38b5faf4b Dan Magenheimer mm: frontswap: co...	61	struct swap_info_struct *swap_info[MAX_SWAPFILES];
1da177e4c Linus Torvalds Linux-2.6.12-rc2	62
fc0abb145 Ingo Molnar [PATCH] sem2mutex...	63	static DEFINE_MUTEX(swapon_mutex);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	64
66d7dd518 Kay Sievers /proc/swaps: supp...	65 66 67	static DECLARE_WAIT_QUEUE_HEAD(proc_poll_wait); /* Activity counter to indicate that a swapon or swapoff has occurred */ static atomic_t proc_poll_event = ATOMIC_INIT(0);
8d69aaee8 Hugh Dickins swap_info: swap_m...	68	static inline unsigned char swap_count(unsigned char ent)
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	69	{
570a335b8 Hugh Dickins swap_info: swap c...	70	return ent & ~SWAP_HAS_CACHE; /* may include SWAP_HAS_CONT flag */
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	71	}
efa90a981 Hugh Dickins swap_info: change...	72	/* returns 1 if swap entry is freed */
c9e444103 KAMEZAWA Hiroyuki mm: reuse unused ...	73 74 75	static int __try_to_reclaim_swap(struct swap_info_struct *si, unsigned long offset) {
efa90a981 Hugh Dickins swap_info: change...	76	swp_entry_t entry = swp_entry(si->type, offset);
c9e444103 KAMEZAWA Hiroyuki mm: reuse unused ...	77 78	struct page *page; int ret = 0;
33806f06d Shaohua Li swap: make each s...	79	page = find_get_page(swap_address_space(entry), entry.val);
c9e444103 KAMEZAWA Hiroyuki mm: reuse unused ...	80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95	if (!page) return 0; /* * This function is called from scan_swap_map() and it's called * by vmscan.c at reclaiming pages. So, we hold a lock on a page, here. * We have to use trylock for avoiding deadlock. This is a special * case and you should use try_to_free_swap() with explicit lock_page() * in usual operations. */ if (trylock_page(page)) { ret = try_to_free_swap(page); unlock_page(page); } page_cache_release(page); return ret; }
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	96
1da177e4c Linus Torvalds Linux-2.6.12-rc2	97	/*
6a6ba8317 Hugh Dickins swapfile: swapon ...	98 99 100 101 102 103	* swapon tell device that all the old swap contents can be discarded, * to allow the swap device to optimize its wear-levelling. / static int discard_swap(struct swap_info_struct si) { struct swap_extent *se;
9625a5f28 Hugh Dickins swap_info: includ...	104 105	sector_t start_block; sector_t nr_blocks;
6a6ba8317 Hugh Dickins swapfile: swapon ...	106	int err = 0;
9625a5f28 Hugh Dickins swap_info: includ...	107 108 109 110 111 112	/* Do not discard the swap header page! */ se = &si->first_swap_extent; start_block = (se->start_block + 1) << (PAGE_SHIFT - 9); nr_blocks = ((sector_t)se->nr_pages - 1) << (PAGE_SHIFT - 9); if (nr_blocks) { err = blkdev_issue_discard(si->bdev, start_block,
dd3932edd Christoph Hellwig block: remove BLK...	113	nr_blocks, GFP_KERNEL, 0);
9625a5f28 Hugh Dickins swap_info: includ...	114 115 116 117	if (err) return err; cond_resched(); }
6a6ba8317 Hugh Dickins swapfile: swapon ...	118
9625a5f28 Hugh Dickins swap_info: includ...	119 120 121	list_for_each_entry(se, &si->first_swap_extent.list, list) { start_block = se->start_block << (PAGE_SHIFT - 9); nr_blocks = (sector_t)se->nr_pages << (PAGE_SHIFT - 9);
6a6ba8317 Hugh Dickins swapfile: swapon ...	122 123	err = blkdev_issue_discard(si->bdev, start_block,
dd3932edd Christoph Hellwig block: remove BLK...	124	nr_blocks, GFP_KERNEL, 0);
6a6ba8317 Hugh Dickins swapfile: swapon ...	125 126 127 128 129 130 131	if (err) break; cond_resched(); } return err; /* That will often be -EOPNOTSUPP */ }
7992fde72 Hugh Dickins swapfile: swap al...	132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148	/* * swap allocation tell device that a cluster of swap can now be discarded, * to allow the swap device to optimize its wear-levelling. / static void discard_swap_cluster(struct swap_info_struct si, pgoff_t start_page, pgoff_t nr_pages) { struct swap_extent se = si->curr_swap_extent; int found_extent = 0; while (nr_pages) { struct list_head lh; if (se->start_page <= start_page && start_page < se->start_page + se->nr_pages) { pgoff_t offset = start_page - se->start_page; sector_t start_block = se->start_block + offset;
858a29900 Hugh Dickins swapfile: change ...	149	sector_t nr_blocks = se->nr_pages - offset;
7992fde72 Hugh Dickins swapfile: swap al...	150 151 152 153 154 155 156 157 158 159 160 161	if (nr_blocks > nr_pages) nr_blocks = nr_pages; start_page += nr_blocks; nr_pages -= nr_blocks; if (!found_extent++) si->curr_swap_extent = se; start_block <<= PAGE_SHIFT - 9; nr_blocks <<= PAGE_SHIFT - 9; if (blkdev_issue_discard(si->bdev, start_block,
dd3932edd Christoph Hellwig block: remove BLK...	162	nr_blocks, GFP_NOIO, 0))
7992fde72 Hugh Dickins swapfile: swap al...	163 164 165 166	break; } lh = se->list.next;
7992fde72 Hugh Dickins swapfile: swap al...	167 168 169	se = list_entry(lh, struct swap_extent, list); } }
048c27fd7 Hugh Dickins [PATCH] swap: sca...	170 171	#define SWAPFILE_CLUSTER 256 #define LATENCY_LIMIT 256
2a8f94493 Shaohua Li swap: change bloc...	172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228	static inline void cluster_set_flag(struct swap_cluster_info info, unsigned int flag) { info->flags = flag; } static inline unsigned int cluster_count(struct swap_cluster_info info) { return info->data; } static inline void cluster_set_count(struct swap_cluster_info info, unsigned int c) { info->data = c; } static inline void cluster_set_count_flag(struct swap_cluster_info info, unsigned int c, unsigned int f) { info->flags = f; info->data = c; } static inline unsigned int cluster_next(struct swap_cluster_info info) { return info->data; } static inline void cluster_set_next(struct swap_cluster_info info, unsigned int n) { info->data = n; } static inline void cluster_set_next_flag(struct swap_cluster_info info, unsigned int n, unsigned int f) { info->flags = f; info->data = n; } static inline bool cluster_is_free(struct swap_cluster_info info) { return info->flags & CLUSTER_FLAG_FREE; } static inline bool cluster_is_null(struct swap_cluster_info info) { return info->flags & CLUSTER_FLAG_NEXT_NULL; } static inline void cluster_set_null(struct swap_cluster_info info) { info->flags = CLUSTER_FLAG_NEXT_NULL; info->data = 0; }
815c2c543 Shaohua Li swap: make swap d...	229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311	/* Add a cluster to discard list and schedule it to do discard / static void swap_cluster_schedule_discard(struct swap_info_struct si, unsigned int idx) { /* * If scan_swap_map() can't find a free cluster, it will check * si->swap_map directly. To make sure the discarding cluster isn't * taken by scan_swap_map(), mark the swap entries bad (occupied). It * will be cleared after discard / memset(si->swap_map + idx SWAPFILE_CLUSTER, SWAP_MAP_BAD, SWAPFILE_CLUSTER); if (cluster_is_null(&si->discard_cluster_head)) { cluster_set_next_flag(&si->discard_cluster_head, idx, 0); cluster_set_next_flag(&si->discard_cluster_tail, idx, 0); } else { unsigned int tail = cluster_next(&si->discard_cluster_tail); cluster_set_next(&si->cluster_info[tail], idx); cluster_set_next_flag(&si->discard_cluster_tail, idx, 0); } schedule_work(&si->discard_work); } /* * Doing discard actually. After a cluster discard is finished, the cluster * will be added to free cluster list. caller should hold si->lock. / static void swap_do_scheduled_discard(struct swap_info_struct si) { struct swap_cluster_info info; unsigned int idx; info = si->cluster_info; while (!cluster_is_null(&si->discard_cluster_head)) { idx = cluster_next(&si->discard_cluster_head); cluster_set_next_flag(&si->discard_cluster_head, cluster_next(&info[idx]), 0); if (cluster_next(&si->discard_cluster_tail) == idx) { cluster_set_null(&si->discard_cluster_head); cluster_set_null(&si->discard_cluster_tail); } spin_unlock(&si->lock); discard_swap_cluster(si, idx SWAPFILE_CLUSTER, SWAPFILE_CLUSTER); spin_lock(&si->lock); cluster_set_flag(&info[idx], CLUSTER_FLAG_FREE); if (cluster_is_null(&si->free_cluster_head)) { cluster_set_next_flag(&si->free_cluster_head, idx, 0); cluster_set_next_flag(&si->free_cluster_tail, idx, 0); } else { unsigned int tail; tail = cluster_next(&si->free_cluster_tail); cluster_set_next(&info[tail], idx); cluster_set_next_flag(&si->free_cluster_tail, idx, 0); } memset(si->swap_map + idx * SWAPFILE_CLUSTER, 0, SWAPFILE_CLUSTER); } } static void swap_discard_work(struct work_struct work) { struct swap_info_struct si; si = container_of(work, struct swap_info_struct, discard_work); spin_lock(&si->lock); swap_do_scheduled_discard(si); spin_unlock(&si->lock); }
2a8f94493 Shaohua Li swap: change bloc...	312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356	/* * The cluster corresponding to page_nr will be used. The cluster will be * removed from free cluster list and its usage counter will be increased. / static void inc_cluster_info_page(struct swap_info_struct p, struct swap_cluster_info cluster_info, unsigned long page_nr) { unsigned long idx = page_nr / SWAPFILE_CLUSTER; if (!cluster_info) return; if (cluster_is_free(&cluster_info[idx])) { VM_BUG_ON(cluster_next(&p->free_cluster_head) != idx); cluster_set_next_flag(&p->free_cluster_head, cluster_next(&cluster_info[idx]), 0); if (cluster_next(&p->free_cluster_tail) == idx) { cluster_set_null(&p->free_cluster_tail); cluster_set_null(&p->free_cluster_head); } cluster_set_count_flag(&cluster_info[idx], 0, 0); } VM_BUG_ON(cluster_count(&cluster_info[idx]) >= SWAPFILE_CLUSTER); cluster_set_count(&cluster_info[idx], cluster_count(&cluster_info[idx]) + 1); } / * The cluster corresponding to page_nr decreases one usage. If the usage * counter becomes 0, which means no page in the cluster is in using, we can * optionally discard the cluster and add it to free cluster list. / static void dec_cluster_info_page(struct swap_info_struct p, struct swap_cluster_info *cluster_info, unsigned long page_nr) { unsigned long idx = page_nr / SWAPFILE_CLUSTER; if (!cluster_info) return; VM_BUG_ON(cluster_count(&cluster_info[idx]) == 0); cluster_set_count(&cluster_info[idx], cluster_count(&cluster_info[idx]) - 1); if (cluster_count(&cluster_info[idx]) == 0) {
815c2c543 Shaohua Li swap: make swap d...	357 358 359 360 361	/* * If the swap is discardable, prepare discard the cluster * instead of free it immediately. The cluster will be freed * after discard. */
edfe23dac Shaohua Li swap: fix races e...	362 363	if ((p->flags & (SWP_WRITEOK \| SWP_PAGE_DISCARD)) == (SWP_WRITEOK \| SWP_PAGE_DISCARD)) {
815c2c543 Shaohua Li swap: make swap d...	364 365 366	swap_cluster_schedule_discard(p, idx); return; }
2a8f94493 Shaohua Li swap: change bloc...	367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382	cluster_set_flag(&cluster_info[idx], CLUSTER_FLAG_FREE); if (cluster_is_null(&p->free_cluster_head)) { cluster_set_next_flag(&p->free_cluster_head, idx, 0); cluster_set_next_flag(&p->free_cluster_tail, idx, 0); } else { unsigned int tail = cluster_next(&p->free_cluster_tail); cluster_set_next(&cluster_info[tail], idx); cluster_set_next_flag(&p->free_cluster_tail, idx, 0); } } } /* * It's possible scan_swap_map() uses a free cluster in the middle of free * cluster list. Avoiding such abuse to avoid list corruption. */
ebc2a1a69 Shaohua Li swap: make cluste...	383 384	static bool scan_swap_map_ssd_cluster_conflict(struct swap_info_struct *si,
2a8f94493 Shaohua Li swap: change bloc...	385 386	unsigned long offset) {
ebc2a1a69 Shaohua Li swap: make cluste...	387 388	struct percpu_cluster *percpu_cluster; bool conflict;
2a8f94493 Shaohua Li swap: change bloc...	389	offset /= SWAPFILE_CLUSTER;
ebc2a1a69 Shaohua Li swap: make cluste...	390	conflict = !cluster_is_null(&si->free_cluster_head) &&
2a8f94493 Shaohua Li swap: change bloc...	391 392	offset != cluster_next(&si->free_cluster_head) && cluster_is_free(&si->cluster_info[offset]);
ebc2a1a69 Shaohua Li swap: make cluste...	393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453	if (!conflict) return false; percpu_cluster = this_cpu_ptr(si->percpu_cluster); cluster_set_null(&percpu_cluster->index); return true; } /* * Try to get a swap entry from current cpu's swap entry pool (a cluster). This * might involve allocating a new cluster for current CPU too. / static void scan_swap_map_try_ssd_cluster(struct swap_info_struct si, unsigned long offset, unsigned long scan_base) { struct percpu_cluster cluster; bool found_free; unsigned long tmp; new_cluster: cluster = this_cpu_ptr(si->percpu_cluster); if (cluster_is_null(&cluster->index)) { if (!cluster_is_null(&si->free_cluster_head)) { cluster->index = si->free_cluster_head; cluster->next = cluster_next(&cluster->index) SWAPFILE_CLUSTER; } else if (!cluster_is_null(&si->discard_cluster_head)) { /* * we don't have free cluster but have some clusters in * discarding, do discard now and reclaim them / swap_do_scheduled_discard(si); scan_base = offset = si->cluster_next; goto new_cluster; } else return; } found_free = false; / * Other CPUs can use our cluster if they can't find a free cluster, * check if there is still free entry in the cluster / tmp = cluster->next; while (tmp < si->max && tmp < (cluster_next(&cluster->index) + 1) SWAPFILE_CLUSTER) { if (!si->swap_map[tmp]) { found_free = true; break; } tmp++; } if (!found_free) { cluster_set_null(&cluster->index); goto new_cluster; } cluster->next = tmp + 1; offset = tmp; scan_base = tmp;
2a8f94493 Shaohua Li swap: change bloc...	454	}
24b8ff7c2 Cesar Eduardo Barros mm: remove inline...	455 456	static unsigned long scan_swap_map(struct swap_info_struct *si, unsigned char usage)
1da177e4c Linus Torvalds Linux-2.6.12-rc2	457	{
ebebbbe90 Hugh Dickins swapfile: rearran...	458	unsigned long offset;
c60aa176c Hugh Dickins swapfile: swap al...	459	unsigned long scan_base;
7992fde72 Hugh Dickins swapfile: swap al...	460	unsigned long last_in_cluster = 0;
048c27fd7 Hugh Dickins [PATCH] swap: sca...	461	int latency_ration = LATENCY_LIMIT;
7dfad4183 Hugh Dickins [PATCH] swap: sca...	462
886bb7e9c Hugh Dickins swapfile: remove ...	463	/*
7dfad4183 Hugh Dickins [PATCH] swap: sca...	464 465 466 467 468 469 470	* We try to cluster swap pages by allocating them sequentially * in swap. Once we've allocated SWAPFILE_CLUSTER pages this * way, however, we resort to first-free allocation, starting * a new cluster. This prevents us from scattering swap pages * all over the entire swap partition, so that we reduce * overall disk seek times between swap pages. -- sct * But we do now try to find an empty cluster. -Andrea
c60aa176c Hugh Dickins swapfile: swap al...	471	* And we let swap pages go all over an SSD partition. Hugh
7dfad4183 Hugh Dickins [PATCH] swap: sca...	472	*/
52b7efdbe Hugh Dickins [PATCH] swap: sca...	473	si->flags += SWP_SCANNING;
c60aa176c Hugh Dickins swapfile: swap al...	474	scan_base = offset = si->cluster_next;
ebebbbe90 Hugh Dickins swapfile: rearran...	475
ebc2a1a69 Shaohua Li swap: make cluste...	476 477 478 479 480	/* SSD algorithm */ if (si->cluster_info) { scan_swap_map_try_ssd_cluster(si, &offset, &scan_base); goto checks; }
ebebbbe90 Hugh Dickins swapfile: rearran...	481 482 483 484 485	if (unlikely(!si->cluster_nr--)) { if (si->pages - si->inuse_pages < SWAPFILE_CLUSTER) { si->cluster_nr = SWAPFILE_CLUSTER - 1; goto checks; }
2a8f94493 Shaohua Li swap: change bloc...	486
ec8acf20a Shaohua Li swap: add per-par...	487	spin_unlock(&si->lock);
7dfad4183 Hugh Dickins [PATCH] swap: sca...	488
c60aa176c Hugh Dickins swapfile: swap al...	489 490 491 492 493 494 495 496 497 498	/* * If seek is expensive, start searching for new cluster from * start of partition, to minimize the span of allocated swap. * But if seek is cheap, search from our current position, so * that swap is allocated from all over the partition: if the * Flash Translation Layer only remaps within limited zones, * we don't want to wear out the first zone too quickly. */ if (!(si->flags & SWP_SOLIDSTATE)) scan_base = offset = si->lowest_bit;
7dfad4183 Hugh Dickins [PATCH] swap: sca...	499 500 501 502	last_in_cluster = offset + SWAPFILE_CLUSTER - 1; /* Locate the first empty (unaligned) cluster */ for (; last_in_cluster <= si->highest_bit; offset++) {
1da177e4c Linus Torvalds Linux-2.6.12-rc2	503	if (si->swap_map[offset])
7dfad4183 Hugh Dickins [PATCH] swap: sca...	504 505	last_in_cluster = offset + SWAPFILE_CLUSTER; else if (offset == last_in_cluster) {
ec8acf20a Shaohua Li swap: add per-par...	506	spin_lock(&si->lock);
ebebbbe90 Hugh Dickins swapfile: rearran...	507 508 509 510	offset -= SWAPFILE_CLUSTER - 1; si->cluster_next = offset; si->cluster_nr = SWAPFILE_CLUSTER - 1; goto checks;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	511	}
048c27fd7 Hugh Dickins [PATCH] swap: sca...	512 513 514 515	if (unlikely(--latency_ration < 0)) { cond_resched(); latency_ration = LATENCY_LIMIT; }
7dfad4183 Hugh Dickins [PATCH] swap: sca...	516	}
ebebbbe90 Hugh Dickins swapfile: rearran...	517 518	offset = si->lowest_bit;
c60aa176c Hugh Dickins swapfile: swap al...	519 520 521 522 523 524 525	last_in_cluster = offset + SWAPFILE_CLUSTER - 1; /* Locate the first empty (unaligned) cluster */ for (; last_in_cluster < scan_base; offset++) { if (si->swap_map[offset]) last_in_cluster = offset + SWAPFILE_CLUSTER; else if (offset == last_in_cluster) {
ec8acf20a Shaohua Li swap: add per-par...	526	spin_lock(&si->lock);
c60aa176c Hugh Dickins swapfile: swap al...	527 528 529	offset -= SWAPFILE_CLUSTER - 1; si->cluster_next = offset; si->cluster_nr = SWAPFILE_CLUSTER - 1;
c60aa176c Hugh Dickins swapfile: swap al...	530 531 532 533 534 535 536 537 538	goto checks; } if (unlikely(--latency_ration < 0)) { cond_resched(); latency_ration = LATENCY_LIMIT; } } offset = scan_base;
ec8acf20a Shaohua Li swap: add per-par...	539	spin_lock(&si->lock);
ebebbbe90 Hugh Dickins swapfile: rearran...	540	si->cluster_nr = SWAPFILE_CLUSTER - 1;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	541	}
7dfad4183 Hugh Dickins [PATCH] swap: sca...	542
ebebbbe90 Hugh Dickins swapfile: rearran...	543	checks:
ebc2a1a69 Shaohua Li swap: make cluste...	544 545 546 547	if (si->cluster_info) { while (scan_swap_map_ssd_cluster_conflict(si, offset)) scan_swap_map_try_ssd_cluster(si, &offset, &scan_base); }
ebebbbe90 Hugh Dickins swapfile: rearran...	548	if (!(si->flags & SWP_WRITEOK))
52b7efdbe Hugh Dickins [PATCH] swap: sca...	549	goto no_page;
7dfad4183 Hugh Dickins [PATCH] swap: sca...	550 551	if (!si->highest_bit) goto no_page;
ebebbbe90 Hugh Dickins swapfile: rearran...	552	if (offset > si->highest_bit)
c60aa176c Hugh Dickins swapfile: swap al...	553	scan_base = offset = si->lowest_bit;
c9e444103 KAMEZAWA Hiroyuki mm: reuse unused ...	554
b73d7fcec Hugh Dickins swap: prevent reu...	555 556	/* reuse swap entry of cache-only swap if not busy. */ if (vm_swap_full() && si->swap_map[offset] == SWAP_HAS_CACHE) {
c9e444103 KAMEZAWA Hiroyuki mm: reuse unused ...	557	int swap_was_freed;
ec8acf20a Shaohua Li swap: add per-par...	558	spin_unlock(&si->lock);
c9e444103 KAMEZAWA Hiroyuki mm: reuse unused ...	559	swap_was_freed = __try_to_reclaim_swap(si, offset);
ec8acf20a Shaohua Li swap: add per-par...	560	spin_lock(&si->lock);
c9e444103 KAMEZAWA Hiroyuki mm: reuse unused ...	561 562 563 564 565	/* entry was freed successfully, try to use this again / if (swap_was_freed) goto checks; goto scan; / check next one */ }
ebebbbe90 Hugh Dickins swapfile: rearran...	566 567 568 569 570 571 572 573 574 575 576	if (si->swap_map[offset]) goto scan; if (offset == si->lowest_bit) si->lowest_bit++; if (offset == si->highest_bit) si->highest_bit--; si->inuse_pages++; if (si->inuse_pages == si->pages) { si->lowest_bit = si->max; si->highest_bit = 0;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	577	}
253d553ba Hugh Dickins swap_info: SWAP_H...	578	si->swap_map[offset] = usage;
2a8f94493 Shaohua Li swap: change bloc...	579	inc_cluster_info_page(si, si->cluster_info, offset);
ebebbbe90 Hugh Dickins swapfile: rearran...	580 581	si->cluster_next = offset + 1; si->flags -= SWP_SCANNING;
7992fde72 Hugh Dickins swapfile: swap al...	582
ebebbbe90 Hugh Dickins swapfile: rearran...	583	return offset;
7dfad4183 Hugh Dickins [PATCH] swap: sca...	584
ebebbbe90 Hugh Dickins swapfile: rearran...	585	scan:
ec8acf20a Shaohua Li swap: add per-par...	586	spin_unlock(&si->lock);
7dfad4183 Hugh Dickins [PATCH] swap: sca...	587	while (++offset <= si->highest_bit) {
52b7efdbe Hugh Dickins [PATCH] swap: sca...	588	if (!si->swap_map[offset]) {
ec8acf20a Shaohua Li swap: add per-par...	589	spin_lock(&si->lock);
52b7efdbe Hugh Dickins [PATCH] swap: sca...	590 591	goto checks; }
c9e444103 KAMEZAWA Hiroyuki mm: reuse unused ...	592	if (vm_swap_full() && si->swap_map[offset] == SWAP_HAS_CACHE) {
ec8acf20a Shaohua Li swap: add per-par...	593	spin_lock(&si->lock);
c9e444103 KAMEZAWA Hiroyuki mm: reuse unused ...	594 595	goto checks; }
048c27fd7 Hugh Dickins [PATCH] swap: sca...	596 597 598 599	if (unlikely(--latency_ration < 0)) { cond_resched(); latency_ration = LATENCY_LIMIT; }
7dfad4183 Hugh Dickins [PATCH] swap: sca...	600	}
c60aa176c Hugh Dickins swapfile: swap al...	601	offset = si->lowest_bit;
a5998061d Jamie Liu mm/swapfile.c: do...	602	while (offset < scan_base) {
c60aa176c Hugh Dickins swapfile: swap al...	603	if (!si->swap_map[offset]) {
ec8acf20a Shaohua Li swap: add per-par...	604	spin_lock(&si->lock);
c60aa176c Hugh Dickins swapfile: swap al...	605 606	goto checks; }
c9e444103 KAMEZAWA Hiroyuki mm: reuse unused ...	607	if (vm_swap_full() && si->swap_map[offset] == SWAP_HAS_CACHE) {
ec8acf20a Shaohua Li swap: add per-par...	608	spin_lock(&si->lock);
c9e444103 KAMEZAWA Hiroyuki mm: reuse unused ...	609 610	goto checks; }
c60aa176c Hugh Dickins swapfile: swap al...	611 612 613 614	if (unlikely(--latency_ration < 0)) { cond_resched(); latency_ration = LATENCY_LIMIT; }
a5998061d Jamie Liu mm/swapfile.c: do...	615	offset++;
c60aa176c Hugh Dickins swapfile: swap al...	616	}
ec8acf20a Shaohua Li swap: add per-par...	617	spin_lock(&si->lock);
7dfad4183 Hugh Dickins [PATCH] swap: sca...	618 619	no_page:
52b7efdbe Hugh Dickins [PATCH] swap: sca...	620	si->flags -= SWP_SCANNING;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	621 622 623 624 625	return 0; } swp_entry_t get_swap_page(void) {
fb4f88dca Hugh Dickins [PATCH] swap: get...	626 627 628 629	struct swap_info_struct *si; pgoff_t offset; int type, next; int wrapped = 0;
ec8acf20a Shaohua Li swap: add per-par...	630	int hp_index;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	631
5d337b919 Hugh Dickins [PATCH] swap: swa...	632	spin_lock(&swap_lock);
ec8acf20a Shaohua Li swap: add per-par...	633	if (atomic_long_read(&nr_swap_pages) <= 0)
fb4f88dca Hugh Dickins [PATCH] swap: get...	634	goto noswap;
ec8acf20a Shaohua Li swap: add per-par...	635	atomic_long_dec(&nr_swap_pages);
fb4f88dca Hugh Dickins [PATCH] swap: get...	636 637	for (type = swap_list.next; type >= 0 && wrapped < 2; type = next) {
ec8acf20a Shaohua Li swap: add per-par...	638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656	hp_index = atomic_xchg(&highest_priority_index, -1); /* * highest_priority_index records current highest priority swap * type which just frees swap entries. If its priority is * higher than that of swap_list.next swap type, we use it. It * isn't protected by swap_lock, so it can be an invalid value * if the corresponding swap type is swapoff. We double check * the flags here. It's even possible the swap type is swapoff * and swapon again and its priority is changed. In such rare * case, low prority swap type might be used, but eventually * high priority swap will be used after several rounds of * swap. */ if (hp_index != -1 && hp_index != type && swap_info[type]->prio < swap_info[hp_index]->prio && (swap_info[hp_index]->flags & SWP_WRITEOK)) { type = hp_index; swap_list.next = type; }
efa90a981 Hugh Dickins swap_info: change...	657	si = swap_info[type];
fb4f88dca Hugh Dickins [PATCH] swap: get...	658 659	next = si->next; if (next < 0 \|\|
efa90a981 Hugh Dickins swap_info: change...	660	(!wrapped && si->prio != swap_info[next]->prio)) {
fb4f88dca Hugh Dickins [PATCH] swap: get...	661 662	next = swap_list.head; wrapped++;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	663	}
fb4f88dca Hugh Dickins [PATCH] swap: get...	664
ec8acf20a Shaohua Li swap: add per-par...	665 666 667	spin_lock(&si->lock); if (!si->highest_bit) { spin_unlock(&si->lock);
fb4f88dca Hugh Dickins [PATCH] swap: get...	668	continue;
ec8acf20a Shaohua Li swap: add per-par...	669 670 671	} if (!(si->flags & SWP_WRITEOK)) { spin_unlock(&si->lock);
fb4f88dca Hugh Dickins [PATCH] swap: get...	672	continue;
ec8acf20a Shaohua Li swap: add per-par...	673	}
fb4f88dca Hugh Dickins [PATCH] swap: get...	674 675	swap_list.next = next;
ec8acf20a Shaohua Li swap: add per-par...	676 677	spin_unlock(&swap_lock);
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	678	/* This is called for allocating swap entry for cache */
253d553ba Hugh Dickins swap_info: SWAP_H...	679	offset = scan_swap_map(si, SWAP_HAS_CACHE);
ec8acf20a Shaohua Li swap: add per-par...	680 681	spin_unlock(&si->lock); if (offset)
fb4f88dca Hugh Dickins [PATCH] swap: get...	682	return swp_entry(type, offset);
ec8acf20a Shaohua Li swap: add per-par...	683	spin_lock(&swap_lock);
fb4f88dca Hugh Dickins [PATCH] swap: get...	684	next = swap_list.next;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	685	}
fb4f88dca Hugh Dickins [PATCH] swap: get...	686
ec8acf20a Shaohua Li swap: add per-par...	687	atomic_long_inc(&nr_swap_pages);
fb4f88dca Hugh Dickins [PATCH] swap: get...	688	noswap:
5d337b919 Hugh Dickins [PATCH] swap: swa...	689	spin_unlock(&swap_lock);
fb4f88dca Hugh Dickins [PATCH] swap: get...	690	return (swp_entry_t) {0};
1da177e4c Linus Torvalds Linux-2.6.12-rc2	691	}
2de1a7e40 Seth Jennings mm/swapfile.c: fi...	692	/* The only caller of this function is now suspend routine */
910321ea8 Hugh Dickins swap: revert spec...	693 694 695 696	swp_entry_t get_swap_page_of_type(int type) { struct swap_info_struct *si; pgoff_t offset;
910321ea8 Hugh Dickins swap: revert spec...	697	si = swap_info[type];
ec8acf20a Shaohua Li swap: add per-par...	698	spin_lock(&si->lock);
910321ea8 Hugh Dickins swap: revert spec...	699	if (si && (si->flags & SWP_WRITEOK)) {
ec8acf20a Shaohua Li swap: add per-par...	700	atomic_long_dec(&nr_swap_pages);
910321ea8 Hugh Dickins swap: revert spec...	701 702 703	/* This is called for allocating swap entry, not cache */ offset = scan_swap_map(si, 1); if (offset) {
ec8acf20a Shaohua Li swap: add per-par...	704	spin_unlock(&si->lock);
910321ea8 Hugh Dickins swap: revert spec...	705 706	return swp_entry(type, offset); }
ec8acf20a Shaohua Li swap: add per-par...	707	atomic_long_inc(&nr_swap_pages);
910321ea8 Hugh Dickins swap: revert spec...	708	}
ec8acf20a Shaohua Li swap: add per-par...	709	spin_unlock(&si->lock);
910321ea8 Hugh Dickins swap: revert spec...	710 711	return (swp_entry_t) {0}; }
73c34b6ac Hugh Dickins swap_info: miscel...	712	static struct swap_info_struct *swap_info_get(swp_entry_t entry)
1da177e4c Linus Torvalds Linux-2.6.12-rc2	713	{
73c34b6ac Hugh Dickins swap_info: miscel...	714	struct swap_info_struct *p;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	715 716 717 718 719 720 721	unsigned long offset, type; if (!entry.val) goto out; type = swp_type(entry); if (type >= nr_swapfiles) goto bad_nofile;
efa90a981 Hugh Dickins swap_info: change...	722	p = swap_info[type];
1da177e4c Linus Torvalds Linux-2.6.12-rc2	723 724 725 726 727 728 729	if (!(p->flags & SWP_USED)) goto bad_device; offset = swp_offset(entry); if (offset >= p->max) goto bad_offset; if (!p->swap_map[offset]) goto bad_free;
ec8acf20a Shaohua Li swap: add per-par...	730	spin_lock(&p->lock);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	731 732 733	return p; bad_free:
465c47fd8 Andrew Morton mm/swapfile.c: co...	734 735	pr_err("swap_free: %s%08lx ", Unused_offset, entry.val);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	736 737	goto out; bad_offset:
465c47fd8 Andrew Morton mm/swapfile.c: co...	738 739	pr_err("swap_free: %s%08lx ", Bad_offset, entry.val);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	740 741	goto out; bad_device:
465c47fd8 Andrew Morton mm/swapfile.c: co...	742 743	pr_err("swap_free: %s%08lx ", Unused_file, entry.val);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	744 745	goto out; bad_nofile:
465c47fd8 Andrew Morton mm/swapfile.c: co...	746 747	pr_err("swap_free: %s%08lx ", Bad_file, entry.val);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	748 749	out: return NULL;
886bb7e9c Hugh Dickins swapfile: remove ...	750	}
1da177e4c Linus Torvalds Linux-2.6.12-rc2	751
ec8acf20a Shaohua Li swap: add per-par...	752 753 754 755 756 757 758 759 760 761 762 763 764 765 766 767 768 769 770 771	/* * This swap type frees swap entry, check if it is the highest priority swap * type which just frees swap entry. get_swap_page() uses * highest_priority_index to search highest priority swap type. The * swap_info_struct.lock can't protect us if there are multiple swap types * active, so we use atomic_cmpxchg. */ static void set_highest_priority_index(int type) { int old_hp_index, new_hp_index; do { old_hp_index = atomic_read(&highest_priority_index); if (old_hp_index != -1 && swap_info[old_hp_index]->prio >= swap_info[type]->prio) break; new_hp_index = type; } while (atomic_cmpxchg(&highest_priority_index, old_hp_index, new_hp_index) != old_hp_index); }
8d69aaee8 Hugh Dickins swap_info: swap_m...	772 773	static unsigned char swap_entry_free(struct swap_info_struct *p, swp_entry_t entry, unsigned char usage)
1da177e4c Linus Torvalds Linux-2.6.12-rc2	774	{
253d553ba Hugh Dickins swap_info: SWAP_H...	775	unsigned long offset = swp_offset(entry);
8d69aaee8 Hugh Dickins swap_info: swap_m...	776 777	unsigned char count; unsigned char has_cache;
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	778
253d553ba Hugh Dickins swap_info: SWAP_H...	779 780 781	count = p->swap_map[offset]; has_cache = count & SWAP_HAS_CACHE; count &= ~SWAP_HAS_CACHE;
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	782
253d553ba Hugh Dickins swap_info: SWAP_H...	783	if (usage == SWAP_HAS_CACHE) {
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	784	VM_BUG_ON(!has_cache);
253d553ba Hugh Dickins swap_info: SWAP_H...	785	has_cache = 0;
aaa468653 Hugh Dickins swap_info: note S...	786 787 788 789 790 791	} else if (count == SWAP_MAP_SHMEM) { /* * Or we could insist on shmem.c using a special * swap_shmem_free() and free_shmem_swap_and_cache()... */ count = 0;
570a335b8 Hugh Dickins swap_info: swap c...	792 793 794 795 796 797 798 799 800	} else if ((count & ~COUNT_CONTINUED) <= SWAP_MAP_MAX) { if (count == COUNT_CONTINUED) { if (swap_count_continued(p, offset, count)) count = SWAP_MAP_MAX \| COUNT_CONTINUED; else count = SWAP_MAP_MAX; } else count--; }
253d553ba Hugh Dickins swap_info: SWAP_H...	801 802 803 804 805 806	if (!count) mem_cgroup_uncharge_swap(entry); usage = count \| has_cache; p->swap_map[offset] = usage;
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	807
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	808	/* free if no reference */
253d553ba Hugh Dickins swap_info: SWAP_H...	809	if (!usage) {
2a8f94493 Shaohua Li swap: change bloc...	810	dec_cluster_info_page(p, p->cluster_info, offset);
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	811 812 813 814	if (offset < p->lowest_bit) p->lowest_bit = offset; if (offset > p->highest_bit) p->highest_bit = offset;
ec8acf20a Shaohua Li swap: add per-par...	815 816	set_highest_priority_index(p->type); atomic_long_inc(&nr_swap_pages);
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	817	p->inuse_pages--;
38b5faf4b Dan Magenheimer mm: frontswap: co...	818	frontswap_invalidate_page(p->type, offset);
737449236 Mel Gorman swapfile: avoid d...	819 820 821 822 823 824	if (p->flags & SWP_BLKDEV) { struct gendisk *disk = p->bdev->bd_disk; if (disk->fops->swap_slot_free_notify) disk->fops->swap_slot_free_notify(p->bdev, offset); }
1da177e4c Linus Torvalds Linux-2.6.12-rc2	825	}
253d553ba Hugh Dickins swap_info: SWAP_H...	826 827	return usage;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	828 829 830	} /*
2de1a7e40 Seth Jennings mm/swapfile.c: fi...	831	* Caller has made sure that the swap device corresponding to entry
1da177e4c Linus Torvalds Linux-2.6.12-rc2	832 833 834 835	* is still around or has not been recycled. */ void swap_free(swp_entry_t entry) {
73c34b6ac Hugh Dickins swap_info: miscel...	836	struct swap_info_struct *p;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	837 838 839	p = swap_info_get(entry); if (p) {
253d553ba Hugh Dickins swap_info: SWAP_H...	840	swap_entry_free(p, entry, 1);
ec8acf20a Shaohua Li swap: add per-par...	841	spin_unlock(&p->lock);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	842 843 844 845	} } /*
cb4b86ba4 KAMEZAWA Hiroyuki mm: add swap cach...	846 847 848 849	* Called after dropping swapcache to decrease refcnt to swap entries. / void swapcache_free(swp_entry_t entry, struct page page) {
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	850	struct swap_info_struct *p;
8d69aaee8 Hugh Dickins swap_info: swap_m...	851	unsigned char count;
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	852
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	853 854	p = swap_info_get(entry); if (p) {
253d553ba Hugh Dickins swap_info: SWAP_H...	855 856 857	count = swap_entry_free(p, entry, SWAP_HAS_CACHE); if (page) mem_cgroup_uncharge_swapcache(page, entry, count != 0);
ec8acf20a Shaohua Li swap: add per-par...	858	spin_unlock(&p->lock);
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	859	}
cb4b86ba4 KAMEZAWA Hiroyuki mm: add swap cach...	860 861 862	} /*
c475a8ab6 Hugh Dickins [PATCH] can_share...	863	* How many references to page are currently swapped out?
570a335b8 Hugh Dickins swap_info: swap c...	864 865	* This does not give an exact answer when swap count is continued, * but does include the high COUNT_CONTINUED flag to allow for that.
1da177e4c Linus Torvalds Linux-2.6.12-rc2	866	*/
bde05d1cc Hugh Dickins shmem: replace pa...	867	int page_swapcount(struct page *page)
1da177e4c Linus Torvalds Linux-2.6.12-rc2	868	{
c475a8ab6 Hugh Dickins [PATCH] can_share...	869 870	int count = 0; struct swap_info_struct *p;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	871	swp_entry_t entry;
4c21e2f24 Hugh Dickins [PATCH] mm: split...	872	entry.val = page_private(page);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	873 874	p = swap_info_get(entry); if (p) {
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	875	count = swap_count(p->swap_map[swp_offset(entry)]);
ec8acf20a Shaohua Li swap: add per-par...	876	spin_unlock(&p->lock);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	877	}
c475a8ab6 Hugh Dickins [PATCH] can_share...	878	return count;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	879 880 881	} /*
7b1fe5979 Hugh Dickins mm: reuse_swap_pa...	882 883 884 885	* We can write to an anon page without COW if there are no other references * to it. And as a side-effect, free up its swap: because the old content * on disk will never be read, and seeking back there to write new content * later would only waste time away from clustering.
1da177e4c Linus Torvalds Linux-2.6.12-rc2	886	*/
7b1fe5979 Hugh Dickins mm: reuse_swap_pa...	887	int reuse_swap_page(struct page *page)
1da177e4c Linus Torvalds Linux-2.6.12-rc2	888	{
c475a8ab6 Hugh Dickins [PATCH] can_share...	889	int count;
309381fea Sasha Levin mm: dump page whe...	890	VM_BUG_ON_PAGE(!PageLocked(page), page);
5ad646880 Hugh Dickins ksm: let shared p...	891 892	if (unlikely(PageKsm(page))) return 0;
c475a8ab6 Hugh Dickins [PATCH] can_share...	893	count = page_mapcount(page);
7b1fe5979 Hugh Dickins mm: reuse_swap_pa...	894	if (count <= 1 && PageSwapCache(page)) {
c475a8ab6 Hugh Dickins [PATCH] can_share...	895	count += page_swapcount(page);
7b1fe5979 Hugh Dickins mm: reuse_swap_pa...	896 897 898 899 900	if (count == 1 && !PageWriteback(page)) { delete_from_swap_cache(page); SetPageDirty(page); } }
5ad646880 Hugh Dickins ksm: let shared p...	901	return count <= 1;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	902 903 904	} /*
a2c43eed8 Hugh Dickins mm: try_to_free_s...	905 906	* If swap is getting full, or if there are no more mappings of this page, * then try_to_free_swap is called to free its swap space.
1da177e4c Linus Torvalds Linux-2.6.12-rc2	907	*/
a2c43eed8 Hugh Dickins mm: try_to_free_s...	908	int try_to_free_swap(struct page *page)
1da177e4c Linus Torvalds Linux-2.6.12-rc2	909	{
309381fea Sasha Levin mm: dump page whe...	910	VM_BUG_ON_PAGE(!PageLocked(page), page);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	911 912 913 914 915	if (!PageSwapCache(page)) return 0; if (PageWriteback(page)) return 0;
a2c43eed8 Hugh Dickins mm: try_to_free_s...	916	if (page_swapcount(page))
1da177e4c Linus Torvalds Linux-2.6.12-rc2	917	return 0;
b73d7fcec Hugh Dickins swap: prevent reu...	918 919 920 921 922 923 924 925 926 927 928 929	/* * Once hibernation has begun to create its image of memory, * there's a danger that one of the calls to try_to_free_swap() * - most probably a call from __try_to_reclaim_swap() while * hibernation is allocating its own swap pages for the image, * but conceivably even a call from memory reclaim - will free * the swap from a page which has already been recorded in the * image as a clean swapcache page, and then reuse its swap for * another page of the image. On waking from hibernation, the * original page might be freed under memory pressure, then * later read back in from swap, now with the wrong data. *
2de1a7e40 Seth Jennings mm/swapfile.c: fi...	930	* Hibernation suspends storage while it is writing the image
f90ac3982 Mel Gorman mm: avoid liveloc...	931	* to disk so check that here.
b73d7fcec Hugh Dickins swap: prevent reu...	932	*/
f90ac3982 Mel Gorman mm: avoid liveloc...	933	if (pm_suspended_storage())
b73d7fcec Hugh Dickins swap: prevent reu...	934	return 0;
a2c43eed8 Hugh Dickins mm: try_to_free_s...	935 936 937	delete_from_swap_cache(page); SetPageDirty(page); return 1;
68a22394c Rik van Riel vmscan: free swap...	938 939 940	} /*
1da177e4c Linus Torvalds Linux-2.6.12-rc2	941 942 943	* Free the swap entry like above, but also try to * free the page cache entry if it is the last user. */
2509ef26d Hugh Dickins badpage: zap prin...	944	int free_swap_and_cache(swp_entry_t entry)
1da177e4c Linus Torvalds Linux-2.6.12-rc2	945	{
2509ef26d Hugh Dickins badpage: zap prin...	946	struct swap_info_struct *p;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	947	struct page *page = NULL;
a7420aa54 Andi Kleen HWPOISON: Add sup...	948	if (non_swap_entry(entry))
2509ef26d Hugh Dickins badpage: zap prin...	949	return 1;
0697212a4 Christoph Lameter [PATCH] Swapless ...	950
1da177e4c Linus Torvalds Linux-2.6.12-rc2	951 952	p = swap_info_get(entry); if (p) {
253d553ba Hugh Dickins swap_info: SWAP_H...	953	if (swap_entry_free(p, entry, 1) == SWAP_HAS_CACHE) {
33806f06d Shaohua Li swap: make each s...	954 955	page = find_get_page(swap_address_space(entry), entry.val);
8413ac9d8 Nick Piggin mm: page lock use...	956	if (page && !trylock_page(page)) {
93fac7041 Nick Piggin [PATCH] mm: sched...	957 958 959 960	page_cache_release(page); page = NULL; } }
ec8acf20a Shaohua Li swap: add per-par...	961	spin_unlock(&p->lock);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	962 963	} if (page) {
a2c43eed8 Hugh Dickins mm: try_to_free_s...	964 965 966 967	/* * Not mapped elsewhere, or swap space full? Free it! * Also recheck PageSwapCache now page is locked (above). */
93fac7041 Nick Piggin [PATCH] mm: sched...	968	if (PageSwapCache(page) && !PageWriteback(page) &&
a2c43eed8 Hugh Dickins mm: try_to_free_s...	969	(!page_mapped(page) \|\| vm_swap_full())) {
1da177e4c Linus Torvalds Linux-2.6.12-rc2	970 971 972 973 974 975	delete_from_swap_cache(page); SetPageDirty(page); } unlock_page(page); page_cache_release(page); }
2509ef26d Hugh Dickins badpage: zap prin...	976	return p != NULL;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	977	}
b0cb1a19d Rafael J. Wysocki Replace CONFIG_SO...	978	#ifdef CONFIG_HIBERNATION
f577eb30a Rafael J. Wysocki [PATCH] swsusp: l...	979	/*
915bae9eb Rafael J. Wysocki [PATCH] swsusp: u...	980	* Find the swap type that corresponds to given device (if any).
f577eb30a Rafael J. Wysocki [PATCH] swsusp: l...	981	*
915bae9eb Rafael J. Wysocki [PATCH] swsusp: u...	982 983 984 985	* @offset - number of the PAGE_SIZE-sized block of the device, starting * from 0, in which the swap header is expected to be located. * * This is needed for the suspend to disk (aka swsusp).
f577eb30a Rafael J. Wysocki [PATCH] swsusp: l...	986	*/
7bf236874 Rafael J. Wysocki [PATCH] swsusp: D...	987	int swap_type_of(dev_t device, sector_t offset, struct block_device **bdev_p)
f577eb30a Rafael J. Wysocki [PATCH] swsusp: l...	988	{
915bae9eb Rafael J. Wysocki [PATCH] swsusp: u...	989	struct block_device *bdev = NULL;
efa90a981 Hugh Dickins swap_info: change...	990	int type;
f577eb30a Rafael J. Wysocki [PATCH] swsusp: l...	991
915bae9eb Rafael J. Wysocki [PATCH] swsusp: u...	992 993	if (device) bdev = bdget(device);
f577eb30a Rafael J. Wysocki [PATCH] swsusp: l...	994	spin_lock(&swap_lock);
efa90a981 Hugh Dickins swap_info: change...	995 996	for (type = 0; type < nr_swapfiles; type++) { struct swap_info_struct *sis = swap_info[type];
f577eb30a Rafael J. Wysocki [PATCH] swsusp: l...	997
915bae9eb Rafael J. Wysocki [PATCH] swsusp: u...	998	if (!(sis->flags & SWP_WRITEOK))
f577eb30a Rafael J. Wysocki [PATCH] swsusp: l...	999	continue;
b6b5bce35 Rafael J. Wysocki [PATCH] swsusp: F...	1000
915bae9eb Rafael J. Wysocki [PATCH] swsusp: u...	1001	if (!bdev) {
7bf236874 Rafael J. Wysocki [PATCH] swsusp: D...	1002	if (bdev_p)
dddac6a7b Alan Jenkins PM / Hibernate: R...	1003	*bdev_p = bdgrab(sis->bdev);
7bf236874 Rafael J. Wysocki [PATCH] swsusp: D...	1004
6e1819d61 Rafael J. Wysocki [PATCH] swsusp: u...	1005	spin_unlock(&swap_lock);
efa90a981 Hugh Dickins swap_info: change...	1006	return type;
6e1819d61 Rafael J. Wysocki [PATCH] swsusp: u...	1007	}
915bae9eb Rafael J. Wysocki [PATCH] swsusp: u...	1008	if (bdev == sis->bdev) {
9625a5f28 Hugh Dickins swap_info: includ...	1009	struct swap_extent *se = &sis->first_swap_extent;
915bae9eb Rafael J. Wysocki [PATCH] swsusp: u...	1010
915bae9eb Rafael J. Wysocki [PATCH] swsusp: u...	1011	if (se->start_block == offset) {
7bf236874 Rafael J. Wysocki [PATCH] swsusp: D...	1012	if (bdev_p)
dddac6a7b Alan Jenkins PM / Hibernate: R...	1013	*bdev_p = bdgrab(sis->bdev);
7bf236874 Rafael J. Wysocki [PATCH] swsusp: D...	1014
915bae9eb Rafael J. Wysocki [PATCH] swsusp: u...	1015 1016	spin_unlock(&swap_lock); bdput(bdev);
efa90a981 Hugh Dickins swap_info: change...	1017	return type;
915bae9eb Rafael J. Wysocki [PATCH] swsusp: u...	1018	}
f577eb30a Rafael J. Wysocki [PATCH] swsusp: l...	1019 1020 1021	} } spin_unlock(&swap_lock);
915bae9eb Rafael J. Wysocki [PATCH] swsusp: u...	1022 1023	if (bdev) bdput(bdev);
f577eb30a Rafael J. Wysocki [PATCH] swsusp: l...	1024 1025 1026 1027	return -ENODEV; } /*
73c34b6ac Hugh Dickins swap_info: miscel...	1028 1029 1030 1031 1032 1033 1034 1035 1036 1037 1038	* Get the (PAGE_SIZE) block corresponding to given offset on the swapdev * corresponding to given index in swap_info (swap type). / sector_t swapdev_block(int type, pgoff_t offset) { struct block_device bdev; if ((unsigned int)type >= nr_swapfiles) return 0; if (!(swap_info[type]->flags & SWP_WRITEOK)) return 0;
d4906e1aa Lee Schermerhorn swap: rework map_...	1039	return map_swap_entry(swp_entry(type, offset), &bdev);
73c34b6ac Hugh Dickins swap_info: miscel...	1040 1041 1042	} /*
f577eb30a Rafael J. Wysocki [PATCH] swsusp: l...	1043 1044 1045 1046 1047 1048 1049 1050	* Return either the total number of swap pages of given type, or the number * of free pages of that type (depending on @free) * * This is needed for software suspend */ unsigned int count_swap_pages(int type, int free) { unsigned int n = 0;
efa90a981 Hugh Dickins swap_info: change...	1051 1052 1053	spin_lock(&swap_lock); if ((unsigned int)type < nr_swapfiles) { struct swap_info_struct *sis = swap_info[type];
ec8acf20a Shaohua Li swap: add per-par...	1054	spin_lock(&sis->lock);
efa90a981 Hugh Dickins swap_info: change...	1055 1056	if (sis->flags & SWP_WRITEOK) { n = sis->pages;
f577eb30a Rafael J. Wysocki [PATCH] swsusp: l...	1057	if (free)
efa90a981 Hugh Dickins swap_info: change...	1058	n -= sis->inuse_pages;
f577eb30a Rafael J. Wysocki [PATCH] swsusp: l...	1059	}
ec8acf20a Shaohua Li swap: add per-par...	1060	spin_unlock(&sis->lock);
f577eb30a Rafael J. Wysocki [PATCH] swsusp: l...	1061	}
efa90a981 Hugh Dickins swap_info: change...	1062	spin_unlock(&swap_lock);
f577eb30a Rafael J. Wysocki [PATCH] swsusp: l...	1063 1064	return n; }
73c34b6ac Hugh Dickins swap_info: miscel...	1065	#endif /* CONFIG_HIBERNATION */
f577eb30a Rafael J. Wysocki [PATCH] swsusp: l...	1066
179ef71cb Cyrill Gorcunov mm: save soft-dir...	1067 1068 1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080	static inline int maybe_same_pte(pte_t pte, pte_t swp_pte) { #ifdef CONFIG_MEM_SOFT_DIRTY /* * When pte keeps soft dirty bit the pte generated * from swap entry does not has it, still it's same * pte from logical point of view. */ pte_t swp_pte_dirty = pte_swp_mksoft_dirty(swp_pte); return pte_same(pte, swp_pte) \|\| pte_same(pte, swp_pte_dirty); #else return pte_same(pte, swp_pte); #endif }
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1081	/*
72866f6f2 Hugh Dickins [PATCH] mm: anon ...	1082 1083 1084	* No need to decide whether this PTE shares the swap entry with others, * just let do_wp_page work it out if a write is requested later - to * force COW, vm_page_prot omits write permission from any private vma.
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1085	*/
044d66c1d Hugh Dickins memcgroup: reinst...	1086	static int unuse_pte(struct vm_area_struct vma, pmd_t pmd,
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1087 1088	unsigned long addr, swp_entry_t entry, struct page *page) {
9e16b7fb1 Hugh Dickins mm,ksm: swapoff m...	1089	struct page *swapcache;
72835c86c Johannes Weiner mm: unify remaini...	1090	struct mem_cgroup *memcg;
044d66c1d Hugh Dickins memcgroup: reinst...	1091 1092 1093	spinlock_t ptl; pte_t pte; int ret = 1;
9e16b7fb1 Hugh Dickins mm,ksm: swapoff m...	1094 1095 1096 1097	swapcache = page; page = ksm_might_need_to_copy(page, vma, addr); if (unlikely(!page)) return -ENOMEM;
72835c86c Johannes Weiner mm: unify remaini...	1098 1099	if (mem_cgroup_try_charge_swapin(vma->vm_mm, page, GFP_KERNEL, &memcg)) {
044d66c1d Hugh Dickins memcgroup: reinst...	1100	ret = -ENOMEM;
85d9fc89f KAMEZAWA Hiroyuki memcg: fix refcnt...	1101 1102	goto out_nolock; }
044d66c1d Hugh Dickins memcgroup: reinst...	1103 1104	pte = pte_offset_map_lock(vma->vm_mm, pmd, addr, &ptl);
179ef71cb Cyrill Gorcunov mm: save soft-dir...	1105	if (unlikely(!maybe_same_pte(*pte, swp_entry_to_pte(entry)))) {
5d84c7766 Johannes Weiner mm: swapfile: cle...	1106	mem_cgroup_cancel_charge_swapin(memcg);
044d66c1d Hugh Dickins memcgroup: reinst...	1107 1108 1109	ret = 0; goto out; }
8a9f3ccd2 Balbir Singh Memory controller...	1110
b084d4353 KAMEZAWA Hiroyuki mm: count swap usage	1111	dec_mm_counter(vma->vm_mm, MM_SWAPENTS);
d559db086 KAMEZAWA Hiroyuki mm: clean up mm_c...	1112	inc_mm_counter(vma->vm_mm, MM_ANONPAGES);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1113 1114 1115	get_page(page); set_pte_at(vma->vm_mm, addr, pte, pte_mkold(mk_pte(page, vma->vm_page_prot)));
9e16b7fb1 Hugh Dickins mm,ksm: swapoff m...	1116 1117 1118 1119	if (page == swapcache) page_add_anon_rmap(page, vma, addr); else /* ksm created a completely new copy */ page_add_new_anon_rmap(page, vma, addr);
72835c86c Johannes Weiner mm: unify remaini...	1120	mem_cgroup_commit_charge_swapin(page, memcg);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1121 1122 1123 1124 1125 1126	swap_free(entry); /* * Move the page to the active list so it is not * immediately swapped out again after swapon. */ activate_page(page);
044d66c1d Hugh Dickins memcgroup: reinst...	1127 1128	out: pte_unmap_unlock(pte, ptl);
85d9fc89f KAMEZAWA Hiroyuki memcg: fix refcnt...	1129	out_nolock:
9e16b7fb1 Hugh Dickins mm,ksm: swapoff m...	1130 1131 1132 1133	if (page != swapcache) { unlock_page(page); put_page(page); }
044d66c1d Hugh Dickins memcgroup: reinst...	1134	return ret;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1135 1136 1137 1138 1139 1140	} static int unuse_pte_range(struct vm_area_struct vma, pmd_t pmd, unsigned long addr, unsigned long end, swp_entry_t entry, struct page *page) {
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1141	pte_t swp_pte = swp_entry_to_pte(entry);
705e87c0c Hugh Dickins [PATCH] mm: pte_o...	1142	pte_t *pte;
8a9f3ccd2 Balbir Singh Memory controller...	1143	int ret = 0;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1144
044d66c1d Hugh Dickins memcgroup: reinst...	1145 1146 1147 1148 1149 1150 1151	/* * We don't actually need pte lock while scanning for swp_pte: since * we hold page lock and mmap_sem, swp_pte cannot be inserted into the * page table while we're scanning; though it could get zapped, and on * some architectures (e.g. x86_32 with PAE) we might catch a glimpse * of unmatched parts which look like swp_pte, so unuse_pte must * recheck under pte lock. Scanning without pte lock lets it be
2de1a7e40 Seth Jennings mm/swapfile.c: fi...	1152	* preemptable whenever CONFIG_PREEMPT but not CONFIG_HIGHPTE.
044d66c1d Hugh Dickins memcgroup: reinst...	1153 1154	*/ pte = pte_offset_map(pmd, addr);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1155 1156 1157 1158 1159	do { /* * swapoff spends a _lot_ of time in this loop! * Test inline before going to call unuse_pte. */
179ef71cb Cyrill Gorcunov mm: save soft-dir...	1160	if (unlikely(maybe_same_pte(*pte, swp_pte))) {
044d66c1d Hugh Dickins memcgroup: reinst...	1161 1162 1163 1164 1165	pte_unmap(pte); ret = unuse_pte(vma, pmd, addr, entry, page); if (ret) goto out; pte = pte_offset_map(pmd, addr);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1166 1167	} } while (pte++, addr += PAGE_SIZE, addr != end);
044d66c1d Hugh Dickins memcgroup: reinst...	1168 1169	pte_unmap(pte - 1); out:
8a9f3ccd2 Balbir Singh Memory controller...	1170	return ret;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1171 1172 1173 1174 1175 1176 1177 1178	} static inline int unuse_pmd_range(struct vm_area_struct vma, pud_t pud, unsigned long addr, unsigned long end, swp_entry_t entry, struct page page) { pmd_t pmd; unsigned long next;
8a9f3ccd2 Balbir Singh Memory controller...	1179	int ret;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1180 1181 1182 1183	pmd = pmd_offset(pud, addr); do { next = pmd_addr_end(addr, end);
1a5a9906d Andrea Arcangeli mm: thp: fix pmd_...	1184	if (pmd_none_or_trans_huge_or_clear_bad(pmd))
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1185	continue;
8a9f3ccd2 Balbir Singh Memory controller...	1186 1187 1188	ret = unuse_pte_range(vma, pmd, addr, next, entry, page); if (ret) return ret;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1189 1190 1191 1192 1193 1194 1195 1196 1197 1198	} while (pmd++, addr = next, addr != end); return 0; } static inline int unuse_pud_range(struct vm_area_struct vma, pgd_t pgd, unsigned long addr, unsigned long end, swp_entry_t entry, struct page page) { pud_t pud; unsigned long next;
8a9f3ccd2 Balbir Singh Memory controller...	1199	int ret;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1200 1201 1202 1203 1204 1205	pud = pud_offset(pgd, addr); do { next = pud_addr_end(addr, end); if (pud_none_or_clear_bad(pud)) continue;
8a9f3ccd2 Balbir Singh Memory controller...	1206 1207 1208	ret = unuse_pmd_range(vma, pud, addr, next, entry, page); if (ret) return ret;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1209 1210 1211 1212 1213 1214 1215 1216 1217	} while (pud++, addr = next, addr != end); return 0; } static int unuse_vma(struct vm_area_struct vma, swp_entry_t entry, struct page page) { pgd_t *pgd; unsigned long addr, end, next;
8a9f3ccd2 Balbir Singh Memory controller...	1218	int ret;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1219
3ca7b3c5b Hugh Dickins mm: define PAGE_M...	1220	if (page_anon_vma(page)) {
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1221 1222 1223 1224 1225 1226 1227 1228 1229 1230 1231 1232 1233 1234 1235	addr = page_address_in_vma(page, vma); if (addr == -EFAULT) return 0; else end = addr + PAGE_SIZE; } else { addr = vma->vm_start; end = vma->vm_end; } pgd = pgd_offset(vma->vm_mm, addr); do { next = pgd_addr_end(addr, end); if (pgd_none_or_clear_bad(pgd)) continue;
8a9f3ccd2 Balbir Singh Memory controller...	1236 1237 1238	ret = unuse_pud_range(vma, pgd, addr, next, entry, page); if (ret) return ret;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1239 1240 1241 1242 1243 1244 1245 1246	} while (pgd++, addr = next, addr != end); return 0; } static int unuse_mm(struct mm_struct mm, swp_entry_t entry, struct page page) { struct vm_area_struct *vma;
8a9f3ccd2 Balbir Singh Memory controller...	1247	int ret = 0;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1248 1249 1250	if (!down_read_trylock(&mm->mmap_sem)) { /*
7d03431cf Fernando Luis Vazquez Cao swapfile/vmscan: ...	1251 1252	* Activate page so shrink_inactive_list is unlikely to unmap * its ptes while lock is dropped, so swapoff can make progress.
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1253	*/
c475a8ab6 Hugh Dickins [PATCH] can_share...	1254	activate_page(page);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1255 1256 1257 1258	unlock_page(page); down_read(&mm->mmap_sem); lock_page(page); }
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1259	for (vma = mm->mmap; vma; vma = vma->vm_next) {
8a9f3ccd2 Balbir Singh Memory controller...	1260	if (vma->anon_vma && (ret = unuse_vma(vma, entry, page)))
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1261 1262	break; }
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1263	up_read(&mm->mmap_sem);
8a9f3ccd2 Balbir Singh Memory controller...	1264	return (ret < 0)? ret: 0;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1265 1266 1267	} /*
38b5faf4b Dan Magenheimer mm: frontswap: co...	1268 1269	* Scan swap_map (or frontswap_map if frontswap parameter is true) * from current position to next entry still in use.
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1270 1271	* Recycle to start on reaching the end, returning 0 when empty. */
6eb396dc4 Hugh Dickins [PATCH] swap: swa...	1272	static unsigned int find_next_to_unuse(struct swap_info_struct *si,
38b5faf4b Dan Magenheimer mm: frontswap: co...	1273	unsigned int prev, bool frontswap)
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1274	{
6eb396dc4 Hugh Dickins [PATCH] swap: swa...	1275 1276	unsigned int max = si->max; unsigned int i = prev;
8d69aaee8 Hugh Dickins swap_info: swap_m...	1277	unsigned char count;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1278 1279	/*
5d337b919 Hugh Dickins [PATCH] swap: swa...	1280	* No need for swap_lock here: we're just looking
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1281 1282	* for whether an entry is in use, not modifying it; false * hits are okay, and sys_swapoff() has already prevented new
5d337b919 Hugh Dickins [PATCH] swap: swa...	1283	* allocations from this area (while holding swap_lock).
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294 1295 1296 1297 1298	/ for (;;) { if (++i >= max) { if (!prev) { i = 0; break; } / * No entries in use at top of swap_map, * loop back to start and recheck there. */ max = prev + 1; prev = 0; i = 1; }
38b5faf4b Dan Magenheimer mm: frontswap: co...	1299 1300 1301 1302 1303 1304	if (frontswap) { if (frontswap_test(si, i)) break; else continue; }
edfe23dac Shaohua Li swap: fix races e...	1305	count = ACCESS_ONCE(si->swap_map[i]);
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	1306	if (count && swap_count(count) != SWAP_MAP_BAD)
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1307 1308 1309 1310 1311 1312 1313 1314 1315	break; } return i; } /* * We completely avoid races by reading each swap page in advance, * and then search for the process using it. All the necessary * page table adjustments can then be made atomically.
38b5faf4b Dan Magenheimer mm: frontswap: co...	1316 1317 1318	* * if the boolean frontswap is true, only unuse pages_to_unuse pages; * pages_to_unuse==0 means all pages; ignored if frontswap is false
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1319	*/
38b5faf4b Dan Magenheimer mm: frontswap: co...	1320 1321	int try_to_unuse(unsigned int type, bool frontswap, unsigned long pages_to_unuse)
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1322	{
efa90a981 Hugh Dickins swap_info: change...	1323	struct swap_info_struct *si = swap_info[type];
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1324	struct mm_struct *start_mm;
edfe23dac Shaohua Li swap: fix races e...	1325 1326 1327 1328 1329	volatile unsigned char swap_map; / swap_map is accessed without * locking. Mark it as volatile * to prevent compiler doing * something odd. */
8d69aaee8 Hugh Dickins swap_info: swap_m...	1330	unsigned char swcount;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1331 1332	struct page *page; swp_entry_t entry;
6eb396dc4 Hugh Dickins [PATCH] swap: swa...	1333	unsigned int i = 0;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1334	int retval = 0;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1335 1336 1337 1338 1339 1340 1341 1342 1343 1344 1345 1346 1347	/* * When searching mms for an entry, a good strategy is to * start at the first mm we freed the previous entry from * (though actually we don't notice whether we or coincidence * freed the entry). Initialize this start_mm with a hold. * * A simpler strategy would be to start at the last mm we * freed the previous entry from; but that would take less * advantage of mmlist ordering, which clusters forked mms * together, child after parent. If we race with dup_mmap(), we * prefer to resolve parent before child, lest we miss entries * duplicated after we scanned child: using last mm would invert
570a335b8 Hugh Dickins swap_info: swap c...	1348	* that.
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1349 1350 1351 1352 1353 1354 1355 1356 1357	/ start_mm = &init_mm; atomic_inc(&init_mm.mm_users); / * Keep on scanning until all entries have gone. Usually, * one pass through swap_map is enough, but not necessarily: * there are races when an instance of an entry might be missed. */
38b5faf4b Dan Magenheimer mm: frontswap: co...	1358	while ((i = find_next_to_unuse(si, i, frontswap)) != 0) {
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1359 1360 1361 1362	if (signal_pending(current)) { retval = -EINTR; break; }
886bb7e9c Hugh Dickins swapfile: remove ...	1363	/*
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1364 1365	* Get a page for the entry, using the existing swap * cache page if there is one. Otherwise, get a clean
886bb7e9c Hugh Dickins swapfile: remove ...	1366	* page and read the swap into it.
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1367 1368 1369	*/ swap_map = &si->swap_map[i]; entry = swp_entry(type, i);
02098feaa Hugh Dickins swapin needs gfp_...	1370 1371	page = read_swap_cache_async(entry, GFP_HIGHUSER_MOVABLE, NULL, 0);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1372 1373 1374 1375 1376 1377 1378	if (!page) { /* * Either swap_duplicate() failed because entry * has been freed independently, and will not be * reused since sys_swapoff() already disabled * allocation from here, or alloc_page() failed. */
edfe23dac Shaohua Li swap: fix races e...	1379 1380 1381 1382 1383 1384 1385 1386 1387	swcount = swap_map; / * We don't hold lock here, so the swap entry could be * SWAP_MAP_BAD (when the cluster is discarding). * Instead of fail out, We can just skip the swap * entry because swapoff will wait for discarding * finish anyway. */ if (!swcount \|\| swcount == SWAP_MAP_BAD)
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1388 1389 1390 1391 1392 1393 1394 1395 1396 1397 1398 1399 1400 1401 1402 1403 1404 1405 1406 1407 1408 1409 1410 1411 1412 1413 1414 1415 1416	continue; retval = -ENOMEM; break; } /* * Don't hold on to start_mm if it looks like exiting. / if (atomic_read(&start_mm->mm_users) == 1) { mmput(start_mm); start_mm = &init_mm; atomic_inc(&init_mm.mm_users); } / * Wait for and lock page. When do_swap_page races with * try_to_unuse, do_swap_page can handle the fault much * faster than try_to_unuse can locate the entry. This * apparently redundant "wait_on_page_locked" lets try_to_unuse * defer to do_swap_page in such a case - in some tests, * do_swap_page and try_to_unuse repeatedly compete. / wait_on_page_locked(page); wait_on_page_writeback(page); lock_page(page); wait_on_page_writeback(page); / * Remove all references to entry.
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1417	*/
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1418	swcount = *swap_map;
aaa468653 Hugh Dickins swap_info: note S...	1419 1420 1421 1422 1423 1424	if (swap_count(swcount) == SWAP_MAP_SHMEM) { retval = shmem_unuse(entry, page); /* page has already been unlocked and released */ if (retval < 0) break; continue;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1425	}
aaa468653 Hugh Dickins swap_info: note S...	1426 1427	if (swap_count(swcount) && start_mm != &init_mm) retval = unuse_mm(start_mm, entry, page);
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	1428	if (swap_count(*swap_map)) {
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1429 1430 1431 1432 1433 1434 1435 1436 1437	int set_start_mm = (swap_map >= swcount); struct list_head p = &start_mm->mmlist; struct mm_struct new_start_mm = start_mm; struct mm_struct prev_mm = start_mm; struct mm_struct *mm; atomic_inc(&new_start_mm->mm_users); atomic_inc(&prev_mm->mm_users); spin_lock(&mmlist_lock);
aaa468653 Hugh Dickins swap_info: note S...	1438	while (swap_count(*swap_map) && !retval &&
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1439 1440	(p = p->next) != &start_mm->mmlist) { mm = list_entry(p, struct mm_struct, mmlist);
70af7c5c6 Hugh Dickins [PATCH] swapoff: ...	1441	if (!atomic_inc_not_zero(&mm->mm_users))
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1442	continue;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1443 1444 1445 1446 1447 1448 1449	spin_unlock(&mmlist_lock); mmput(prev_mm); prev_mm = mm; cond_resched(); swcount = *swap_map;
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	1450	if (!swap_count(swcount)) /* any usage ? */
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1451	;
aaa468653 Hugh Dickins swap_info: note S...	1452	else if (mm == &init_mm)
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1453	set_start_mm = 1;
aaa468653 Hugh Dickins swap_info: note S...	1454	else
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1455	retval = unuse_mm(mm, entry, page);
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	1456
32c5fc10e Bo Liu mm: remove incorr...	1457	if (set_start_mm && *swap_map < swcount) {
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1458 1459 1460 1461 1462 1463 1464 1465 1466 1467 1468 1469 1470 1471 1472 1473 1474 1475 1476	mmput(new_start_mm); atomic_inc(&mm->mm_users); new_start_mm = mm; set_start_mm = 0; } spin_lock(&mmlist_lock); } spin_unlock(&mmlist_lock); mmput(prev_mm); mmput(start_mm); start_mm = new_start_mm; } if (retval) { unlock_page(page); page_cache_release(page); break; } /*
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1477 1478 1479 1480 1481 1482 1483 1484 1485 1486 1487	* If a reference remains (rare), we would like to leave * the page in the swap cache; but try_to_unmap could * then re-duplicate the entry once we drop page lock, * so we might loop indefinitely; also, that page could * not be swapped out to other storage meanwhile. So: * delete from cache even if there's another reference, * after ensuring that the data has been saved to disk - * since if the reference remains (rarer), it will be * read from disk into another page. Splitting into two * pages would be incorrect if swap supported "shared * private" pages, but they are handled by tmpfs files.
5ad646880 Hugh Dickins ksm: let shared p...	1488 1489 1490 1491 1492 1493	* * Given how unuse_vma() targets one particular offset * in an anon_vma, once the anon_vma has been determined, * this splitting happens to be just what is needed to * handle where KSM pages have been swapped out: re-reading * is unnecessarily slow, but we can fix that later on.
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1494	*/
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	1495 1496	if (swap_count(*swap_map) && PageDirty(page) && PageSwapCache(page)) {
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1497 1498 1499 1500 1501 1502 1503 1504	struct writeback_control wbc = { .sync_mode = WB_SYNC_NONE, }; swap_writepage(page, &wbc); lock_page(page); wait_on_page_writeback(page); }
68bdc8d64 Hugh Dickins mm: try_to_unuse ...	1505 1506 1507 1508 1509 1510 1511 1512 1513 1514	/* * It is conceivable that a racing task removed this page from * swap cache just before we acquired the page lock at the top, * or while we dropped it in unuse_mm(). The page might even * be back in swap cache on another swap area: that we must not * delete, since it may not have been written out to swap yet. */ if (PageSwapCache(page) && likely(page_private(page) == entry.val))
2e0e26c76 Hugh Dickins tmpfs: open a win...	1515	delete_from_swap_cache(page);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1516 1517 1518 1519	/* * So we could skip searching mms once swap count went * to 1, we did not mark any present ptes as dirty: must
2706a1b89 Anderson Briglia vmscan: fix comme...	1520	* mark page dirty so shrink_page_list will preserve it.
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1521 1522 1523 1524 1525 1526 1527 1528 1529 1530	/ SetPageDirty(page); unlock_page(page); page_cache_release(page); / * Make sure that we aren't completely killing * interactive performance. */ cond_resched();
38b5faf4b Dan Magenheimer mm: frontswap: co...	1531 1532 1533 1534	if (frontswap && pages_to_unuse > 0) { if (!--pages_to_unuse) break; }
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1535 1536 1537	} mmput(start_mm);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1538 1539 1540 1541	return retval; } /*
5d337b919 Hugh Dickins [PATCH] swap: swa...	1542 1543 1544	* After a successful try_to_unuse, if no swap is now in use, we know * we can empty the mmlist. swap_lock must be held on entry and exit. * Note that mmlist_lock nests inside swap_lock, and an mm must be
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1545 1546 1547 1548 1549	* added to the mmlist just after page_duplicate - before would be racy. / static void drain_mmlist(void) { struct list_head p, *next;
efa90a981 Hugh Dickins swap_info: change...	1550	unsigned int type;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1551
efa90a981 Hugh Dickins swap_info: change...	1552 1553	for (type = 0; type < nr_swapfiles; type++) if (swap_info[type]->inuse_pages)
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1554 1555 1556 1557 1558 1559 1560 1561 1562	return; spin_lock(&mmlist_lock); list_for_each_safe(p, next, &init_mm.mmlist) list_del_init(p); spin_unlock(&mmlist_lock); } /* * Use this swapdev's extent info to locate the (PAGE_SIZE) block which
d4906e1aa Lee Schermerhorn swap: rework map_...	1563 1564 1565	* corresponds to page offset for the specified swap entry. * Note that the type of this function is sector_t, but it returns page offset * into the bdev, not sector offset.
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1566	*/
d4906e1aa Lee Schermerhorn swap: rework map_...	1567	static sector_t map_swap_entry(swp_entry_t entry, struct block_device **bdev)
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1568	{
f29ad6a99 Hugh Dickins swap_info: privat...	1569 1570 1571 1572	struct swap_info_struct sis; struct swap_extent start_se; struct swap_extent *se; pgoff_t offset;
efa90a981 Hugh Dickins swap_info: change...	1573	sis = swap_info[swp_type(entry)];
f29ad6a99 Hugh Dickins swap_info: privat...	1574 1575 1576 1577 1578	*bdev = sis->bdev; offset = swp_offset(entry); start_se = sis->curr_swap_extent; se = start_se;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1579 1580 1581 1582 1583 1584 1585 1586	for ( ; ; ) { struct list_head *lh; if (se->start_page <= offset && offset < (se->start_page + se->nr_pages)) { return se->start_block + (offset - se->start_page); }
11d31886d Hugh Dickins [PATCH] swap: swa...	1587	lh = se->list.next;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1588 1589 1590 1591 1592 1593 1594	se = list_entry(lh, struct swap_extent, list); sis->curr_swap_extent = se; BUG_ON(se == start_se); /* It must be present / } } /
d4906e1aa Lee Schermerhorn swap: rework map_...	1595 1596 1597 1598 1599 1600 1601 1602 1603 1604	* Returns the page offset into bdev for the specified page's swap entry. / sector_t map_swap_page(struct page page, struct block_device *bdev) { swp_entry_t entry; entry.val = page_private(page); return map_swap_entry(entry, bdev); } /
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1605 1606 1607 1608	* Free all of a swapdev's extent information / static void destroy_swap_extents(struct swap_info_struct sis) {
9625a5f28 Hugh Dickins swap_info: includ...	1609	while (!list_empty(&sis->first_swap_extent.list)) {
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1610	struct swap_extent *se;
9625a5f28 Hugh Dickins swap_info: includ...	1611	se = list_entry(sis->first_swap_extent.list.next,
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1612 1613 1614 1615	struct swap_extent, list); list_del(&se->list); kfree(se); }
62c230bc1 Mel Gorman mm: add support f...	1616 1617 1618 1619 1620 1621 1622 1623	if (sis->flags & SWP_FILE) { struct file swap_file = sis->swap_file; struct address_space mapping = swap_file->f_mapping; sis->flags &= ~SWP_FILE; mapping->a_ops->swap_deactivate(swap_file); }
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1624 1625 1626 1627	} /* * Add a block range (and the corresponding page range) into this swapdev's
11d31886d Hugh Dickins [PATCH] swap: swa...	1628	* extent list. The extent list is kept sorted in page order.
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1629	*
11d31886d Hugh Dickins [PATCH] swap: swa...	1630	* This function rather assumes that it is called in ascending page order.
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1631	*/
a509bc1a9 Mel Gorman mm: swap: impleme...	1632	int
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1633 1634 1635 1636 1637 1638	add_swap_extent(struct swap_info_struct sis, unsigned long start_page, unsigned long nr_pages, sector_t start_block) { struct swap_extent se; struct swap_extent new_se; struct list_head lh;
9625a5f28 Hugh Dickins swap_info: includ...	1639 1640 1641 1642 1643 1644 1645 1646 1647	if (start_page == 0) { se = &sis->first_swap_extent; sis->curr_swap_extent = se; se->start_page = 0; se->nr_pages = nr_pages; se->start_block = start_block; return 1; } else { lh = sis->first_swap_extent.list.prev; /* Highest extent */
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1648	se = list_entry(lh, struct swap_extent, list);
11d31886d Hugh Dickins [PATCH] swap: swa...	1649 1650	BUG_ON(se->start_page + se->nr_pages != start_page); if (se->start_block + se->nr_pages == start_block) {
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1651 1652 1653 1654	/* Merge it */ se->nr_pages += nr_pages; return 0; }
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1655 1656 1657 1658 1659 1660 1661 1662 1663 1664 1665	} /* * No merge. Insert a new extent, preserving ordering. / new_se = kmalloc(sizeof(se), GFP_KERNEL); if (new_se == NULL) return -ENOMEM; new_se->start_page = start_page; new_se->nr_pages = nr_pages; new_se->start_block = start_block;
9625a5f28 Hugh Dickins swap_info: includ...	1666	list_add_tail(&new_se->list, &sis->first_swap_extent.list);
53092a740 Hugh Dickins [PATCH] swap: sho...	1667	return 1;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1668 1669 1670 1671 1672 1673 1674 1675 1676 1677 1678 1679 1680 1681 1682 1683 1684 1685 1686 1687 1688 1689	} /* * A `swap extent' is a simple thing which maps a contiguous range of pages * onto a contiguous range of disk blocks. An ordered list of swap extents * is built at swapon time and is then used at swap_writepage/swap_readpage * time for locating where on disk a page belongs. * * If the swapfile is an S_ISBLK block device, a single extent is installed. * This is done so that the main operating code can treat S_ISBLK and S_ISREG * swap files identically. * * Whether the swapdev is an S_ISREG file or an S_ISBLK blockdev, the swap * extent list operates in PAGE_SIZE disk blocks. Both S_ISREG and S_ISBLK * swapfiles are handled identically after swapon time. * * For S_ISREG swapfiles, setup_swap_extents() will walk all the file's blocks * and will parse them into an ordered extent list, in PAGE_SIZE chunks. If * some stray blocks are found which do not fall within the PAGE_SIZE alignment * requirements, they are simply tossed out - we will never use those blocks * for swapping. *
b0d9bcd4b Hugh Dickins [PATCH] swap: upd...	1690	* For S_ISREG swapfiles we set S_SWAPFILE across the life of the swapon. This
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1691 1692 1693 1694 1695 1696 1697 1698 1699 1700	* prevents root from shooting her foot off by ftruncating an in-use swapfile, * which will scribble on the fs. * * The amount of disk space which a single swap extent represents varies. * Typically it is in the 1-4 megabyte range. So we can have hundreds of * extents in the list. To avoid much list walking, we cache the previous * search location in `curr_swap_extent', and start new searches from there. * This is extremely effective. The average number of iterations in * map_swap_page() has been measured at about 0.3 per page. - akpm. */
53092a740 Hugh Dickins [PATCH] swap: sho...	1701	static int setup_swap_extents(struct swap_info_struct sis, sector_t span)
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1702	{
62c230bc1 Mel Gorman mm: add support f...	1703 1704 1705	struct file swap_file = sis->swap_file; struct address_space mapping = swap_file->f_mapping; struct inode *inode = mapping->host;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1706	int ret;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1707 1708	if (S_ISBLK(inode->i_mode)) { ret = add_swap_extent(sis, 0, sis->max, 0);
53092a740 Hugh Dickins [PATCH] swap: sho...	1709	*span = sis->pages;
a509bc1a9 Mel Gorman mm: swap: impleme...	1710	return ret;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1711	}
62c230bc1 Mel Gorman mm: add support f...	1712	if (mapping->a_ops->swap_activate) {
a509bc1a9 Mel Gorman mm: swap: impleme...	1713	ret = mapping->a_ops->swap_activate(sis, swap_file, span);
62c230bc1 Mel Gorman mm: add support f...	1714 1715 1716 1717 1718	if (!ret) { sis->flags \|= SWP_FILE; ret = add_swap_extent(sis, 0, sis->max, 0); *span = sis->pages; }
a509bc1a9 Mel Gorman mm: swap: impleme...	1719	return ret;
62c230bc1 Mel Gorman mm: add support f...	1720	}
a509bc1a9 Mel Gorman mm: swap: impleme...	1721	return generic_swapfile_activate(sis, swap_file, span);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1722	}
cf0cac0a0 Cesar Eduardo Barros mm: refactor rein...	1723	static void _enable_swap_info(struct swap_info_struct *p, int prio,
2a8f94493 Shaohua Li swap: change bloc...	1724 1725	unsigned char swap_map, struct swap_cluster_info cluster_info)
40531542e Cesar Eduardo Barros sys_swapon: separ...	1726 1727	{ int i, prev;
40531542e Cesar Eduardo Barros sys_swapon: separ...	1728 1729 1730 1731 1732	if (prio >= 0) p->prio = prio; else p->prio = --least_priority; p->swap_map = swap_map;
2a8f94493 Shaohua Li swap: change bloc...	1733	p->cluster_info = cluster_info;
40531542e Cesar Eduardo Barros sys_swapon: separ...	1734	p->flags \|= SWP_WRITEOK;
ec8acf20a Shaohua Li swap: add per-par...	1735	atomic_long_add(p->pages, &nr_swap_pages);
40531542e Cesar Eduardo Barros sys_swapon: separ...	1736 1737 1738 1739 1740 1741 1742 1743 1744 1745 1746 1747 1748 1749	total_swap_pages += p->pages; /* insert swap space into swap_list: */ prev = -1; for (i = swap_list.head; i >= 0; i = swap_info[i]->next) { if (p->prio >= swap_info[i]->prio) break; prev = i; } p->next = i; if (prev < 0) swap_list.head = swap_list.next = p->type; else swap_info[prev]->next = p->type;
cf0cac0a0 Cesar Eduardo Barros mm: refactor rein...	1750 1751 1752 1753	} static void enable_swap_info(struct swap_info_struct p, int prio, unsigned char swap_map,
2a8f94493 Shaohua Li swap: change bloc...	1754	struct swap_cluster_info *cluster_info,
cf0cac0a0 Cesar Eduardo Barros mm: refactor rein...	1755 1756	unsigned long *frontswap_map) {
4f89849da Minchan Kim frontswap: get ri...	1757	frontswap_init(p->type, frontswap_map);
cf0cac0a0 Cesar Eduardo Barros mm: refactor rein...	1758	spin_lock(&swap_lock);
ec8acf20a Shaohua Li swap: add per-par...	1759	spin_lock(&p->lock);
2a8f94493 Shaohua Li swap: change bloc...	1760	_enable_swap_info(p, prio, swap_map, cluster_info);
ec8acf20a Shaohua Li swap: add per-par...	1761	spin_unlock(&p->lock);
cf0cac0a0 Cesar Eduardo Barros mm: refactor rein...	1762 1763 1764 1765 1766 1767	spin_unlock(&swap_lock); } static void reinsert_swap_info(struct swap_info_struct *p) { spin_lock(&swap_lock);
ec8acf20a Shaohua Li swap: add per-par...	1768	spin_lock(&p->lock);
2a8f94493 Shaohua Li swap: change bloc...	1769	_enable_swap_info(p, p->prio, p->swap_map, p->cluster_info);
ec8acf20a Shaohua Li swap: add per-par...	1770	spin_unlock(&p->lock);
40531542e Cesar Eduardo Barros sys_swapon: separ...	1771 1772	spin_unlock(&swap_lock); }
c4ea37c26 Heiko Carstens [CVE-2009-0029] S...	1773	SYSCALL_DEFINE1(swapoff, const char __user *, specialfile)
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1774	{
73c34b6ac Hugh Dickins swap_info: miscel...	1775	struct swap_info_struct *p = NULL;
8d69aaee8 Hugh Dickins swap_info: swap_m...	1776	unsigned char *swap_map;
2a8f94493 Shaohua Li swap: change bloc...	1777	struct swap_cluster_info *cluster_info;
4f89849da Minchan Kim frontswap: get ri...	1778	unsigned long *frontswap_map;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1779 1780 1781	struct file swap_file, victim; struct address_space mapping; struct inode inode;
91a27b2a7 Jeff Layton vfs: define struc...	1782	struct filename *pathname;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1783 1784	int i, type, prev; int err;
5b808a230 Krzysztof Kozlowski swap: fix set_blo...	1785	unsigned int old_block_size;
886bb7e9c Hugh Dickins swapfile: remove ...	1786
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1787 1788	if (!capable(CAP_SYS_ADMIN)) return -EPERM;
191c54244 Al Viro mm: collapse secu...	1789	BUG_ON(!current->mm);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1790	pathname = getname(specialfile);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1791	if (IS_ERR(pathname))
f58b59c1d Xiaotian Feng swapfile: fix nam...	1792	return PTR_ERR(pathname);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1793
669abf4e5 Jeff Layton vfs: make path_op...	1794	victim = file_open_name(pathname, O_RDWR\|O_LARGEFILE, 0);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1795 1796 1797 1798 1799 1800	err = PTR_ERR(victim); if (IS_ERR(victim)) goto out; mapping = victim->f_mapping; prev = -1;
5d337b919 Hugh Dickins [PATCH] swap: swa...	1801	spin_lock(&swap_lock);
efa90a981 Hugh Dickins swap_info: change...	1802 1803	for (type = swap_list.head; type >= 0; type = swap_info[type]->next) { p = swap_info[type];
22c6f8fdb Hugh Dickins swapfile: remove ...	1804	if (p->flags & SWP_WRITEOK) {
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1805 1806 1807 1808 1809 1810 1811	if (p->swap_file->f_mapping == mapping) break; } prev = type; } if (type < 0) { err = -EINVAL;
5d337b919 Hugh Dickins [PATCH] swap: swa...	1812	spin_unlock(&swap_lock);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1813 1814	goto out_dput; }
191c54244 Al Viro mm: collapse secu...	1815	if (!security_vm_enough_memory_mm(current->mm, p->pages))
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1816 1817 1818	vm_unacct_memory(p->pages); else { err = -ENOMEM;
5d337b919 Hugh Dickins [PATCH] swap: swa...	1819	spin_unlock(&swap_lock);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1820 1821	goto out_dput; }
efa90a981 Hugh Dickins swap_info: change...	1822	if (prev < 0)
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1823	swap_list.head = p->next;
efa90a981 Hugh Dickins swap_info: change...	1824 1825	else swap_info[prev]->next = p->next;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1826 1827 1828 1829	if (type == swap_list.next) { /* just pick something that's safe... */ swap_list.next = swap_list.head; }
ec8acf20a Shaohua Li swap: add per-par...	1830	spin_lock(&p->lock);
78ecba081 Hugh Dickins mm: fix ever-decr...	1831	if (p->prio < 0) {
efa90a981 Hugh Dickins swap_info: change...	1832 1833	for (i = p->next; i >= 0; i = swap_info[i]->next) swap_info[i]->prio = p->prio--;
78ecba081 Hugh Dickins mm: fix ever-decr...	1834 1835	least_priority++; }
ec8acf20a Shaohua Li swap: add per-par...	1836	atomic_long_sub(p->pages, &nr_swap_pages);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1837 1838	total_swap_pages -= p->pages; p->flags &= ~SWP_WRITEOK;
ec8acf20a Shaohua Li swap: add per-par...	1839	spin_unlock(&p->lock);
5d337b919 Hugh Dickins [PATCH] swap: swa...	1840	spin_unlock(&swap_lock);
fb4f88dca Hugh Dickins [PATCH] swap: get...	1841
e1e12d2f3 David Rientjes mm, oom: fix race...	1842	set_current_oom_origin();
38b5faf4b Dan Magenheimer mm: frontswap: co...	1843	err = try_to_unuse(type, false, 0); /* force all pages to be unused */
e1e12d2f3 David Rientjes mm, oom: fix race...	1844	clear_current_oom_origin();
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1845
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1846 1847	if (err) { /* re-insert swap space back into swap_list */
cf0cac0a0 Cesar Eduardo Barros mm: refactor rein...	1848	reinsert_swap_info(p);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1849 1850	goto out_dput; }
52b7efdbe Hugh Dickins [PATCH] swap: sca...	1851
815c2c543 Shaohua Li swap: make swap d...	1852	flush_work(&p->discard_work);
5d337b919 Hugh Dickins [PATCH] swap: swa...	1853	destroy_swap_extents(p);
570a335b8 Hugh Dickins swap_info: swap c...	1854 1855	if (p->flags & SWP_CONTINUED) free_swap_count_continuations(p);
fc0abb145 Ingo Molnar [PATCH] sem2mutex...	1856	mutex_lock(&swapon_mutex);
5d337b919 Hugh Dickins [PATCH] swap: swa...	1857	spin_lock(&swap_lock);
ec8acf20a Shaohua Li swap: add per-par...	1858	spin_lock(&p->lock);
5d337b919 Hugh Dickins [PATCH] swap: swa...	1859	drain_mmlist();
52b7efdbe Hugh Dickins [PATCH] swap: sca...	1860	/* wait for anyone still in scan_swap_map */
52b7efdbe Hugh Dickins [PATCH] swap: sca...	1861 1862	p->highest_bit = 0; /* cuts scans short */ while (p->flags >= SWP_SCANNING) {
ec8acf20a Shaohua Li swap: add per-par...	1863	spin_unlock(&p->lock);
5d337b919 Hugh Dickins [PATCH] swap: swa...	1864	spin_unlock(&swap_lock);
13e4b57f6 Nishanth Aravamudan [PATCH] mm: fix-u...	1865	schedule_timeout_uninterruptible(1);
5d337b919 Hugh Dickins [PATCH] swap: swa...	1866	spin_lock(&swap_lock);
ec8acf20a Shaohua Li swap: add per-par...	1867	spin_lock(&p->lock);
52b7efdbe Hugh Dickins [PATCH] swap: sca...	1868	}
52b7efdbe Hugh Dickins [PATCH] swap: sca...	1869
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1870	swap_file = p->swap_file;
5b808a230 Krzysztof Kozlowski swap: fix set_blo...	1871	old_block_size = p->old_block_size;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1872 1873 1874 1875	p->swap_file = NULL; p->max = 0; swap_map = p->swap_map; p->swap_map = NULL;
2a8f94493 Shaohua Li swap: change bloc...	1876 1877	cluster_info = p->cluster_info; p->cluster_info = NULL;
4f89849da Minchan Kim frontswap: get ri...	1878	frontswap_map = frontswap_map_get(p);
ec8acf20a Shaohua Li swap: add per-par...	1879	spin_unlock(&p->lock);
5d337b919 Hugh Dickins [PATCH] swap: swa...	1880	spin_unlock(&swap_lock);
4f89849da Minchan Kim frontswap: get ri...	1881	frontswap_invalidate_area(type);
58e97ba6b Krzysztof Kozlowski frontswap: enable...	1882	frontswap_map_set(p, NULL);
fc0abb145 Ingo Molnar [PATCH] sem2mutex...	1883	mutex_unlock(&swapon_mutex);
ebc2a1a69 Shaohua Li swap: make cluste...	1884 1885	free_percpu(p->percpu_cluster); p->percpu_cluster = NULL;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1886	vfree(swap_map);
2a8f94493 Shaohua Li swap: change bloc...	1887	vfree(cluster_info);
4f89849da Minchan Kim frontswap: get ri...	1888	vfree(frontswap_map);
2de1a7e40 Seth Jennings mm/swapfile.c: fi...	1889	/* Destroy swap account information */
27a7faa07 KAMEZAWA Hiroyuki memcg: swap cgrou...	1890	swap_cgroup_swapoff(type);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1891 1892 1893	inode = mapping->host; if (S_ISBLK(inode->i_mode)) { struct block_device *bdev = I_BDEV(inode);
5b808a230 Krzysztof Kozlowski swap: fix set_blo...	1894	set_blocksize(bdev, old_block_size);
e525fd89d Tejun Heo block: make blkde...	1895	blkdev_put(bdev, FMODE_READ \| FMODE_WRITE \| FMODE_EXCL);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1896	} else {
1b1dcc1b5 Jes Sorensen [PATCH] mutex sub...	1897	mutex_lock(&inode->i_mutex);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1898	inode->i_flags &= ~S_SWAPFILE;
1b1dcc1b5 Jes Sorensen [PATCH] mutex sub...	1899	mutex_unlock(&inode->i_mutex);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1900 1901	} filp_close(swap_file, NULL);
f893ab41e Weijie Yang mm/swap: fix race...	1902 1903 1904 1905 1906 1907 1908 1909 1910	/* * Clear the SWP_USED flag after all resources are freed so that swapon * can reuse this swap_info in alloc_swap_info() safely. It is ok to * not hold p->lock after we cleared its SWP_WRITEOK. */ spin_lock(&swap_lock); p->flags = 0; spin_unlock(&swap_lock);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1911	err = 0;
66d7dd518 Kay Sievers /proc/swaps: supp...	1912 1913	atomic_inc(&proc_poll_event); wake_up_interruptible(&proc_poll_wait);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1914 1915 1916 1917	out_dput: filp_close(victim, NULL); out:
f58b59c1d Xiaotian Feng swapfile: fix nam...	1918	putname(pathname);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1919 1920 1921 1922	return err; } #ifdef CONFIG_PROC_FS
66d7dd518 Kay Sievers /proc/swaps: supp...	1923 1924	static unsigned swaps_poll(struct file file, poll_table wait) {
f15146380 Kay Sievers fs: seq_file - ad...	1925	struct seq_file *seq = file->private_data;
66d7dd518 Kay Sievers /proc/swaps: supp...	1926 1927	poll_wait(file, &proc_poll_wait, wait);
f15146380 Kay Sievers fs: seq_file - ad...	1928 1929	if (seq->poll_event != atomic_read(&proc_poll_event)) { seq->poll_event = atomic_read(&proc_poll_event);
66d7dd518 Kay Sievers /proc/swaps: supp...	1930 1931 1932 1933 1934	return POLLIN \| POLLRDNORM \| POLLERR \| POLLPRI; } return POLLIN \| POLLRDNORM; }
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1935 1936 1937	/* iterator / static void swap_start(struct seq_file swap, loff_t pos) {
efa90a981 Hugh Dickins swap_info: change...	1938 1939	struct swap_info_struct *si; int type;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1940	loff_t l = *pos;
fc0abb145 Ingo Molnar [PATCH] sem2mutex...	1941	mutex_lock(&swapon_mutex);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1942
881e4aabe Suleiman Souhlal [PATCH] Always pr...	1943 1944	if (!l) return SEQ_START_TOKEN;
efa90a981 Hugh Dickins swap_info: change...	1945 1946 1947 1948	for (type = 0; type < nr_swapfiles; type++) { smp_rmb(); /* read nr_swapfiles before swap_info[type] */ si = swap_info[type]; if (!(si->flags & SWP_USED) \|\| !si->swap_map)
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1949	continue;
881e4aabe Suleiman Souhlal [PATCH] Always pr...	1950	if (!--l)
efa90a981 Hugh Dickins swap_info: change...	1951	return si;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1952 1953 1954 1955 1956 1957 1958	} return NULL; } static void swap_next(struct seq_file swap, void v, loff_t pos) {
efa90a981 Hugh Dickins swap_info: change...	1959 1960	struct swap_info_struct *si = v; int type;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1961
881e4aabe Suleiman Souhlal [PATCH] Always pr...	1962	if (v == SEQ_START_TOKEN)
efa90a981 Hugh Dickins swap_info: change...	1963 1964 1965	type = 0; else type = si->type + 1;
881e4aabe Suleiman Souhlal [PATCH] Always pr...	1966
efa90a981 Hugh Dickins swap_info: change...	1967 1968 1969 1970	for (; type < nr_swapfiles; type++) { smp_rmb(); /* read nr_swapfiles before swap_info[type] */ si = swap_info[type]; if (!(si->flags & SWP_USED) \|\| !si->swap_map)
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1971 1972	continue; ++*pos;
efa90a981 Hugh Dickins swap_info: change...	1973	return si;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1974 1975 1976 1977 1978 1979 1980	} return NULL; } static void swap_stop(struct seq_file swap, void v) {
fc0abb145 Ingo Molnar [PATCH] sem2mutex...	1981	mutex_unlock(&swapon_mutex);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1982 1983 1984 1985	} static int swap_show(struct seq_file swap, void v) {
efa90a981 Hugh Dickins swap_info: change...	1986	struct swap_info_struct *si = v;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1987 1988	struct file *file; int len;
efa90a981 Hugh Dickins swap_info: change...	1989	if (si == SEQ_START_TOKEN) {
881e4aabe Suleiman Souhlal [PATCH] Always pr...	1990 1991 1992 1993	seq_puts(swap,"Filename\t\t\t\tType\t\tSize\tUsed\tPriority "); return 0; }
1da177e4c Linus Torvalds Linux-2.6.12-rc2	1994
efa90a981 Hugh Dickins swap_info: change...	1995	file = si->swap_file;
c32c2f63a Jan Blunck d_path: Make seq_...	1996 1997	len = seq_path(swap, &file->f_path, " \t \\");
6eb396dc4 Hugh Dickins [PATCH] swap: swa...	1998 1999	seq_printf(swap, "%*s%s\t%u\t%u\t%d ",
886bb7e9c Hugh Dickins swapfile: remove ...	2000	len < 40 ? 40 - len : 1, " ",
496ad9aa8 Al Viro new helper: file_...	2001	S_ISBLK(file_inode(file)->i_mode) ?
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2002	"partition" : "file\t",
efa90a981 Hugh Dickins swap_info: change...	2003 2004 2005	si->pages << (PAGE_SHIFT - 10), si->inuse_pages << (PAGE_SHIFT - 10), si->prio);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2006 2007	return 0; }
15ad7cdcf Helge Deller [PATCH] struct se...	2008	static const struct seq_operations swaps_op = {
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2009 2010 2011 2012 2013 2014 2015 2016	.start = swap_start, .next = swap_next, .stop = swap_stop, .show = swap_show }; static int swaps_open(struct inode inode, struct file file) {
f15146380 Kay Sievers fs: seq_file - ad...	2017	struct seq_file *seq;
66d7dd518 Kay Sievers /proc/swaps: supp...	2018	int ret;
66d7dd518 Kay Sievers /proc/swaps: supp...	2019	ret = seq_open(file, &swaps_op);
f15146380 Kay Sievers fs: seq_file - ad...	2020	if (ret)
66d7dd518 Kay Sievers /proc/swaps: supp...	2021	return ret;
66d7dd518 Kay Sievers /proc/swaps: supp...	2022
f15146380 Kay Sievers fs: seq_file - ad...	2023 2024 2025	seq = file->private_data; seq->poll_event = atomic_read(&proc_poll_event); return 0;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2026	}
15ad7cdcf Helge Deller [PATCH] struct se...	2027	static const struct file_operations proc_swaps_operations = {
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2028 2029 2030 2031	.open = swaps_open, .read = seq_read, .llseek = seq_lseek, .release = seq_release,
66d7dd518 Kay Sievers /proc/swaps: supp...	2032	.poll = swaps_poll,
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2033 2034 2035 2036	}; static int __init procswaps_init(void) {
3d71f86f4 Denis V. Lunev mm: use non-racy ...	2037	proc_create("swaps", 0, NULL, &proc_swaps_operations);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2038 2039 2040 2041	return 0; } __initcall(procswaps_init); #endif /* CONFIG_PROC_FS */
1796316a8 Jan Beulich x86: consolidate ...	2042 2043 2044 2045 2046 2047 2048 2049	#ifdef MAX_SWAPFILES_CHECK static int __init max_swapfiles_check(void) { MAX_SWAPFILES_CHECK(); return 0; } late_initcall(max_swapfiles_check); #endif
53cbb2435 Cesar Eduardo Barros sys_swapon: separ...	2050	static struct swap_info_struct *alloc_swap_info(void)
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2051	{
73c34b6ac Hugh Dickins swap_info: miscel...	2052	struct swap_info_struct *p;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2053	unsigned int type;
efa90a981 Hugh Dickins swap_info: change...	2054 2055 2056	p = kzalloc(sizeof(*p), GFP_KERNEL); if (!p)
53cbb2435 Cesar Eduardo Barros sys_swapon: separ...	2057	return ERR_PTR(-ENOMEM);
efa90a981 Hugh Dickins swap_info: change...	2058
5d337b919 Hugh Dickins [PATCH] swap: swa...	2059	spin_lock(&swap_lock);
efa90a981 Hugh Dickins swap_info: change...	2060 2061	for (type = 0; type < nr_swapfiles; type++) { if (!(swap_info[type]->flags & SWP_USED))
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2062	break;
efa90a981 Hugh Dickins swap_info: change...	2063	}
0697212a4 Christoph Lameter [PATCH] Swapless ...	2064	if (type >= MAX_SWAPFILES) {
5d337b919 Hugh Dickins [PATCH] swap: swa...	2065	spin_unlock(&swap_lock);
efa90a981 Hugh Dickins swap_info: change...	2066	kfree(p);
730c0581c Cesar Eduardo Barros sys_swapon: simpl...	2067	return ERR_PTR(-EPERM);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2068	}
efa90a981 Hugh Dickins swap_info: change...	2069 2070 2071 2072 2073 2074 2075 2076 2077 2078 2079 2080 2081 2082 2083 2084 2085 2086	if (type >= nr_swapfiles) { p->type = type; swap_info[type] = p; /* * Write swap_info[type] before nr_swapfiles, in case a * racing procfs swap_start() or swap_next() is reading them. * (We never shrink nr_swapfiles, we never free this entry.) / smp_wmb(); nr_swapfiles++; } else { kfree(p); p = swap_info[type]; / * Do not memset this entry: a racing procfs swap_next() * would be relying on p->type to remain valid. */ }
9625a5f28 Hugh Dickins swap_info: includ...	2087	INIT_LIST_HEAD(&p->first_swap_extent.list);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2088	p->flags = SWP_USED;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2089	p->next = -1;
5d337b919 Hugh Dickins [PATCH] swap: swa...	2090	spin_unlock(&swap_lock);
ec8acf20a Shaohua Li swap: add per-par...	2091	spin_lock_init(&p->lock);
efa90a981 Hugh Dickins swap_info: change...	2092
53cbb2435 Cesar Eduardo Barros sys_swapon: separ...	2093	return p;
53cbb2435 Cesar Eduardo Barros sys_swapon: separ...	2094	}
4d0e1e107 Cesar Eduardo Barros sys_swapon: separ...	2095 2096 2097 2098 2099 2100 2101 2102 2103 2104 2105	static int claim_swapfile(struct swap_info_struct p, struct inode inode) { int error; if (S_ISBLK(inode->i_mode)) { p->bdev = bdgrab(I_BDEV(inode)); error = blkdev_get(p->bdev, FMODE_READ \| FMODE_WRITE \| FMODE_EXCL, sys_swapon); if (error < 0) { p->bdev = NULL;
87ade72a7 Cesar Eduardo Barros sys_swapon: simpl...	2106	return -EINVAL;
4d0e1e107 Cesar Eduardo Barros sys_swapon: separ...	2107 2108 2109 2110	} p->old_block_size = block_size(p->bdev); error = set_blocksize(p->bdev, PAGE_SIZE); if (error < 0)
87ade72a7 Cesar Eduardo Barros sys_swapon: simpl...	2111	return error;
4d0e1e107 Cesar Eduardo Barros sys_swapon: separ...	2112 2113 2114 2115	p->flags \|= SWP_BLKDEV; } else if (S_ISREG(inode->i_mode)) { p->bdev = inode->i_sb->s_bdev; mutex_lock(&inode->i_mutex);
87ade72a7 Cesar Eduardo Barros sys_swapon: simpl...	2116 2117 2118 2119	if (IS_SWAPFILE(inode)) return -EBUSY; } else return -EINVAL;
4d0e1e107 Cesar Eduardo Barros sys_swapon: separ...	2120 2121	return 0;
4d0e1e107 Cesar Eduardo Barros sys_swapon: separ...	2122	}
ca8bd38bf Cesar Eduardo Barros sys_swapon: separ...	2123 2124 2125 2126 2127 2128 2129	static unsigned long read_swap_header(struct swap_info_struct p, union swap_header swap_header, struct inode *inode) { int i; unsigned long maxpages; unsigned long swapfilepages;
d6bbbd29b Raymond Jennings swap: warn when a...	2130	unsigned long last_page;
ca8bd38bf Cesar Eduardo Barros sys_swapon: separ...	2131 2132	if (memcmp("SWAPSPACE2", swap_header->magic.magic, 10)) {
465c47fd8 Andrew Morton mm/swapfile.c: co...	2133 2134	pr_err("Unable to find swap-space signature ");
387190253 Cesar Eduardo Barros sys_swapon: simpl...	2135	return 0;
ca8bd38bf Cesar Eduardo Barros sys_swapon: separ...	2136 2137 2138 2139 2140 2141 2142 2143 2144 2145 2146 2147	} /* swap partition endianess hack... / if (swab32(swap_header->info.version) == 1) { swab32s(&swap_header->info.version); swab32s(&swap_header->info.last_page); swab32s(&swap_header->info.nr_badpages); for (i = 0; i < swap_header->info.nr_badpages; i++) swab32s(&swap_header->info.badpages[i]); } / Check the swap header's sub-version */ if (swap_header->info.version != 1) {
465c47fd8 Andrew Morton mm/swapfile.c: co...	2148 2149 2150	pr_warn("Unable to handle swap header version %d ", swap_header->info.version);
387190253 Cesar Eduardo Barros sys_swapon: simpl...	2151	return 0;
ca8bd38bf Cesar Eduardo Barros sys_swapon: separ...	2152 2153 2154 2155 2156 2157 2158 2159	} p->lowest_bit = 1; p->cluster_next = 1; p->cluster_nr = 0; /* * Find out how many pages are allowed for a single swap
9b15b817f Hugh Dickins swap: fix shmem s...	2160	* device. There are two limiting factors: 1) the number
a2c16d6cb Hugh Dickins mm: let swap use ...	2161 2162	* of bits for the swap offset in the swp_entry_t type, and * 2) the number of bits in the swap pte as defined by the
9b15b817f Hugh Dickins swap: fix shmem s...	2163	* different architectures. In order to find the
a2c16d6cb Hugh Dickins mm: let swap use ...	2164	* largest possible bit mask, a swap entry with swap type 0
ca8bd38bf Cesar Eduardo Barros sys_swapon: separ...	2165	* and swap offset ~0UL is created, encoded to a swap pte,
a2c16d6cb Hugh Dickins mm: let swap use ...	2166	* decoded to a swp_entry_t again, and finally the swap
ca8bd38bf Cesar Eduardo Barros sys_swapon: separ...	2167 2168 2169	* offset is extracted. This will mask all the bits from * the initial ~0UL mask that can't be encoded in either * the swp_entry_t or the architecture definition of a
9b15b817f Hugh Dickins swap: fix shmem s...	2170	* swap pte.
ca8bd38bf Cesar Eduardo Barros sys_swapon: separ...	2171 2172	*/ maxpages = swp_offset(pte_to_swp_entry(
9b15b817f Hugh Dickins swap: fix shmem s...	2173	swp_entry_to_pte(swp_entry(0, ~0UL)))) + 1;
d6bbbd29b Raymond Jennings swap: warn when a...	2174 2175	last_page = swap_header->info.last_page; if (last_page > maxpages) {
465c47fd8 Andrew Morton mm/swapfile.c: co...	2176 2177	pr_warn("Truncating oversized swap area, only using %luk out of %luk ",
d6bbbd29b Raymond Jennings swap: warn when a...	2178 2179 2180 2181 2182	maxpages << (PAGE_SHIFT - 10), last_page << (PAGE_SHIFT - 10)); } if (maxpages > last_page) { maxpages = last_page + 1;
ca8bd38bf Cesar Eduardo Barros sys_swapon: separ...	2183 2184 2185 2186 2187 2188 2189	/* p->max is an unsigned int: don't overflow it */ if ((unsigned int)maxpages == 0) maxpages = UINT_MAX; } p->highest_bit = maxpages - 1; if (!maxpages)
387190253 Cesar Eduardo Barros sys_swapon: simpl...	2190	return 0;
ca8bd38bf Cesar Eduardo Barros sys_swapon: separ...	2191 2192	swapfilepages = i_size_read(inode) >> PAGE_SHIFT; if (swapfilepages && maxpages > swapfilepages) {
465c47fd8 Andrew Morton mm/swapfile.c: co...	2193 2194	pr_warn("Swap area shorter than signature indicates ");
387190253 Cesar Eduardo Barros sys_swapon: simpl...	2195	return 0;
ca8bd38bf Cesar Eduardo Barros sys_swapon: separ...	2196 2197	} if (swap_header->info.nr_badpages && S_ISREG(inode->i_mode))
387190253 Cesar Eduardo Barros sys_swapon: simpl...	2198	return 0;
ca8bd38bf Cesar Eduardo Barros sys_swapon: separ...	2199	if (swap_header->info.nr_badpages > MAX_SWAP_BADPAGES)
387190253 Cesar Eduardo Barros sys_swapon: simpl...	2200	return 0;
ca8bd38bf Cesar Eduardo Barros sys_swapon: separ...	2201 2202	return maxpages;
ca8bd38bf Cesar Eduardo Barros sys_swapon: separ...	2203	}
915d4d7bc Cesar Eduardo Barros sys_swapon: separ...	2204 2205 2206	static int setup_swap_map_and_extents(struct swap_info_struct p, union swap_header swap_header, unsigned char *swap_map,
2a8f94493 Shaohua Li swap: change bloc...	2207	struct swap_cluster_info *cluster_info,
915d4d7bc Cesar Eduardo Barros sys_swapon: separ...	2208 2209 2210 2211	unsigned long maxpages, sector_t *span) { int i;
915d4d7bc Cesar Eduardo Barros sys_swapon: separ...	2212 2213	unsigned int nr_good_pages; int nr_extents;
2a8f94493 Shaohua Li swap: change bloc...	2214 2215	unsigned long nr_clusters = DIV_ROUND_UP(maxpages, SWAPFILE_CLUSTER); unsigned long idx = p->cluster_next / SWAPFILE_CLUSTER;
915d4d7bc Cesar Eduardo Barros sys_swapon: separ...	2216 2217	nr_good_pages = maxpages - 1; /* omit header page */
2a8f94493 Shaohua Li swap: change bloc...	2218 2219	cluster_set_null(&p->free_cluster_head); cluster_set_null(&p->free_cluster_tail);
815c2c543 Shaohua Li swap: make swap d...	2220 2221	cluster_set_null(&p->discard_cluster_head); cluster_set_null(&p->discard_cluster_tail);
2a8f94493 Shaohua Li swap: change bloc...	2222
915d4d7bc Cesar Eduardo Barros sys_swapon: separ...	2223 2224	for (i = 0; i < swap_header->info.nr_badpages; i++) { unsigned int page_nr = swap_header->info.badpages[i];
bdb8e3f68 Cesar Eduardo Barros sys_swapon: simpl...	2225 2226	if (page_nr == 0 \|\| page_nr > swap_header->info.last_page) return -EINVAL;
915d4d7bc Cesar Eduardo Barros sys_swapon: separ...	2227 2228 2229	if (page_nr < maxpages) { swap_map[page_nr] = SWAP_MAP_BAD; nr_good_pages--;
2a8f94493 Shaohua Li swap: change bloc...	2230 2231 2232 2233 2234	/* * Haven't marked the cluster free yet, no list * operation involved */ inc_cluster_info_page(p, cluster_info, page_nr);
915d4d7bc Cesar Eduardo Barros sys_swapon: separ...	2235 2236	} }
2a8f94493 Shaohua Li swap: change bloc...	2237 2238 2239	/* Haven't marked the cluster free yet, no list operation involved */ for (i = maxpages; i < round_up(maxpages, SWAPFILE_CLUSTER); i++) inc_cluster_info_page(p, cluster_info, i);
915d4d7bc Cesar Eduardo Barros sys_swapon: separ...	2240 2241	if (nr_good_pages) { swap_map[0] = SWAP_MAP_BAD;
2a8f94493 Shaohua Li swap: change bloc...	2242 2243 2244 2245 2246	/* * Not mark the cluster free yet, no list * operation involved */ inc_cluster_info_page(p, cluster_info, 0);
915d4d7bc Cesar Eduardo Barros sys_swapon: separ...	2247 2248 2249	p->max = maxpages; p->pages = nr_good_pages; nr_extents = setup_swap_extents(p, span);
bdb8e3f68 Cesar Eduardo Barros sys_swapon: simpl...	2250 2251	if (nr_extents < 0) return nr_extents;
915d4d7bc Cesar Eduardo Barros sys_swapon: separ...	2252 2253 2254	nr_good_pages = p->pages; } if (!nr_good_pages) {
465c47fd8 Andrew Morton mm/swapfile.c: co...	2255 2256	pr_warn("Empty swap-file ");
bdb8e3f68 Cesar Eduardo Barros sys_swapon: simpl...	2257	return -EINVAL;
915d4d7bc Cesar Eduardo Barros sys_swapon: separ...	2258	}
2a8f94493 Shaohua Li swap: change bloc...	2259 2260 2261 2262 2263 2264 2265 2266 2267 2268 2269 2270 2271 2272 2273 2274 2275 2276 2277 2278 2279 2280 2281 2282	if (!cluster_info) return nr_extents; for (i = 0; i < nr_clusters; i++) { if (!cluster_count(&cluster_info[idx])) { cluster_set_flag(&cluster_info[idx], CLUSTER_FLAG_FREE); if (cluster_is_null(&p->free_cluster_head)) { cluster_set_next_flag(&p->free_cluster_head, idx, 0); cluster_set_next_flag(&p->free_cluster_tail, idx, 0); } else { unsigned int tail; tail = cluster_next(&p->free_cluster_tail); cluster_set_next(&cluster_info[tail], idx); cluster_set_next_flag(&p->free_cluster_tail, idx, 0); } } idx++; if (idx == nr_clusters) idx = 0; }
915d4d7bc Cesar Eduardo Barros sys_swapon: separ...	2283	return nr_extents;
915d4d7bc Cesar Eduardo Barros sys_swapon: separ...	2284	}
dcf6b7ddd Rafael Aquini swap: discard whi...	2285 2286 2287 2288 2289 2290 2291 2292 2293 2294 2295 2296 2297	/* * Helper to sys_swapon determining if a given swap * backing device queue supports DISCARD operations. / static bool swap_discardable(struct swap_info_struct si) { struct request_queue *q = bdev_get_queue(si->bdev); if (!q \|\| !blk_queue_discard(q)) return false; return true; }
53cbb2435 Cesar Eduardo Barros sys_swapon: separ...	2298 2299 2300	SYSCALL_DEFINE2(swapon, const char __user , specialfile, int, swap_flags) { struct swap_info_struct p;
91a27b2a7 Jeff Layton vfs: define struc...	2301	struct filename *name;
53cbb2435 Cesar Eduardo Barros sys_swapon: separ...	2302 2303	struct file swap_file = NULL; struct address_space mapping;
40531542e Cesar Eduardo Barros sys_swapon: separ...	2304 2305	int i; int prio;
53cbb2435 Cesar Eduardo Barros sys_swapon: separ...	2306 2307	int error; union swap_header *swap_header;
915d4d7bc Cesar Eduardo Barros sys_swapon: separ...	2308	int nr_extents;
53cbb2435 Cesar Eduardo Barros sys_swapon: separ...	2309 2310	sector_t span; unsigned long maxpages;
53cbb2435 Cesar Eduardo Barros sys_swapon: separ...	2311	unsigned char *swap_map = NULL;
2a8f94493 Shaohua Li swap: change bloc...	2312	struct swap_cluster_info *cluster_info = NULL;
38b5faf4b Dan Magenheimer mm: frontswap: co...	2313	unsigned long *frontswap_map = NULL;
53cbb2435 Cesar Eduardo Barros sys_swapon: separ...	2314 2315	struct page page = NULL; struct inode inode = NULL;
53cbb2435 Cesar Eduardo Barros sys_swapon: separ...	2316
d15cab975 Hugh Dickins swapon: check val...	2317 2318	if (swap_flags & ~SWAP_FLAGS_VALID) return -EINVAL;
53cbb2435 Cesar Eduardo Barros sys_swapon: separ...	2319 2320 2321 2322	if (!capable(CAP_SYS_ADMIN)) return -EPERM; p = alloc_swap_info();
2542e5134 Cesar Eduardo Barros sys_swapon: simpl...	2323 2324	if (IS_ERR(p)) return PTR_ERR(p);
53cbb2435 Cesar Eduardo Barros sys_swapon: separ...	2325
815c2c543 Shaohua Li swap: make swap d...	2326	INIT_WORK(&p->discard_work, swap_discard_work);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2327	name = getname(specialfile);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2328	if (IS_ERR(name)) {
7de7fb6b3 Cesar Eduardo Barros sys_swapon: move ...	2329	error = PTR_ERR(name);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2330	name = NULL;
bd69010b0 Cesar Eduardo Barros sys_swapon: use a...	2331	goto bad_swap;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2332	}
669abf4e5 Jeff Layton vfs: make path_op...	2333	swap_file = file_open_name(name, O_RDWR\|O_LARGEFILE, 0);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2334	if (IS_ERR(swap_file)) {
7de7fb6b3 Cesar Eduardo Barros sys_swapon: move ...	2335	error = PTR_ERR(swap_file);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2336	swap_file = NULL;
bd69010b0 Cesar Eduardo Barros sys_swapon: use a...	2337	goto bad_swap;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2338 2339 2340 2341	} p->swap_file = swap_file; mapping = swap_file->f_mapping;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2342
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2343	for (i = 0; i < nr_swapfiles; i++) {
efa90a981 Hugh Dickins swap_info: change...	2344	struct swap_info_struct *q = swap_info[i];
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2345
e8e6c2ec4 Cesar Eduardo Barros sys_swapon: do no...	2346	if (q == p \|\| !q->swap_file)
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2347	continue;
7de7fb6b3 Cesar Eduardo Barros sys_swapon: move ...	2348 2349	if (mapping == q->swap_file->f_mapping) { error = -EBUSY;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2350	goto bad_swap;
7de7fb6b3 Cesar Eduardo Barros sys_swapon: move ...	2351	}
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2352	}
2130781e2 Cesar Eduardo Barros sys_swapon: fix i...	2353 2354	inode = mapping->host; /* If S_ISREG(inode->i_mode) will do mutex_lock(&inode->i_mutex); */
4d0e1e107 Cesar Eduardo Barros sys_swapon: separ...	2355 2356	error = claim_swapfile(p, inode); if (unlikely(error))
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2357	goto bad_swap;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2358
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2359 2360 2361 2362 2363 2364 2365	/* * Read the swap header. */ if (!mapping->a_ops->readpage) { error = -EINVAL; goto bad_swap; }
090d2b185 Pekka Enberg [PATCH] read_mapp...	2366	page = read_mapping_page(mapping, 0, swap_file);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2367 2368 2369 2370	if (IS_ERR(page)) { error = PTR_ERR(page); goto bad_swap; }
81e339712 Hugh Dickins swapfile: remove ...	2371	swap_header = kmap(page);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2372
ca8bd38bf Cesar Eduardo Barros sys_swapon: separ...	2373 2374	maxpages = read_swap_header(p, swap_header, inode); if (unlikely(!maxpages)) {
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2375 2376 2377	error = -EINVAL; goto bad_swap; }
886bb7e9c Hugh Dickins swapfile: remove ...	2378
81e339712 Hugh Dickins swapfile: remove ...	2379	/* OK, set up the swap map and apply the bad block list */
803d0c835 Cesar Eduardo Barros sys_swapon: use v...	2380	swap_map = vzalloc(maxpages);
81e339712 Hugh Dickins swapfile: remove ...	2381 2382 2383 2384	if (!swap_map) { error = -ENOMEM; goto bad_swap; }
2a8f94493 Shaohua Li swap: change bloc...	2385 2386 2387 2388 2389 2390 2391 2392 2393 2394 2395 2396 2397 2398	if (p->bdev && blk_queue_nonrot(bdev_get_queue(p->bdev))) { p->flags \|= SWP_SOLIDSTATE; /* * select a random position to start with to help wear leveling * SSD / p->cluster_next = 1 + (prandom_u32() % p->highest_bit); cluster_info = vzalloc(DIV_ROUND_UP(maxpages, SWAPFILE_CLUSTER) sizeof(*cluster_info)); if (!cluster_info) { error = -ENOMEM; goto bad_swap; }
ebc2a1a69 Shaohua Li swap: make cluste...	2399 2400 2401 2402 2403 2404 2405 2406 2407 2408	p->percpu_cluster = alloc_percpu(struct percpu_cluster); if (!p->percpu_cluster) { error = -ENOMEM; goto bad_swap; } for_each_possible_cpu(i) { struct percpu_cluster *cluster; cluster = per_cpu_ptr(p->percpu_cluster, i); cluster_set_null(&cluster->index); }
2a8f94493 Shaohua Li swap: change bloc...	2409	}
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2410
1421ef3cd Cesar Eduardo Barros sys_swapon: call ...	2411 2412 2413	error = swap_cgroup_swapon(p->type, maxpages); if (error) goto bad_swap;
915d4d7bc Cesar Eduardo Barros sys_swapon: separ...	2414	nr_extents = setup_swap_map_and_extents(p, swap_header, swap_map,
2a8f94493 Shaohua Li swap: change bloc...	2415	cluster_info, maxpages, &span);
915d4d7bc Cesar Eduardo Barros sys_swapon: separ...	2416 2417	if (unlikely(nr_extents < 0)) { error = nr_extents;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2418 2419	goto bad_swap; }
38b5faf4b Dan Magenheimer mm: frontswap: co...	2420 2421	/* frontswap enabled? set up bit-per-page map for frontswap */ if (frontswap_enabled)
7b57976da Akinobu Mita frontswap: fix in...	2422	frontswap_map = vzalloc(BITS_TO_LONGS(maxpages) * sizeof(long));
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2423
2a8f94493 Shaohua Li swap: change bloc...	2424 2425 2426 2427 2428 2429 2430 2431 2432	if (p->bdev &&(swap_flags & SWAP_FLAG_DISCARD) && swap_discardable(p)) { /* * When discard is enabled for swap with no particular * policy flagged, we set all swap discard flags here in * order to sustain backward compatibility with older * swapon(8) releases. */ p->flags \|= (SWP_DISCARDABLE \| SWP_AREA_DISCARD \| SWP_PAGE_DISCARD);
dcf6b7ddd Rafael Aquini swap: discard whi...	2433
2a8f94493 Shaohua Li swap: change bloc...	2434 2435 2436 2437 2438 2439 2440 2441 2442 2443 2444 2445 2446 2447 2448 2449 2450 2451	/* * By flagging sys_swapon, a sysadmin can tell us to * either do single-time area discards only, or to just * perform discards for released swap page-clusters. * Now it's time to adjust the p->flags accordingly. / if (swap_flags & SWAP_FLAG_DISCARD_ONCE) p->flags &= ~SWP_PAGE_DISCARD; else if (swap_flags & SWAP_FLAG_DISCARD_PAGES) p->flags &= ~SWP_AREA_DISCARD; / issue a swapon-time discard if it's still required */ if (p->flags & SWP_AREA_DISCARD) { int err = discard_swap(p); if (unlikely(err)) pr_err("swapon: discard_swap(%p): %d ", p, err);
dcf6b7ddd Rafael Aquini swap: discard whi...	2452	}
20137a490 Hugh Dickins swapfile: swapon ...	2453	}
6a6ba8317 Hugh Dickins swapfile: swapon ...	2454
fc0abb145 Ingo Molnar [PATCH] sem2mutex...	2455	mutex_lock(&swapon_mutex);
40531542e Cesar Eduardo Barros sys_swapon: separ...	2456	prio = -1;
78ecba081 Hugh Dickins mm: fix ever-decr...	2457	if (swap_flags & SWAP_FLAG_PREFER)
40531542e Cesar Eduardo Barros sys_swapon: separ...	2458	prio =
78ecba081 Hugh Dickins mm: fix ever-decr...	2459	(swap_flags & SWAP_FLAG_PRIO_MASK) >> SWAP_FLAG_PRIO_SHIFT;
2a8f94493 Shaohua Li swap: change bloc...	2460	enable_swap_info(p, prio, swap_map, cluster_info, frontswap_map);
c69dbfb84 Cesar Eduardo Barros sys_swapon: move ...	2461
465c47fd8 Andrew Morton mm/swapfile.c: co...	2462	pr_info("Adding %uk swap on %s. "
dcf6b7ddd Rafael Aquini swap: discard whi...	2463 2464	"Priority:%d extents:%d across:%lluk %s%s%s%s%s ",
91a27b2a7 Jeff Layton vfs: define struc...	2465	p->pages<<(PAGE_SHIFT-10), name->name, p->prio,
c69dbfb84 Cesar Eduardo Barros sys_swapon: move ...	2466 2467	nr_extents, (unsigned long long)span<<(PAGE_SHIFT-10), (p->flags & SWP_SOLIDSTATE) ? "SS" : "",
38b5faf4b Dan Magenheimer mm: frontswap: co...	2468	(p->flags & SWP_DISCARDABLE) ? "D" : "",
dcf6b7ddd Rafael Aquini swap: discard whi...	2469 2470	(p->flags & SWP_AREA_DISCARD) ? "s" : "", (p->flags & SWP_PAGE_DISCARD) ? "c" : "",
38b5faf4b Dan Magenheimer mm: frontswap: co...	2471	(frontswap_map) ? "FS" : "");
c69dbfb84 Cesar Eduardo Barros sys_swapon: move ...	2472
fc0abb145 Ingo Molnar [PATCH] sem2mutex...	2473	mutex_unlock(&swapon_mutex);
66d7dd518 Kay Sievers /proc/swaps: supp...	2474 2475	atomic_inc(&proc_poll_event); wake_up_interruptible(&proc_poll_wait);
9b01c350a Cesar Eduardo Barros sys_swapon: do on...	2476 2477	if (S_ISREG(inode->i_mode)) inode->i_flags \|= S_SWAPFILE;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2478 2479 2480	error = 0; goto out; bad_swap:
ebc2a1a69 Shaohua Li swap: make cluste...	2481 2482	free_percpu(p->percpu_cluster); p->percpu_cluster = NULL;
bd69010b0 Cesar Eduardo Barros sys_swapon: use a...	2483	if (inode && S_ISBLK(inode->i_mode) && p->bdev) {
f2090d2df Cesar Eduardo Barros sys_swapon: remov...	2484 2485	set_blocksize(p->bdev, p->old_block_size); blkdev_put(p->bdev, FMODE_READ \| FMODE_WRITE \| FMODE_EXCL);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2486	}
4cd3bb10f Hugh Dickins [PATCH] swap: mov...	2487	destroy_swap_extents(p);
e8e6c2ec4 Cesar Eduardo Barros sys_swapon: do no...	2488	swap_cgroup_swapoff(p->type);
5d337b919 Hugh Dickins [PATCH] swap: swa...	2489	spin_lock(&swap_lock);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2490	p->swap_file = NULL;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2491	p->flags = 0;
5d337b919 Hugh Dickins [PATCH] swap: swa...	2492	spin_unlock(&swap_lock);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2493	vfree(swap_map);
2a8f94493 Shaohua Li swap: change bloc...	2494	vfree(cluster_info);
52c50567d Mel Gorman mm: swap: unlock ...	2495	if (swap_file) {
2130781e2 Cesar Eduardo Barros sys_swapon: fix i...	2496	if (inode && S_ISREG(inode->i_mode)) {
52c50567d Mel Gorman mm: swap: unlock ...	2497	mutex_unlock(&inode->i_mutex);
2130781e2 Cesar Eduardo Barros sys_swapon: fix i...	2498 2499	inode = NULL; }
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2500	filp_close(swap_file, NULL);
52c50567d Mel Gorman mm: swap: unlock ...	2501	}
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2502 2503 2504 2505 2506 2507 2508	out: if (page && !IS_ERR(page)) { kunmap(page); page_cache_release(page); } if (name) putname(name);
9b01c350a Cesar Eduardo Barros sys_swapon: do on...	2509	if (inode && S_ISREG(inode->i_mode))
1b1dcc1b5 Jes Sorensen [PATCH] mutex sub...	2510	mutex_unlock(&inode->i_mutex);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2511 2512 2513 2514 2515	return error; } void si_swapinfo(struct sysinfo *val) {
efa90a981 Hugh Dickins swap_info: change...	2516	unsigned int type;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2517	unsigned long nr_to_be_unused = 0;
5d337b919 Hugh Dickins [PATCH] swap: swa...	2518	spin_lock(&swap_lock);
efa90a981 Hugh Dickins swap_info: change...	2519 2520 2521 2522 2523	for (type = 0; type < nr_swapfiles; type++) { struct swap_info_struct *si = swap_info[type]; if ((si->flags & SWP_USED) && !(si->flags & SWP_WRITEOK)) nr_to_be_unused += si->inuse_pages;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2524	}
ec8acf20a Shaohua Li swap: add per-par...	2525	val->freeswap = atomic_long_read(&nr_swap_pages) + nr_to_be_unused;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2526	val->totalswap = total_swap_pages + nr_to_be_unused;
5d337b919 Hugh Dickins [PATCH] swap: swa...	2527	spin_unlock(&swap_lock);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2528 2529 2530 2531 2532	} /* * Verify that a swap entry is valid and increment its swap map count. *
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	2533 2534 2535 2536 2537 2538	* Returns error code in following case. * - success -> 0 * - swp_entry is invalid -> EINVAL * - swp_entry is migration entry -> EINVAL * - swap-cache reference is requested but there is already one. -> EEXIST * - swap-cache reference is requested but the entry is not used. -> ENOENT
570a335b8 Hugh Dickins swap_info: swap c...	2539	* - swap-mapped reference requested but needs continued swap count. -> ENOMEM
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2540	*/
8d69aaee8 Hugh Dickins swap_info: swap_m...	2541	static int __swap_duplicate(swp_entry_t entry, unsigned char usage)
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2542	{
73c34b6ac Hugh Dickins swap_info: miscel...	2543	struct swap_info_struct *p;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2544	unsigned long offset, type;
8d69aaee8 Hugh Dickins swap_info: swap_m...	2545 2546	unsigned char count; unsigned char has_cache;
253d553ba Hugh Dickins swap_info: SWAP_H...	2547	int err = -EINVAL;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2548
a7420aa54 Andi Kleen HWPOISON: Add sup...	2549	if (non_swap_entry(entry))
253d553ba Hugh Dickins swap_info: SWAP_H...	2550	goto out;
0697212a4 Christoph Lameter [PATCH] Swapless ...	2551
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2552 2553 2554	type = swp_type(entry); if (type >= nr_swapfiles) goto bad_file;
efa90a981 Hugh Dickins swap_info: change...	2555	p = swap_info[type];
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2556	offset = swp_offset(entry);
ec8acf20a Shaohua Li swap: add per-par...	2557	spin_lock(&p->lock);
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	2558 2559	if (unlikely(offset >= p->max)) goto unlock_out;
253d553ba Hugh Dickins swap_info: SWAP_H...	2560	count = p->swap_map[offset];
edfe23dac Shaohua Li swap: fix races e...	2561 2562 2563 2564 2565 2566 2567 2568 2569	/* * swapin_readahead() doesn't check if a swap entry is valid, so the * swap entry could be SWAP_MAP_BAD. Check here with lock held. */ if (unlikely(swap_count(count) == SWAP_MAP_BAD)) { err = -ENOENT; goto unlock_out; }
253d553ba Hugh Dickins swap_info: SWAP_H...	2570 2571 2572	has_cache = count & SWAP_HAS_CACHE; count &= ~SWAP_HAS_CACHE; err = 0;
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	2573
253d553ba Hugh Dickins swap_info: SWAP_H...	2574	if (usage == SWAP_HAS_CACHE) {
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	2575 2576	/* set SWAP_HAS_CACHE if there is no cache and entry is used */
253d553ba Hugh Dickins swap_info: SWAP_H...	2577 2578 2579 2580 2581 2582	if (!has_cache && count) has_cache = SWAP_HAS_CACHE; else if (has_cache) /* someone else added cache / err = -EEXIST; else / no users remaining */ err = -ENOENT;
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	2583 2584	} else if (count \|\| has_cache) {
253d553ba Hugh Dickins swap_info: SWAP_H...	2585
570a335b8 Hugh Dickins swap_info: swap c...	2586 2587 2588	if ((count & ~COUNT_CONTINUED) < SWAP_MAP_MAX) count += usage; else if ((count & ~COUNT_CONTINUED) > SWAP_MAP_MAX)
253d553ba Hugh Dickins swap_info: SWAP_H...	2589	err = -EINVAL;
570a335b8 Hugh Dickins swap_info: swap c...	2590 2591 2592 2593	else if (swap_count_continued(p, offset, count)) count = COUNT_CONTINUED; else err = -ENOMEM;
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	2594	} else
253d553ba Hugh Dickins swap_info: SWAP_H...	2595 2596 2597	err = -ENOENT; /* unused swap entry */ p->swap_map[offset] = count \| has_cache;
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	2598	unlock_out:
ec8acf20a Shaohua Li swap: add per-par...	2599	spin_unlock(&p->lock);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2600	out:
253d553ba Hugh Dickins swap_info: SWAP_H...	2601	return err;
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2602 2603	bad_file:
465c47fd8 Andrew Morton mm/swapfile.c: co...	2604 2605	pr_err("swap_dup: %s%08lx ", Bad_file, entry.val);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2606 2607	goto out; }
253d553ba Hugh Dickins swap_info: SWAP_H...	2608
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	2609	/*
aaa468653 Hugh Dickins swap_info: note S...	2610 2611 2612 2613 2614 2615 2616 2617 2618	* Help swapoff by noting that swap entry belongs to shmem/tmpfs * (in which case its reference count is never incremented). / void swap_shmem_alloc(swp_entry_t entry) { __swap_duplicate(entry, SWAP_MAP_SHMEM); } /
08259d58e Hugh Dickins mm: add comment o...	2619 2620 2621 2622 2623	* Increase reference count of swap entry by 1. * Returns 0 for success, or -ENOMEM if a swap_count_continuation is required * but could not be atomically allocated. Returns 0, just as if it succeeded, * if __swap_duplicate() fails for another reason (-EINVAL or -ENOENT), which * might occur if a page table entry has got corrupted.
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	2624	*/
570a335b8 Hugh Dickins swap_info: swap c...	2625	int swap_duplicate(swp_entry_t entry)
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	2626	{
570a335b8 Hugh Dickins swap_info: swap c...	2627 2628 2629 2630 2631	int err = 0; while (!err && __swap_duplicate(entry, 1) == -ENOMEM) err = add_swap_count_continuation(entry, GFP_ATOMIC); return err;
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	2632	}
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2633
cb4b86ba4 KAMEZAWA Hiroyuki mm: add swap cach...	2634	/*
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	2635 2636	* @entry: swap entry for which we allocate swap cache. *
73c34b6ac Hugh Dickins swap_info: miscel...	2637	* Called when allocating swap cache for existing swap entry,
355cfa73d KAMEZAWA Hiroyuki mm: modify swap_m...	2638 2639 2640	* This can return error codes. Returns 0 at success. * -EBUSY means there is a swap cache. * Note: return code is different from swap_duplicate().
cb4b86ba4 KAMEZAWA Hiroyuki mm: add swap cach...	2641 2642 2643	*/ int swapcache_prepare(swp_entry_t entry) {
253d553ba Hugh Dickins swap_info: SWAP_H...	2644	return __swap_duplicate(entry, SWAP_HAS_CACHE);
cb4b86ba4 KAMEZAWA Hiroyuki mm: add swap cach...	2645	}
f981c5950 Mel Gorman mm: methods for t...	2646 2647 2648 2649 2650 2651 2652 2653 2654 2655 2656 2657	struct swap_info_struct page_swap_info(struct page page) { swp_entry_t swap = { .val = page_private(page) }; BUG_ON(!PageSwapCache(page)); return swap_info[swp_type(swap)]; } /* * out-of-line __page_file_ methods to avoid include hell. / struct address_space __page_file_mapping(struct page *page) {
309381fea Sasha Levin mm: dump page whe...	2658	VM_BUG_ON_PAGE(!PageSwapCache(page), page);
f981c5950 Mel Gorman mm: methods for t...	2659 2660 2661 2662 2663 2664 2665	return page_swap_info(page)->swap_file->f_mapping; } EXPORT_SYMBOL_GPL(__page_file_mapping); pgoff_t __page_file_index(struct page *page) { swp_entry_t swap = { .val = page_private(page) };
309381fea Sasha Levin mm: dump page whe...	2666	VM_BUG_ON_PAGE(!PageSwapCache(page), page);
f981c5950 Mel Gorman mm: methods for t...	2667 2668 2669	return swp_offset(swap); } EXPORT_SYMBOL_GPL(__page_file_index);
1da177e4c Linus Torvalds Linux-2.6.12-rc2	2670	/*
570a335b8 Hugh Dickins swap_info: swap c...	2671 2672 2673 2674 2675 2676 2677 2678 2679 2680 2681 2682 2683 2684 2685 2686 2687 2688 2689 2690 2691 2692 2693 2694 2695 2696 2697 2698 2699 2700 2701 2702 2703 2704 2705 2706 2707 2708 2709 2710 2711 2712 2713 2714 2715 2716 2717 2718 2719 2720 2721 2722	* add_swap_count_continuation - called when a swap count is duplicated * beyond SWAP_MAP_MAX, it allocates a new page and links that to the entry's * page of the original vmalloc'ed swap_map, to hold the continuation count * (for that entry and for its neighbouring PAGE_SIZE swap entries). Called * again when count is duplicated beyond SWAP_MAP_MAX * SWAP_CONT_MAX, etc. * * These continuation pages are seldom referenced: the common paths all work * on the original swap_map, only referring to a continuation page when the * low "digit" of a count is incremented or decremented through SWAP_MAP_MAX. * * add_swap_count_continuation(, GFP_ATOMIC) can be called while holding * page table locks; if it fails, add_swap_count_continuation(, GFP_KERNEL) * can be called after dropping locks. / int add_swap_count_continuation(swp_entry_t entry, gfp_t gfp_mask) { struct swap_info_struct si; struct page head; struct page page; struct page list_page; pgoff_t offset; unsigned char count; / * When debugging, it's easier to use __GFP_ZERO here; but it's better * for latency not to zero a page while GFP_ATOMIC and holding locks. / page = alloc_page(gfp_mask \| __GFP_HIGHMEM); si = swap_info_get(entry); if (!si) { / * An acceptable race has occurred since the failing * __swap_duplicate(): the swap entry has been freed, * perhaps even the whole swap_map cleared for swapoff. / goto outer; } offset = swp_offset(entry); count = si->swap_map[offset] & ~SWAP_HAS_CACHE; if ((count & ~COUNT_CONTINUED) != SWAP_MAP_MAX) { / * The higher the swap count, the more likely it is that tasks * will race to add swap count continuation: we need to avoid * over-provisioning. */ goto out; } if (!page) {
ec8acf20a Shaohua Li swap: add per-par...	2723	spin_unlock(&si->lock);
570a335b8 Hugh Dickins swap_info: swap c...	2724 2725 2726 2727 2728	return -ENOMEM; } /* * We are fortunate that although vmalloc_to_page uses pte_offset_map,
2de1a7e40 Seth Jennings mm/swapfile.c: fi...	2729 2730	* no architecture is using highmem pages for kernel page tables: so it * will not corrupt the GFP_ATOMIC caller's atomic page table kmaps.
570a335b8 Hugh Dickins swap_info: swap c...	2731 2732 2733 2734 2735 2736 2737 2738 2739 2740 2741 2742 2743 2744 2745 2746 2747 2748 2749 2750 2751 2752 2753 2754	/ head = vmalloc_to_page(si->swap_map + offset); offset &= ~PAGE_MASK; / * Page allocation does not initialize the page's lru field, * but it does always reset its private field. / if (!page_private(head)) { BUG_ON(count & COUNT_CONTINUED); INIT_LIST_HEAD(&head->lru); set_page_private(head, SWP_CONTINUED); si->flags \|= SWP_CONTINUED; } list_for_each_entry(list_page, &head->lru, lru) { unsigned char map; /* * If the previous map said no continuation, but we've found * a continuation page, free our allocation and use this one. */ if (!(count & COUNT_CONTINUED)) goto out;
9b04c5fec Cong Wang mm: remove the se...	2755	map = kmap_atomic(list_page) + offset;
570a335b8 Hugh Dickins swap_info: swap c...	2756	count = *map;
9b04c5fec Cong Wang mm: remove the se...	2757	kunmap_atomic(map);
570a335b8 Hugh Dickins swap_info: swap c...	2758 2759 2760 2761 2762 2763 2764 2765 2766 2767 2768 2769	/* * If this continuation count now has some space in it, * free our allocation and use this one. / if ((count & ~COUNT_CONTINUED) != SWAP_CONT_MAX) goto out; } list_add_tail(&page->lru, &head->lru); page = NULL; / now it's attached, don't free it */ out:
ec8acf20a Shaohua Li swap: add per-par...	2770	spin_unlock(&si->lock);
570a335b8 Hugh Dickins swap_info: swap c...	2771 2772 2773 2774 2775 2776 2777 2778 2779 2780 2781 2782 2783 2784 2785 2786 2787 2788 2789 2790 2791 2792 2793 2794 2795 2796 2797 2798 2799	outer: if (page) __free_page(page); return 0; } /* * swap_count_continued - when the original swap_map count is incremented * from SWAP_MAP_MAX, check if there is already a continuation page to carry * into, carry if so, or else fail until a new continuation page is allocated; * when the original swap_map count is decremented from 0 with continuation, * borrow from the continuation and report whether it still holds more. * Called while __swap_duplicate() or swap_entry_free() holds swap_lock. / static bool swap_count_continued(struct swap_info_struct si, pgoff_t offset, unsigned char count) { struct page head; struct page page; unsigned char map; head = vmalloc_to_page(si->swap_map + offset); if (page_private(head) != SWP_CONTINUED) { BUG_ON(count & COUNT_CONTINUED); return false; / need to add count continuation */ } offset &= ~PAGE_MASK; page = list_entry(head->lru.next, struct page, lru);
9b04c5fec Cong Wang mm: remove the se...	2800	map = kmap_atomic(page) + offset;
570a335b8 Hugh Dickins swap_info: swap c...	2801 2802 2803 2804 2805 2806 2807 2808 2809	if (count == SWAP_MAP_MAX) /* initial increment from swap_map / goto init_map; / jump over SWAP_CONT_MAX checks / if (count == (SWAP_MAP_MAX \| COUNT_CONTINUED)) { / incrementing / / * Think of how you add 1 to 999 / while (map == (SWAP_CONT_MAX \| COUNT_CONTINUED)) {
9b04c5fec Cong Wang mm: remove the se...	2810	kunmap_atomic(map);
570a335b8 Hugh Dickins swap_info: swap c...	2811 2812	page = list_entry(page->lru.next, struct page, lru); BUG_ON(page == head);
9b04c5fec Cong Wang mm: remove the se...	2813	map = kmap_atomic(page) + offset;
570a335b8 Hugh Dickins swap_info: swap c...	2814 2815	} if (*map == SWAP_CONT_MAX) {
9b04c5fec Cong Wang mm: remove the se...	2816	kunmap_atomic(map);
570a335b8 Hugh Dickins swap_info: swap c...	2817 2818 2819	page = list_entry(page->lru.next, struct page, lru); if (page == head) return false; /* add count continuation */
9b04c5fec Cong Wang mm: remove the se...	2820	map = kmap_atomic(page) + offset;
570a335b8 Hugh Dickins swap_info: swap c...	2821 2822 2823	init_map: map = 0; / we didn't zero the page / } map += 1;
9b04c5fec Cong Wang mm: remove the se...	2824	kunmap_atomic(map);
570a335b8 Hugh Dickins swap_info: swap c...	2825 2826	page = list_entry(page->lru.prev, struct page, lru); while (page != head) {
9b04c5fec Cong Wang mm: remove the se...	2827	map = kmap_atomic(page) + offset;
570a335b8 Hugh Dickins swap_info: swap c...	2828	*map = COUNT_CONTINUED;
9b04c5fec Cong Wang mm: remove the se...	2829	kunmap_atomic(map);
570a335b8 Hugh Dickins swap_info: swap c...	2830 2831 2832 2833 2834 2835 2836 2837 2838 2839	page = list_entry(page->lru.prev, struct page, lru); } return true; /* incremented / } else { / decrementing / / * Think of how you subtract 1 from 1000 / BUG_ON(count != COUNT_CONTINUED); while (map == COUNT_CONTINUED) {
9b04c5fec Cong Wang mm: remove the se...	2840	kunmap_atomic(map);
570a335b8 Hugh Dickins swap_info: swap c...	2841 2842	page = list_entry(page->lru.next, struct page, lru); BUG_ON(page == head);
9b04c5fec Cong Wang mm: remove the se...	2843	map = kmap_atomic(page) + offset;
570a335b8 Hugh Dickins swap_info: swap c...	2844 2845 2846 2847 2848	} BUG_ON(map == 0); map -= 1; if (*map == 0) count = 0;
9b04c5fec Cong Wang mm: remove the se...	2849	kunmap_atomic(map);
570a335b8 Hugh Dickins swap_info: swap c...	2850 2851	page = list_entry(page->lru.prev, struct page, lru); while (page != head) {
9b04c5fec Cong Wang mm: remove the se...	2852	map = kmap_atomic(page) + offset;
570a335b8 Hugh Dickins swap_info: swap c...	2853 2854	*map = SWAP_CONT_MAX \| count; count = COUNT_CONTINUED;
9b04c5fec Cong Wang mm: remove the se...	2855	kunmap_atomic(map);
570a335b8 Hugh Dickins swap_info: swap c...	2856 2857 2858 2859 2860 2861 2862 2863 2864 2865 2866 2867 2868 2869 2870 2871 2872 2873 2874 2875 2876 2877 2878 2879 2880 2881 2882 2883	page = list_entry(page->lru.prev, struct page, lru); } return count == COUNT_CONTINUED; } } /* * free_swap_count_continuations - swapoff free all the continuation pages * appended to the swap_map, after swap_map is quiesced, before vfree'ing it. / static void free_swap_count_continuations(struct swap_info_struct si) { pgoff_t offset; for (offset = 0; offset < si->max; offset += PAGE_SIZE) { struct page head; head = vmalloc_to_page(si->swap_map + offset); if (page_private(head)) { struct list_head this, next; list_for_each_safe(this, next, &head->lru) { struct page page; page = list_entry(this, struct page, lru); list_del(this); __free_page(page); } } } }