Blame view

mm/highmem.c 19.7 KB
b24413180   Greg Kroah-Hartman   License cleanup: ...
1
  // SPDX-License-Identifier: GPL-2.0
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
  /*
   * High memory handling common code and variables.
   *
   * (C) 1999 Andrea Arcangeli, SuSE GmbH, andrea@suse.de
   *          Gerhard Wichert, Siemens AG, Gerhard.Wichert@pdb.siemens.de
   *
   *
   * Redesigned the x86 32-bit VM architecture to deal with
   * 64-bit physical space. With current x86 CPUs this
   * means up to 64 Gigabytes physical RAM.
   *
   * Rewrote high memory support to move the page cache into
   * high memory. Implemented permanent (schedulable) kmaps
   * based on Linus' idea.
   *
   * Copyright (C) 1999 Ingo Molnar <mingo@redhat.com>
   */
  
  #include <linux/mm.h>
b95f1b31b   Paul Gortmaker   mm: Map most file...
21
  #include <linux/export.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
22
23
24
25
26
27
28
29
  #include <linux/swap.h>
  #include <linux/bio.h>
  #include <linux/pagemap.h>
  #include <linux/mempool.h>
  #include <linux/blkdev.h>
  #include <linux/init.h>
  #include <linux/hash.h>
  #include <linux/highmem.h>
eac790059   Jason Wessel   mm,kdb,kgdb: Add ...
30
  #include <linux/kgdb.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
31
  #include <asm/tlbflush.h>
186525bd6   Ingo Molnar   mm, x86/mm: Untan...
32
  #include <linux/vmalloc.h>
a8e23a291   Peter Zijlstra   mm,x86: fix kmap_...
33

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
34
35
36
37
38
39
40
41
42
  /*
   * Virtual_count is not a pure "count".
   *  0 means that it is not mapped, and has not been mapped
   *    since a TLB flush - it is usable.
   *  1 means that there are no users, but it has been mapped
   *    since the last TLB flush - so we can't use it.
   *  n means that there are (n-1) current users of it.
   */
  #ifdef CONFIG_HIGHMEM
260b23674   Al Viro   [PATCH] gfp_t: th...
43

15de36a4c   Max Filippov   mm/highmem: make ...
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
  /*
   * Architecture with aliasing data cache may define the following family of
   * helper functions in its asm/highmem.h to control cache color of virtual
   * addresses where physical memory pages are mapped by kmap.
   */
  #ifndef get_pkmap_color
  
  /*
   * Determine color of virtual address where the page should be mapped.
   */
  static inline unsigned int get_pkmap_color(struct page *page)
  {
  	return 0;
  }
  #define get_pkmap_color get_pkmap_color
  
  /*
   * Get next index for mapping inside PKMAP region for page with given color.
   */
  static inline unsigned int get_next_pkmap_nr(unsigned int color)
  {
  	static unsigned int last_pkmap_nr;
  
  	last_pkmap_nr = (last_pkmap_nr + 1) & LAST_PKMAP_MASK;
  	return last_pkmap_nr;
  }
  
  /*
   * Determine if page index inside PKMAP region (pkmap_nr) of given color
   * has wrapped around PKMAP region end. When this happens an attempt to
   * flush all unused PKMAP slots is made.
   */
  static inline int no_more_pkmaps(unsigned int pkmap_nr, unsigned int color)
  {
  	return pkmap_nr == 0;
  }
  
  /*
   * Get the number of PKMAP entries of the given color. If no free slot is
   * found after checking that many entries, kmap will sleep waiting for
   * someone to call kunmap and free PKMAP slot.
   */
  static inline int get_pkmap_entries_count(unsigned int color)
  {
  	return LAST_PKMAP;
  }
  
  /*
   * Get head of a wait queue for PKMAP entries of the given color.
   * Wait queues for different mapping colors should be independent to avoid
   * unnecessary wakeups caused by freeing of slots of other colors.
   */
  static inline wait_queue_head_t *get_pkmap_wait_queue_head(unsigned int color)
  {
  	static DECLARE_WAIT_QUEUE_HEAD(pkmap_map_wait);
  
  	return &pkmap_map_wait;
  }
  #endif
ca79b0c21   Arun KS   mm: convert total...
103
104
  atomic_long_t _totalhigh_pages __read_mostly;
  EXPORT_SYMBOL(_totalhigh_pages);
3e4d3af50   Peter Zijlstra   mm: stack based k...
105

9727688db   songqiang   mm/highmem.c: fix...
106
  unsigned int __nr_free_highpages(void)
c1f60a5a4   Christoph Lameter   [PATCH] reduce MA...
107
  {
33499bfe5   Joonsoo Kim   mm/highmem: make ...
108
  	struct zone *zone;
c1f60a5a4   Christoph Lameter   [PATCH] reduce MA...
109
  	unsigned int pages = 0;
33499bfe5   Joonsoo Kim   mm/highmem: make ...
110
111
112
  	for_each_populated_zone(zone) {
  		if (is_highmem(zone))
  			pages += zone_page_state(zone, NR_FREE_PAGES);
2a1e274ac   Mel Gorman   Create the ZONE_M...
113
  	}
c1f60a5a4   Christoph Lameter   [PATCH] reduce MA...
114
115
116
  
  	return pages;
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
117
  static int pkmap_count[LAST_PKMAP];
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
118
  static  __cacheline_aligned_in_smp DEFINE_SPINLOCK(kmap_lock);
9727688db   songqiang   mm/highmem.c: fix...
119
  pte_t *pkmap_page_table;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
120

3297e7607   Nicolas Pitre   highmem: atomic h...
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
  /*
   * Most architectures have no use for kmap_high_get(), so let's abstract
   * the disabling of IRQ out of the locking in that case to save on a
   * potential useless overhead.
   */
  #ifdef ARCH_NEEDS_KMAP_HIGH_GET
  #define lock_kmap()             spin_lock_irq(&kmap_lock)
  #define unlock_kmap()           spin_unlock_irq(&kmap_lock)
  #define lock_kmap_any(flags)    spin_lock_irqsave(&kmap_lock, flags)
  #define unlock_kmap_any(flags)  spin_unlock_irqrestore(&kmap_lock, flags)
  #else
  #define lock_kmap()             spin_lock(&kmap_lock)
  #define unlock_kmap()           spin_unlock(&kmap_lock)
  #define lock_kmap_any(flags)    \
  		do { spin_lock(&kmap_lock); (void)(flags); } while (0)
  #define unlock_kmap_any(flags)  \
  		do { spin_unlock(&kmap_lock); (void)(flags); } while (0)
  #endif
13f876ba7   Thomas Gleixner   highmem: High imp...
139
  struct page *__kmap_to_page(void *vaddr)
5a178119b   Mel Gorman   mm: add support f...
140
141
  {
  	unsigned long addr = (unsigned long)vaddr;
498c22802   Will Deacon   mm: highmem: don'...
142
  	if (addr >= PKMAP_ADDR(0) && addr < PKMAP_ADDR(LAST_PKMAP)) {
4de22c058   Joonsoo Kim   mm, highmem: use ...
143
  		int i = PKMAP_NR(addr);
9727688db   songqiang   mm/highmem.c: fix...
144

5a178119b   Mel Gorman   mm: add support f...
145
146
147
148
149
  		return pte_page(pkmap_page_table[i]);
  	}
  
  	return virt_to_page(addr);
  }
13f876ba7   Thomas Gleixner   highmem: High imp...
150
  EXPORT_SYMBOL(__kmap_to_page);
5a178119b   Mel Gorman   mm: add support f...
151

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
152
153
154
  static void flush_all_zero_pkmaps(void)
  {
  	int i;
5843d9a4d   Nick Piggin   x86, pat: avoid h...
155
  	int need_flush = 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
  
  	flush_cache_kmaps();
  
  	for (i = 0; i < LAST_PKMAP; i++) {
  		struct page *page;
  
  		/*
  		 * zero means we don't have anything to do,
  		 * >1 means that it is still in use. Only
  		 * a count of 1 means that it is free but
  		 * needs to be unmapped
  		 */
  		if (pkmap_count[i] != 1)
  			continue;
  		pkmap_count[i] = 0;
  
  		/* sanity check */
75babcace   Eric Sesterhenn   BUG_ON() Conversi...
173
  		BUG_ON(pte_none(pkmap_page_table[i]));
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
174
175
176
177
178
179
180
181
182
  
  		/*
  		 * Don't need an atomic fetch-and-clear op here;
  		 * no-one has the page mapped, and cannot get at
  		 * its virtual address (and hence PTE) without first
  		 * getting the kmap_lock (which is held here).
  		 * So no dangers, even with speculative execution.
  		 */
  		page = pte_page(pkmap_page_table[i]);
eb2db439a   Joonsoo Kim   mm, highmem: get ...
183
  		pte_clear(&init_mm, PKMAP_ADDR(i), &pkmap_page_table[i]);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
184
185
  
  		set_page_address(page, NULL);
5843d9a4d   Nick Piggin   x86, pat: avoid h...
186
  		need_flush = 1;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
187
  	}
5843d9a4d   Nick Piggin   x86, pat: avoid h...
188
189
  	if (need_flush)
  		flush_tlb_kernel_range(PKMAP_ADDR(0), PKMAP_ADDR(LAST_PKMAP));
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
190
  }
13f876ba7   Thomas Gleixner   highmem: High imp...
191
  void __kmap_flush_unused(void)
ce6234b52   Jeremy Fitzhardinge   [PATCH] i386: PAR...
192
  {
3297e7607   Nicolas Pitre   highmem: atomic h...
193
  	lock_kmap();
ce6234b52   Jeremy Fitzhardinge   [PATCH] i386: PAR...
194
  	flush_all_zero_pkmaps();
3297e7607   Nicolas Pitre   highmem: atomic h...
195
  	unlock_kmap();
ce6234b52   Jeremy Fitzhardinge   [PATCH] i386: PAR...
196
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
197
198
199
200
  static inline unsigned long map_new_virtual(struct page *page)
  {
  	unsigned long vaddr;
  	int count;
15de36a4c   Max Filippov   mm/highmem: make ...
201
202
  	unsigned int last_pkmap_nr;
  	unsigned int color = get_pkmap_color(page);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
203
204
  
  start:
15de36a4c   Max Filippov   mm/highmem: make ...
205
  	count = get_pkmap_entries_count(color);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
206
207
  	/* Find an empty entry */
  	for (;;) {
15de36a4c   Max Filippov   mm/highmem: make ...
208
209
  		last_pkmap_nr = get_next_pkmap_nr(color);
  		if (no_more_pkmaps(last_pkmap_nr, color)) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
210
  			flush_all_zero_pkmaps();
15de36a4c   Max Filippov   mm/highmem: make ...
211
  			count = get_pkmap_entries_count(color);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
212
213
214
215
216
217
218
219
220
221
222
  		}
  		if (!pkmap_count[last_pkmap_nr])
  			break;	/* Found a usable entry */
  		if (--count)
  			continue;
  
  		/*
  		 * Sleep for somebody else to unmap their entries
  		 */
  		{
  			DECLARE_WAITQUEUE(wait, current);
15de36a4c   Max Filippov   mm/highmem: make ...
223
224
  			wait_queue_head_t *pkmap_map_wait =
  				get_pkmap_wait_queue_head(color);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
225
226
  
  			__set_current_state(TASK_UNINTERRUPTIBLE);
15de36a4c   Max Filippov   mm/highmem: make ...
227
  			add_wait_queue(pkmap_map_wait, &wait);
3297e7607   Nicolas Pitre   highmem: atomic h...
228
  			unlock_kmap();
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
229
  			schedule();
15de36a4c   Max Filippov   mm/highmem: make ...
230
  			remove_wait_queue(pkmap_map_wait, &wait);
3297e7607   Nicolas Pitre   highmem: atomic h...
231
  			lock_kmap();
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
  
  			/* Somebody else might have mapped it while we slept */
  			if (page_address(page))
  				return (unsigned long)page_address(page);
  
  			/* Re-start */
  			goto start;
  		}
  	}
  	vaddr = PKMAP_ADDR(last_pkmap_nr);
  	set_pte_at(&init_mm, vaddr,
  		   &(pkmap_page_table[last_pkmap_nr]), mk_pte(page, kmap_prot));
  
  	pkmap_count[last_pkmap_nr] = 1;
  	set_page_address(page, (void *)vaddr);
  
  	return vaddr;
  }
77f6078aa   Randy Dunlap   mm: highmem kerne...
250
251
252
253
254
255
256
257
  /**
   * kmap_high - map a highmem page into memory
   * @page: &struct page to map
   *
   * Returns the page's virtual memory address.
   *
   * We cannot call this from interrupts, as it may block.
   */
920c7a5d0   Harvey Harrison   mm: remove fastca...
258
  void *kmap_high(struct page *page)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
259
260
261
262
263
264
  {
  	unsigned long vaddr;
  
  	/*
  	 * For highmem pages, we can't trust "virtual" until
  	 * after we have the lock.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
265
  	 */
3297e7607   Nicolas Pitre   highmem: atomic h...
266
  	lock_kmap();
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
267
268
269
270
  	vaddr = (unsigned long)page_address(page);
  	if (!vaddr)
  		vaddr = map_new_virtual(page);
  	pkmap_count[PKMAP_NR(vaddr)]++;
75babcace   Eric Sesterhenn   BUG_ON() Conversi...
271
  	BUG_ON(pkmap_count[PKMAP_NR(vaddr)] < 2);
3297e7607   Nicolas Pitre   highmem: atomic h...
272
  	unlock_kmap();
9727688db   songqiang   mm/highmem.c: fix...
273
  	return (void *) vaddr;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
274
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
275
  EXPORT_SYMBOL(kmap_high);
3297e7607   Nicolas Pitre   highmem: atomic h...
276
277
278
279
280
281
  #ifdef ARCH_NEEDS_KMAP_HIGH_GET
  /**
   * kmap_high_get - pin a highmem page into memory
   * @page: &struct page to pin
   *
   * Returns the page's current virtual memory address, or NULL if no mapping
5e39df562   Uwe Kleine-König   grammar fix in co...
282
   * exists.  If and only if a non null address is returned then a
3297e7607   Nicolas Pitre   highmem: atomic h...
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
   * matching call to kunmap_high() is necessary.
   *
   * This can be called from any context.
   */
  void *kmap_high_get(struct page *page)
  {
  	unsigned long vaddr, flags;
  
  	lock_kmap_any(flags);
  	vaddr = (unsigned long)page_address(page);
  	if (vaddr) {
  		BUG_ON(pkmap_count[PKMAP_NR(vaddr)] < 1);
  		pkmap_count[PKMAP_NR(vaddr)]++;
  	}
  	unlock_kmap_any(flags);
9727688db   songqiang   mm/highmem.c: fix...
298
  	return (void *) vaddr;
3297e7607   Nicolas Pitre   highmem: atomic h...
299
300
  }
  #endif
77f6078aa   Randy Dunlap   mm: highmem kerne...
301
  /**
4e9dc5df4   Li Haifeng   mm: fix kunmap_hi...
302
   * kunmap_high - unmap a highmem page into memory
77f6078aa   Randy Dunlap   mm: highmem kerne...
303
   * @page: &struct page to unmap
3297e7607   Nicolas Pitre   highmem: atomic h...
304
305
306
   *
   * If ARCH_NEEDS_KMAP_HIGH_GET is not defined then this may be called
   * only from user context.
77f6078aa   Randy Dunlap   mm: highmem kerne...
307
   */
920c7a5d0   Harvey Harrison   mm: remove fastca...
308
  void kunmap_high(struct page *page)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
309
310
311
  {
  	unsigned long vaddr;
  	unsigned long nr;
3297e7607   Nicolas Pitre   highmem: atomic h...
312
  	unsigned long flags;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
313
  	int need_wakeup;
15de36a4c   Max Filippov   mm/highmem: make ...
314
315
  	unsigned int color = get_pkmap_color(page);
  	wait_queue_head_t *pkmap_map_wait;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
316

3297e7607   Nicolas Pitre   highmem: atomic h...
317
  	lock_kmap_any(flags);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
318
  	vaddr = (unsigned long)page_address(page);
75babcace   Eric Sesterhenn   BUG_ON() Conversi...
319
  	BUG_ON(!vaddr);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
  	nr = PKMAP_NR(vaddr);
  
  	/*
  	 * A count must never go down to zero
  	 * without a TLB flush!
  	 */
  	need_wakeup = 0;
  	switch (--pkmap_count[nr]) {
  	case 0:
  		BUG();
  	case 1:
  		/*
  		 * Avoid an unnecessary wake_up() function call.
  		 * The common case is pkmap_count[] == 1, but
  		 * no waiters.
  		 * The tasks queued in the wait-queue are guarded
  		 * by both the lock in the wait-queue-head and by
  		 * the kmap_lock.  As the kmap_lock is held here,
  		 * no need for the wait-queue-head's lock.  Simply
  		 * test if the queue is empty.
  		 */
15de36a4c   Max Filippov   mm/highmem: make ...
341
342
  		pkmap_map_wait = get_pkmap_wait_queue_head(color);
  		need_wakeup = waitqueue_active(pkmap_map_wait);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
343
  	}
3297e7607   Nicolas Pitre   highmem: atomic h...
344
  	unlock_kmap_any(flags);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
345
346
347
  
  	/* do wake-up, if needed, race-free outside of the spin lock */
  	if (need_wakeup)
15de36a4c   Max Filippov   mm/highmem: make ...
348
  		wake_up(pkmap_map_wait);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
349
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
350
  EXPORT_SYMBOL(kunmap_high);
0060ef3b4   Matthew Wilcox (Oracle)   mm: support THPs ...
351
352
353
354
355
356
357
358
  
  #ifdef CONFIG_TRANSPARENT_HUGEPAGE
  void zero_user_segments(struct page *page, unsigned start1, unsigned end1,
  		unsigned start2, unsigned end2)
  {
  	unsigned int i;
  
  	BUG_ON(end1 > page_size(page) || end2 > page_size(page));
184cee516   OGAWA Hirofumi   mm/highmem.c: fix...
359
360
361
362
  	if (start1 >= end1)
  		start1 = end1 = 0;
  	if (start2 >= end2)
  		start2 = end2 = 0;
0060ef3b4   Matthew Wilcox (Oracle)   mm: support THPs ...
363
364
  	for (i = 0; i < compound_nr(page); i++) {
  		void *kaddr = NULL;
0060ef3b4   Matthew Wilcox (Oracle)   mm: support THPs ...
365
366
367
368
369
  		if (start1 >= PAGE_SIZE) {
  			start1 -= PAGE_SIZE;
  			end1 -= PAGE_SIZE;
  		} else {
  			unsigned this_end = min_t(unsigned, end1, PAGE_SIZE);
184cee516   OGAWA Hirofumi   mm/highmem.c: fix...
370
371
  			if (end1 > start1) {
  				kaddr = kmap_atomic(page + i);
0060ef3b4   Matthew Wilcox (Oracle)   mm: support THPs ...
372
  				memset(kaddr + start1, 0, this_end - start1);
184cee516   OGAWA Hirofumi   mm/highmem.c: fix...
373
  			}
0060ef3b4   Matthew Wilcox (Oracle)   mm: support THPs ...
374
375
376
377
378
379
380
381
382
  			end1 -= this_end;
  			start1 = 0;
  		}
  
  		if (start2 >= PAGE_SIZE) {
  			start2 -= PAGE_SIZE;
  			end2 -= PAGE_SIZE;
  		} else {
  			unsigned this_end = min_t(unsigned, end2, PAGE_SIZE);
184cee516   OGAWA Hirofumi   mm/highmem.c: fix...
383
384
385
  			if (end2 > start2) {
  				if (!kaddr)
  					kaddr = kmap_atomic(page + i);
0060ef3b4   Matthew Wilcox (Oracle)   mm: support THPs ...
386
  				memset(kaddr + start2, 0, this_end - start2);
184cee516   OGAWA Hirofumi   mm/highmem.c: fix...
387
  			}
0060ef3b4   Matthew Wilcox (Oracle)   mm: support THPs ...
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
  			end2 -= this_end;
  			start2 = 0;
  		}
  
  		if (kaddr) {
  			kunmap_atomic(kaddr);
  			flush_dcache_page(page + i);
  		}
  
  		if (!end1 && !end2)
  			break;
  	}
  
  	BUG_ON((start1 | start2 | end1 | end2) != 0);
  }
  EXPORT_SYMBOL(zero_user_segments);
  #endif /* CONFIG_TRANSPARENT_HUGEPAGE */
298fa1ad5   Thomas Gleixner   highmem: Provide ...
405
406
407
408
409
  #endif /* CONFIG_HIGHMEM */
  
  #ifdef CONFIG_KMAP_LOCAL
  
  #include <asm/kmap_size.h>
389755c25   Thomas Gleixner   highmem: Make DEB...
410
  /*
6e799cb69   Thomas Gleixner   mm/highmem: Provi...
411
   * With DEBUG_KMAP_LOCAL the stack depth is doubled and every second
389755c25   Thomas Gleixner   highmem: Make DEB...
412
413
   * slot is unused which acts as a guard page
   */
6e799cb69   Thomas Gleixner   mm/highmem: Provi...
414
  #ifdef CONFIG_DEBUG_KMAP_LOCAL
389755c25   Thomas Gleixner   highmem: Make DEB...
415
416
417
418
  # define KM_INCR	2
  #else
  # define KM_INCR	1
  #endif
298fa1ad5   Thomas Gleixner   highmem: Provide ...
419
420
  static inline int kmap_local_idx_push(void)
  {
ea0eafead   Changbin Du   mm: in_irq() cleanup
421
  	WARN_ON_ONCE(in_hardirq() && !irqs_disabled());
5fbda3ecd   Thomas Gleixner   sched: highmem: S...
422
423
424
  	current->kmap_ctrl.idx += KM_INCR;
  	BUG_ON(current->kmap_ctrl.idx >= KM_MAX_IDX);
  	return current->kmap_ctrl.idx - 1;
298fa1ad5   Thomas Gleixner   highmem: Provide ...
425
426
427
428
  }
  
  static inline int kmap_local_idx(void)
  {
5fbda3ecd   Thomas Gleixner   sched: highmem: S...
429
  	return current->kmap_ctrl.idx - 1;
298fa1ad5   Thomas Gleixner   highmem: Provide ...
430
431
432
433
  }
  
  static inline void kmap_local_idx_pop(void)
  {
5fbda3ecd   Thomas Gleixner   sched: highmem: S...
434
435
  	current->kmap_ctrl.idx -= KM_INCR;
  	BUG_ON(current->kmap_ctrl.idx < 0);
298fa1ad5   Thomas Gleixner   highmem: Provide ...
436
437
438
439
440
  }
  
  #ifndef arch_kmap_local_post_map
  # define arch_kmap_local_post_map(vaddr, pteval)	do { } while (0)
  #endif
3c1016b53   Thomas Gleixner   mm/highmem: Remov...
441

298fa1ad5   Thomas Gleixner   highmem: Provide ...
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
  #ifndef arch_kmap_local_pre_unmap
  # define arch_kmap_local_pre_unmap(vaddr)		do { } while (0)
  #endif
  
  #ifndef arch_kmap_local_post_unmap
  # define arch_kmap_local_post_unmap(vaddr)		do { } while (0)
  #endif
  
  #ifndef arch_kmap_local_map_idx
  #define arch_kmap_local_map_idx(idx, pfn)	kmap_local_calc_idx(idx)
  #endif
  
  #ifndef arch_kmap_local_unmap_idx
  #define arch_kmap_local_unmap_idx(idx, vaddr)	kmap_local_calc_idx(idx)
  #endif
  
  #ifndef arch_kmap_local_high_get
  static inline void *arch_kmap_local_high_get(struct page *page)
  {
  	return NULL;
  }
  #endif
a1dce7fd2   Thomas Gleixner   mm/highmem: prepa...
464
465
466
467
  #ifndef arch_kmap_local_set_pte
  #define arch_kmap_local_set_pte(mm, vaddr, ptep, ptev)	\
  	set_pte_at(mm, vaddr, ptep, ptev)
  #endif
298fa1ad5   Thomas Gleixner   highmem: Provide ...
468
  /* Unmap a local mapping which was obtained by kmap_high_get() */
2a656cad3   Thomas Gleixner   mm/highmem: Take ...
469
  static inline bool kmap_high_unmap_local(unsigned long vaddr)
298fa1ad5   Thomas Gleixner   highmem: Provide ...
470
471
  {
  #ifdef ARCH_NEEDS_KMAP_HIGH_GET
2a656cad3   Thomas Gleixner   mm/highmem: Take ...
472
  	if (vaddr >= PKMAP_ADDR(0) && vaddr < PKMAP_ADDR(LAST_PKMAP)) {
298fa1ad5   Thomas Gleixner   highmem: Provide ...
473
  		kunmap_high(pte_page(pkmap_page_table[PKMAP_NR(vaddr)]));
2a656cad3   Thomas Gleixner   mm/highmem: Take ...
474
475
  		return true;
  	}
298fa1ad5   Thomas Gleixner   highmem: Provide ...
476
  #endif
2a656cad3   Thomas Gleixner   mm/highmem: Take ...
477
  	return false;
298fa1ad5   Thomas Gleixner   highmem: Provide ...
478
479
480
481
482
483
484
485
  }
  
  static inline int kmap_local_calc_idx(int idx)
  {
  	return idx + KM_MAX_IDX * smp_processor_id();
  }
  
  static pte_t *__kmap_pte;
4dfddb52a   Ard Biesheuvel   kmap_local: don't...
486
  static pte_t *kmap_get_pte(unsigned long vaddr, int idx)
298fa1ad5   Thomas Gleixner   highmem: Provide ...
487
  {
4dfddb52a   Ard Biesheuvel   kmap_local: don't...
488
489
490
491
492
493
  	if (IS_ENABLED(CONFIG_KMAP_LOCAL_NON_LINEAR_PTE_ARRAY))
  		/*
  		 * Set by the arch if __kmap_pte[-idx] does not produce
  		 * the correct entry.
  		 */
  		return virt_to_kpte(vaddr);
298fa1ad5   Thomas Gleixner   highmem: Provide ...
494
495
  	if (!__kmap_pte)
  		__kmap_pte = virt_to_kpte(__fix_to_virt(FIX_KMAP_BEGIN));
4dfddb52a   Ard Biesheuvel   kmap_local: don't...
496
  	return &__kmap_pte[-idx];
298fa1ad5   Thomas Gleixner   highmem: Provide ...
497
498
499
500
  }
  
  void *__kmap_local_pfn_prot(unsigned long pfn, pgprot_t prot)
  {
4dfddb52a   Ard Biesheuvel   kmap_local: don't...
501
  	pte_t pteval, *kmap_pte;
298fa1ad5   Thomas Gleixner   highmem: Provide ...
502
503
  	unsigned long vaddr;
  	int idx;
f3ba3c710   Thomas Gleixner   mm/highmem: Provi...
504
505
  	/*
  	 * Disable migration so resulting virtual address is stable
f0953a1bb   Ingo Molnar   mm: fix typos in ...
506
  	 * across preemption.
f3ba3c710   Thomas Gleixner   mm/highmem: Provi...
507
508
  	 */
  	migrate_disable();
298fa1ad5   Thomas Gleixner   highmem: Provide ...
509
510
511
  	preempt_disable();
  	idx = arch_kmap_local_map_idx(kmap_local_idx_push(), pfn);
  	vaddr = __fix_to_virt(FIX_KMAP_BEGIN + idx);
4dfddb52a   Ard Biesheuvel   kmap_local: don't...
512
513
  	kmap_pte = kmap_get_pte(vaddr, idx);
  	BUG_ON(!pte_none(*kmap_pte));
298fa1ad5   Thomas Gleixner   highmem: Provide ...
514
  	pteval = pfn_pte(pfn, prot);
4dfddb52a   Ard Biesheuvel   kmap_local: don't...
515
  	arch_kmap_local_set_pte(&init_mm, vaddr, kmap_pte, pteval);
298fa1ad5   Thomas Gleixner   highmem: Provide ...
516
  	arch_kmap_local_post_map(vaddr, pteval);
5fbda3ecd   Thomas Gleixner   sched: highmem: S...
517
  	current->kmap_ctrl.pteval[kmap_local_idx()] = pteval;
298fa1ad5   Thomas Gleixner   highmem: Provide ...
518
519
520
521
522
523
524
525
526
  	preempt_enable();
  
  	return (void *)vaddr;
  }
  EXPORT_SYMBOL_GPL(__kmap_local_pfn_prot);
  
  void *__kmap_local_page_prot(struct page *page, pgprot_t prot)
  {
  	void *kmap;
0e91a0c69   Thomas Gleixner   mm/highmem: Provi...
527
528
529
530
531
532
  	/*
  	 * To broaden the usage of the actual kmap_local() machinery always map
  	 * pages when debugging is enabled and the architecture has no problems
  	 * with alias mappings.
  	 */
  	if (!IS_ENABLED(CONFIG_DEBUG_KMAP_LOCAL_FORCE_MAP) && !PageHighMem(page))
298fa1ad5   Thomas Gleixner   highmem: Provide ...
533
534
535
536
537
538
539
540
541
542
543
544
545
546
  		return page_address(page);
  
  	/* Try kmap_high_get() if architecture has it enabled */
  	kmap = arch_kmap_local_high_get(page);
  	if (kmap)
  		return kmap;
  
  	return __kmap_local_pfn_prot(page_to_pfn(page), prot);
  }
  EXPORT_SYMBOL(__kmap_local_page_prot);
  
  void kunmap_local_indexed(void *vaddr)
  {
  	unsigned long addr = (unsigned long) vaddr & PAGE_MASK;
4dfddb52a   Ard Biesheuvel   kmap_local: don't...
547
  	pte_t *kmap_pte;
298fa1ad5   Thomas Gleixner   highmem: Provide ...
548
549
550
551
  	int idx;
  
  	if (addr < __fix_to_virt(FIX_KMAP_END) ||
  	    addr > __fix_to_virt(FIX_KMAP_BEGIN)) {
0e91a0c69   Thomas Gleixner   mm/highmem: Provi...
552
553
554
555
556
  		if (IS_ENABLED(CONFIG_DEBUG_KMAP_LOCAL_FORCE_MAP)) {
  			/* This _should_ never happen! See above. */
  			WARN_ON_ONCE(1);
  			return;
  		}
2a656cad3   Thomas Gleixner   mm/highmem: Take ...
557
558
559
560
561
562
563
564
  		/*
  		 * Handle mappings which were obtained by kmap_high_get()
  		 * first as the virtual address of such mappings is below
  		 * PAGE_OFFSET. Warn for all other addresses which are in
  		 * the user space part of the virtual address space.
  		 */
  		if (!kmap_high_unmap_local(addr))
  			WARN_ON_ONCE(addr < PAGE_OFFSET);
298fa1ad5   Thomas Gleixner   highmem: Provide ...
565
566
567
568
569
570
  		return;
  	}
  
  	preempt_disable();
  	idx = arch_kmap_local_unmap_idx(kmap_local_idx(), addr);
  	WARN_ON_ONCE(addr != __fix_to_virt(FIX_KMAP_BEGIN + idx));
4dfddb52a   Ard Biesheuvel   kmap_local: don't...
571
  	kmap_pte = kmap_get_pte(addr, idx);
298fa1ad5   Thomas Gleixner   highmem: Provide ...
572
  	arch_kmap_local_pre_unmap(addr);
4dfddb52a   Ard Biesheuvel   kmap_local: don't...
573
  	pte_clear(&init_mm, addr, kmap_pte);
298fa1ad5   Thomas Gleixner   highmem: Provide ...
574
  	arch_kmap_local_post_unmap(addr);
5fbda3ecd   Thomas Gleixner   sched: highmem: S...
575
  	current->kmap_ctrl.pteval[kmap_local_idx()] = __pte(0);
298fa1ad5   Thomas Gleixner   highmem: Provide ...
576
577
  	kmap_local_idx_pop();
  	preempt_enable();
f3ba3c710   Thomas Gleixner   mm/highmem: Provi...
578
  	migrate_enable();
298fa1ad5   Thomas Gleixner   highmem: Provide ...
579
580
  }
  EXPORT_SYMBOL(kunmap_local_indexed);
5fbda3ecd   Thomas Gleixner   sched: highmem: S...
581
582
583
584
585
586
587
588
589
590
591
592
593
594
  
  /*
   * Invoked before switch_to(). This is safe even when during or after
   * clearing the maps an interrupt which needs a kmap_local happens because
   * the task::kmap_ctrl.idx is not modified by the unmapping code so a
   * nested kmap_local will use the next unused index and restore the index
   * on unmap. The already cleared kmaps of the outgoing task are irrelevant
   * because the interrupt context does not know about them. The same applies
   * when scheduling back in for an interrupt which happens before the
   * restore is complete.
   */
  void __kmap_local_sched_out(void)
  {
  	struct task_struct *tsk = current;
4dfddb52a   Ard Biesheuvel   kmap_local: don't...
595
  	pte_t *kmap_pte;
5fbda3ecd   Thomas Gleixner   sched: highmem: S...
596
597
598
599
600
601
602
603
604
  	int i;
  
  	/* Clear kmaps */
  	for (i = 0; i < tsk->kmap_ctrl.idx; i++) {
  		pte_t pteval = tsk->kmap_ctrl.pteval[i];
  		unsigned long addr;
  		int idx;
  
  		/* With debug all even slots are unmapped and act as guard */
487cfade1   Ira Weiny   mm/highmem: fix C...
605
  		if (IS_ENABLED(CONFIG_DEBUG_KMAP_LOCAL) && !(i & 0x01)) {
c21d040de   Max Filippov   highmem: fix chec...
606
  			WARN_ON_ONCE(pte_val(pteval) != 0);
5fbda3ecd   Thomas Gleixner   sched: highmem: S...
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
  			continue;
  		}
  		if (WARN_ON_ONCE(pte_none(pteval)))
  			continue;
  
  		/*
  		 * This is a horrible hack for XTENSA to calculate the
  		 * coloured PTE index. Uses the PFN encoded into the pteval
  		 * and the map index calculation because the actual mapped
  		 * virtual address is not stored in task::kmap_ctrl.
  		 * For any sane architecture this is optimized out.
  		 */
  		idx = arch_kmap_local_map_idx(i, pte_pfn(pteval));
  
  		addr = __fix_to_virt(FIX_KMAP_BEGIN + idx);
4dfddb52a   Ard Biesheuvel   kmap_local: don't...
622
  		kmap_pte = kmap_get_pte(addr, idx);
5fbda3ecd   Thomas Gleixner   sched: highmem: S...
623
  		arch_kmap_local_pre_unmap(addr);
4dfddb52a   Ard Biesheuvel   kmap_local: don't...
624
  		pte_clear(&init_mm, addr, kmap_pte);
5fbda3ecd   Thomas Gleixner   sched: highmem: S...
625
626
627
628
629
630
631
  		arch_kmap_local_post_unmap(addr);
  	}
  }
  
  void __kmap_local_sched_in(void)
  {
  	struct task_struct *tsk = current;
4dfddb52a   Ard Biesheuvel   kmap_local: don't...
632
  	pte_t *kmap_pte;
5fbda3ecd   Thomas Gleixner   sched: highmem: S...
633
634
635
636
637
638
639
640
641
  	int i;
  
  	/* Restore kmaps */
  	for (i = 0; i < tsk->kmap_ctrl.idx; i++) {
  		pte_t pteval = tsk->kmap_ctrl.pteval[i];
  		unsigned long addr;
  		int idx;
  
  		/* With debug all even slots are unmapped and act as guard */
487cfade1   Ira Weiny   mm/highmem: fix C...
642
  		if (IS_ENABLED(CONFIG_DEBUG_KMAP_LOCAL) && !(i & 0x01)) {
c21d040de   Max Filippov   highmem: fix chec...
643
  			WARN_ON_ONCE(pte_val(pteval) != 0);
5fbda3ecd   Thomas Gleixner   sched: highmem: S...
644
645
646
647
648
649
650
651
  			continue;
  		}
  		if (WARN_ON_ONCE(pte_none(pteval)))
  			continue;
  
  		/* See comment in __kmap_local_sched_out() */
  		idx = arch_kmap_local_map_idx(i, pte_pfn(pteval));
  		addr = __fix_to_virt(FIX_KMAP_BEGIN + idx);
4dfddb52a   Ard Biesheuvel   kmap_local: don't...
652
653
  		kmap_pte = kmap_get_pte(addr, idx);
  		set_pte_at(&init_mm, addr, kmap_pte, pteval);
5fbda3ecd   Thomas Gleixner   sched: highmem: S...
654
655
656
657
658
659
660
661
662
  		arch_kmap_local_post_map(addr, pteval);
  	}
  }
  
  void kmap_local_fork(struct task_struct *tsk)
  {
  	if (WARN_ON_ONCE(tsk->kmap_ctrl.idx))
  		memset(&tsk->kmap_ctrl, 0, sizeof(tsk->kmap_ctrl));
  }
298fa1ad5   Thomas Gleixner   highmem: Provide ...
663
  #endif
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
664

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
665
666
667
668
669
670
671
672
673
674
675
676
  #if defined(HASHED_PAGE_VIRTUAL)
  
  #define PA_HASH_ORDER	7
  
  /*
   * Describes one page->virtual association
   */
  struct page_address_map {
  	struct page *page;
  	void *virtual;
  	struct list_head list;
  };
a354e2c84   Joonsoo Kim   mm, highmem: remo...
677
  static struct page_address_map page_address_maps[LAST_PKMAP];
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
678
679
680
681
682
683
684
685
  
  /*
   * Hash table bucket
   */
  static struct page_address_slot {
  	struct list_head lh;			/* List of page_address_maps */
  	spinlock_t lock;			/* Protect this bucket's list */
  } ____cacheline_aligned_in_smp page_address_htable[1<<PA_HASH_ORDER];
f99187947   Ian Campbell   mm: make HASHED_P...
686
  static struct page_address_slot *page_slot(const struct page *page)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
687
688
689
  {
  	return &page_address_htable[hash_ptr(page, PA_HASH_ORDER)];
  }
77f6078aa   Randy Dunlap   mm: highmem kerne...
690
691
692
693
694
695
  /**
   * page_address - get the mapped virtual address of a page
   * @page: &struct page to get the virtual address of
   *
   * Returns the page's virtual address.
   */
f99187947   Ian Campbell   mm: make HASHED_P...
696
  void *page_address(const struct page *page)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
  {
  	unsigned long flags;
  	void *ret;
  	struct page_address_slot *pas;
  
  	if (!PageHighMem(page))
  		return lowmem_page_address(page);
  
  	pas = page_slot(page);
  	ret = NULL;
  	spin_lock_irqsave(&pas->lock, flags);
  	if (!list_empty(&pas->lh)) {
  		struct page_address_map *pam;
  
  		list_for_each_entry(pam, &pas->lh, list) {
  			if (pam->page == page) {
  				ret = pam->virtual;
  				goto done;
  			}
  		}
  	}
  done:
  	spin_unlock_irqrestore(&pas->lock, flags);
  	return ret;
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
722
  EXPORT_SYMBOL(page_address);
77f6078aa   Randy Dunlap   mm: highmem kerne...
723
724
725
726
727
  /**
   * set_page_address - set a page's virtual address
   * @page: &struct page to set
   * @virtual: virtual address to use
   */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
728
729
730
731
732
733
734
735
736
737
  void set_page_address(struct page *page, void *virtual)
  {
  	unsigned long flags;
  	struct page_address_slot *pas;
  	struct page_address_map *pam;
  
  	BUG_ON(!PageHighMem(page));
  
  	pas = page_slot(page);
  	if (virtual) {		/* Add */
a354e2c84   Joonsoo Kim   mm, highmem: remo...
738
  		pam = &page_address_maps[PKMAP_NR((unsigned long)virtual)];
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
739
740
741
742
743
744
745
746
747
748
749
750
  		pam->page = page;
  		pam->virtual = virtual;
  
  		spin_lock_irqsave(&pas->lock, flags);
  		list_add_tail(&pam->list, &pas->lh);
  		spin_unlock_irqrestore(&pas->lock, flags);
  	} else {		/* Remove */
  		spin_lock_irqsave(&pas->lock, flags);
  		list_for_each_entry(pam, &pas->lh, list) {
  			if (pam->page == page) {
  				list_del(&pam->list);
  				spin_unlock_irqrestore(&pas->lock, flags);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
751
752
753
754
755
756
757
758
  				goto done;
  			}
  		}
  		spin_unlock_irqrestore(&pas->lock, flags);
  	}
  done:
  	return;
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
759
760
761
  void __init page_address_init(void)
  {
  	int i;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
762
763
764
765
  	for (i = 0; i < ARRAY_SIZE(page_address_htable); i++) {
  		INIT_LIST_HEAD(&page_address_htable[i].lh);
  		spin_lock_init(&page_address_htable[i].lock);
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
766
  }
955cc774f   Ira Weiny   mm/highmem.c: cle...
767
  #endif	/* defined(HASHED_PAGE_VIRTUAL) */