Blame view

mm/nommu.c 53.2 KB
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1
2
3
4
5
6
7
8
  /*
   *  linux/mm/nommu.c
   *
   *  Replacement code for mm functions to support CPU's that don't
   *  have any form of memory management unit (thus no virtual memory).
   *
   *  See Documentation/nommu-mmap.txt
   *
8feae1311   David Howells   NOMMU: Make VMAs ...
9
   *  Copyright (c) 2004-2008 David Howells <dhowells@redhat.com>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
10
11
12
   *  Copyright (c) 2000-2003 David McCullough <davidm@snapgear.com>
   *  Copyright (c) 2000-2001 D Jeff Dionne <jeff@uClinux.org>
   *  Copyright (c) 2002      Greg Ungerer <gerg@snapgear.com>
29c185e5c   Paul Mundt   nommu: Provide st...
13
   *  Copyright (c) 2007-2010 Paul Mundt <lethal@linux-sh.org>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
14
   */
b95f1b31b   Paul Gortmaker   mm: Map most file...
15
  #include <linux/export.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
16
17
18
19
20
21
22
23
  #include <linux/mm.h>
  #include <linux/mman.h>
  #include <linux/swap.h>
  #include <linux/file.h>
  #include <linux/highmem.h>
  #include <linux/pagemap.h>
  #include <linux/slab.h>
  #include <linux/vmalloc.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
24
25
26
27
28
29
  #include <linux/blkdev.h>
  #include <linux/backing-dev.h>
  #include <linux/mount.h>
  #include <linux/personality.h>
  #include <linux/security.h>
  #include <linux/syscalls.h>
120a795da   Al Viro   audit mmap
30
  #include <linux/audit.h>
cf4aebc29   Clark Williams   sched: Move sched...
31
  #include <linux/sched/sysctl.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
32
33
34
35
  
  #include <asm/uaccess.h>
  #include <asm/tlb.h>
  #include <asm/tlbflush.h>
eb8cdec4a   Bernd Schmidt   nommu: add suppor...
36
  #include <asm/mmu_context.h>
8feae1311   David Howells   NOMMU: Make VMAs ...
37
  #include "internal.h"
8feae1311   David Howells   NOMMU: Make VMAs ...
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
  #if 0
  #define kenter(FMT, ...) \
  	printk(KERN_DEBUG "==> %s("FMT")
  ", __func__, ##__VA_ARGS__)
  #define kleave(FMT, ...) \
  	printk(KERN_DEBUG "<== %s()"FMT"
  ", __func__, ##__VA_ARGS__)
  #define kdebug(FMT, ...) \
  	printk(KERN_DEBUG "xxx" FMT"yyy
  ", ##__VA_ARGS__)
  #else
  #define kenter(FMT, ...) \
  	no_printk(KERN_DEBUG "==> %s("FMT")
  ", __func__, ##__VA_ARGS__)
  #define kleave(FMT, ...) \
  	no_printk(KERN_DEBUG "<== %s()"FMT"
  ", __func__, ##__VA_ARGS__)
  #define kdebug(FMT, ...) \
  	no_printk(KERN_DEBUG FMT"
  ", ##__VA_ARGS__)
  #endif
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
59
60
61
62
63
  
  void *high_memory;
  struct page *mem_map;
  unsigned long max_mapnr;
  unsigned long num_physpages;
4266c97a3   Hugh Dickins   nommu: fix two bu...
64
  unsigned long highest_memmap_pfn;
00a62ce91   KOSAKI Motohiro   mm: fix Committed...
65
  struct percpu_counter vm_committed_as;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
66
67
68
  int sysctl_overcommit_memory = OVERCOMMIT_GUESS; /* heuristic overcommit */
  int sysctl_overcommit_ratio = 50; /* default is 50% */
  int sysctl_max_map_count = DEFAULT_MAX_MAP_COUNT;
fc4d5c292   David Howells   nommu: make the i...
69
  int sysctl_nr_trim_pages = CONFIG_NOMMU_INITIAL_TRIM_EXCESS;
c9b1d0981   Andrew Shewmaker   mm: limit growth ...
70
  unsigned long sysctl_user_reserve_kbytes __read_mostly = 1UL << 17; /* 128MB */
4eeab4f55   Andrew Shewmaker   mm: replace hardc...
71
  unsigned long sysctl_admin_reserve_kbytes __read_mostly = 1UL << 13; /* 8MB */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
72
  int heap_stack_gap = 0;
33e5d7697   David Howells   nommu: fix a numb...
73
  atomic_long_t mmap_pages_allocated;
8feae1311   David Howells   NOMMU: Make VMAs ...
74

997071bcb   K. Y. Srinivasan   mm: export a func...
75
76
77
78
79
80
81
82
83
84
85
86
87
88
  /*
   * The global memory commitment made in the system can be a metric
   * that can be used to drive ballooning decisions when Linux is hosted
   * as a guest. On Hyper-V, the host implements a policy engine for dynamically
   * balancing memory across competing virtual machines that are hosted.
   * Several metrics drive this policy engine including the guest reported
   * memory commitment.
   */
  unsigned long vm_memory_committed(void)
  {
  	return percpu_counter_read_positive(&vm_committed_as);
  }
  
  EXPORT_SYMBOL_GPL(vm_memory_committed);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
89
  EXPORT_SYMBOL(mem_map);
6a04de6db   Wu, Bryan   [PATCH] nommu: fi...
90
  EXPORT_SYMBOL(num_physpages);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
91

8feae1311   David Howells   NOMMU: Make VMAs ...
92
93
94
95
  /* list of mapped, potentially shareable regions */
  static struct kmem_cache *vm_region_jar;
  struct rb_root nommu_region_tree = RB_ROOT;
  DECLARE_RWSEM(nommu_region_sem);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
96

f0f37e2f7   Alexey Dobriyan   const: mark struc...
97
  const struct vm_operations_struct generic_file_vm_ops = {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
98
99
100
  };
  
  /*
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
101
102
103
104
105
106
107
108
   * Return the total memory allocated for this pointer, not
   * just what the caller asked for.
   *
   * Doesn't have to be accurate, i.e. may have races.
   */
  unsigned int kobjsize(const void *objp)
  {
  	struct page *page;
4016a1390   Michael Hennerich   mm/nommu.c: retur...
109
110
111
112
  	/*
  	 * If the object we have should not have ksize performed on it,
  	 * return size of 0
  	 */
5a1603be5   Paul Mundt   nommu: Correct ko...
113
  	if (!objp || !virt_addr_valid(objp))
6cfd53fc0   Paul Mundt   nommu: fix kobjsi...
114
115
116
  		return 0;
  
  	page = virt_to_head_page(objp);
6cfd53fc0   Paul Mundt   nommu: fix kobjsi...
117
118
119
120
121
  
  	/*
  	 * If the allocator sets PageSlab, we know the pointer came from
  	 * kmalloc().
  	 */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
122
123
  	if (PageSlab(page))
  		return ksize(objp);
6cfd53fc0   Paul Mundt   nommu: fix kobjsi...
124
  	/*
ab2e83ead   Paul Mundt   NOMMU: Teach kobj...
125
126
127
128
129
130
131
132
133
134
135
136
137
138
  	 * If it's not a compound page, see if we have a matching VMA
  	 * region. This test is intentionally done in reverse order,
  	 * so if there's no VMA, we still fall through and hand back
  	 * PAGE_SIZE for 0-order pages.
  	 */
  	if (!PageCompound(page)) {
  		struct vm_area_struct *vma;
  
  		vma = find_vma(current->mm, (unsigned long)objp);
  		if (vma)
  			return vma->vm_end - vma->vm_start;
  	}
  
  	/*
6cfd53fc0   Paul Mundt   nommu: fix kobjsi...
139
  	 * The ksize() function is only guaranteed to work for pointers
5a1603be5   Paul Mundt   nommu: Correct ko...
140
  	 * returned by kmalloc(). So handle arbitrary pointers here.
6cfd53fc0   Paul Mundt   nommu: fix kobjsi...
141
  	 */
5a1603be5   Paul Mundt   nommu: Correct ko...
142
  	return PAGE_SIZE << compound_order(page);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
143
  }
28a35716d   Michel Lespinasse   mm: use long type...
144
145
146
147
  long __get_user_pages(struct task_struct *tsk, struct mm_struct *mm,
  		      unsigned long start, unsigned long nr_pages,
  		      unsigned int foll_flags, struct page **pages,
  		      struct vm_area_struct **vmas, int *nonblocking)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
148
  {
910e46da4   Sonic Zhang   [PATCH] Check if ...
149
  	struct vm_area_struct *vma;
7b4d5b8b3   David Howells   [PATCH] NOMMU: Ch...
150
151
152
153
  	unsigned long vm_flags;
  	int i;
  
  	/* calculate required read or write permissions.
58fa879e1   Hugh Dickins   mm: FOLL flags fo...
154
  	 * If FOLL_FORCE is set, we only require the "MAY" flags.
7b4d5b8b3   David Howells   [PATCH] NOMMU: Ch...
155
  	 */
58fa879e1   Hugh Dickins   mm: FOLL flags fo...
156
157
158
159
  	vm_flags  = (foll_flags & FOLL_WRITE) ?
  			(VM_WRITE | VM_MAYWRITE) : (VM_READ | VM_MAYREAD);
  	vm_flags &= (foll_flags & FOLL_FORCE) ?
  			(VM_MAYREAD | VM_MAYWRITE) : (VM_READ | VM_WRITE);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
160

9d73777e5   Peter Zijlstra   clarify get_user_...
161
  	for (i = 0; i < nr_pages; i++) {
7561e8ca0   David Howells   NOMMU: Revert 'no...
162
  		vma = find_vma(mm, start);
7b4d5b8b3   David Howells   [PATCH] NOMMU: Ch...
163
164
165
166
  		if (!vma)
  			goto finish_or_fault;
  
  		/* protect what we can, including chardevs */
1c3aff1ce   Hugh Dickins   mm: remove unused...
167
168
  		if ((vma->vm_flags & (VM_IO | VM_PFNMAP)) ||
  		    !(vm_flags & vma->vm_flags))
7b4d5b8b3   David Howells   [PATCH] NOMMU: Ch...
169
  			goto finish_or_fault;
910e46da4   Sonic Zhang   [PATCH] Check if ...
170

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
171
172
173
174
175
176
  		if (pages) {
  			pages[i] = virt_to_page(start);
  			if (pages[i])
  				page_cache_get(pages[i]);
  		}
  		if (vmas)
910e46da4   Sonic Zhang   [PATCH] Check if ...
177
  			vmas[i] = vma;
e1ee65d85   David Howells   NOMMU: Fix __get_...
178
  		start = (start + PAGE_SIZE) & PAGE_MASK;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
179
  	}
7b4d5b8b3   David Howells   [PATCH] NOMMU: Ch...
180
181
182
183
184
  
  	return i;
  
  finish_or_fault:
  	return i ? : -EFAULT;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
185
  }
b291f0003   Nick Piggin   mlock: mlocked pa...
186

b291f0003   Nick Piggin   mlock: mlocked pa...
187
188
189
190
191
192
193
  /*
   * get a list of pages in an address range belonging to the specified process
   * and indicate the VMA that covers each page
   * - this is potentially dodgy as we may end incrementing the page count of a
   *   slab page or a secondary page from a compound page
   * - don't permit access to VMAs that don't support it, such as I/O mappings
   */
28a35716d   Michel Lespinasse   mm: use long type...
194
195
196
197
  long get_user_pages(struct task_struct *tsk, struct mm_struct *mm,
  		    unsigned long start, unsigned long nr_pages,
  		    int write, int force, struct page **pages,
  		    struct vm_area_struct **vmas)
b291f0003   Nick Piggin   mlock: mlocked pa...
198
199
200
201
  {
  	int flags = 0;
  
  	if (write)
58fa879e1   Hugh Dickins   mm: FOLL flags fo...
202
  		flags |= FOLL_WRITE;
b291f0003   Nick Piggin   mlock: mlocked pa...
203
  	if (force)
58fa879e1   Hugh Dickins   mm: FOLL flags fo...
204
  		flags |= FOLL_FORCE;
b291f0003   Nick Piggin   mlock: mlocked pa...
205

53a7706d5   Michel Lespinasse   mlock: do not hol...
206
207
  	return __get_user_pages(tsk, mm, start, nr_pages, flags, pages, vmas,
  				NULL);
b291f0003   Nick Piggin   mlock: mlocked pa...
208
  }
66aa2b4b1   Greg Ungerer   [PATCH] uclinux: ...
209
  EXPORT_SYMBOL(get_user_pages);
dfc2f91ac   Paul Mundt   nommu: provide fo...
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
  /**
   * follow_pfn - look up PFN at a user virtual address
   * @vma: memory mapping
   * @address: user virtual address
   * @pfn: location to store found PFN
   *
   * Only IO mappings and raw PFN mappings are allowed.
   *
   * Returns zero and the pfn at @pfn on success, -ve otherwise.
   */
  int follow_pfn(struct vm_area_struct *vma, unsigned long address,
  	unsigned long *pfn)
  {
  	if (!(vma->vm_flags & (VM_IO | VM_PFNMAP)))
  		return -EINVAL;
  
  	*pfn = address >> PAGE_SHIFT;
  	return 0;
  }
  EXPORT_SYMBOL(follow_pfn);
f1c4069e1   Joonsoo Kim   mm, vmalloc: expo...
230
  LIST_HEAD(vmap_area_list);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
231

b3bdda02a   Christoph Lameter   vmalloc: add cons...
232
  void vfree(const void *addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
233
234
235
  {
  	kfree(addr);
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
236
  EXPORT_SYMBOL(vfree);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
237

dd0fc66fb   Al Viro   [PATCH] gfp flags...
238
  void *__vmalloc(unsigned long size, gfp_t gfp_mask, pgprot_t prot)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
239
240
  {
  	/*
8518609de   Robert P. J. Day   Explain clearly w...
241
242
  	 *  You can't specify __GFP_HIGHMEM with kmalloc() since kmalloc()
  	 * returns only a logical address.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
243
  	 */
84097518d   Nick Piggin   [PATCH] mm: nommu...
244
  	return kmalloc(size, (gfp_mask | __GFP_COMP) & ~__GFP_HIGHMEM);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
245
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
246
  EXPORT_SYMBOL(__vmalloc);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
247

f905bc447   Paul Mundt   nommu: add new vm...
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
  void *vmalloc_user(unsigned long size)
  {
  	void *ret;
  
  	ret = __vmalloc(size, GFP_KERNEL | __GFP_HIGHMEM | __GFP_ZERO,
  			PAGE_KERNEL);
  	if (ret) {
  		struct vm_area_struct *vma;
  
  		down_write(&current->mm->mmap_sem);
  		vma = find_vma(current->mm, (unsigned long)ret);
  		if (vma)
  			vma->vm_flags |= VM_USERMAP;
  		up_write(&current->mm->mmap_sem);
  	}
  
  	return ret;
  }
  EXPORT_SYMBOL(vmalloc_user);
b3bdda02a   Christoph Lameter   vmalloc: add cons...
267
  struct page *vmalloc_to_page(const void *addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
268
269
270
  {
  	return virt_to_page(addr);
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
271
  EXPORT_SYMBOL(vmalloc_to_page);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
272

b3bdda02a   Christoph Lameter   vmalloc: add cons...
273
  unsigned long vmalloc_to_pfn(const void *addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
274
275
276
  {
  	return page_to_pfn(virt_to_page(addr));
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
277
  EXPORT_SYMBOL(vmalloc_to_pfn);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
  
  long vread(char *buf, char *addr, unsigned long count)
  {
  	memcpy(buf, addr, count);
  	return count;
  }
  
  long vwrite(char *buf, char *addr, unsigned long count)
  {
  	/* Don't allow overflow */
  	if ((unsigned long) addr + count < count)
  		count = -(unsigned long) addr;
  
  	memcpy(addr, buf, count);
  	return(count);
  }
  
  /*
   *	vmalloc  -  allocate virtually continguos memory
   *
   *	@size:		allocation size
   *
   *	Allocate enough pages to cover @size from the page level
   *	allocator and map them into continguos kernel virtual space.
   *
c1c8897f8   Michael Opdenacker   Spelling fix: "co...
303
   *	For tight control over page level allocator and protection flags
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
304
305
306
307
308
309
   *	use __vmalloc() instead.
   */
  void *vmalloc(unsigned long size)
  {
         return __vmalloc(size, GFP_KERNEL | __GFP_HIGHMEM, PAGE_KERNEL);
  }
f61388822   Andrew Morton   [PATCH] nommu: im...
310
  EXPORT_SYMBOL(vmalloc);
e1ca7788d   Dave Young   mm: add vzalloc()...
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
  /*
   *	vzalloc - allocate virtually continguos memory with zero fill
   *
   *	@size:		allocation size
   *
   *	Allocate enough pages to cover @size from the page level
   *	allocator and map them into continguos kernel virtual space.
   *	The memory allocated is set to zero.
   *
   *	For tight control over page level allocator and protection flags
   *	use __vmalloc() instead.
   */
  void *vzalloc(unsigned long size)
  {
  	return __vmalloc(size, GFP_KERNEL | __GFP_HIGHMEM | __GFP_ZERO,
  			PAGE_KERNEL);
  }
  EXPORT_SYMBOL(vzalloc);
  
  /**
   * vmalloc_node - allocate memory on a specific node
   * @size:	allocation size
   * @node:	numa node
   *
   * Allocate enough pages to cover @size from the page level
   * allocator and map them into contiguous kernel virtual space.
   *
   * For tight control over page level allocator and protection flags
   * use __vmalloc() instead.
   */
f61388822   Andrew Morton   [PATCH] nommu: im...
341
342
343
344
  void *vmalloc_node(unsigned long size, int node)
  {
  	return vmalloc(size);
  }
9a14f653d   Paul Mundt   nommu: Fix up vma...
345
  EXPORT_SYMBOL(vmalloc_node);
e1ca7788d   Dave Young   mm: add vzalloc()...
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
  
  /**
   * vzalloc_node - allocate memory on a specific node with zero fill
   * @size:	allocation size
   * @node:	numa node
   *
   * Allocate enough pages to cover @size from the page level
   * allocator and map them into contiguous kernel virtual space.
   * The memory allocated is set to zero.
   *
   * For tight control over page level allocator and protection flags
   * use __vmalloc() instead.
   */
  void *vzalloc_node(unsigned long size, int node)
  {
  	return vzalloc(size);
  }
  EXPORT_SYMBOL(vzalloc_node);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
364

1af446edf   Paul Mundt   nommu: Provide vm...
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
  #ifndef PAGE_KERNEL_EXEC
  # define PAGE_KERNEL_EXEC PAGE_KERNEL
  #endif
  
  /**
   *	vmalloc_exec  -  allocate virtually contiguous, executable memory
   *	@size:		allocation size
   *
   *	Kernel-internal function to allocate enough pages to cover @size
   *	the page level allocator and map them into contiguous and
   *	executable kernel virtual space.
   *
   *	For tight control over page level allocator and protection flags
   *	use __vmalloc() instead.
   */
  
  void *vmalloc_exec(unsigned long size)
  {
  	return __vmalloc(size, GFP_KERNEL | __GFP_HIGHMEM, PAGE_KERNEL_EXEC);
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
385
386
  /**
   * vmalloc_32  -  allocate virtually contiguous memory (32bit addressable)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
387
388
389
390
391
392
393
394
395
   *	@size:		allocation size
   *
   *	Allocate enough 32bit PA addressable pages to cover @size from the
   *	page level allocator and map them into continguos kernel virtual space.
   */
  void *vmalloc_32(unsigned long size)
  {
  	return __vmalloc(size, GFP_KERNEL, PAGE_KERNEL);
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
396
397
398
399
400
401
402
403
  EXPORT_SYMBOL(vmalloc_32);
  
  /**
   * vmalloc_32_user - allocate zeroed virtually contiguous 32bit memory
   *	@size:		allocation size
   *
   * The resulting memory area is 32bit addressable and zeroed so it can be
   * mapped to userspace without leaking data.
f905bc447   Paul Mundt   nommu: add new vm...
404
405
406
   *
   * VM_USERMAP is set on the corresponding VMA so that subsequent calls to
   * remap_vmalloc_range() are permissible.
b50731732   Paul Mundt   nommu: vmalloc_32...
407
408
409
   */
  void *vmalloc_32_user(unsigned long size)
  {
f905bc447   Paul Mundt   nommu: add new vm...
410
411
412
413
414
  	/*
  	 * We'll have to sort out the ZONE_DMA bits for 64-bit,
  	 * but for now this can simply use vmalloc_user() directly.
  	 */
  	return vmalloc_user(size);
b50731732   Paul Mundt   nommu: vmalloc_32...
415
416
  }
  EXPORT_SYMBOL(vmalloc_32_user);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
417
418
419
420
421
422
  
  void *vmap(struct page **pages, unsigned int count, unsigned long flags, pgprot_t prot)
  {
  	BUG();
  	return NULL;
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
423
  EXPORT_SYMBOL(vmap);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
424

b3bdda02a   Christoph Lameter   vmalloc: add cons...
425
  void vunmap(const void *addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
426
427
428
  {
  	BUG();
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
429
  EXPORT_SYMBOL(vunmap);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
430

eb6434d9e   Paul Mundt   nommu: Stub in vm...
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
  void *vm_map_ram(struct page **pages, unsigned int count, int node, pgprot_t prot)
  {
  	BUG();
  	return NULL;
  }
  EXPORT_SYMBOL(vm_map_ram);
  
  void vm_unmap_ram(const void *mem, unsigned int count)
  {
  	BUG();
  }
  EXPORT_SYMBOL(vm_unmap_ram);
  
  void vm_unmap_aliases(void)
  {
  }
  EXPORT_SYMBOL_GPL(vm_unmap_aliases);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
448
  /*
1eeb66a1b   Christoph Hellwig   move die notifier...
449
450
451
452
453
454
   * Implement a stub for vmalloc_sync_all() if the architecture chose not to
   * have one.
   */
  void  __attribute__((weak)) vmalloc_sync_all(void)
  {
  }
29c185e5c   Paul Mundt   nommu: Provide st...
455
456
457
458
459
460
461
462
463
464
465
466
  /**
   *	alloc_vm_area - allocate a range of kernel address space
   *	@size:		size of the area
   *
   *	Returns:	NULL on failure, vm_struct on success
   *
   *	This function reserves a range of kernel address space, and
   *	allocates pagetables to map that range.  No actual mappings
   *	are created.  If the kernel address space is not shared
   *	between processes, it syncs the pagetable across all
   *	processes.
   */
cd12909cb   David Vrabel   xen: map foreign ...
467
  struct vm_struct *alloc_vm_area(size_t size, pte_t **ptes)
29c185e5c   Paul Mundt   nommu: Provide st...
468
469
470
471
472
473
474
475
476
477
478
  {
  	BUG();
  	return NULL;
  }
  EXPORT_SYMBOL_GPL(alloc_vm_area);
  
  void free_vm_area(struct vm_struct *area)
  {
  	BUG();
  }
  EXPORT_SYMBOL_GPL(free_vm_area);
b50731732   Paul Mundt   nommu: vmalloc_32...
479
480
481
482
483
484
  int vm_insert_page(struct vm_area_struct *vma, unsigned long addr,
  		   struct page *page)
  {
  	return -EINVAL;
  }
  EXPORT_SYMBOL(vm_insert_page);
1eeb66a1b   Christoph Hellwig   move die notifier...
485
  /*
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
486
487
488
489
490
491
   *  sys_brk() for the most part doesn't need the global kernel
   *  lock, except when an application is doing something nasty
   *  like trying to un-brk an area that has already been mapped
   *  to a regular file.  in this case, the unmapping will need
   *  to invoke file system routines that need the global lock.
   */
6a6160a7b   Heiko Carstens   [CVE-2009-0029] S...
492
  SYSCALL_DEFINE1(brk, unsigned long, brk)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
  {
  	struct mm_struct *mm = current->mm;
  
  	if (brk < mm->start_brk || brk > mm->context.end_brk)
  		return mm->brk;
  
  	if (mm->brk == brk)
  		return mm->brk;
  
  	/*
  	 * Always allow shrinking brk
  	 */
  	if (brk <= mm->brk) {
  		mm->brk = brk;
  		return brk;
  	}
  
  	/*
  	 * Ok, looks good - let it rip.
  	 */
cfe79c00a   Mike Frysinger   NOMMU: Avoiding d...
513
  	flush_icache_range(mm->brk, brk);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
514
515
  	return mm->brk = brk;
  }
8feae1311   David Howells   NOMMU: Make VMAs ...
516
517
518
519
  /*
   * initialise the VMA and region record slabs
   */
  void __init mmap_init(void)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
520
  {
00a62ce91   KOSAKI Motohiro   mm: fix Committed...
521
522
523
524
  	int ret;
  
  	ret = percpu_counter_init(&vm_committed_as, 0);
  	VM_BUG_ON(ret);
33e5d7697   David Howells   nommu: fix a numb...
525
  	vm_region_jar = KMEM_CACHE(vm_region, SLAB_PANIC);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
526
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
527

3034097a5   David Howells   [PATCH] NOMMU: Or...
528
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
529
530
   * validate the region tree
   * - the caller must hold the region lock
3034097a5   David Howells   [PATCH] NOMMU: Or...
531
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
532
533
  #ifdef CONFIG_DEBUG_NOMMU_REGIONS
  static noinline void validate_nommu_regions(void)
3034097a5   David Howells   [PATCH] NOMMU: Or...
534
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
535
536
  	struct vm_region *region, *last;
  	struct rb_node *p, *lastp;
3034097a5   David Howells   [PATCH] NOMMU: Or...
537

8feae1311   David Howells   NOMMU: Make VMAs ...
538
539
540
541
542
  	lastp = rb_first(&nommu_region_tree);
  	if (!lastp)
  		return;
  
  	last = rb_entry(lastp, struct vm_region, vm_rb);
33e5d7697   David Howells   nommu: fix a numb...
543
544
  	BUG_ON(unlikely(last->vm_end <= last->vm_start));
  	BUG_ON(unlikely(last->vm_top < last->vm_end));
8feae1311   David Howells   NOMMU: Make VMAs ...
545
546
547
548
  
  	while ((p = rb_next(lastp))) {
  		region = rb_entry(p, struct vm_region, vm_rb);
  		last = rb_entry(lastp, struct vm_region, vm_rb);
33e5d7697   David Howells   nommu: fix a numb...
549
550
551
  		BUG_ON(unlikely(region->vm_end <= region->vm_start));
  		BUG_ON(unlikely(region->vm_top < region->vm_end));
  		BUG_ON(unlikely(region->vm_start < last->vm_top));
3034097a5   David Howells   [PATCH] NOMMU: Or...
552

8feae1311   David Howells   NOMMU: Make VMAs ...
553
554
  		lastp = p;
  	}
3034097a5   David Howells   [PATCH] NOMMU: Or...
555
  }
8feae1311   David Howells   NOMMU: Make VMAs ...
556
  #else
33e5d7697   David Howells   nommu: fix a numb...
557
558
559
  static void validate_nommu_regions(void)
  {
  }
8feae1311   David Howells   NOMMU: Make VMAs ...
560
  #endif
3034097a5   David Howells   [PATCH] NOMMU: Or...
561
562
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
563
   * add a region into the global tree
3034097a5   David Howells   [PATCH] NOMMU: Or...
564
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
565
  static void add_nommu_region(struct vm_region *region)
3034097a5   David Howells   [PATCH] NOMMU: Or...
566
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
567
568
  	struct vm_region *pregion;
  	struct rb_node **p, *parent;
3034097a5   David Howells   [PATCH] NOMMU: Or...
569

8feae1311   David Howells   NOMMU: Make VMAs ...
570
  	validate_nommu_regions();
8feae1311   David Howells   NOMMU: Make VMAs ...
571
572
573
574
575
576
577
578
579
580
581
582
583
  	parent = NULL;
  	p = &nommu_region_tree.rb_node;
  	while (*p) {
  		parent = *p;
  		pregion = rb_entry(parent, struct vm_region, vm_rb);
  		if (region->vm_start < pregion->vm_start)
  			p = &(*p)->rb_left;
  		else if (region->vm_start > pregion->vm_start)
  			p = &(*p)->rb_right;
  		else if (pregion == region)
  			return;
  		else
  			BUG();
3034097a5   David Howells   [PATCH] NOMMU: Or...
584
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
585
586
  	rb_link_node(&region->vm_rb, parent, p);
  	rb_insert_color(&region->vm_rb, &nommu_region_tree);
3034097a5   David Howells   [PATCH] NOMMU: Or...
587

8feae1311   David Howells   NOMMU: Make VMAs ...
588
  	validate_nommu_regions();
3034097a5   David Howells   [PATCH] NOMMU: Or...
589
  }
3034097a5   David Howells   [PATCH] NOMMU: Or...
590
591
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
592
   * delete a region from the global tree
930e652a2   David Howells   [PATCH] NOMMU: Ma...
593
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
594
  static void delete_nommu_region(struct vm_region *region)
930e652a2   David Howells   [PATCH] NOMMU: Ma...
595
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
596
  	BUG_ON(!nommu_region_tree.rb_node);
930e652a2   David Howells   [PATCH] NOMMU: Ma...
597

8feae1311   David Howells   NOMMU: Make VMAs ...
598
599
600
  	validate_nommu_regions();
  	rb_erase(&region->vm_rb, &nommu_region_tree);
  	validate_nommu_regions();
57c8f63e8   Greg Ungerer   nommu: stub expan...
601
  }
930e652a2   David Howells   [PATCH] NOMMU: Ma...
602
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
603
   * free a contiguous series of pages
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
604
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
605
  static void free_page_series(unsigned long from, unsigned long to)
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
606
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
607
608
609
610
  	for (; from < to; from += PAGE_SIZE) {
  		struct page *page = virt_to_page(from);
  
  		kdebug("- free %lx", from);
33e5d7697   David Howells   nommu: fix a numb...
611
  		atomic_long_dec(&mmap_pages_allocated);
8feae1311   David Howells   NOMMU: Make VMAs ...
612
  		if (page_count(page) != 1)
33e5d7697   David Howells   nommu: fix a numb...
613
614
  			kdebug("free page %p: refcount not one: %d",
  			       page, page_count(page));
8feae1311   David Howells   NOMMU: Make VMAs ...
615
  		put_page(page);
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
616
  	}
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
617
618
619
  }
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
620
   * release a reference to a region
33e5d7697   David Howells   nommu: fix a numb...
621
   * - the caller must hold the region semaphore for writing, which this releases
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
622
   * - the region may not have been added to the tree yet, in which case vm_top
8feae1311   David Howells   NOMMU: Make VMAs ...
623
   *   will equal vm_start
3034097a5   David Howells   [PATCH] NOMMU: Or...
624
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
625
626
  static void __put_nommu_region(struct vm_region *region)
  	__releases(nommu_region_sem)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
627
  {
1e2ae599d   David Howells   nommu: struct vm_...
628
  	kenter("%p{%d}", region, region->vm_usage);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
629

8feae1311   David Howells   NOMMU: Make VMAs ...
630
  	BUG_ON(!nommu_region_tree.rb_node);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
631

1e2ae599d   David Howells   nommu: struct vm_...
632
  	if (--region->vm_usage == 0) {
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
633
  		if (region->vm_top > region->vm_start)
8feae1311   David Howells   NOMMU: Make VMAs ...
634
635
636
637
638
639
640
641
642
643
  			delete_nommu_region(region);
  		up_write(&nommu_region_sem);
  
  		if (region->vm_file)
  			fput(region->vm_file);
  
  		/* IO memory and memory shared directly out of the pagecache
  		 * from ramfs/tmpfs mustn't be released here */
  		if (region->vm_flags & VM_MAPPED_COPY) {
  			kdebug("free series");
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
644
  			free_page_series(region->vm_start, region->vm_top);
8feae1311   David Howells   NOMMU: Make VMAs ...
645
646
647
648
  		}
  		kmem_cache_free(vm_region_jar, region);
  	} else {
  		up_write(&nommu_region_sem);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
649
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
650
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
651

8feae1311   David Howells   NOMMU: Make VMAs ...
652
653
654
655
656
657
658
  /*
   * release a reference to a region
   */
  static void put_nommu_region(struct vm_region *region)
  {
  	down_write(&nommu_region_sem);
  	__put_nommu_region(region);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
659
  }
3034097a5   David Howells   [PATCH] NOMMU: Or...
660
  /*
eb8cdec4a   Bernd Schmidt   nommu: add suppor...
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
   * update protection on a vma
   */
  static void protect_vma(struct vm_area_struct *vma, unsigned long flags)
  {
  #ifdef CONFIG_MPU
  	struct mm_struct *mm = vma->vm_mm;
  	long start = vma->vm_start & PAGE_MASK;
  	while (start < vma->vm_end) {
  		protect_page(mm, start, flags);
  		start += PAGE_SIZE;
  	}
  	update_protections(mm);
  #endif
  }
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
677
678
679
680
   * add a VMA into a process's mm_struct in the appropriate place in the list
   * and tree and add to the address space's page tree also if not an anonymous
   * page
   * - should be called with mm->mmap_sem held writelocked
3034097a5   David Howells   [PATCH] NOMMU: Or...
681
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
682
  static void add_vma_to_mm(struct mm_struct *mm, struct vm_area_struct *vma)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
683
  {
6038def0d   Namhyung Kim   mm: nommu: sort m...
684
  	struct vm_area_struct *pvma, *prev;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
685
  	struct address_space *mapping;
6038def0d   Namhyung Kim   mm: nommu: sort m...
686
  	struct rb_node **p, *parent, *rb_prev;
8feae1311   David Howells   NOMMU: Make VMAs ...
687
688
689
690
691
692
693
  
  	kenter(",%p", vma);
  
  	BUG_ON(!vma->vm_region);
  
  	mm->map_count++;
  	vma->vm_mm = mm;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
694

eb8cdec4a   Bernd Schmidt   nommu: add suppor...
695
  	protect_vma(vma, vma->vm_flags);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
696
697
698
  	/* add the VMA to the mapping */
  	if (vma->vm_file) {
  		mapping = vma->vm_file->f_mapping;
918e556ec   David Howells   NOMMU: Lock i_mma...
699
  		mutex_lock(&mapping->i_mmap_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
700
  		flush_dcache_mmap_lock(mapping);
6b2dbba8b   Michel Lespinasse   mm: replace vma p...
701
  		vma_interval_tree_insert(vma, &mapping->i_mmap);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
702
  		flush_dcache_mmap_unlock(mapping);
918e556ec   David Howells   NOMMU: Lock i_mma...
703
  		mutex_unlock(&mapping->i_mmap_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
704
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
705
  	/* add the VMA to the tree */
6038def0d   Namhyung Kim   mm: nommu: sort m...
706
  	parent = rb_prev = NULL;
8feae1311   David Howells   NOMMU: Make VMAs ...
707
  	p = &mm->mm_rb.rb_node;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
708
709
710
  	while (*p) {
  		parent = *p;
  		pvma = rb_entry(parent, struct vm_area_struct, vm_rb);
8feae1311   David Howells   NOMMU: Make VMAs ...
711
712
713
  		/* sort by: start addr, end addr, VMA struct addr in that order
  		 * (the latter is necessary as we may get identical VMAs) */
  		if (vma->vm_start < pvma->vm_start)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
714
  			p = &(*p)->rb_left;
6038def0d   Namhyung Kim   mm: nommu: sort m...
715
716
  		else if (vma->vm_start > pvma->vm_start) {
  			rb_prev = parent;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
717
  			p = &(*p)->rb_right;
6038def0d   Namhyung Kim   mm: nommu: sort m...
718
  		} else if (vma->vm_end < pvma->vm_end)
8feae1311   David Howells   NOMMU: Make VMAs ...
719
  			p = &(*p)->rb_left;
6038def0d   Namhyung Kim   mm: nommu: sort m...
720
721
  		else if (vma->vm_end > pvma->vm_end) {
  			rb_prev = parent;
8feae1311   David Howells   NOMMU: Make VMAs ...
722
  			p = &(*p)->rb_right;
6038def0d   Namhyung Kim   mm: nommu: sort m...
723
  		} else if (vma < pvma)
8feae1311   David Howells   NOMMU: Make VMAs ...
724
  			p = &(*p)->rb_left;
6038def0d   Namhyung Kim   mm: nommu: sort m...
725
726
  		else if (vma > pvma) {
  			rb_prev = parent;
8feae1311   David Howells   NOMMU: Make VMAs ...
727
  			p = &(*p)->rb_right;
6038def0d   Namhyung Kim   mm: nommu: sort m...
728
  		} else
8feae1311   David Howells   NOMMU: Make VMAs ...
729
  			BUG();
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
730
731
732
  	}
  
  	rb_link_node(&vma->vm_rb, parent, p);
8feae1311   David Howells   NOMMU: Make VMAs ...
733
734
735
  	rb_insert_color(&vma->vm_rb, &mm->mm_rb);
  
  	/* add VMA to the VMA list also */
6038def0d   Namhyung Kim   mm: nommu: sort m...
736
737
738
  	prev = NULL;
  	if (rb_prev)
  		prev = rb_entry(rb_prev, struct vm_area_struct, vm_rb);
8feae1311   David Howells   NOMMU: Make VMAs ...
739

6038def0d   Namhyung Kim   mm: nommu: sort m...
740
  	__vma_link_list(mm, vma, prev, parent);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
741
  }
3034097a5   David Howells   [PATCH] NOMMU: Or...
742
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
743
   * delete a VMA from its owning mm_struct and address space
3034097a5   David Howells   [PATCH] NOMMU: Or...
744
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
745
  static void delete_vma_from_mm(struct vm_area_struct *vma)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
746
747
  {
  	struct address_space *mapping;
8feae1311   David Howells   NOMMU: Make VMAs ...
748
749
750
  	struct mm_struct *mm = vma->vm_mm;
  
  	kenter("%p", vma);
eb8cdec4a   Bernd Schmidt   nommu: add suppor...
751
  	protect_vma(vma, 0);
8feae1311   David Howells   NOMMU: Make VMAs ...
752
753
754
  	mm->map_count--;
  	if (mm->mmap_cache == vma)
  		mm->mmap_cache = NULL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
755
756
757
758
  
  	/* remove the VMA from the mapping */
  	if (vma->vm_file) {
  		mapping = vma->vm_file->f_mapping;
918e556ec   David Howells   NOMMU: Lock i_mma...
759
  		mutex_lock(&mapping->i_mmap_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
760
  		flush_dcache_mmap_lock(mapping);
6b2dbba8b   Michel Lespinasse   mm: replace vma p...
761
  		vma_interval_tree_remove(vma, &mapping->i_mmap);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
762
  		flush_dcache_mmap_unlock(mapping);
918e556ec   David Howells   NOMMU: Lock i_mma...
763
  		mutex_unlock(&mapping->i_mmap_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
764
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
765
766
  	/* remove from the MM's tree and list */
  	rb_erase(&vma->vm_rb, &mm->mm_rb);
b951bf2c4   Namhyung Kim   mm: nommu: don't ...
767
768
769
770
771
772
773
774
  
  	if (vma->vm_prev)
  		vma->vm_prev->vm_next = vma->vm_next;
  	else
  		mm->mmap = vma->vm_next;
  
  	if (vma->vm_next)
  		vma->vm_next->vm_prev = vma->vm_prev;
8feae1311   David Howells   NOMMU: Make VMAs ...
775
776
777
778
779
780
781
782
783
784
  }
  
  /*
   * destroy a VMA record
   */
  static void delete_vma(struct mm_struct *mm, struct vm_area_struct *vma)
  {
  	kenter("%p", vma);
  	if (vma->vm_ops && vma->vm_ops->close)
  		vma->vm_ops->close(vma);
e9714acf8   Konstantin Khlebnikov   mm: kill vma flag...
785
  	if (vma->vm_file)
8feae1311   David Howells   NOMMU: Make VMAs ...
786
  		fput(vma->vm_file);
8feae1311   David Howells   NOMMU: Make VMAs ...
787
788
789
790
791
792
793
794
795
796
797
  	put_nommu_region(vma->vm_region);
  	kmem_cache_free(vm_area_cachep, vma);
  }
  
  /*
   * look up the first VMA in which addr resides, NULL if none
   * - should be called with mm->mmap_sem at least held readlocked
   */
  struct vm_area_struct *find_vma(struct mm_struct *mm, unsigned long addr)
  {
  	struct vm_area_struct *vma;
8feae1311   David Howells   NOMMU: Make VMAs ...
798
799
  
  	/* check the cache first */
b6a9b7f6b   Jan Stancek   mm: prevent mmap_...
800
  	vma = ACCESS_ONCE(mm->mmap_cache);
8feae1311   David Howells   NOMMU: Make VMAs ...
801
802
  	if (vma && vma->vm_start <= addr && vma->vm_end > addr)
  		return vma;
e922c4c53   Namhyung Kim   mm: nommu: find v...
803
  	/* trawl the list (there may be multiple mappings in which addr
8feae1311   David Howells   NOMMU: Make VMAs ...
804
  	 * resides) */
e922c4c53   Namhyung Kim   mm: nommu: find v...
805
  	for (vma = mm->mmap; vma; vma = vma->vm_next) {
8feae1311   David Howells   NOMMU: Make VMAs ...
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
  		if (vma->vm_start > addr)
  			return NULL;
  		if (vma->vm_end > addr) {
  			mm->mmap_cache = vma;
  			return vma;
  		}
  	}
  
  	return NULL;
  }
  EXPORT_SYMBOL(find_vma);
  
  /*
   * find a VMA
   * - we don't extend stack VMAs under NOMMU conditions
   */
  struct vm_area_struct *find_extend_vma(struct mm_struct *mm, unsigned long addr)
  {
7561e8ca0   David Howells   NOMMU: Revert 'no...
824
  	return find_vma(mm, addr);
8feae1311   David Howells   NOMMU: Make VMAs ...
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
  }
  
  /*
   * expand a stack to a given address
   * - not supported under NOMMU conditions
   */
  int expand_stack(struct vm_area_struct *vma, unsigned long address)
  {
  	return -ENOMEM;
  }
  
  /*
   * look up the first VMA exactly that exactly matches addr
   * - should be called with mm->mmap_sem at least held readlocked
   */
  static struct vm_area_struct *find_vma_exact(struct mm_struct *mm,
  					     unsigned long addr,
  					     unsigned long len)
  {
  	struct vm_area_struct *vma;
8feae1311   David Howells   NOMMU: Make VMAs ...
845
846
847
848
849
850
  	unsigned long end = addr + len;
  
  	/* check the cache first */
  	vma = mm->mmap_cache;
  	if (vma && vma->vm_start == addr && vma->vm_end == end)
  		return vma;
e922c4c53   Namhyung Kim   mm: nommu: find v...
851
  	/* trawl the list (there may be multiple mappings in which addr
8feae1311   David Howells   NOMMU: Make VMAs ...
852
  	 * resides) */
e922c4c53   Namhyung Kim   mm: nommu: find v...
853
  	for (vma = mm->mmap; vma; vma = vma->vm_next) {
8feae1311   David Howells   NOMMU: Make VMAs ...
854
855
856
857
858
859
860
861
862
863
864
  		if (vma->vm_start < addr)
  			continue;
  		if (vma->vm_start > addr)
  			return NULL;
  		if (vma->vm_end == end) {
  			mm->mmap_cache = vma;
  			return vma;
  		}
  	}
  
  	return NULL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
865
866
867
868
869
870
871
872
873
874
875
876
877
878
  }
  
  /*
   * determine whether a mapping should be permitted and, if so, what sort of
   * mapping we're capable of supporting
   */
  static int validate_mmap_request(struct file *file,
  				 unsigned long addr,
  				 unsigned long len,
  				 unsigned long prot,
  				 unsigned long flags,
  				 unsigned long pgoff,
  				 unsigned long *_capabilities)
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
879
  	unsigned long capabilities, rlen;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
880
881
882
  	int ret;
  
  	/* do the simple checks first */
06aab5a30   David Howells   NOMMU: Ignore mma...
883
  	if (flags & MAP_FIXED) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
884
885
886
887
888
889
890
891
892
893
  		printk(KERN_DEBUG
  		       "%d: Can't do fixed-address/overlay mmap of RAM
  ",
  		       current->pid);
  		return -EINVAL;
  	}
  
  	if ((flags & MAP_TYPE) != MAP_PRIVATE &&
  	    (flags & MAP_TYPE) != MAP_SHARED)
  		return -EINVAL;
f81cff0d4   Mike Frysinger   [PATCH] uclinux: ...
894
  	if (!len)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
895
  		return -EINVAL;
f81cff0d4   Mike Frysinger   [PATCH] uclinux: ...
896
  	/* Careful about overflows.. */
8feae1311   David Howells   NOMMU: Make VMAs ...
897
898
  	rlen = PAGE_ALIGN(len);
  	if (!rlen || rlen > TASK_SIZE)
f81cff0d4   Mike Frysinger   [PATCH] uclinux: ...
899
  		return -ENOMEM;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
900
  	/* offset overflow? */
8feae1311   David Howells   NOMMU: Make VMAs ...
901
  	if ((pgoff + (rlen >> PAGE_SHIFT)) < pgoff)
f81cff0d4   Mike Frysinger   [PATCH] uclinux: ...
902
  		return -EOVERFLOW;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
  
  	if (file) {
  		/* validate file mapping requests */
  		struct address_space *mapping;
  
  		/* files must support mmap */
  		if (!file->f_op || !file->f_op->mmap)
  			return -ENODEV;
  
  		/* work out if what we've got could possibly be shared
  		 * - we support chardevs that provide their own "memory"
  		 * - we support files/blockdevs that are memory backed
  		 */
  		mapping = file->f_mapping;
  		if (!mapping)
496ad9aa8   Al Viro   new helper: file_...
918
  			mapping = file_inode(file)->i_mapping;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
919
920
921
922
923
924
925
926
  
  		capabilities = 0;
  		if (mapping && mapping->backing_dev_info)
  			capabilities = mapping->backing_dev_info->capabilities;
  
  		if (!capabilities) {
  			/* no explicit capabilities set, so assume some
  			 * defaults */
496ad9aa8   Al Viro   new helper: file_...
927
  			switch (file_inode(file)->i_mode & S_IFMT) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
  			case S_IFREG:
  			case S_IFBLK:
  				capabilities = BDI_CAP_MAP_COPY;
  				break;
  
  			case S_IFCHR:
  				capabilities =
  					BDI_CAP_MAP_DIRECT |
  					BDI_CAP_READ_MAP |
  					BDI_CAP_WRITE_MAP;
  				break;
  
  			default:
  				return -EINVAL;
  			}
  		}
  
  		/* eliminate any capabilities that we can't support on this
  		 * device */
  		if (!file->f_op->get_unmapped_area)
  			capabilities &= ~BDI_CAP_MAP_DIRECT;
  		if (!file->f_op->read)
  			capabilities &= ~BDI_CAP_MAP_COPY;
28d7a6ae9   Graff Yang   nommu: check fd r...
951
952
953
  		/* The file shall have been opened with read permission. */
  		if (!(file->f_mode & FMODE_READ))
  			return -EACCES;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
954
955
956
957
958
  		if (flags & MAP_SHARED) {
  			/* do checks for writing, appending and locking */
  			if ((prot & PROT_WRITE) &&
  			    !(file->f_mode & FMODE_WRITE))
  				return -EACCES;
496ad9aa8   Al Viro   new helper: file_...
959
  			if (IS_APPEND(file_inode(file)) &&
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
960
961
  			    (file->f_mode & FMODE_WRITE))
  				return -EACCES;
496ad9aa8   Al Viro   new helper: file_...
962
  			if (locks_verify_locked(file_inode(file)))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
963
964
965
966
  				return -EAGAIN;
  
  			if (!(capabilities & BDI_CAP_MAP_DIRECT))
  				return -ENODEV;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
967
968
969
970
971
972
973
974
975
976
977
978
979
980
  			/* we mustn't privatise shared mappings */
  			capabilities &= ~BDI_CAP_MAP_COPY;
  		}
  		else {
  			/* we're going to read the file into private memory we
  			 * allocate */
  			if (!(capabilities & BDI_CAP_MAP_COPY))
  				return -ENODEV;
  
  			/* we don't permit a private writable mapping to be
  			 * shared with the backing device */
  			if (prot & PROT_WRITE)
  				capabilities &= ~BDI_CAP_MAP_DIRECT;
  		}
3c7b20454   Bernd Schmidt   nommu: allow priv...
981
982
983
984
985
986
987
988
989
990
991
992
993
994
  		if (capabilities & BDI_CAP_MAP_DIRECT) {
  			if (((prot & PROT_READ)  && !(capabilities & BDI_CAP_READ_MAP))  ||
  			    ((prot & PROT_WRITE) && !(capabilities & BDI_CAP_WRITE_MAP)) ||
  			    ((prot & PROT_EXEC)  && !(capabilities & BDI_CAP_EXEC_MAP))
  			    ) {
  				capabilities &= ~BDI_CAP_MAP_DIRECT;
  				if (flags & MAP_SHARED) {
  					printk(KERN_WARNING
  					       "MAP_SHARED not completely supported on !MMU
  ");
  					return -EINVAL;
  				}
  			}
  		}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
995
996
  		/* handle executable mappings and implied executable
  		 * mappings */
e9536ae72   Josef Sipek   [PATCH] struct pa...
997
  		if (file->f_path.mnt->mnt_flags & MNT_NOEXEC) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
998
999
1000
1001
1002
1003
1004
1005
1006
1007
1008
1009
1010
1011
1012
1013
1014
1015
1016
1017
1018
1019
1020
1021
1022
1023
1024
1025
1026
1027
1028
  			if (prot & PROT_EXEC)
  				return -EPERM;
  		}
  		else if ((prot & PROT_READ) && !(prot & PROT_EXEC)) {
  			/* handle implication of PROT_EXEC by PROT_READ */
  			if (current->personality & READ_IMPLIES_EXEC) {
  				if (capabilities & BDI_CAP_EXEC_MAP)
  					prot |= PROT_EXEC;
  			}
  		}
  		else if ((prot & PROT_READ) &&
  			 (prot & PROT_EXEC) &&
  			 !(capabilities & BDI_CAP_EXEC_MAP)
  			 ) {
  			/* backing file is not executable, try to copy */
  			capabilities &= ~BDI_CAP_MAP_DIRECT;
  		}
  	}
  	else {
  		/* anonymous mappings are always memory backed and can be
  		 * privately mapped
  		 */
  		capabilities = BDI_CAP_MAP_COPY;
  
  		/* handle PROT_EXEC implication by PROT_READ */
  		if ((prot & PROT_READ) &&
  		    (current->personality & READ_IMPLIES_EXEC))
  			prot |= PROT_EXEC;
  	}
  
  	/* allow the security API to have its say */
e5467859f   Al Viro   split ->file_mmap...
1029
1030
1031
  	ret = security_mmap_addr(addr);
  	if (ret < 0)
  		return ret;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1032
1033
1034
1035
1036
1037
1038
1039
1040
1041
1042
1043
1044
1045
1046
1047
1048
1049
  
  	/* looks okay */
  	*_capabilities = capabilities;
  	return 0;
  }
  
  /*
   * we've determined that we can make the mapping, now translate what we
   * now know into VMA flags
   */
  static unsigned long determine_vm_flags(struct file *file,
  					unsigned long prot,
  					unsigned long flags,
  					unsigned long capabilities)
  {
  	unsigned long vm_flags;
  
  	vm_flags = calc_vm_prot_bits(prot) | calc_vm_flag_bits(flags);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1050
1051
1052
1053
  	/* vm_flags |= mm->def_flags; */
  
  	if (!(capabilities & BDI_CAP_MAP_DIRECT)) {
  		/* attempt to share read-only copies of mapped file chunks */
3c7b20454   Bernd Schmidt   nommu: allow priv...
1054
  		vm_flags |= VM_MAYREAD | VM_MAYWRITE | VM_MAYEXEC;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1055
1056
  		if (file && !(prot & PROT_WRITE))
  			vm_flags |= VM_MAYSHARE;
3c7b20454   Bernd Schmidt   nommu: allow priv...
1057
  	} else {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1058
1059
1060
  		/* overlay a shareable mapping on the backing device or inode
  		 * if possible - used for chardevs, ramfs/tmpfs/shmfs and
  		 * romfs/cramfs */
3c7b20454   Bernd Schmidt   nommu: allow priv...
1061
  		vm_flags |= VM_MAYSHARE | (capabilities & BDI_CAP_VMFLAGS);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1062
  		if (flags & MAP_SHARED)
3c7b20454   Bernd Schmidt   nommu: allow priv...
1063
  			vm_flags |= VM_SHARED;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1064
1065
1066
1067
1068
1069
  	}
  
  	/* refuse to let anyone share private mappings with this process if
  	 * it's being traced - otherwise breakpoints set in it may interfere
  	 * with another untraced process
  	 */
a288eecce   Tejun Heo   ptrace: kill triv...
1070
  	if ((flags & MAP_PRIVATE) && current->ptrace)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1071
1072
1073
1074
1075
1076
  		vm_flags &= ~VM_MAYSHARE;
  
  	return vm_flags;
  }
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
1077
1078
   * set up a shared mapping on a file (the driver or filesystem provides and
   * pins the storage)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1079
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
1080
  static int do_mmap_shared_file(struct vm_area_struct *vma)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1081
1082
1083
1084
  {
  	int ret;
  
  	ret = vma->vm_file->f_op->mmap(vma->vm_file, vma);
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1085
1086
  	if (ret == 0) {
  		vma->vm_region->vm_top = vma->vm_region->vm_end;
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1087
  		return 0;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1088
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1089
1090
  	if (ret != -ENOSYS)
  		return ret;
3fa30460e   David Howells   nommu: fix an inc...
1091
1092
1093
  	/* getting -ENOSYS indicates that direct mmap isn't possible (as
  	 * opposed to tried but failed) so we can only give a suitable error as
  	 * it's not possible to make a private copy if MAP_SHARED was given */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1094
1095
1096
1097
1098
1099
  	return -ENODEV;
  }
  
  /*
   * set up a private mapping or an anonymous shared mapping
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
1100
1101
  static int do_mmap_private(struct vm_area_struct *vma,
  			   struct vm_region *region,
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1102
1103
  			   unsigned long len,
  			   unsigned long capabilities)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1104
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
1105
  	struct page *pages;
f67d9b157   Bob Liu   nommu: add page a...
1106
  	unsigned long total, point, n;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1107
  	void *base;
8feae1311   David Howells   NOMMU: Make VMAs ...
1108
  	int ret, order;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1109
1110
1111
1112
1113
  
  	/* invoke the file's mapping function so that it can keep track of
  	 * shared mappings on devices or memory
  	 * - VM_MAYSHARE will be set if it may attempt to share
  	 */
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1114
  	if (capabilities & BDI_CAP_MAP_DIRECT) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1115
  		ret = vma->vm_file->f_op->mmap(vma->vm_file, vma);
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1116
  		if (ret == 0) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1117
  			/* shouldn't return success if we're not sharing */
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1118
1119
  			BUG_ON(!(vma->vm_flags & VM_MAYSHARE));
  			vma->vm_region->vm_top = vma->vm_region->vm_end;
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1120
  			return 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1121
  		}
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1122
1123
  		if (ret != -ENOSYS)
  			return ret;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1124
1125
1126
1127
1128
  
  		/* getting an ENOSYS error indicates that direct mmap isn't
  		 * possible (as opposed to tried but failed) so we'll try to
  		 * make a private copy of the data and map that instead */
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1129

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1130
1131
1132
1133
  	/* allocate some memory to hold the mapping
  	 * - note that this may not return a page-aligned address if the object
  	 *   we're allocating is smaller than a page
  	 */
f67d9b157   Bob Liu   nommu: add page a...
1134
  	order = get_order(len);
8feae1311   David Howells   NOMMU: Make VMAs ...
1135
1136
1137
1138
  	kdebug("alloc order %d for %lx", order, len);
  
  	pages = alloc_pages(GFP_KERNEL, order);
  	if (!pages)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1139
  		goto enomem;
8feae1311   David Howells   NOMMU: Make VMAs ...
1140
  	total = 1 << order;
33e5d7697   David Howells   nommu: fix a numb...
1141
  	atomic_long_add(total, &mmap_pages_allocated);
8feae1311   David Howells   NOMMU: Make VMAs ...
1142

f67d9b157   Bob Liu   nommu: add page a...
1143
  	point = len >> PAGE_SHIFT;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1144
1145
1146
1147
1148
1149
1150
1151
  
  	/* we allocated a power-of-2 sized page set, so we may want to trim off
  	 * the excess */
  	if (sysctl_nr_trim_pages && total - point >= sysctl_nr_trim_pages) {
  		while (total > point) {
  			order = ilog2(total - point);
  			n = 1 << order;
  			kdebug("shave %lu/%lu @%lu", n, total - point, total);
33e5d7697   David Howells   nommu: fix a numb...
1152
  			atomic_long_sub(n, &mmap_pages_allocated);
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1153
1154
1155
1156
  			total -= n;
  			set_page_refcounted(pages + total);
  			__free_pages(pages + total, order);
  		}
8feae1311   David Howells   NOMMU: Make VMAs ...
1157
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1158
1159
  	for (point = 1; point < total; point++)
  		set_page_refcounted(&pages[point]);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1160

8feae1311   David Howells   NOMMU: Make VMAs ...
1161
1162
1163
  	base = page_address(pages);
  	region->vm_flags = vma->vm_flags |= VM_MAPPED_COPY;
  	region->vm_start = (unsigned long) base;
f67d9b157   Bob Liu   nommu: add page a...
1164
  	region->vm_end   = region->vm_start + len;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1165
  	region->vm_top   = region->vm_start + (total << PAGE_SHIFT);
8feae1311   David Howells   NOMMU: Make VMAs ...
1166
1167
1168
  
  	vma->vm_start = region->vm_start;
  	vma->vm_end   = region->vm_start + len;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1169
1170
1171
1172
1173
1174
1175
1176
1177
1178
1179
  
  	if (vma->vm_file) {
  		/* read the contents of a file into the copy */
  		mm_segment_t old_fs;
  		loff_t fpos;
  
  		fpos = vma->vm_pgoff;
  		fpos <<= PAGE_SHIFT;
  
  		old_fs = get_fs();
  		set_fs(KERNEL_DS);
f67d9b157   Bob Liu   nommu: add page a...
1180
  		ret = vma->vm_file->f_op->read(vma->vm_file, base, len, &fpos);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1181
1182
1183
1184
1185
1186
  		set_fs(old_fs);
  
  		if (ret < 0)
  			goto error_free;
  
  		/* clear the last little bit */
f67d9b157   Bob Liu   nommu: add page a...
1187
1188
  		if (ret < len)
  			memset(base + ret, 0, len - ret);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1189

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1190
1191
1192
1193
1194
  	}
  
  	return 0;
  
  error_free:
7223bb4a8   Namhyung Kim   mm: nommu: fix a ...
1195
  	free_page_series(region->vm_start, region->vm_top);
8feae1311   David Howells   NOMMU: Make VMAs ...
1196
1197
  	region->vm_start = vma->vm_start = 0;
  	region->vm_end   = vma->vm_end = 0;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1198
  	region->vm_top   = 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1199
1200
1201
  	return ret;
  
  enomem:
05ae6fa31   Greg Ungerer   uclinux: add proc...
1202
1203
1204
  	printk("Allocation of length %lu from process %d (%s) failed
  ",
  	       len, current->pid, current->comm);
7bf02ea22   David Rientjes   arch, mm: filter ...
1205
  	show_free_areas(0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1206
1207
1208
1209
1210
1211
  	return -ENOMEM;
  }
  
  /*
   * handle mapping creation for uClinux
   */
e3fc629d7   Al Viro   switch aio and sh...
1212
  unsigned long do_mmap_pgoff(struct file *file,
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1213
1214
1215
1216
  			    unsigned long addr,
  			    unsigned long len,
  			    unsigned long prot,
  			    unsigned long flags,
bebeb3d68   Michel Lespinasse   mm: introduce mm_...
1217
  			    unsigned long pgoff,
41badc15c   Michel Lespinasse   mm: make do_mmap_...
1218
  			    unsigned long *populate)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1219
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
1220
1221
  	struct vm_area_struct *vma;
  	struct vm_region *region;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1222
  	struct rb_node *rb;
8feae1311   David Howells   NOMMU: Make VMAs ...
1223
  	unsigned long capabilities, vm_flags, result;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1224
  	int ret;
8feae1311   David Howells   NOMMU: Make VMAs ...
1225
  	kenter(",%lx,%lx,%lx,%lx,%lx", addr, len, prot, flags, pgoff);
41badc15c   Michel Lespinasse   mm: make do_mmap_...
1226
  	*populate = 0;
bebeb3d68   Michel Lespinasse   mm: introduce mm_...
1227

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1228
1229
1230
1231
  	/* decide whether we should attempt the mapping, and if so what sort of
  	 * mapping */
  	ret = validate_mmap_request(file, addr, len, prot, flags, pgoff,
  				    &capabilities);
8feae1311   David Howells   NOMMU: Make VMAs ...
1232
1233
  	if (ret < 0) {
  		kleave(" = %d [val]", ret);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1234
  		return ret;
8feae1311   David Howells   NOMMU: Make VMAs ...
1235
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1236

06aab5a30   David Howells   NOMMU: Ignore mma...
1237
1238
  	/* we ignore the address hint */
  	addr = 0;
f67d9b157   Bob Liu   nommu: add page a...
1239
  	len = PAGE_ALIGN(len);
06aab5a30   David Howells   NOMMU: Ignore mma...
1240

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1241
1242
1243
  	/* we've determined that we can make the mapping, now translate what we
  	 * now know into VMA flags */
  	vm_flags = determine_vm_flags(file, prot, flags, capabilities);
8feae1311   David Howells   NOMMU: Make VMAs ...
1244
1245
1246
1247
1248
1249
1250
1251
  	/* we're going to need to record the mapping */
  	region = kmem_cache_zalloc(vm_region_jar, GFP_KERNEL);
  	if (!region)
  		goto error_getting_region;
  
  	vma = kmem_cache_zalloc(vm_area_cachep, GFP_KERNEL);
  	if (!vma)
  		goto error_getting_vma;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1252

1e2ae599d   David Howells   nommu: struct vm_...
1253
  	region->vm_usage = 1;
8feae1311   David Howells   NOMMU: Make VMAs ...
1254
1255
  	region->vm_flags = vm_flags;
  	region->vm_pgoff = pgoff;
5beb49305   Rik van Riel   mm: change anon_v...
1256
  	INIT_LIST_HEAD(&vma->anon_vma_chain);
8feae1311   David Howells   NOMMU: Make VMAs ...
1257
1258
  	vma->vm_flags = vm_flags;
  	vma->vm_pgoff = pgoff;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1259

8feae1311   David Howells   NOMMU: Make VMAs ...
1260
  	if (file) {
cb0942b81   Al Viro   make get_file() r...
1261
1262
  		region->vm_file = get_file(file);
  		vma->vm_file = get_file(file);
8feae1311   David Howells   NOMMU: Make VMAs ...
1263
1264
1265
1266
1267
  	}
  
  	down_write(&nommu_region_sem);
  
  	/* if we want to share, we need to check for regions created by other
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1268
  	 * mmap() calls that overlap with our proposed mapping
8feae1311   David Howells   NOMMU: Make VMAs ...
1269
  	 * - we can only share with a superset match on most regular files
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1270
1271
1272
1273
1274
1275
  	 * - shared mappings on character devices and memory backed files are
  	 *   permitted to overlap inexactly as far as we are concerned for in
  	 *   these cases, sharing is handled in the driver or filesystem rather
  	 *   than here
  	 */
  	if (vm_flags & VM_MAYSHARE) {
8feae1311   David Howells   NOMMU: Make VMAs ...
1276
1277
  		struct vm_region *pregion;
  		unsigned long pglen, rpglen, pgend, rpgend, start;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1278

8feae1311   David Howells   NOMMU: Make VMAs ...
1279
1280
  		pglen = (len + PAGE_SIZE - 1) >> PAGE_SHIFT;
  		pgend = pgoff + pglen;
165b23927   David Howells   [PATCH] NOMMU: ma...
1281

8feae1311   David Howells   NOMMU: Make VMAs ...
1282
1283
  		for (rb = rb_first(&nommu_region_tree); rb; rb = rb_next(rb)) {
  			pregion = rb_entry(rb, struct vm_region, vm_rb);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1284

8feae1311   David Howells   NOMMU: Make VMAs ...
1285
  			if (!(pregion->vm_flags & VM_MAYSHARE))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1286
1287
1288
  				continue;
  
  			/* search for overlapping mappings on the same file */
496ad9aa8   Al Viro   new helper: file_...
1289
1290
  			if (file_inode(pregion->vm_file) !=
  			    file_inode(file))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1291
  				continue;
8feae1311   David Howells   NOMMU: Make VMAs ...
1292
  			if (pregion->vm_pgoff >= pgend)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1293
  				continue;
8feae1311   David Howells   NOMMU: Make VMAs ...
1294
1295
1296
1297
  			rpglen = pregion->vm_end - pregion->vm_start;
  			rpglen = (rpglen + PAGE_SIZE - 1) >> PAGE_SHIFT;
  			rpgend = pregion->vm_pgoff + rpglen;
  			if (pgoff >= rpgend)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1298
  				continue;
8feae1311   David Howells   NOMMU: Make VMAs ...
1299
1300
1301
1302
1303
  			/* handle inexactly overlapping matches between
  			 * mappings */
  			if ((pregion->vm_pgoff != pgoff || rpglen != pglen) &&
  			    !(pgoff >= pregion->vm_pgoff && pgend <= rpgend)) {
  				/* new mapping is not a subset of the region */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1304
1305
1306
1307
  				if (!(capabilities & BDI_CAP_MAP_DIRECT))
  					goto sharing_violation;
  				continue;
  			}
8feae1311   David Howells   NOMMU: Make VMAs ...
1308
  			/* we've found a region we can share */
1e2ae599d   David Howells   nommu: struct vm_...
1309
  			pregion->vm_usage++;
8feae1311   David Howells   NOMMU: Make VMAs ...
1310
1311
1312
1313
1314
1315
1316
1317
1318
1319
1320
1321
1322
1323
1324
1325
  			vma->vm_region = pregion;
  			start = pregion->vm_start;
  			start += (pgoff - pregion->vm_pgoff) << PAGE_SHIFT;
  			vma->vm_start = start;
  			vma->vm_end = start + len;
  
  			if (pregion->vm_flags & VM_MAPPED_COPY) {
  				kdebug("share copy");
  				vma->vm_flags |= VM_MAPPED_COPY;
  			} else {
  				kdebug("share mmap");
  				ret = do_mmap_shared_file(vma);
  				if (ret < 0) {
  					vma->vm_region = NULL;
  					vma->vm_start = 0;
  					vma->vm_end = 0;
1e2ae599d   David Howells   nommu: struct vm_...
1326
  					pregion->vm_usage--;
8feae1311   David Howells   NOMMU: Make VMAs ...
1327
1328
1329
1330
1331
1332
1333
1334
1335
  					pregion = NULL;
  					goto error_just_free;
  				}
  			}
  			fput(region->vm_file);
  			kmem_cache_free(vm_region_jar, region);
  			region = pregion;
  			result = start;
  			goto share;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1336
  		}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1337
1338
1339
1340
  		/* obtain the address at which to make a shared mapping
  		 * - this is the hook for quasi-memory character devices to
  		 *   tell us the location of a shared mapping
  		 */
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1341
  		if (capabilities & BDI_CAP_MAP_DIRECT) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1342
1343
  			addr = file->f_op->get_unmapped_area(file, addr, len,
  							     pgoff, flags);
bb005a59e   Namhyung Kim   mm: nommu: fix a ...
1344
  			if (IS_ERR_VALUE(addr)) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1345
  				ret = addr;
bb005a59e   Namhyung Kim   mm: nommu: fix a ...
1346
  				if (ret != -ENOSYS)
8feae1311   David Howells   NOMMU: Make VMAs ...
1347
  					goto error_just_free;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1348
1349
1350
1351
  
  				/* the driver refused to tell us where to site
  				 * the mapping so we'll have to attempt to copy
  				 * it */
bb005a59e   Namhyung Kim   mm: nommu: fix a ...
1352
  				ret = -ENODEV;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1353
  				if (!(capabilities & BDI_CAP_MAP_COPY))
8feae1311   David Howells   NOMMU: Make VMAs ...
1354
  					goto error_just_free;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1355
1356
  
  				capabilities &= ~BDI_CAP_MAP_DIRECT;
8feae1311   David Howells   NOMMU: Make VMAs ...
1357
1358
1359
  			} else {
  				vma->vm_start = region->vm_start = addr;
  				vma->vm_end = region->vm_end = addr + len;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1360
1361
1362
  			}
  		}
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1363
  	vma->vm_region = region;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1364

645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1365
1366
1367
  	/* set up the mapping
  	 * - the region is filled in if BDI_CAP_MAP_DIRECT is still set
  	 */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1368
  	if (file && vma->vm_flags & VM_SHARED)
8feae1311   David Howells   NOMMU: Make VMAs ...
1369
  		ret = do_mmap_shared_file(vma);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1370
  	else
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1371
  		ret = do_mmap_private(vma, region, len, capabilities);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1372
  	if (ret < 0)
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1373
1374
  		goto error_just_free;
  	add_nommu_region(region);
8feae1311   David Howells   NOMMU: Make VMAs ...
1375

ea6376395   Jie Zhang   nommu: fix malloc...
1376
1377
1378
1379
  	/* clear anonymous mappings that don't ask for uninitialized data */
  	if (!vma->vm_file && !(flags & MAP_UNINITIALIZED))
  		memset((void *)region->vm_start, 0,
  		       region->vm_end - region->vm_start);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1380
  	/* okay... we have a mapping; now we have to register it */
8feae1311   David Howells   NOMMU: Make VMAs ...
1381
  	result = vma->vm_start;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1382

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1383
  	current->mm->total_vm += len >> PAGE_SHIFT;
8feae1311   David Howells   NOMMU: Make VMAs ...
1384
1385
  share:
  	add_vma_to_mm(current->mm, vma);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1386

cfe79c00a   Mike Frysinger   NOMMU: Avoiding d...
1387
1388
1389
1390
1391
1392
  	/* we flush the region from the icache only when the first executable
  	 * mapping of it is made  */
  	if (vma->vm_flags & VM_EXEC && !region->vm_icache_flushed) {
  		flush_icache_range(region->vm_start, region->vm_end);
  		region->vm_icache_flushed = true;
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1393

cfe79c00a   Mike Frysinger   NOMMU: Avoiding d...
1394
  	up_write(&nommu_region_sem);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1395

8feae1311   David Howells   NOMMU: Make VMAs ...
1396
1397
  	kleave(" = %lx", result);
  	return result;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1398

8feae1311   David Howells   NOMMU: Make VMAs ...
1399
1400
1401
  error_just_free:
  	up_write(&nommu_region_sem);
  error:
89a864027   David Howells   NOMMU: Don't pass...
1402
1403
  	if (region->vm_file)
  		fput(region->vm_file);
8feae1311   David Howells   NOMMU: Make VMAs ...
1404
  	kmem_cache_free(vm_region_jar, region);
89a864027   David Howells   NOMMU: Don't pass...
1405
1406
  	if (vma->vm_file)
  		fput(vma->vm_file);
8feae1311   David Howells   NOMMU: Make VMAs ...
1407
1408
1409
1410
1411
1412
1413
1414
1415
1416
  	kmem_cache_free(vm_area_cachep, vma);
  	kleave(" = %d", ret);
  	return ret;
  
  sharing_violation:
  	up_write(&nommu_region_sem);
  	printk(KERN_WARNING "Attempt to share mismatched mappings
  ");
  	ret = -EINVAL;
  	goto error;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1417

8feae1311   David Howells   NOMMU: Make VMAs ...
1418
1419
1420
1421
1422
  error_getting_vma:
  	kmem_cache_free(vm_region_jar, region);
  	printk(KERN_WARNING "Allocation of vma for %lu byte allocation"
  	       " from process %d failed
  ",
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1423
  	       len, current->pid);
7bf02ea22   David Rientjes   arch, mm: filter ...
1424
  	show_free_areas(0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1425
  	return -ENOMEM;
8feae1311   David Howells   NOMMU: Make VMAs ...
1426
1427
1428
1429
  error_getting_region:
  	printk(KERN_WARNING "Allocation of vm region for %lu byte allocation"
  	       " from process %d failed
  ",
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1430
  	       len, current->pid);
7bf02ea22   David Rientjes   arch, mm: filter ...
1431
  	show_free_areas(0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1432
1433
  	return -ENOMEM;
  }
6be5ceb02   Linus Torvalds   VM: add "vm_mmap(...
1434

66f0dc481   Hugh Dickins   mm: move sys_mmap...
1435
1436
1437
1438
1439
1440
  SYSCALL_DEFINE6(mmap_pgoff, unsigned long, addr, unsigned long, len,
  		unsigned long, prot, unsigned long, flags,
  		unsigned long, fd, unsigned long, pgoff)
  {
  	struct file *file = NULL;
  	unsigned long retval = -EBADF;
120a795da   Al Viro   audit mmap
1441
  	audit_mmap_fd(fd, flags);
66f0dc481   Hugh Dickins   mm: move sys_mmap...
1442
1443
1444
1445
1446
1447
1448
  	if (!(flags & MAP_ANONYMOUS)) {
  		file = fget(fd);
  		if (!file)
  			goto out;
  	}
  
  	flags &= ~(MAP_EXECUTABLE | MAP_DENYWRITE);
ad1ed2937   Greg Ungerer   nommu: fix compil...
1449
  	retval = vm_mmap_pgoff(file, addr, len, prot, flags, pgoff);
66f0dc481   Hugh Dickins   mm: move sys_mmap...
1450
1451
1452
1453
1454
1455
  
  	if (file)
  		fput(file);
  out:
  	return retval;
  }
a4679373c   Christoph Hellwig   Add generic sys_o...
1456
1457
1458
1459
1460
1461
1462
1463
1464
1465
1466
1467
1468
1469
1470
1471
1472
1473
1474
1475
1476
1477
1478
  #ifdef __ARCH_WANT_SYS_OLD_MMAP
  struct mmap_arg_struct {
  	unsigned long addr;
  	unsigned long len;
  	unsigned long prot;
  	unsigned long flags;
  	unsigned long fd;
  	unsigned long offset;
  };
  
  SYSCALL_DEFINE1(old_mmap, struct mmap_arg_struct __user *, arg)
  {
  	struct mmap_arg_struct a;
  
  	if (copy_from_user(&a, arg, sizeof(a)))
  		return -EFAULT;
  	if (a.offset & ~PAGE_MASK)
  		return -EINVAL;
  
  	return sys_mmap_pgoff(a.addr, a.len, a.prot, a.flags, a.fd,
  			      a.offset >> PAGE_SHIFT);
  }
  #endif /* __ARCH_WANT_SYS_OLD_MMAP */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1479
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
1480
1481
   * split a vma into two pieces at address 'addr', a new vma is allocated either
   * for the first part or the tail.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1482
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
1483
1484
  int split_vma(struct mm_struct *mm, struct vm_area_struct *vma,
  	      unsigned long addr, int new_below)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1485
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
1486
1487
1488
  	struct vm_area_struct *new;
  	struct vm_region *region;
  	unsigned long npages;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1489

8feae1311   David Howells   NOMMU: Make VMAs ...
1490
  	kenter("");
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1491

779c10232   David Howells   nommu: remove a s...
1492
1493
1494
  	/* we're only permitted to split anonymous regions (these should have
  	 * only a single usage on the region) */
  	if (vma->vm_file)
8feae1311   David Howells   NOMMU: Make VMAs ...
1495
  		return -ENOMEM;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1496

8feae1311   David Howells   NOMMU: Make VMAs ...
1497
1498
  	if (mm->map_count >= sysctl_max_map_count)
  		return -ENOMEM;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1499

8feae1311   David Howells   NOMMU: Make VMAs ...
1500
1501
1502
  	region = kmem_cache_alloc(vm_region_jar, GFP_KERNEL);
  	if (!region)
  		return -ENOMEM;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1503

8feae1311   David Howells   NOMMU: Make VMAs ...
1504
1505
1506
1507
1508
1509
1510
1511
1512
1513
1514
1515
1516
1517
  	new = kmem_cache_alloc(vm_area_cachep, GFP_KERNEL);
  	if (!new) {
  		kmem_cache_free(vm_region_jar, region);
  		return -ENOMEM;
  	}
  
  	/* most fields are the same, copy all, and then fixup */
  	*new = *vma;
  	*region = *vma->vm_region;
  	new->vm_region = region;
  
  	npages = (addr - vma->vm_start) >> PAGE_SHIFT;
  
  	if (new_below) {
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1518
  		region->vm_top = region->vm_end = new->vm_end = addr;
8feae1311   David Howells   NOMMU: Make VMAs ...
1519
1520
1521
  	} else {
  		region->vm_start = new->vm_start = addr;
  		region->vm_pgoff = new->vm_pgoff += npages;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1522
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1523
1524
1525
1526
1527
1528
1529
1530
1531
1532
1533
1534
  
  	if (new->vm_ops && new->vm_ops->open)
  		new->vm_ops->open(new);
  
  	delete_vma_from_mm(vma);
  	down_write(&nommu_region_sem);
  	delete_nommu_region(vma->vm_region);
  	if (new_below) {
  		vma->vm_region->vm_start = vma->vm_start = addr;
  		vma->vm_region->vm_pgoff = vma->vm_pgoff += npages;
  	} else {
  		vma->vm_region->vm_end = vma->vm_end = addr;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1535
  		vma->vm_region->vm_top = addr;
8feae1311   David Howells   NOMMU: Make VMAs ...
1536
1537
1538
1539
1540
1541
1542
  	}
  	add_nommu_region(vma->vm_region);
  	add_nommu_region(new->vm_region);
  	up_write(&nommu_region_sem);
  	add_vma_to_mm(mm, vma);
  	add_vma_to_mm(mm, new);
  	return 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1543
  }
3034097a5   David Howells   [PATCH] NOMMU: Or...
1544
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
1545
1546
   * shrink a VMA by removing the specified chunk from either the beginning or
   * the end
3034097a5   David Howells   [PATCH] NOMMU: Or...
1547
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
1548
1549
1550
  static int shrink_vma(struct mm_struct *mm,
  		      struct vm_area_struct *vma,
  		      unsigned long from, unsigned long to)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1551
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
1552
  	struct vm_region *region;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1553

8feae1311   David Howells   NOMMU: Make VMAs ...
1554
  	kenter("");
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1555

8feae1311   David Howells   NOMMU: Make VMAs ...
1556
1557
1558
1559
1560
1561
1562
1563
  	/* adjust the VMA's pointers, which may reposition it in the MM's tree
  	 * and list */
  	delete_vma_from_mm(vma);
  	if (from > vma->vm_start)
  		vma->vm_end = from;
  	else
  		vma->vm_start = to;
  	add_vma_to_mm(mm, vma);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1564

8feae1311   David Howells   NOMMU: Make VMAs ...
1565
1566
  	/* cut the backing region down to size */
  	region = vma->vm_region;
1e2ae599d   David Howells   nommu: struct vm_...
1567
  	BUG_ON(region->vm_usage != 1);
8feae1311   David Howells   NOMMU: Make VMAs ...
1568
1569
1570
  
  	down_write(&nommu_region_sem);
  	delete_nommu_region(region);
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1571
1572
1573
1574
  	if (from > region->vm_start) {
  		to = region->vm_top;
  		region->vm_top = region->vm_end = from;
  	} else {
8feae1311   David Howells   NOMMU: Make VMAs ...
1575
  		region->vm_start = to;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1576
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1577
1578
1579
1580
1581
1582
  	add_nommu_region(region);
  	up_write(&nommu_region_sem);
  
  	free_page_series(from, to);
  	return 0;
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1583

8feae1311   David Howells   NOMMU: Make VMAs ...
1584
1585
1586
1587
1588
1589
1590
1591
  /*
   * release a mapping
   * - under NOMMU conditions the chunk to be unmapped must be backed by a single
   *   VMA, though it need not cover the whole VMA
   */
  int do_munmap(struct mm_struct *mm, unsigned long start, size_t len)
  {
  	struct vm_area_struct *vma;
f67d9b157   Bob Liu   nommu: add page a...
1592
  	unsigned long end;
8feae1311   David Howells   NOMMU: Make VMAs ...
1593
  	int ret;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1594

8feae1311   David Howells   NOMMU: Make VMAs ...
1595
  	kenter(",%lx,%zx", start, len);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1596

f67d9b157   Bob Liu   nommu: add page a...
1597
  	len = PAGE_ALIGN(len);
8feae1311   David Howells   NOMMU: Make VMAs ...
1598
1599
  	if (len == 0)
  		return -EINVAL;
365e9c87a   Hugh Dickins   [PATCH] mm: updat...
1600

f67d9b157   Bob Liu   nommu: add page a...
1601
  	end = start + len;
8feae1311   David Howells   NOMMU: Make VMAs ...
1602
1603
1604
  	/* find the first potentially overlapping VMA */
  	vma = find_vma(mm, start);
  	if (!vma) {
33e5d7697   David Howells   nommu: fix a numb...
1605
1606
1607
1608
1609
1610
1611
1612
1613
1614
  		static int limit = 0;
  		if (limit < 5) {
  			printk(KERN_WARNING
  			       "munmap of memory not mmapped by process %d"
  			       " (%s): 0x%lx-0x%lx
  ",
  			       current->pid, current->comm,
  			       start, start + len - 1);
  			limit++;
  		}
8feae1311   David Howells   NOMMU: Make VMAs ...
1615
1616
  		return -EINVAL;
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1617

8feae1311   David Howells   NOMMU: Make VMAs ...
1618
1619
1620
1621
1622
1623
1624
1625
1626
  	/* we're allowed to split an anonymous VMA but not a file-backed one */
  	if (vma->vm_file) {
  		do {
  			if (start > vma->vm_start) {
  				kleave(" = -EINVAL [miss]");
  				return -EINVAL;
  			}
  			if (end == vma->vm_end)
  				goto erase_whole_vma;
d75a310c4   Namhyung Kim   mm: nommu: check ...
1627
1628
  			vma = vma->vm_next;
  		} while (vma);
8feae1311   David Howells   NOMMU: Make VMAs ...
1629
1630
1631
1632
1633
1634
1635
1636
1637
1638
1639
1640
1641
1642
1643
1644
1645
1646
1647
1648
1649
1650
1651
1652
1653
1654
1655
  		kleave(" = -EINVAL [split file]");
  		return -EINVAL;
  	} else {
  		/* the chunk must be a subset of the VMA found */
  		if (start == vma->vm_start && end == vma->vm_end)
  			goto erase_whole_vma;
  		if (start < vma->vm_start || end > vma->vm_end) {
  			kleave(" = -EINVAL [superset]");
  			return -EINVAL;
  		}
  		if (start & ~PAGE_MASK) {
  			kleave(" = -EINVAL [unaligned start]");
  			return -EINVAL;
  		}
  		if (end != vma->vm_end && end & ~PAGE_MASK) {
  			kleave(" = -EINVAL [unaligned split]");
  			return -EINVAL;
  		}
  		if (start != vma->vm_start && end != vma->vm_end) {
  			ret = split_vma(mm, vma, start, 1);
  			if (ret < 0) {
  				kleave(" = %d [split]", ret);
  				return ret;
  			}
  		}
  		return shrink_vma(mm, vma, start, end);
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1656

8feae1311   David Howells   NOMMU: Make VMAs ...
1657
1658
1659
1660
  erase_whole_vma:
  	delete_vma_from_mm(vma);
  	delete_vma(mm, vma);
  	kleave(" = 0");
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1661
1662
  	return 0;
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
1663
  EXPORT_SYMBOL(do_munmap);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1664

bfce281c2   Al Viro   kill mm argument ...
1665
  int vm_munmap(unsigned long addr, size_t len)
3034097a5   David Howells   [PATCH] NOMMU: Or...
1666
  {
bfce281c2   Al Viro   kill mm argument ...
1667
  	struct mm_struct *mm = current->mm;
3034097a5   David Howells   [PATCH] NOMMU: Or...
1668
  	int ret;
3034097a5   David Howells   [PATCH] NOMMU: Or...
1669
1670
1671
1672
1673
1674
  
  	down_write(&mm->mmap_sem);
  	ret = do_munmap(mm, addr, len);
  	up_write(&mm->mmap_sem);
  	return ret;
  }
a46ef99d8   Linus Torvalds   VM: add "vm_munma...
1675
1676
1677
1678
  EXPORT_SYMBOL(vm_munmap);
  
  SYSCALL_DEFINE2(munmap, unsigned long, addr, size_t, len)
  {
bfce281c2   Al Viro   kill mm argument ...
1679
  	return vm_munmap(addr, len);
a46ef99d8   Linus Torvalds   VM: add "vm_munma...
1680
  }
3034097a5   David Howells   [PATCH] NOMMU: Or...
1681
1682
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
1683
   * release all the mappings made in a process's VM space
3034097a5   David Howells   [PATCH] NOMMU: Or...
1684
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
1685
  void exit_mmap(struct mm_struct *mm)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1686
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
1687
  	struct vm_area_struct *vma;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1688

8feae1311   David Howells   NOMMU: Make VMAs ...
1689
1690
  	if (!mm)
  		return;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1691

8feae1311   David Howells   NOMMU: Make VMAs ...
1692
  	kenter("");
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1693

8feae1311   David Howells   NOMMU: Make VMAs ...
1694
  	mm->total_vm = 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1695

8feae1311   David Howells   NOMMU: Make VMAs ...
1696
1697
1698
1699
  	while ((vma = mm->mmap)) {
  		mm->mmap = vma->vm_next;
  		delete_vma_from_mm(vma);
  		delete_vma(mm, vma);
04c349615   Steven J. Magnani   nommu: yield CPU ...
1700
  		cond_resched();
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1701
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1702
1703
  
  	kleave("");
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1704
  }
e4eb1ff61   Linus Torvalds   VM: add "vm_brk()...
1705
  unsigned long vm_brk(unsigned long addr, unsigned long len)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1706
1707
1708
1709
1710
  {
  	return -ENOMEM;
  }
  
  /*
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1711
1712
   * expand (or shrink) an existing mapping, potentially moving it at the same
   * time (controlled by the MREMAP_MAYMOVE flag and available VM space)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1713
   *
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1714
   * under NOMMU conditions, we only permit changing a mapping's size, and only
8feae1311   David Howells   NOMMU: Make VMAs ...
1715
1716
   * as long as it stays within the region allocated by do_mmap_private() and the
   * block is not shareable
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1717
   *
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1718
   * MREMAP_FIXED is not supported under NOMMU conditions
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1719
   */
4b377bab2   Al Viro   make do_mremap() ...
1720
  static unsigned long do_mremap(unsigned long addr,
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1721
1722
1723
  			unsigned long old_len, unsigned long new_len,
  			unsigned long flags, unsigned long new_addr)
  {
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1724
  	struct vm_area_struct *vma;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1725
1726
  
  	/* insanity checks first */
f67d9b157   Bob Liu   nommu: add page a...
1727
1728
  	old_len = PAGE_ALIGN(old_len);
  	new_len = PAGE_ALIGN(new_len);
8feae1311   David Howells   NOMMU: Make VMAs ...
1729
  	if (old_len == 0 || new_len == 0)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1730
  		return (unsigned long) -EINVAL;
8feae1311   David Howells   NOMMU: Make VMAs ...
1731
1732
  	if (addr & ~PAGE_MASK)
  		return -EINVAL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1733
1734
  	if (flags & MREMAP_FIXED && new_addr != addr)
  		return (unsigned long) -EINVAL;
8feae1311   David Howells   NOMMU: Make VMAs ...
1735
  	vma = find_vma_exact(current->mm, addr, old_len);
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1736
1737
  	if (!vma)
  		return (unsigned long) -EINVAL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1738

6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1739
  	if (vma->vm_end != vma->vm_start + old_len)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1740
  		return (unsigned long) -EFAULT;
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1741
  	if (vma->vm_flags & VM_MAYSHARE)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1742
  		return (unsigned long) -EPERM;
8feae1311   David Howells   NOMMU: Make VMAs ...
1743
  	if (new_len > vma->vm_region->vm_end - vma->vm_region->vm_start)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1744
1745
1746
  		return (unsigned long) -ENOMEM;
  
  	/* all checks complete - do it */
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1747
  	vma->vm_end = vma->vm_start + new_len;
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1748
1749
  	return vma->vm_start;
  }
6a6160a7b   Heiko Carstens   [CVE-2009-0029] S...
1750
1751
1752
  SYSCALL_DEFINE5(mremap, unsigned long, addr, unsigned long, old_len,
  		unsigned long, new_len, unsigned long, flags,
  		unsigned long, new_addr)
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1753
1754
1755
1756
1757
1758
1759
  {
  	unsigned long ret;
  
  	down_write(&current->mm->mmap_sem);
  	ret = do_mremap(addr, old_len, new_len, flags, new_addr);
  	up_write(&current->mm->mmap_sem);
  	return ret;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1760
  }
240aadeed   Michel Lespinasse   mm: accelerate mm...
1761
1762
1763
  struct page *follow_page_mask(struct vm_area_struct *vma,
  			      unsigned long address, unsigned int flags,
  			      unsigned int *page_mask)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1764
  {
240aadeed   Michel Lespinasse   mm: accelerate mm...
1765
  	*page_mask = 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1766
1767
  	return NULL;
  }
8f3b1327a   Bob Liu   mm/nommu.c: fix r...
1768
1769
  int remap_pfn_range(struct vm_area_struct *vma, unsigned long addr,
  		unsigned long pfn, unsigned long size, pgprot_t prot)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1770
  {
8f3b1327a   Bob Liu   mm/nommu.c: fix r...
1771
1772
  	if (addr != (pfn << PAGE_SHIFT))
  		return -EINVAL;
314e51b98   Konstantin Khlebnikov   mm: kill vma flag...
1773
  	vma->vm_flags |= VM_IO | VM_PFNMAP | VM_DONTEXPAND | VM_DONTDUMP;
66aa2b4b1   Greg Ungerer   [PATCH] uclinux: ...
1774
  	return 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1775
  }
22c4af409   Luke Yang   [PATCH] nommu: ex...
1776
  EXPORT_SYMBOL(remap_pfn_range);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1777

3c0b9de6d   Linus Torvalds   vm: add no-mmu vm...
1778
1779
1780
1781
1782
1783
1784
1785
1786
  int vm_iomap_memory(struct vm_area_struct *vma, phys_addr_t start, unsigned long len)
  {
  	unsigned long pfn = start >> PAGE_SHIFT;
  	unsigned long vm_len = vma->vm_end - vma->vm_start;
  
  	pfn += vma->vm_pgoff;
  	return io_remap_pfn_range(vma, vma->vm_start, pfn, vm_len, vma->vm_page_prot);
  }
  EXPORT_SYMBOL(vm_iomap_memory);
f905bc447   Paul Mundt   nommu: add new vm...
1787
1788
1789
1790
1791
1792
1793
1794
1795
1796
1797
1798
1799
1800
  int remap_vmalloc_range(struct vm_area_struct *vma, void *addr,
  			unsigned long pgoff)
  {
  	unsigned int size = vma->vm_end - vma->vm_start;
  
  	if (!(vma->vm_flags & VM_USERMAP))
  		return -EINVAL;
  
  	vma->vm_start = (unsigned long)(addr + (pgoff << PAGE_SHIFT));
  	vma->vm_end = vma->vm_start + size;
  
  	return 0;
  }
  EXPORT_SYMBOL(remap_vmalloc_range);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1801
1802
1803
1804
1805
  unsigned long arch_get_unmapped_area(struct file *file, unsigned long addr,
  	unsigned long len, unsigned long pgoff, unsigned long flags)
  {
  	return -ENOMEM;
  }
1363c3cd8   Wolfgang Wander   [PATCH] Avoiding ...
1806
  void arch_unmap_area(struct mm_struct *mm, unsigned long addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1807
1808
  {
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1809
1810
1811
1812
1813
  void unmap_mapping_range(struct address_space *mapping,
  			 loff_t const holebegin, loff_t const holelen,
  			 int even_cows)
  {
  }
22c4af409   Luke Yang   [PATCH] nommu: ex...
1814
  EXPORT_SYMBOL(unmap_mapping_range);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1815
1816
1817
1818
1819
1820
1821
1822
1823
1824
1825
1826
1827
1828
1829
1830
1831
  
  /*
   * Check that a process has enough memory to allocate a new virtual
   * mapping. 0 means there is enough memory for the allocation to
   * succeed and -ENOMEM implies there is not.
   *
   * We currently support three overcommit policies, which are set via the
   * vm.overcommit_memory sysctl.  See Documentation/vm/overcommit-accounting
   *
   * Strict overcommit modes added 2002 Feb 26 by Alan Cox.
   * Additional code 2002 Jul 20 by Robert Love.
   *
   * cap_sys_admin is 1 if the process has admin privileges, 0 otherwise.
   *
   * Note this is a helper function intended to be used by LSMs which
   * wish to use this logic.
   */
34b4e4aa3   Alan Cox   fix NULL pointer ...
1832
  int __vm_enough_memory(struct mm_struct *mm, long pages, int cap_sys_admin)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1833
  {
c9b1d0981   Andrew Shewmaker   mm: limit growth ...
1834
  	unsigned long free, allowed, reserve;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1835
1836
1837
1838
1839
1840
1841
1842
1843
1844
  
  	vm_acct_memory(pages);
  
  	/*
  	 * Sometimes we want to use more memory than we have
  	 */
  	if (sysctl_overcommit_memory == OVERCOMMIT_ALWAYS)
  		return 0;
  
  	if (sysctl_overcommit_memory == OVERCOMMIT_GUESS) {
c15bef309   Dmitry Fink   mmap: fix and tid...
1845
1846
1847
1848
1849
1850
1851
1852
1853
1854
  		free = global_page_state(NR_FREE_PAGES);
  		free += global_page_state(NR_FILE_PAGES);
  
  		/*
  		 * shmem pages shouldn't be counted as free in this
  		 * case, they can't be purged, only swapped out, and
  		 * that won't affect the overall amount of available
  		 * memory in the system.
  		 */
  		free -= global_page_state(NR_SHMEM);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1855

ec8acf20a   Shaohua Li   swap: add per-par...
1856
  		free += get_nr_swap_pages();
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1857
1858
1859
1860
1861
1862
1863
  
  		/*
  		 * Any slabs which are created with the
  		 * SLAB_RECLAIM_ACCOUNT flag claim to have contents
  		 * which are reclaimable, under pressure.  The dentry
  		 * cache and most inode caches should fall into this
  		 */
972d1a7b1   Christoph Lameter   [PATCH] ZVC: Supp...
1864
  		free += global_page_state(NR_SLAB_RECLAIMABLE);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1865
1866
  
  		/*
d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1867
1868
  		 * Leave reserved pages. The pages are not for anonymous pages.
  		 */
c15bef309   Dmitry Fink   mmap: fix and tid...
1869
  		if (free <= totalreserve_pages)
d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1870
1871
  			goto error;
  		else
c15bef309   Dmitry Fink   mmap: fix and tid...
1872
  			free -= totalreserve_pages;
d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1873
1874
  
  		/*
4eeab4f55   Andrew Shewmaker   mm: replace hardc...
1875
  		 * Reserve some for root
d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1876
  		 */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1877
  		if (!cap_sys_admin)
4eeab4f55   Andrew Shewmaker   mm: replace hardc...
1878
  			free -= sysctl_admin_reserve_kbytes >> (PAGE_SHIFT - 10);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1879
1880
1881
  
  		if (free > pages)
  			return 0;
d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1882
1883
  
  		goto error;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1884
1885
1886
1887
  	}
  
  	allowed = totalram_pages * sysctl_overcommit_ratio / 100;
  	/*
4eeab4f55   Andrew Shewmaker   mm: replace hardc...
1888
  	 * Reserve some 3% for root
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1889
1890
  	 */
  	if (!cap_sys_admin)
4eeab4f55   Andrew Shewmaker   mm: replace hardc...
1891
  		allowed -= sysctl_admin_reserve_kbytes >> (PAGE_SHIFT - 10);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1892
  	allowed += total_swap_pages;
c9b1d0981   Andrew Shewmaker   mm: limit growth ...
1893
1894
1895
1896
1897
1898
1899
  	/*
  	 * Don't let a single process grow so big a user can't recover
  	 */
  	if (mm) {
  		reserve = sysctl_user_reserve_kbytes >> (PAGE_SHIFT - 10);
  		allowed -= min(mm->total_vm / 32, reserve);
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1900

00a62ce91   KOSAKI Motohiro   mm: fix Committed...
1901
  	if (percpu_counter_read_positive(&vm_committed_as) < allowed)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1902
  		return 0;
00a62ce91   KOSAKI Motohiro   mm: fix Committed...
1903

d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1904
  error:
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1905
1906
1907
1908
  	vm_unacct_memory(pages);
  
  	return -ENOMEM;
  }
cae5d3903   Stephen Wilson   mm: arch: rename ...
1909
  int in_gate_area_no_mm(unsigned long addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1910
1911
1912
  {
  	return 0;
  }
b0e15190e   David Howells   [PATCH] NOMMU: Ma...
1913

d0217ac04   Nick Piggin   mm: fault feedbac...
1914
  int filemap_fault(struct vm_area_struct *vma, struct vm_fault *vmf)
b0e15190e   David Howells   [PATCH] NOMMU: Ma...
1915
1916
  {
  	BUG();
d0217ac04   Nick Piggin   mm: fault feedbac...
1917
  	return 0;
b0e15190e   David Howells   [PATCH] NOMMU: Ma...
1918
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
1919
  EXPORT_SYMBOL(filemap_fault);
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1920

0b173bc4d   Konstantin Khlebnikov   mm: kill vma flag...
1921
1922
1923
1924
1925
1926
1927
  int generic_file_remap_pages(struct vm_area_struct *vma, unsigned long addr,
  			     unsigned long size, pgoff_t pgoff)
  {
  	BUG();
  	return 0;
  }
  EXPORT_SYMBOL(generic_file_remap_pages);
f55f199b7   Mike Frysinger   NOMMU: implement ...
1928
1929
  static int __access_remote_vm(struct task_struct *tsk, struct mm_struct *mm,
  		unsigned long addr, void *buf, int len, int write)
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1930
  {
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1931
  	struct vm_area_struct *vma;
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1932
1933
1934
1935
  
  	down_read(&mm->mmap_sem);
  
  	/* the access must start within one of the target process's mappings */
0159b141d   David Howells   [PATCH] NOMMU: Us...
1936
1937
  	vma = find_vma(mm, addr);
  	if (vma) {
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1938
1939
1940
1941
1942
  		/* don't overrun this mapping */
  		if (addr + len >= vma->vm_end)
  			len = vma->vm_end - addr;
  
  		/* only read or write mappings where it is permitted */
d00c7b993   David Howells   [PATCH] NOMMU: Pe...
1943
  		if (write && vma->vm_flags & VM_MAYWRITE)
7959722b9   Jie Zhang   NOMMU: Use copy_*...
1944
1945
  			copy_to_user_page(vma, NULL, addr,
  					 (void *) addr, buf, len);
d00c7b993   David Howells   [PATCH] NOMMU: Pe...
1946
  		else if (!write && vma->vm_flags & VM_MAYREAD)
7959722b9   Jie Zhang   NOMMU: Use copy_*...
1947
1948
  			copy_from_user_page(vma, NULL, addr,
  					    buf, (void *) addr, len);
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1949
1950
1951
1952
1953
1954
1955
  		else
  			len = 0;
  	} else {
  		len = 0;
  	}
  
  	up_read(&mm->mmap_sem);
f55f199b7   Mike Frysinger   NOMMU: implement ...
1956
1957
1958
1959
1960
1961
1962
1963
1964
1965
1966
1967
1968
1969
1970
1971
1972
1973
1974
1975
1976
1977
1978
1979
1980
1981
1982
1983
1984
1985
1986
1987
1988
1989
1990
1991
  
  	return len;
  }
  
  /**
   * @access_remote_vm - access another process' address space
   * @mm:		the mm_struct of the target address space
   * @addr:	start address to access
   * @buf:	source or destination buffer
   * @len:	number of bytes to transfer
   * @write:	whether the access is a write
   *
   * The caller must hold a reference on @mm.
   */
  int access_remote_vm(struct mm_struct *mm, unsigned long addr,
  		void *buf, int len, int write)
  {
  	return __access_remote_vm(NULL, mm, addr, buf, len, write);
  }
  
  /*
   * Access another process' address space.
   * - source/target buffer must be kernel space
   */
  int access_process_vm(struct task_struct *tsk, unsigned long addr, void *buf, int len, int write)
  {
  	struct mm_struct *mm;
  
  	if (addr + len < addr)
  		return 0;
  
  	mm = get_task_mm(tsk);
  	if (!mm)
  		return 0;
  
  	len = __access_remote_vm(tsk, mm, addr, buf, len, write);
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1992
1993
1994
  	mmput(mm);
  	return len;
  }
7e6608724   David Howells   nommu: fix shared...
1995
1996
1997
1998
1999
2000
2001
2002
2003
2004
2005
2006
2007
2008
2009
2010
  
  /**
   * nommu_shrink_inode_mappings - Shrink the shared mappings on an inode
   * @inode: The inode to check
   * @size: The current filesize of the inode
   * @newsize: The proposed filesize of the inode
   *
   * Check the shared mappings on an inode on behalf of a shrinking truncate to
   * make sure that that any outstanding VMAs aren't broken and then shrink the
   * vm_regions that extend that beyond so that do_mmap_pgoff() doesn't
   * automatically grant mappings that are too large.
   */
  int nommu_shrink_inode_mappings(struct inode *inode, size_t size,
  				size_t newsize)
  {
  	struct vm_area_struct *vma;
7e6608724   David Howells   nommu: fix shared...
2011
2012
2013
2014
2015
2016
2017
2018
  	struct vm_region *region;
  	pgoff_t low, high;
  	size_t r_size, r_top;
  
  	low = newsize >> PAGE_SHIFT;
  	high = (size + PAGE_SIZE - 1) >> PAGE_SHIFT;
  
  	down_write(&nommu_region_sem);
918e556ec   David Howells   NOMMU: Lock i_mma...
2019
  	mutex_lock(&inode->i_mapping->i_mmap_mutex);
7e6608724   David Howells   nommu: fix shared...
2020
2021
  
  	/* search for VMAs that fall within the dead zone */
6b2dbba8b   Michel Lespinasse   mm: replace vma p...
2022
  	vma_interval_tree_foreach(vma, &inode->i_mapping->i_mmap, low, high) {
7e6608724   David Howells   nommu: fix shared...
2023
2024
2025
  		/* found one - only interested if it's shared out of the page
  		 * cache */
  		if (vma->vm_flags & VM_SHARED) {
918e556ec   David Howells   NOMMU: Lock i_mma...
2026
  			mutex_unlock(&inode->i_mapping->i_mmap_mutex);
7e6608724   David Howells   nommu: fix shared...
2027
2028
2029
2030
2031
2032
2033
2034
2035
2036
2037
  			up_write(&nommu_region_sem);
  			return -ETXTBSY; /* not quite true, but near enough */
  		}
  	}
  
  	/* reduce any regions that overlap the dead zone - if in existence,
  	 * these will be pointed to by VMAs that don't overlap the dead zone
  	 *
  	 * we don't check for any regions that start beyond the EOF as there
  	 * shouldn't be any
  	 */
6b2dbba8b   Michel Lespinasse   mm: replace vma p...
2038
2039
  	vma_interval_tree_foreach(vma, &inode->i_mapping->i_mmap,
  				  0, ULONG_MAX) {
7e6608724   David Howells   nommu: fix shared...
2040
2041
2042
2043
2044
2045
2046
2047
2048
2049
2050
2051
2052
  		if (!(vma->vm_flags & VM_SHARED))
  			continue;
  
  		region = vma->vm_region;
  		r_size = region->vm_top - region->vm_start;
  		r_top = (region->vm_pgoff << PAGE_SHIFT) + r_size;
  
  		if (r_top > newsize) {
  			region->vm_top -= r_top - newsize;
  			if (region->vm_end > region->vm_top)
  				region->vm_end = region->vm_top;
  		}
  	}
918e556ec   David Howells   NOMMU: Lock i_mma...
2053
  	mutex_unlock(&inode->i_mapping->i_mmap_mutex);
7e6608724   David Howells   nommu: fix shared...
2054
2055
2056
  	up_write(&nommu_region_sem);
  	return 0;
  }
c9b1d0981   Andrew Shewmaker   mm: limit growth ...
2057
2058
2059
2060
2061
2062
2063
2064
2065
2066
2067
2068
2069
2070
2071
2072
2073
2074
2075
2076
2077
  
  /*
   * Initialise sysctl_user_reserve_kbytes.
   *
   * This is intended to prevent a user from starting a single memory hogging
   * process, such that they cannot recover (kill the hog) in OVERCOMMIT_NEVER
   * mode.
   *
   * The default value is min(3% of free memory, 128MB)
   * 128MB is enough to recover with sshd/login, bash, and top/kill.
   */
  static int __meminit init_user_reserve(void)
  {
  	unsigned long free_kbytes;
  
  	free_kbytes = global_page_state(NR_FREE_PAGES) << (PAGE_SHIFT - 10);
  
  	sysctl_user_reserve_kbytes = min(free_kbytes / 32, 1UL << 17);
  	return 0;
  }
  module_init(init_user_reserve)
4eeab4f55   Andrew Shewmaker   mm: replace hardc...
2078
2079
2080
2081
2082
2083
2084
2085
2086
2087
2088
2089
2090
2091
2092
2093
2094
2095
2096
2097
2098
  
  /*
   * Initialise sysctl_admin_reserve_kbytes.
   *
   * The purpose of sysctl_admin_reserve_kbytes is to allow the sys admin
   * to log in and kill a memory hogging process.
   *
   * Systems with more than 256MB will reserve 8MB, enough to recover
   * with sshd, bash, and top in OVERCOMMIT_GUESS. Smaller systems will
   * only reserve 3% of free pages by default.
   */
  static int __meminit init_admin_reserve(void)
  {
  	unsigned long free_kbytes;
  
  	free_kbytes = global_page_state(NR_FREE_PAGES) << (PAGE_SHIFT - 10);
  
  	sysctl_admin_reserve_kbytes = min(free_kbytes / 32, 1UL << 13);
  	return 0;
  }
  module_init(init_admin_reserve)