Blame view

mm/nommu.c 50.7 KB
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1
2
3
4
5
6
7
8
  /*
   *  linux/mm/nommu.c
   *
   *  Replacement code for mm functions to support CPU's that don't
   *  have any form of memory management unit (thus no virtual memory).
   *
   *  See Documentation/nommu-mmap.txt
   *
8feae1311   David Howells   NOMMU: Make VMAs ...
9
   *  Copyright (c) 2004-2008 David Howells <dhowells@redhat.com>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
10
11
12
   *  Copyright (c) 2000-2003 David McCullough <davidm@snapgear.com>
   *  Copyright (c) 2000-2001 D Jeff Dionne <jeff@uClinux.org>
   *  Copyright (c) 2002      Greg Ungerer <gerg@snapgear.com>
29c185e5c   Paul Mundt   nommu: Provide st...
13
   *  Copyright (c) 2007-2010 Paul Mundt <lethal@linux-sh.org>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
14
   */
b95f1b31b   Paul Gortmaker   mm: Map most file...
15
  #include <linux/export.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
16
17
18
19
20
21
22
23
  #include <linux/mm.h>
  #include <linux/mman.h>
  #include <linux/swap.h>
  #include <linux/file.h>
  #include <linux/highmem.h>
  #include <linux/pagemap.h>
  #include <linux/slab.h>
  #include <linux/vmalloc.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
24
25
26
27
28
29
  #include <linux/blkdev.h>
  #include <linux/backing-dev.h>
  #include <linux/mount.h>
  #include <linux/personality.h>
  #include <linux/security.h>
  #include <linux/syscalls.h>
120a795da   Al Viro   audit mmap
30
  #include <linux/audit.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
31
32
33
34
  
  #include <asm/uaccess.h>
  #include <asm/tlb.h>
  #include <asm/tlbflush.h>
eb8cdec4a   Bernd Schmidt   nommu: add suppor...
35
  #include <asm/mmu_context.h>
8feae1311   David Howells   NOMMU: Make VMAs ...
36
  #include "internal.h"
8feae1311   David Howells   NOMMU: Make VMAs ...
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
  #if 0
  #define kenter(FMT, ...) \
  	printk(KERN_DEBUG "==> %s("FMT")
  ", __func__, ##__VA_ARGS__)
  #define kleave(FMT, ...) \
  	printk(KERN_DEBUG "<== %s()"FMT"
  ", __func__, ##__VA_ARGS__)
  #define kdebug(FMT, ...) \
  	printk(KERN_DEBUG "xxx" FMT"yyy
  ", ##__VA_ARGS__)
  #else
  #define kenter(FMT, ...) \
  	no_printk(KERN_DEBUG "==> %s("FMT")
  ", __func__, ##__VA_ARGS__)
  #define kleave(FMT, ...) \
  	no_printk(KERN_DEBUG "<== %s()"FMT"
  ", __func__, ##__VA_ARGS__)
  #define kdebug(FMT, ...) \
  	no_printk(KERN_DEBUG FMT"
  ", ##__VA_ARGS__)
  #endif
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
58
59
60
61
62
  
  void *high_memory;
  struct page *mem_map;
  unsigned long max_mapnr;
  unsigned long num_physpages;
4266c97a3   Hugh Dickins   nommu: fix two bu...
63
  unsigned long highest_memmap_pfn;
00a62ce91   KOSAKI Motohiro   mm: fix Committed...
64
  struct percpu_counter vm_committed_as;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
65
66
67
  int sysctl_overcommit_memory = OVERCOMMIT_GUESS; /* heuristic overcommit */
  int sysctl_overcommit_ratio = 50; /* default is 50% */
  int sysctl_max_map_count = DEFAULT_MAX_MAP_COUNT;
fc4d5c292   David Howells   nommu: make the i...
68
  int sysctl_nr_trim_pages = CONFIG_NOMMU_INITIAL_TRIM_EXCESS;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
69
  int heap_stack_gap = 0;
33e5d7697   David Howells   nommu: fix a numb...
70
  atomic_long_t mmap_pages_allocated;
8feae1311   David Howells   NOMMU: Make VMAs ...
71

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
72
  EXPORT_SYMBOL(mem_map);
6a04de6db   Wu, Bryan   [PATCH] nommu: fi...
73
  EXPORT_SYMBOL(num_physpages);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
74

8feae1311   David Howells   NOMMU: Make VMAs ...
75
76
77
78
  /* list of mapped, potentially shareable regions */
  static struct kmem_cache *vm_region_jar;
  struct rb_root nommu_region_tree = RB_ROOT;
  DECLARE_RWSEM(nommu_region_sem);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
79

f0f37e2f7   Alexey Dobriyan   const: mark struc...
80
  const struct vm_operations_struct generic_file_vm_ops = {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
81
82
83
  };
  
  /*
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
84
85
86
87
88
89
90
91
   * Return the total memory allocated for this pointer, not
   * just what the caller asked for.
   *
   * Doesn't have to be accurate, i.e. may have races.
   */
  unsigned int kobjsize(const void *objp)
  {
  	struct page *page;
4016a1390   Michael Hennerich   mm/nommu.c: retur...
92
93
94
95
  	/*
  	 * If the object we have should not have ksize performed on it,
  	 * return size of 0
  	 */
5a1603be5   Paul Mundt   nommu: Correct ko...
96
  	if (!objp || !virt_addr_valid(objp))
6cfd53fc0   Paul Mundt   nommu: fix kobjsi...
97
98
99
  		return 0;
  
  	page = virt_to_head_page(objp);
6cfd53fc0   Paul Mundt   nommu: fix kobjsi...
100
101
102
103
104
  
  	/*
  	 * If the allocator sets PageSlab, we know the pointer came from
  	 * kmalloc().
  	 */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
105
106
  	if (PageSlab(page))
  		return ksize(objp);
6cfd53fc0   Paul Mundt   nommu: fix kobjsi...
107
  	/*
ab2e83ead   Paul Mundt   NOMMU: Teach kobj...
108
109
110
111
112
113
114
115
116
117
118
119
120
121
  	 * If it's not a compound page, see if we have a matching VMA
  	 * region. This test is intentionally done in reverse order,
  	 * so if there's no VMA, we still fall through and hand back
  	 * PAGE_SIZE for 0-order pages.
  	 */
  	if (!PageCompound(page)) {
  		struct vm_area_struct *vma;
  
  		vma = find_vma(current->mm, (unsigned long)objp);
  		if (vma)
  			return vma->vm_end - vma->vm_start;
  	}
  
  	/*
6cfd53fc0   Paul Mundt   nommu: fix kobjsi...
122
  	 * The ksize() function is only guaranteed to work for pointers
5a1603be5   Paul Mundt   nommu: Correct ko...
123
  	 * returned by kmalloc(). So handle arbitrary pointers here.
6cfd53fc0   Paul Mundt   nommu: fix kobjsi...
124
  	 */
5a1603be5   Paul Mundt   nommu: Correct ko...
125
  	return PAGE_SIZE << compound_order(page);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
126
  }
b291f0003   Nick Piggin   mlock: mlocked pa...
127
  int __get_user_pages(struct task_struct *tsk, struct mm_struct *mm,
4266c97a3   Hugh Dickins   nommu: fix two bu...
128
  		     unsigned long start, int nr_pages, unsigned int foll_flags,
53a7706d5   Michel Lespinasse   mlock: do not hol...
129
130
  		     struct page **pages, struct vm_area_struct **vmas,
  		     int *retry)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
131
  {
910e46da4   Sonic Zhang   [PATCH] Check if ...
132
  	struct vm_area_struct *vma;
7b4d5b8b3   David Howells   [PATCH] NOMMU: Ch...
133
134
135
136
  	unsigned long vm_flags;
  	int i;
  
  	/* calculate required read or write permissions.
58fa879e1   Hugh Dickins   mm: FOLL flags fo...
137
  	 * If FOLL_FORCE is set, we only require the "MAY" flags.
7b4d5b8b3   David Howells   [PATCH] NOMMU: Ch...
138
  	 */
58fa879e1   Hugh Dickins   mm: FOLL flags fo...
139
140
141
142
  	vm_flags  = (foll_flags & FOLL_WRITE) ?
  			(VM_WRITE | VM_MAYWRITE) : (VM_READ | VM_MAYREAD);
  	vm_flags &= (foll_flags & FOLL_FORCE) ?
  			(VM_MAYREAD | VM_MAYWRITE) : (VM_READ | VM_WRITE);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
143

9d73777e5   Peter Zijlstra   clarify get_user_...
144
  	for (i = 0; i < nr_pages; i++) {
7561e8ca0   David Howells   NOMMU: Revert 'no...
145
  		vma = find_vma(mm, start);
7b4d5b8b3   David Howells   [PATCH] NOMMU: Ch...
146
147
148
149
  		if (!vma)
  			goto finish_or_fault;
  
  		/* protect what we can, including chardevs */
1c3aff1ce   Hugh Dickins   mm: remove unused...
150
151
  		if ((vma->vm_flags & (VM_IO | VM_PFNMAP)) ||
  		    !(vm_flags & vma->vm_flags))
7b4d5b8b3   David Howells   [PATCH] NOMMU: Ch...
152
  			goto finish_or_fault;
910e46da4   Sonic Zhang   [PATCH] Check if ...
153

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
154
155
156
157
158
159
  		if (pages) {
  			pages[i] = virt_to_page(start);
  			if (pages[i])
  				page_cache_get(pages[i]);
  		}
  		if (vmas)
910e46da4   Sonic Zhang   [PATCH] Check if ...
160
  			vmas[i] = vma;
e1ee65d85   David Howells   NOMMU: Fix __get_...
161
  		start = (start + PAGE_SIZE) & PAGE_MASK;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
162
  	}
7b4d5b8b3   David Howells   [PATCH] NOMMU: Ch...
163
164
165
166
167
  
  	return i;
  
  finish_or_fault:
  	return i ? : -EFAULT;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
168
  }
b291f0003   Nick Piggin   mlock: mlocked pa...
169

b291f0003   Nick Piggin   mlock: mlocked pa...
170
171
172
173
174
175
176
177
  /*
   * get a list of pages in an address range belonging to the specified process
   * and indicate the VMA that covers each page
   * - this is potentially dodgy as we may end incrementing the page count of a
   *   slab page or a secondary page from a compound page
   * - don't permit access to VMAs that don't support it, such as I/O mappings
   */
  int get_user_pages(struct task_struct *tsk, struct mm_struct *mm,
9d73777e5   Peter Zijlstra   clarify get_user_...
178
  	unsigned long start, int nr_pages, int write, int force,
b291f0003   Nick Piggin   mlock: mlocked pa...
179
180
181
182
183
  	struct page **pages, struct vm_area_struct **vmas)
  {
  	int flags = 0;
  
  	if (write)
58fa879e1   Hugh Dickins   mm: FOLL flags fo...
184
  		flags |= FOLL_WRITE;
b291f0003   Nick Piggin   mlock: mlocked pa...
185
  	if (force)
58fa879e1   Hugh Dickins   mm: FOLL flags fo...
186
  		flags |= FOLL_FORCE;
b291f0003   Nick Piggin   mlock: mlocked pa...
187

53a7706d5   Michel Lespinasse   mlock: do not hol...
188
189
  	return __get_user_pages(tsk, mm, start, nr_pages, flags, pages, vmas,
  				NULL);
b291f0003   Nick Piggin   mlock: mlocked pa...
190
  }
66aa2b4b1   Greg Ungerer   [PATCH] uclinux: ...
191
  EXPORT_SYMBOL(get_user_pages);
dfc2f91ac   Paul Mundt   nommu: provide fo...
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
  /**
   * follow_pfn - look up PFN at a user virtual address
   * @vma: memory mapping
   * @address: user virtual address
   * @pfn: location to store found PFN
   *
   * Only IO mappings and raw PFN mappings are allowed.
   *
   * Returns zero and the pfn at @pfn on success, -ve otherwise.
   */
  int follow_pfn(struct vm_area_struct *vma, unsigned long address,
  	unsigned long *pfn)
  {
  	if (!(vma->vm_flags & (VM_IO | VM_PFNMAP)))
  		return -EINVAL;
  
  	*pfn = address >> PAGE_SHIFT;
  	return 0;
  }
  EXPORT_SYMBOL(follow_pfn);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
212
213
  DEFINE_RWLOCK(vmlist_lock);
  struct vm_struct *vmlist;
b3bdda02a   Christoph Lameter   vmalloc: add cons...
214
  void vfree(const void *addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
215
216
217
  {
  	kfree(addr);
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
218
  EXPORT_SYMBOL(vfree);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
219

dd0fc66fb   Al Viro   [PATCH] gfp flags...
220
  void *__vmalloc(unsigned long size, gfp_t gfp_mask, pgprot_t prot)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
221
222
  {
  	/*
8518609de   Robert P. J. Day   Explain clearly w...
223
224
  	 *  You can't specify __GFP_HIGHMEM with kmalloc() since kmalloc()
  	 * returns only a logical address.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
225
  	 */
84097518d   Nick Piggin   [PATCH] mm: nommu...
226
  	return kmalloc(size, (gfp_mask | __GFP_COMP) & ~__GFP_HIGHMEM);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
227
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
228
  EXPORT_SYMBOL(__vmalloc);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
229

f905bc447   Paul Mundt   nommu: add new vm...
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
  void *vmalloc_user(unsigned long size)
  {
  	void *ret;
  
  	ret = __vmalloc(size, GFP_KERNEL | __GFP_HIGHMEM | __GFP_ZERO,
  			PAGE_KERNEL);
  	if (ret) {
  		struct vm_area_struct *vma;
  
  		down_write(&current->mm->mmap_sem);
  		vma = find_vma(current->mm, (unsigned long)ret);
  		if (vma)
  			vma->vm_flags |= VM_USERMAP;
  		up_write(&current->mm->mmap_sem);
  	}
  
  	return ret;
  }
  EXPORT_SYMBOL(vmalloc_user);
b3bdda02a   Christoph Lameter   vmalloc: add cons...
249
  struct page *vmalloc_to_page(const void *addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
250
251
252
  {
  	return virt_to_page(addr);
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
253
  EXPORT_SYMBOL(vmalloc_to_page);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
254

b3bdda02a   Christoph Lameter   vmalloc: add cons...
255
  unsigned long vmalloc_to_pfn(const void *addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
256
257
258
  {
  	return page_to_pfn(virt_to_page(addr));
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
259
  EXPORT_SYMBOL(vmalloc_to_pfn);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
  
  long vread(char *buf, char *addr, unsigned long count)
  {
  	memcpy(buf, addr, count);
  	return count;
  }
  
  long vwrite(char *buf, char *addr, unsigned long count)
  {
  	/* Don't allow overflow */
  	if ((unsigned long) addr + count < count)
  		count = -(unsigned long) addr;
  
  	memcpy(addr, buf, count);
  	return(count);
  }
  
  /*
   *	vmalloc  -  allocate virtually continguos memory
   *
   *	@size:		allocation size
   *
   *	Allocate enough pages to cover @size from the page level
   *	allocator and map them into continguos kernel virtual space.
   *
c1c8897f8   Michael Opdenacker   Spelling fix: "co...
285
   *	For tight control over page level allocator and protection flags
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
286
287
288
289
290
291
   *	use __vmalloc() instead.
   */
  void *vmalloc(unsigned long size)
  {
         return __vmalloc(size, GFP_KERNEL | __GFP_HIGHMEM, PAGE_KERNEL);
  }
f61388822   Andrew Morton   [PATCH] nommu: im...
292
  EXPORT_SYMBOL(vmalloc);
e1ca7788d   Dave Young   mm: add vzalloc()...
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
  /*
   *	vzalloc - allocate virtually continguos memory with zero fill
   *
   *	@size:		allocation size
   *
   *	Allocate enough pages to cover @size from the page level
   *	allocator and map them into continguos kernel virtual space.
   *	The memory allocated is set to zero.
   *
   *	For tight control over page level allocator and protection flags
   *	use __vmalloc() instead.
   */
  void *vzalloc(unsigned long size)
  {
  	return __vmalloc(size, GFP_KERNEL | __GFP_HIGHMEM | __GFP_ZERO,
  			PAGE_KERNEL);
  }
  EXPORT_SYMBOL(vzalloc);
  
  /**
   * vmalloc_node - allocate memory on a specific node
   * @size:	allocation size
   * @node:	numa node
   *
   * Allocate enough pages to cover @size from the page level
   * allocator and map them into contiguous kernel virtual space.
   *
   * For tight control over page level allocator and protection flags
   * use __vmalloc() instead.
   */
f61388822   Andrew Morton   [PATCH] nommu: im...
323
324
325
326
  void *vmalloc_node(unsigned long size, int node)
  {
  	return vmalloc(size);
  }
9a14f653d   Paul Mundt   nommu: Fix up vma...
327
  EXPORT_SYMBOL(vmalloc_node);
e1ca7788d   Dave Young   mm: add vzalloc()...
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
  
  /**
   * vzalloc_node - allocate memory on a specific node with zero fill
   * @size:	allocation size
   * @node:	numa node
   *
   * Allocate enough pages to cover @size from the page level
   * allocator and map them into contiguous kernel virtual space.
   * The memory allocated is set to zero.
   *
   * For tight control over page level allocator and protection flags
   * use __vmalloc() instead.
   */
  void *vzalloc_node(unsigned long size, int node)
  {
  	return vzalloc(size);
  }
  EXPORT_SYMBOL(vzalloc_node);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
346

1af446edf   Paul Mundt   nommu: Provide vm...
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
  #ifndef PAGE_KERNEL_EXEC
  # define PAGE_KERNEL_EXEC PAGE_KERNEL
  #endif
  
  /**
   *	vmalloc_exec  -  allocate virtually contiguous, executable memory
   *	@size:		allocation size
   *
   *	Kernel-internal function to allocate enough pages to cover @size
   *	the page level allocator and map them into contiguous and
   *	executable kernel virtual space.
   *
   *	For tight control over page level allocator and protection flags
   *	use __vmalloc() instead.
   */
  
  void *vmalloc_exec(unsigned long size)
  {
  	return __vmalloc(size, GFP_KERNEL | __GFP_HIGHMEM, PAGE_KERNEL_EXEC);
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
367
368
  /**
   * vmalloc_32  -  allocate virtually contiguous memory (32bit addressable)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
369
370
371
372
373
374
375
376
377
   *	@size:		allocation size
   *
   *	Allocate enough 32bit PA addressable pages to cover @size from the
   *	page level allocator and map them into continguos kernel virtual space.
   */
  void *vmalloc_32(unsigned long size)
  {
  	return __vmalloc(size, GFP_KERNEL, PAGE_KERNEL);
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
378
379
380
381
382
383
384
385
  EXPORT_SYMBOL(vmalloc_32);
  
  /**
   * vmalloc_32_user - allocate zeroed virtually contiguous 32bit memory
   *	@size:		allocation size
   *
   * The resulting memory area is 32bit addressable and zeroed so it can be
   * mapped to userspace without leaking data.
f905bc447   Paul Mundt   nommu: add new vm...
386
387
388
   *
   * VM_USERMAP is set on the corresponding VMA so that subsequent calls to
   * remap_vmalloc_range() are permissible.
b50731732   Paul Mundt   nommu: vmalloc_32...
389
390
391
   */
  void *vmalloc_32_user(unsigned long size)
  {
f905bc447   Paul Mundt   nommu: add new vm...
392
393
394
395
396
  	/*
  	 * We'll have to sort out the ZONE_DMA bits for 64-bit,
  	 * but for now this can simply use vmalloc_user() directly.
  	 */
  	return vmalloc_user(size);
b50731732   Paul Mundt   nommu: vmalloc_32...
397
398
  }
  EXPORT_SYMBOL(vmalloc_32_user);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
399
400
401
402
403
404
  
  void *vmap(struct page **pages, unsigned int count, unsigned long flags, pgprot_t prot)
  {
  	BUG();
  	return NULL;
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
405
  EXPORT_SYMBOL(vmap);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
406

b3bdda02a   Christoph Lameter   vmalloc: add cons...
407
  void vunmap(const void *addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
408
409
410
  {
  	BUG();
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
411
  EXPORT_SYMBOL(vunmap);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
412

eb6434d9e   Paul Mundt   nommu: Stub in vm...
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
  void *vm_map_ram(struct page **pages, unsigned int count, int node, pgprot_t prot)
  {
  	BUG();
  	return NULL;
  }
  EXPORT_SYMBOL(vm_map_ram);
  
  void vm_unmap_ram(const void *mem, unsigned int count)
  {
  	BUG();
  }
  EXPORT_SYMBOL(vm_unmap_ram);
  
  void vm_unmap_aliases(void)
  {
  }
  EXPORT_SYMBOL_GPL(vm_unmap_aliases);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
430
  /*
1eeb66a1b   Christoph Hellwig   move die notifier...
431
432
433
434
435
436
   * Implement a stub for vmalloc_sync_all() if the architecture chose not to
   * have one.
   */
  void  __attribute__((weak)) vmalloc_sync_all(void)
  {
  }
29c185e5c   Paul Mundt   nommu: Provide st...
437
438
439
440
441
442
443
444
445
446
447
448
  /**
   *	alloc_vm_area - allocate a range of kernel address space
   *	@size:		size of the area
   *
   *	Returns:	NULL on failure, vm_struct on success
   *
   *	This function reserves a range of kernel address space, and
   *	allocates pagetables to map that range.  No actual mappings
   *	are created.  If the kernel address space is not shared
   *	between processes, it syncs the pagetable across all
   *	processes.
   */
cd12909cb   David Vrabel   xen: map foreign ...
449
  struct vm_struct *alloc_vm_area(size_t size, pte_t **ptes)
29c185e5c   Paul Mundt   nommu: Provide st...
450
451
452
453
454
455
456
457
458
459
460
  {
  	BUG();
  	return NULL;
  }
  EXPORT_SYMBOL_GPL(alloc_vm_area);
  
  void free_vm_area(struct vm_struct *area)
  {
  	BUG();
  }
  EXPORT_SYMBOL_GPL(free_vm_area);
b50731732   Paul Mundt   nommu: vmalloc_32...
461
462
463
464
465
466
  int vm_insert_page(struct vm_area_struct *vma, unsigned long addr,
  		   struct page *page)
  {
  	return -EINVAL;
  }
  EXPORT_SYMBOL(vm_insert_page);
1eeb66a1b   Christoph Hellwig   move die notifier...
467
  /*
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
468
469
470
471
472
473
   *  sys_brk() for the most part doesn't need the global kernel
   *  lock, except when an application is doing something nasty
   *  like trying to un-brk an area that has already been mapped
   *  to a regular file.  in this case, the unmapping will need
   *  to invoke file system routines that need the global lock.
   */
6a6160a7b   Heiko Carstens   [CVE-2009-0029] S...
474
  SYSCALL_DEFINE1(brk, unsigned long, brk)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
  {
  	struct mm_struct *mm = current->mm;
  
  	if (brk < mm->start_brk || brk > mm->context.end_brk)
  		return mm->brk;
  
  	if (mm->brk == brk)
  		return mm->brk;
  
  	/*
  	 * Always allow shrinking brk
  	 */
  	if (brk <= mm->brk) {
  		mm->brk = brk;
  		return brk;
  	}
  
  	/*
  	 * Ok, looks good - let it rip.
  	 */
cfe79c00a   Mike Frysinger   NOMMU: Avoiding d...
495
  	flush_icache_range(mm->brk, brk);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
496
497
  	return mm->brk = brk;
  }
8feae1311   David Howells   NOMMU: Make VMAs ...
498
499
500
501
  /*
   * initialise the VMA and region record slabs
   */
  void __init mmap_init(void)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
502
  {
00a62ce91   KOSAKI Motohiro   mm: fix Committed...
503
504
505
506
  	int ret;
  
  	ret = percpu_counter_init(&vm_committed_as, 0);
  	VM_BUG_ON(ret);
33e5d7697   David Howells   nommu: fix a numb...
507
  	vm_region_jar = KMEM_CACHE(vm_region, SLAB_PANIC);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
508
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
509

3034097a5   David Howells   [PATCH] NOMMU: Or...
510
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
511
512
   * validate the region tree
   * - the caller must hold the region lock
3034097a5   David Howells   [PATCH] NOMMU: Or...
513
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
514
515
  #ifdef CONFIG_DEBUG_NOMMU_REGIONS
  static noinline void validate_nommu_regions(void)
3034097a5   David Howells   [PATCH] NOMMU: Or...
516
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
517
518
  	struct vm_region *region, *last;
  	struct rb_node *p, *lastp;
3034097a5   David Howells   [PATCH] NOMMU: Or...
519

8feae1311   David Howells   NOMMU: Make VMAs ...
520
521
522
523
524
  	lastp = rb_first(&nommu_region_tree);
  	if (!lastp)
  		return;
  
  	last = rb_entry(lastp, struct vm_region, vm_rb);
33e5d7697   David Howells   nommu: fix a numb...
525
526
  	BUG_ON(unlikely(last->vm_end <= last->vm_start));
  	BUG_ON(unlikely(last->vm_top < last->vm_end));
8feae1311   David Howells   NOMMU: Make VMAs ...
527
528
529
530
  
  	while ((p = rb_next(lastp))) {
  		region = rb_entry(p, struct vm_region, vm_rb);
  		last = rb_entry(lastp, struct vm_region, vm_rb);
33e5d7697   David Howells   nommu: fix a numb...
531
532
533
  		BUG_ON(unlikely(region->vm_end <= region->vm_start));
  		BUG_ON(unlikely(region->vm_top < region->vm_end));
  		BUG_ON(unlikely(region->vm_start < last->vm_top));
3034097a5   David Howells   [PATCH] NOMMU: Or...
534

8feae1311   David Howells   NOMMU: Make VMAs ...
535
536
  		lastp = p;
  	}
3034097a5   David Howells   [PATCH] NOMMU: Or...
537
  }
8feae1311   David Howells   NOMMU: Make VMAs ...
538
  #else
33e5d7697   David Howells   nommu: fix a numb...
539
540
541
  static void validate_nommu_regions(void)
  {
  }
8feae1311   David Howells   NOMMU: Make VMAs ...
542
  #endif
3034097a5   David Howells   [PATCH] NOMMU: Or...
543
544
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
545
   * add a region into the global tree
3034097a5   David Howells   [PATCH] NOMMU: Or...
546
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
547
  static void add_nommu_region(struct vm_region *region)
3034097a5   David Howells   [PATCH] NOMMU: Or...
548
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
549
550
  	struct vm_region *pregion;
  	struct rb_node **p, *parent;
3034097a5   David Howells   [PATCH] NOMMU: Or...
551

8feae1311   David Howells   NOMMU: Make VMAs ...
552
  	validate_nommu_regions();
8feae1311   David Howells   NOMMU: Make VMAs ...
553
554
555
556
557
558
559
560
561
562
563
564
565
  	parent = NULL;
  	p = &nommu_region_tree.rb_node;
  	while (*p) {
  		parent = *p;
  		pregion = rb_entry(parent, struct vm_region, vm_rb);
  		if (region->vm_start < pregion->vm_start)
  			p = &(*p)->rb_left;
  		else if (region->vm_start > pregion->vm_start)
  			p = &(*p)->rb_right;
  		else if (pregion == region)
  			return;
  		else
  			BUG();
3034097a5   David Howells   [PATCH] NOMMU: Or...
566
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
567
568
  	rb_link_node(&region->vm_rb, parent, p);
  	rb_insert_color(&region->vm_rb, &nommu_region_tree);
3034097a5   David Howells   [PATCH] NOMMU: Or...
569

8feae1311   David Howells   NOMMU: Make VMAs ...
570
  	validate_nommu_regions();
3034097a5   David Howells   [PATCH] NOMMU: Or...
571
  }
3034097a5   David Howells   [PATCH] NOMMU: Or...
572
573
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
574
   * delete a region from the global tree
930e652a2   David Howells   [PATCH] NOMMU: Ma...
575
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
576
  static void delete_nommu_region(struct vm_region *region)
930e652a2   David Howells   [PATCH] NOMMU: Ma...
577
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
578
  	BUG_ON(!nommu_region_tree.rb_node);
930e652a2   David Howells   [PATCH] NOMMU: Ma...
579

8feae1311   David Howells   NOMMU: Make VMAs ...
580
581
582
  	validate_nommu_regions();
  	rb_erase(&region->vm_rb, &nommu_region_tree);
  	validate_nommu_regions();
57c8f63e8   Greg Ungerer   nommu: stub expan...
583
  }
930e652a2   David Howells   [PATCH] NOMMU: Ma...
584
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
585
   * free a contiguous series of pages
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
586
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
587
  static void free_page_series(unsigned long from, unsigned long to)
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
588
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
589
590
591
592
  	for (; from < to; from += PAGE_SIZE) {
  		struct page *page = virt_to_page(from);
  
  		kdebug("- free %lx", from);
33e5d7697   David Howells   nommu: fix a numb...
593
  		atomic_long_dec(&mmap_pages_allocated);
8feae1311   David Howells   NOMMU: Make VMAs ...
594
  		if (page_count(page) != 1)
33e5d7697   David Howells   nommu: fix a numb...
595
596
  			kdebug("free page %p: refcount not one: %d",
  			       page, page_count(page));
8feae1311   David Howells   NOMMU: Make VMAs ...
597
  		put_page(page);
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
598
  	}
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
599
600
601
  }
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
602
   * release a reference to a region
33e5d7697   David Howells   nommu: fix a numb...
603
   * - the caller must hold the region semaphore for writing, which this releases
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
604
   * - the region may not have been added to the tree yet, in which case vm_top
8feae1311   David Howells   NOMMU: Make VMAs ...
605
   *   will equal vm_start
3034097a5   David Howells   [PATCH] NOMMU: Or...
606
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
607
608
  static void __put_nommu_region(struct vm_region *region)
  	__releases(nommu_region_sem)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
609
  {
1e2ae599d   David Howells   nommu: struct vm_...
610
  	kenter("%p{%d}", region, region->vm_usage);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
611

8feae1311   David Howells   NOMMU: Make VMAs ...
612
  	BUG_ON(!nommu_region_tree.rb_node);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
613

1e2ae599d   David Howells   nommu: struct vm_...
614
  	if (--region->vm_usage == 0) {
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
615
  		if (region->vm_top > region->vm_start)
8feae1311   David Howells   NOMMU: Make VMAs ...
616
617
618
619
620
621
622
623
624
625
  			delete_nommu_region(region);
  		up_write(&nommu_region_sem);
  
  		if (region->vm_file)
  			fput(region->vm_file);
  
  		/* IO memory and memory shared directly out of the pagecache
  		 * from ramfs/tmpfs mustn't be released here */
  		if (region->vm_flags & VM_MAPPED_COPY) {
  			kdebug("free series");
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
626
  			free_page_series(region->vm_start, region->vm_top);
8feae1311   David Howells   NOMMU: Make VMAs ...
627
628
629
630
  		}
  		kmem_cache_free(vm_region_jar, region);
  	} else {
  		up_write(&nommu_region_sem);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
631
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
632
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
633

8feae1311   David Howells   NOMMU: Make VMAs ...
634
635
636
637
638
639
640
  /*
   * release a reference to a region
   */
  static void put_nommu_region(struct vm_region *region)
  {
  	down_write(&nommu_region_sem);
  	__put_nommu_region(region);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
641
  }
3034097a5   David Howells   [PATCH] NOMMU: Or...
642
  /*
eb8cdec4a   Bernd Schmidt   nommu: add suppor...
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
   * update protection on a vma
   */
  static void protect_vma(struct vm_area_struct *vma, unsigned long flags)
  {
  #ifdef CONFIG_MPU
  	struct mm_struct *mm = vma->vm_mm;
  	long start = vma->vm_start & PAGE_MASK;
  	while (start < vma->vm_end) {
  		protect_page(mm, start, flags);
  		start += PAGE_SIZE;
  	}
  	update_protections(mm);
  #endif
  }
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
659
660
661
662
   * add a VMA into a process's mm_struct in the appropriate place in the list
   * and tree and add to the address space's page tree also if not an anonymous
   * page
   * - should be called with mm->mmap_sem held writelocked
3034097a5   David Howells   [PATCH] NOMMU: Or...
663
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
664
  static void add_vma_to_mm(struct mm_struct *mm, struct vm_area_struct *vma)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
665
  {
6038def0d   Namhyung Kim   mm: nommu: sort m...
666
  	struct vm_area_struct *pvma, *prev;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
667
  	struct address_space *mapping;
6038def0d   Namhyung Kim   mm: nommu: sort m...
668
  	struct rb_node **p, *parent, *rb_prev;
8feae1311   David Howells   NOMMU: Make VMAs ...
669
670
671
672
673
674
675
  
  	kenter(",%p", vma);
  
  	BUG_ON(!vma->vm_region);
  
  	mm->map_count++;
  	vma->vm_mm = mm;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
676

eb8cdec4a   Bernd Schmidt   nommu: add suppor...
677
  	protect_vma(vma, vma->vm_flags);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
678
679
680
681
682
683
684
685
  	/* add the VMA to the mapping */
  	if (vma->vm_file) {
  		mapping = vma->vm_file->f_mapping;
  
  		flush_dcache_mmap_lock(mapping);
  		vma_prio_tree_insert(vma, &mapping->i_mmap);
  		flush_dcache_mmap_unlock(mapping);
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
686
  	/* add the VMA to the tree */
6038def0d   Namhyung Kim   mm: nommu: sort m...
687
  	parent = rb_prev = NULL;
8feae1311   David Howells   NOMMU: Make VMAs ...
688
  	p = &mm->mm_rb.rb_node;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
689
690
691
  	while (*p) {
  		parent = *p;
  		pvma = rb_entry(parent, struct vm_area_struct, vm_rb);
8feae1311   David Howells   NOMMU: Make VMAs ...
692
693
694
  		/* sort by: start addr, end addr, VMA struct addr in that order
  		 * (the latter is necessary as we may get identical VMAs) */
  		if (vma->vm_start < pvma->vm_start)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
695
  			p = &(*p)->rb_left;
6038def0d   Namhyung Kim   mm: nommu: sort m...
696
697
  		else if (vma->vm_start > pvma->vm_start) {
  			rb_prev = parent;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
698
  			p = &(*p)->rb_right;
6038def0d   Namhyung Kim   mm: nommu: sort m...
699
  		} else if (vma->vm_end < pvma->vm_end)
8feae1311   David Howells   NOMMU: Make VMAs ...
700
  			p = &(*p)->rb_left;
6038def0d   Namhyung Kim   mm: nommu: sort m...
701
702
  		else if (vma->vm_end > pvma->vm_end) {
  			rb_prev = parent;
8feae1311   David Howells   NOMMU: Make VMAs ...
703
  			p = &(*p)->rb_right;
6038def0d   Namhyung Kim   mm: nommu: sort m...
704
  		} else if (vma < pvma)
8feae1311   David Howells   NOMMU: Make VMAs ...
705
  			p = &(*p)->rb_left;
6038def0d   Namhyung Kim   mm: nommu: sort m...
706
707
  		else if (vma > pvma) {
  			rb_prev = parent;
8feae1311   David Howells   NOMMU: Make VMAs ...
708
  			p = &(*p)->rb_right;
6038def0d   Namhyung Kim   mm: nommu: sort m...
709
  		} else
8feae1311   David Howells   NOMMU: Make VMAs ...
710
  			BUG();
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
711
712
713
  	}
  
  	rb_link_node(&vma->vm_rb, parent, p);
8feae1311   David Howells   NOMMU: Make VMAs ...
714
715
716
  	rb_insert_color(&vma->vm_rb, &mm->mm_rb);
  
  	/* add VMA to the VMA list also */
6038def0d   Namhyung Kim   mm: nommu: sort m...
717
718
719
  	prev = NULL;
  	if (rb_prev)
  		prev = rb_entry(rb_prev, struct vm_area_struct, vm_rb);
8feae1311   David Howells   NOMMU: Make VMAs ...
720

6038def0d   Namhyung Kim   mm: nommu: sort m...
721
  	__vma_link_list(mm, vma, prev, parent);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
722
  }
3034097a5   David Howells   [PATCH] NOMMU: Or...
723
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
724
   * delete a VMA from its owning mm_struct and address space
3034097a5   David Howells   [PATCH] NOMMU: Or...
725
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
726
  static void delete_vma_from_mm(struct vm_area_struct *vma)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
727
728
  {
  	struct address_space *mapping;
8feae1311   David Howells   NOMMU: Make VMAs ...
729
730
731
  	struct mm_struct *mm = vma->vm_mm;
  
  	kenter("%p", vma);
eb8cdec4a   Bernd Schmidt   nommu: add suppor...
732
  	protect_vma(vma, 0);
8feae1311   David Howells   NOMMU: Make VMAs ...
733
734
735
  	mm->map_count--;
  	if (mm->mmap_cache == vma)
  		mm->mmap_cache = NULL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
736
737
738
739
740
741
742
743
744
  
  	/* remove the VMA from the mapping */
  	if (vma->vm_file) {
  		mapping = vma->vm_file->f_mapping;
  
  		flush_dcache_mmap_lock(mapping);
  		vma_prio_tree_remove(vma, &mapping->i_mmap);
  		flush_dcache_mmap_unlock(mapping);
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
745
746
  	/* remove from the MM's tree and list */
  	rb_erase(&vma->vm_rb, &mm->mm_rb);
b951bf2c4   Namhyung Kim   mm: nommu: don't ...
747
748
749
750
751
752
753
754
  
  	if (vma->vm_prev)
  		vma->vm_prev->vm_next = vma->vm_next;
  	else
  		mm->mmap = vma->vm_next;
  
  	if (vma->vm_next)
  		vma->vm_next->vm_prev = vma->vm_prev;
8feae1311   David Howells   NOMMU: Make VMAs ...
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
  
  	vma->vm_mm = NULL;
  }
  
  /*
   * destroy a VMA record
   */
  static void delete_vma(struct mm_struct *mm, struct vm_area_struct *vma)
  {
  	kenter("%p", vma);
  	if (vma->vm_ops && vma->vm_ops->close)
  		vma->vm_ops->close(vma);
  	if (vma->vm_file) {
  		fput(vma->vm_file);
  		if (vma->vm_flags & VM_EXECUTABLE)
  			removed_exe_file_vma(mm);
  	}
  	put_nommu_region(vma->vm_region);
  	kmem_cache_free(vm_area_cachep, vma);
  }
  
  /*
   * look up the first VMA in which addr resides, NULL if none
   * - should be called with mm->mmap_sem at least held readlocked
   */
  struct vm_area_struct *find_vma(struct mm_struct *mm, unsigned long addr)
  {
  	struct vm_area_struct *vma;
8feae1311   David Howells   NOMMU: Make VMAs ...
783
784
785
786
787
  
  	/* check the cache first */
  	vma = mm->mmap_cache;
  	if (vma && vma->vm_start <= addr && vma->vm_end > addr)
  		return vma;
e922c4c53   Namhyung Kim   mm: nommu: find v...
788
  	/* trawl the list (there may be multiple mappings in which addr
8feae1311   David Howells   NOMMU: Make VMAs ...
789
  	 * resides) */
e922c4c53   Namhyung Kim   mm: nommu: find v...
790
  	for (vma = mm->mmap; vma; vma = vma->vm_next) {
8feae1311   David Howells   NOMMU: Make VMAs ...
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
  		if (vma->vm_start > addr)
  			return NULL;
  		if (vma->vm_end > addr) {
  			mm->mmap_cache = vma;
  			return vma;
  		}
  	}
  
  	return NULL;
  }
  EXPORT_SYMBOL(find_vma);
  
  /*
   * find a VMA
   * - we don't extend stack VMAs under NOMMU conditions
   */
  struct vm_area_struct *find_extend_vma(struct mm_struct *mm, unsigned long addr)
  {
7561e8ca0   David Howells   NOMMU: Revert 'no...
809
  	return find_vma(mm, addr);
8feae1311   David Howells   NOMMU: Make VMAs ...
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
  }
  
  /*
   * expand a stack to a given address
   * - not supported under NOMMU conditions
   */
  int expand_stack(struct vm_area_struct *vma, unsigned long address)
  {
  	return -ENOMEM;
  }
  
  /*
   * look up the first VMA exactly that exactly matches addr
   * - should be called with mm->mmap_sem at least held readlocked
   */
  static struct vm_area_struct *find_vma_exact(struct mm_struct *mm,
  					     unsigned long addr,
  					     unsigned long len)
  {
  	struct vm_area_struct *vma;
8feae1311   David Howells   NOMMU: Make VMAs ...
830
831
832
833
834
835
  	unsigned long end = addr + len;
  
  	/* check the cache first */
  	vma = mm->mmap_cache;
  	if (vma && vma->vm_start == addr && vma->vm_end == end)
  		return vma;
e922c4c53   Namhyung Kim   mm: nommu: find v...
836
  	/* trawl the list (there may be multiple mappings in which addr
8feae1311   David Howells   NOMMU: Make VMAs ...
837
  	 * resides) */
e922c4c53   Namhyung Kim   mm: nommu: find v...
838
  	for (vma = mm->mmap; vma; vma = vma->vm_next) {
8feae1311   David Howells   NOMMU: Make VMAs ...
839
840
841
842
843
844
845
846
847
848
849
  		if (vma->vm_start < addr)
  			continue;
  		if (vma->vm_start > addr)
  			return NULL;
  		if (vma->vm_end == end) {
  			mm->mmap_cache = vma;
  			return vma;
  		}
  	}
  
  	return NULL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
850
851
852
853
854
855
856
857
858
859
860
861
862
863
  }
  
  /*
   * determine whether a mapping should be permitted and, if so, what sort of
   * mapping we're capable of supporting
   */
  static int validate_mmap_request(struct file *file,
  				 unsigned long addr,
  				 unsigned long len,
  				 unsigned long prot,
  				 unsigned long flags,
  				 unsigned long pgoff,
  				 unsigned long *_capabilities)
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
864
  	unsigned long capabilities, rlen;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
865
866
867
868
  	unsigned long reqprot = prot;
  	int ret;
  
  	/* do the simple checks first */
06aab5a30   David Howells   NOMMU: Ignore mma...
869
  	if (flags & MAP_FIXED) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
870
871
872
873
874
875
876
877
878
879
  		printk(KERN_DEBUG
  		       "%d: Can't do fixed-address/overlay mmap of RAM
  ",
  		       current->pid);
  		return -EINVAL;
  	}
  
  	if ((flags & MAP_TYPE) != MAP_PRIVATE &&
  	    (flags & MAP_TYPE) != MAP_SHARED)
  		return -EINVAL;
f81cff0d4   Mike Frysinger   [PATCH] uclinux: ...
880
  	if (!len)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
881
  		return -EINVAL;
f81cff0d4   Mike Frysinger   [PATCH] uclinux: ...
882
  	/* Careful about overflows.. */
8feae1311   David Howells   NOMMU: Make VMAs ...
883
884
  	rlen = PAGE_ALIGN(len);
  	if (!rlen || rlen > TASK_SIZE)
f81cff0d4   Mike Frysinger   [PATCH] uclinux: ...
885
  		return -ENOMEM;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
886
  	/* offset overflow? */
8feae1311   David Howells   NOMMU: Make VMAs ...
887
  	if ((pgoff + (rlen >> PAGE_SHIFT)) < pgoff)
f81cff0d4   Mike Frysinger   [PATCH] uclinux: ...
888
  		return -EOVERFLOW;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
  
  	if (file) {
  		/* validate file mapping requests */
  		struct address_space *mapping;
  
  		/* files must support mmap */
  		if (!file->f_op || !file->f_op->mmap)
  			return -ENODEV;
  
  		/* work out if what we've got could possibly be shared
  		 * - we support chardevs that provide their own "memory"
  		 * - we support files/blockdevs that are memory backed
  		 */
  		mapping = file->f_mapping;
  		if (!mapping)
e9536ae72   Josef Sipek   [PATCH] struct pa...
904
  			mapping = file->f_path.dentry->d_inode->i_mapping;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
905
906
907
908
909
910
911
912
  
  		capabilities = 0;
  		if (mapping && mapping->backing_dev_info)
  			capabilities = mapping->backing_dev_info->capabilities;
  
  		if (!capabilities) {
  			/* no explicit capabilities set, so assume some
  			 * defaults */
e9536ae72   Josef Sipek   [PATCH] struct pa...
913
  			switch (file->f_path.dentry->d_inode->i_mode & S_IFMT) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
  			case S_IFREG:
  			case S_IFBLK:
  				capabilities = BDI_CAP_MAP_COPY;
  				break;
  
  			case S_IFCHR:
  				capabilities =
  					BDI_CAP_MAP_DIRECT |
  					BDI_CAP_READ_MAP |
  					BDI_CAP_WRITE_MAP;
  				break;
  
  			default:
  				return -EINVAL;
  			}
  		}
  
  		/* eliminate any capabilities that we can't support on this
  		 * device */
  		if (!file->f_op->get_unmapped_area)
  			capabilities &= ~BDI_CAP_MAP_DIRECT;
  		if (!file->f_op->read)
  			capabilities &= ~BDI_CAP_MAP_COPY;
28d7a6ae9   Graff Yang   nommu: check fd r...
937
938
939
  		/* The file shall have been opened with read permission. */
  		if (!(file->f_mode & FMODE_READ))
  			return -EACCES;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
940
941
942
943
944
  		if (flags & MAP_SHARED) {
  			/* do checks for writing, appending and locking */
  			if ((prot & PROT_WRITE) &&
  			    !(file->f_mode & FMODE_WRITE))
  				return -EACCES;
e9536ae72   Josef Sipek   [PATCH] struct pa...
945
  			if (IS_APPEND(file->f_path.dentry->d_inode) &&
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
946
947
  			    (file->f_mode & FMODE_WRITE))
  				return -EACCES;
e9536ae72   Josef Sipek   [PATCH] struct pa...
948
  			if (locks_verify_locked(file->f_path.dentry->d_inode))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
949
950
951
952
  				return -EAGAIN;
  
  			if (!(capabilities & BDI_CAP_MAP_DIRECT))
  				return -ENODEV;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
953
954
955
956
957
958
959
960
961
962
963
964
965
966
  			/* we mustn't privatise shared mappings */
  			capabilities &= ~BDI_CAP_MAP_COPY;
  		}
  		else {
  			/* we're going to read the file into private memory we
  			 * allocate */
  			if (!(capabilities & BDI_CAP_MAP_COPY))
  				return -ENODEV;
  
  			/* we don't permit a private writable mapping to be
  			 * shared with the backing device */
  			if (prot & PROT_WRITE)
  				capabilities &= ~BDI_CAP_MAP_DIRECT;
  		}
3c7b20454   Bernd Schmidt   nommu: allow priv...
967
968
969
970
971
972
973
974
975
976
977
978
979
980
  		if (capabilities & BDI_CAP_MAP_DIRECT) {
  			if (((prot & PROT_READ)  && !(capabilities & BDI_CAP_READ_MAP))  ||
  			    ((prot & PROT_WRITE) && !(capabilities & BDI_CAP_WRITE_MAP)) ||
  			    ((prot & PROT_EXEC)  && !(capabilities & BDI_CAP_EXEC_MAP))
  			    ) {
  				capabilities &= ~BDI_CAP_MAP_DIRECT;
  				if (flags & MAP_SHARED) {
  					printk(KERN_WARNING
  					       "MAP_SHARED not completely supported on !MMU
  ");
  					return -EINVAL;
  				}
  			}
  		}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
981
982
  		/* handle executable mappings and implied executable
  		 * mappings */
e9536ae72   Josef Sipek   [PATCH] struct pa...
983
  		if (file->f_path.mnt->mnt_flags & MNT_NOEXEC) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
1001
1002
1003
1004
1005
1006
1007
1008
1009
1010
1011
1012
1013
1014
  			if (prot & PROT_EXEC)
  				return -EPERM;
  		}
  		else if ((prot & PROT_READ) && !(prot & PROT_EXEC)) {
  			/* handle implication of PROT_EXEC by PROT_READ */
  			if (current->personality & READ_IMPLIES_EXEC) {
  				if (capabilities & BDI_CAP_EXEC_MAP)
  					prot |= PROT_EXEC;
  			}
  		}
  		else if ((prot & PROT_READ) &&
  			 (prot & PROT_EXEC) &&
  			 !(capabilities & BDI_CAP_EXEC_MAP)
  			 ) {
  			/* backing file is not executable, try to copy */
  			capabilities &= ~BDI_CAP_MAP_DIRECT;
  		}
  	}
  	else {
  		/* anonymous mappings are always memory backed and can be
  		 * privately mapped
  		 */
  		capabilities = BDI_CAP_MAP_COPY;
  
  		/* handle PROT_EXEC implication by PROT_READ */
  		if ((prot & PROT_READ) &&
  		    (current->personality & READ_IMPLIES_EXEC))
  			prot |= PROT_EXEC;
  	}
  
  	/* allow the security API to have its say */
ed0321895   Eric Paris   security: Protect...
1015
  	ret = security_file_mmap(file, reqprot, prot, flags, addr, 0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1016
1017
1018
1019
1020
1021
1022
1023
1024
1025
1026
1027
1028
1029
1030
1031
1032
1033
1034
1035
  	if (ret < 0)
  		return ret;
  
  	/* looks okay */
  	*_capabilities = capabilities;
  	return 0;
  }
  
  /*
   * we've determined that we can make the mapping, now translate what we
   * now know into VMA flags
   */
  static unsigned long determine_vm_flags(struct file *file,
  					unsigned long prot,
  					unsigned long flags,
  					unsigned long capabilities)
  {
  	unsigned long vm_flags;
  
  	vm_flags = calc_vm_prot_bits(prot) | calc_vm_flag_bits(flags);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1036
1037
1038
1039
  	/* vm_flags |= mm->def_flags; */
  
  	if (!(capabilities & BDI_CAP_MAP_DIRECT)) {
  		/* attempt to share read-only copies of mapped file chunks */
3c7b20454   Bernd Schmidt   nommu: allow priv...
1040
  		vm_flags |= VM_MAYREAD | VM_MAYWRITE | VM_MAYEXEC;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1041
1042
  		if (file && !(prot & PROT_WRITE))
  			vm_flags |= VM_MAYSHARE;
3c7b20454   Bernd Schmidt   nommu: allow priv...
1043
  	} else {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1044
1045
1046
  		/* overlay a shareable mapping on the backing device or inode
  		 * if possible - used for chardevs, ramfs/tmpfs/shmfs and
  		 * romfs/cramfs */
3c7b20454   Bernd Schmidt   nommu: allow priv...
1047
  		vm_flags |= VM_MAYSHARE | (capabilities & BDI_CAP_VMFLAGS);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1048
  		if (flags & MAP_SHARED)
3c7b20454   Bernd Schmidt   nommu: allow priv...
1049
  			vm_flags |= VM_SHARED;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1050
1051
1052
1053
1054
1055
  	}
  
  	/* refuse to let anyone share private mappings with this process if
  	 * it's being traced - otherwise breakpoints set in it may interfere
  	 * with another untraced process
  	 */
a288eecce   Tejun Heo   ptrace: kill triv...
1056
  	if ((flags & MAP_PRIVATE) && current->ptrace)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1057
1058
1059
1060
1061
1062
  		vm_flags &= ~VM_MAYSHARE;
  
  	return vm_flags;
  }
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
1063
1064
   * set up a shared mapping on a file (the driver or filesystem provides and
   * pins the storage)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1065
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
1066
  static int do_mmap_shared_file(struct vm_area_struct *vma)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1067
1068
1069
1070
  {
  	int ret;
  
  	ret = vma->vm_file->f_op->mmap(vma->vm_file, vma);
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1071
1072
  	if (ret == 0) {
  		vma->vm_region->vm_top = vma->vm_region->vm_end;
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1073
  		return 0;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1074
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1075
1076
  	if (ret != -ENOSYS)
  		return ret;
3fa30460e   David Howells   nommu: fix an inc...
1077
1078
1079
  	/* getting -ENOSYS indicates that direct mmap isn't possible (as
  	 * opposed to tried but failed) so we can only give a suitable error as
  	 * it's not possible to make a private copy if MAP_SHARED was given */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1080
1081
1082
1083
1084
1085
  	return -ENODEV;
  }
  
  /*
   * set up a private mapping or an anonymous shared mapping
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
1086
1087
  static int do_mmap_private(struct vm_area_struct *vma,
  			   struct vm_region *region,
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1088
1089
  			   unsigned long len,
  			   unsigned long capabilities)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1090
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
1091
  	struct page *pages;
f67d9b157   Bob Liu   nommu: add page a...
1092
  	unsigned long total, point, n;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1093
  	void *base;
8feae1311   David Howells   NOMMU: Make VMAs ...
1094
  	int ret, order;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1095
1096
1097
1098
1099
  
  	/* invoke the file's mapping function so that it can keep track of
  	 * shared mappings on devices or memory
  	 * - VM_MAYSHARE will be set if it may attempt to share
  	 */
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1100
  	if (capabilities & BDI_CAP_MAP_DIRECT) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1101
  		ret = vma->vm_file->f_op->mmap(vma->vm_file, vma);
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1102
  		if (ret == 0) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1103
  			/* shouldn't return success if we're not sharing */
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1104
1105
  			BUG_ON(!(vma->vm_flags & VM_MAYSHARE));
  			vma->vm_region->vm_top = vma->vm_region->vm_end;
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1106
  			return 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1107
  		}
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1108
1109
  		if (ret != -ENOSYS)
  			return ret;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1110
1111
1112
1113
1114
  
  		/* getting an ENOSYS error indicates that direct mmap isn't
  		 * possible (as opposed to tried but failed) so we'll try to
  		 * make a private copy of the data and map that instead */
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1115

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1116
1117
1118
1119
  	/* allocate some memory to hold the mapping
  	 * - note that this may not return a page-aligned address if the object
  	 *   we're allocating is smaller than a page
  	 */
f67d9b157   Bob Liu   nommu: add page a...
1120
  	order = get_order(len);
8feae1311   David Howells   NOMMU: Make VMAs ...
1121
1122
1123
1124
  	kdebug("alloc order %d for %lx", order, len);
  
  	pages = alloc_pages(GFP_KERNEL, order);
  	if (!pages)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1125
  		goto enomem;
8feae1311   David Howells   NOMMU: Make VMAs ...
1126
  	total = 1 << order;
33e5d7697   David Howells   nommu: fix a numb...
1127
  	atomic_long_add(total, &mmap_pages_allocated);
8feae1311   David Howells   NOMMU: Make VMAs ...
1128

f67d9b157   Bob Liu   nommu: add page a...
1129
  	point = len >> PAGE_SHIFT;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1130
1131
1132
1133
1134
1135
1136
1137
  
  	/* we allocated a power-of-2 sized page set, so we may want to trim off
  	 * the excess */
  	if (sysctl_nr_trim_pages && total - point >= sysctl_nr_trim_pages) {
  		while (total > point) {
  			order = ilog2(total - point);
  			n = 1 << order;
  			kdebug("shave %lu/%lu @%lu", n, total - point, total);
33e5d7697   David Howells   nommu: fix a numb...
1138
  			atomic_long_sub(n, &mmap_pages_allocated);
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1139
1140
1141
1142
  			total -= n;
  			set_page_refcounted(pages + total);
  			__free_pages(pages + total, order);
  		}
8feae1311   David Howells   NOMMU: Make VMAs ...
1143
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1144
1145
  	for (point = 1; point < total; point++)
  		set_page_refcounted(&pages[point]);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1146

8feae1311   David Howells   NOMMU: Make VMAs ...
1147
1148
1149
  	base = page_address(pages);
  	region->vm_flags = vma->vm_flags |= VM_MAPPED_COPY;
  	region->vm_start = (unsigned long) base;
f67d9b157   Bob Liu   nommu: add page a...
1150
  	region->vm_end   = region->vm_start + len;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1151
  	region->vm_top   = region->vm_start + (total << PAGE_SHIFT);
8feae1311   David Howells   NOMMU: Make VMAs ...
1152
1153
1154
  
  	vma->vm_start = region->vm_start;
  	vma->vm_end   = region->vm_start + len;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1155
1156
1157
1158
1159
1160
1161
1162
1163
1164
1165
  
  	if (vma->vm_file) {
  		/* read the contents of a file into the copy */
  		mm_segment_t old_fs;
  		loff_t fpos;
  
  		fpos = vma->vm_pgoff;
  		fpos <<= PAGE_SHIFT;
  
  		old_fs = get_fs();
  		set_fs(KERNEL_DS);
f67d9b157   Bob Liu   nommu: add page a...
1166
  		ret = vma->vm_file->f_op->read(vma->vm_file, base, len, &fpos);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1167
1168
1169
1170
1171
1172
  		set_fs(old_fs);
  
  		if (ret < 0)
  			goto error_free;
  
  		/* clear the last little bit */
f67d9b157   Bob Liu   nommu: add page a...
1173
1174
  		if (ret < len)
  			memset(base + ret, 0, len - ret);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1175

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1176
1177
1178
1179
1180
  	}
  
  	return 0;
  
  error_free:
7223bb4a8   Namhyung Kim   mm: nommu: fix a ...
1181
  	free_page_series(region->vm_start, region->vm_top);
8feae1311   David Howells   NOMMU: Make VMAs ...
1182
1183
  	region->vm_start = vma->vm_start = 0;
  	region->vm_end   = vma->vm_end = 0;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1184
  	region->vm_top   = 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1185
1186
1187
  	return ret;
  
  enomem:
05ae6fa31   Greg Ungerer   uclinux: add proc...
1188
1189
1190
  	printk("Allocation of length %lu from process %d (%s) failed
  ",
  	       len, current->pid, current->comm);
7bf02ea22   David Rientjes   arch, mm: filter ...
1191
  	show_free_areas(0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1192
1193
1194
1195
1196
1197
1198
1199
1200
1201
1202
1203
1204
  	return -ENOMEM;
  }
  
  /*
   * handle mapping creation for uClinux
   */
  unsigned long do_mmap_pgoff(struct file *file,
  			    unsigned long addr,
  			    unsigned long len,
  			    unsigned long prot,
  			    unsigned long flags,
  			    unsigned long pgoff)
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
1205
1206
  	struct vm_area_struct *vma;
  	struct vm_region *region;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1207
  	struct rb_node *rb;
8feae1311   David Howells   NOMMU: Make VMAs ...
1208
  	unsigned long capabilities, vm_flags, result;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1209
  	int ret;
8feae1311   David Howells   NOMMU: Make VMAs ...
1210
  	kenter(",%lx,%lx,%lx,%lx,%lx", addr, len, prot, flags, pgoff);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1211
1212
1213
1214
  	/* decide whether we should attempt the mapping, and if so what sort of
  	 * mapping */
  	ret = validate_mmap_request(file, addr, len, prot, flags, pgoff,
  				    &capabilities);
8feae1311   David Howells   NOMMU: Make VMAs ...
1215
1216
  	if (ret < 0) {
  		kleave(" = %d [val]", ret);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1217
  		return ret;
8feae1311   David Howells   NOMMU: Make VMAs ...
1218
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1219

06aab5a30   David Howells   NOMMU: Ignore mma...
1220
1221
  	/* we ignore the address hint */
  	addr = 0;
f67d9b157   Bob Liu   nommu: add page a...
1222
  	len = PAGE_ALIGN(len);
06aab5a30   David Howells   NOMMU: Ignore mma...
1223

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1224
1225
1226
  	/* we've determined that we can make the mapping, now translate what we
  	 * now know into VMA flags */
  	vm_flags = determine_vm_flags(file, prot, flags, capabilities);
8feae1311   David Howells   NOMMU: Make VMAs ...
1227
1228
1229
1230
1231
1232
1233
1234
  	/* we're going to need to record the mapping */
  	region = kmem_cache_zalloc(vm_region_jar, GFP_KERNEL);
  	if (!region)
  		goto error_getting_region;
  
  	vma = kmem_cache_zalloc(vm_area_cachep, GFP_KERNEL);
  	if (!vma)
  		goto error_getting_vma;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1235

1e2ae599d   David Howells   nommu: struct vm_...
1236
  	region->vm_usage = 1;
8feae1311   David Howells   NOMMU: Make VMAs ...
1237
1238
  	region->vm_flags = vm_flags;
  	region->vm_pgoff = pgoff;
5beb49305   Rik van Riel   mm: change anon_v...
1239
  	INIT_LIST_HEAD(&vma->anon_vma_chain);
8feae1311   David Howells   NOMMU: Make VMAs ...
1240
1241
  	vma->vm_flags = vm_flags;
  	vma->vm_pgoff = pgoff;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1242

8feae1311   David Howells   NOMMU: Make VMAs ...
1243
1244
1245
1246
1247
1248
1249
1250
1251
1252
1253
1254
1255
1256
  	if (file) {
  		region->vm_file = file;
  		get_file(file);
  		vma->vm_file = file;
  		get_file(file);
  		if (vm_flags & VM_EXECUTABLE) {
  			added_exe_file_vma(current->mm);
  			vma->vm_mm = current->mm;
  		}
  	}
  
  	down_write(&nommu_region_sem);
  
  	/* if we want to share, we need to check for regions created by other
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1257
  	 * mmap() calls that overlap with our proposed mapping
8feae1311   David Howells   NOMMU: Make VMAs ...
1258
  	 * - we can only share with a superset match on most regular files
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1259
1260
1261
1262
1263
1264
  	 * - shared mappings on character devices and memory backed files are
  	 *   permitted to overlap inexactly as far as we are concerned for in
  	 *   these cases, sharing is handled in the driver or filesystem rather
  	 *   than here
  	 */
  	if (vm_flags & VM_MAYSHARE) {
8feae1311   David Howells   NOMMU: Make VMAs ...
1265
1266
  		struct vm_region *pregion;
  		unsigned long pglen, rpglen, pgend, rpgend, start;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1267

8feae1311   David Howells   NOMMU: Make VMAs ...
1268
1269
  		pglen = (len + PAGE_SIZE - 1) >> PAGE_SHIFT;
  		pgend = pgoff + pglen;
165b23927   David Howells   [PATCH] NOMMU: ma...
1270

8feae1311   David Howells   NOMMU: Make VMAs ...
1271
1272
  		for (rb = rb_first(&nommu_region_tree); rb; rb = rb_next(rb)) {
  			pregion = rb_entry(rb, struct vm_region, vm_rb);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1273

8feae1311   David Howells   NOMMU: Make VMAs ...
1274
  			if (!(pregion->vm_flags & VM_MAYSHARE))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1275
1276
1277
  				continue;
  
  			/* search for overlapping mappings on the same file */
8feae1311   David Howells   NOMMU: Make VMAs ...
1278
1279
  			if (pregion->vm_file->f_path.dentry->d_inode !=
  			    file->f_path.dentry->d_inode)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1280
  				continue;
8feae1311   David Howells   NOMMU: Make VMAs ...
1281
  			if (pregion->vm_pgoff >= pgend)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1282
  				continue;
8feae1311   David Howells   NOMMU: Make VMAs ...
1283
1284
1285
1286
  			rpglen = pregion->vm_end - pregion->vm_start;
  			rpglen = (rpglen + PAGE_SIZE - 1) >> PAGE_SHIFT;
  			rpgend = pregion->vm_pgoff + rpglen;
  			if (pgoff >= rpgend)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1287
  				continue;
8feae1311   David Howells   NOMMU: Make VMAs ...
1288
1289
1290
1291
1292
  			/* handle inexactly overlapping matches between
  			 * mappings */
  			if ((pregion->vm_pgoff != pgoff || rpglen != pglen) &&
  			    !(pgoff >= pregion->vm_pgoff && pgend <= rpgend)) {
  				/* new mapping is not a subset of the region */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1293
1294
1295
1296
  				if (!(capabilities & BDI_CAP_MAP_DIRECT))
  					goto sharing_violation;
  				continue;
  			}
8feae1311   David Howells   NOMMU: Make VMAs ...
1297
  			/* we've found a region we can share */
1e2ae599d   David Howells   nommu: struct vm_...
1298
  			pregion->vm_usage++;
8feae1311   David Howells   NOMMU: Make VMAs ...
1299
1300
1301
1302
1303
1304
1305
1306
1307
1308
1309
1310
1311
1312
1313
1314
  			vma->vm_region = pregion;
  			start = pregion->vm_start;
  			start += (pgoff - pregion->vm_pgoff) << PAGE_SHIFT;
  			vma->vm_start = start;
  			vma->vm_end = start + len;
  
  			if (pregion->vm_flags & VM_MAPPED_COPY) {
  				kdebug("share copy");
  				vma->vm_flags |= VM_MAPPED_COPY;
  			} else {
  				kdebug("share mmap");
  				ret = do_mmap_shared_file(vma);
  				if (ret < 0) {
  					vma->vm_region = NULL;
  					vma->vm_start = 0;
  					vma->vm_end = 0;
1e2ae599d   David Howells   nommu: struct vm_...
1315
  					pregion->vm_usage--;
8feae1311   David Howells   NOMMU: Make VMAs ...
1316
1317
1318
1319
1320
1321
1322
1323
1324
  					pregion = NULL;
  					goto error_just_free;
  				}
  			}
  			fput(region->vm_file);
  			kmem_cache_free(vm_region_jar, region);
  			region = pregion;
  			result = start;
  			goto share;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1325
  		}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1326
1327
1328
1329
  		/* obtain the address at which to make a shared mapping
  		 * - this is the hook for quasi-memory character devices to
  		 *   tell us the location of a shared mapping
  		 */
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1330
  		if (capabilities & BDI_CAP_MAP_DIRECT) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1331
1332
  			addr = file->f_op->get_unmapped_area(file, addr, len,
  							     pgoff, flags);
bb005a59e   Namhyung Kim   mm: nommu: fix a ...
1333
  			if (IS_ERR_VALUE(addr)) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1334
  				ret = addr;
bb005a59e   Namhyung Kim   mm: nommu: fix a ...
1335
  				if (ret != -ENOSYS)
8feae1311   David Howells   NOMMU: Make VMAs ...
1336
  					goto error_just_free;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1337
1338
1339
1340
  
  				/* the driver refused to tell us where to site
  				 * the mapping so we'll have to attempt to copy
  				 * it */
bb005a59e   Namhyung Kim   mm: nommu: fix a ...
1341
  				ret = -ENODEV;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1342
  				if (!(capabilities & BDI_CAP_MAP_COPY))
8feae1311   David Howells   NOMMU: Make VMAs ...
1343
  					goto error_just_free;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1344
1345
  
  				capabilities &= ~BDI_CAP_MAP_DIRECT;
8feae1311   David Howells   NOMMU: Make VMAs ...
1346
1347
1348
  			} else {
  				vma->vm_start = region->vm_start = addr;
  				vma->vm_end = region->vm_end = addr + len;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1349
1350
1351
  			}
  		}
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1352
  	vma->vm_region = region;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1353

645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1354
1355
1356
  	/* set up the mapping
  	 * - the region is filled in if BDI_CAP_MAP_DIRECT is still set
  	 */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1357
  	if (file && vma->vm_flags & VM_SHARED)
8feae1311   David Howells   NOMMU: Make VMAs ...
1358
  		ret = do_mmap_shared_file(vma);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1359
  	else
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1360
  		ret = do_mmap_private(vma, region, len, capabilities);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1361
  	if (ret < 0)
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1362
1363
  		goto error_just_free;
  	add_nommu_region(region);
8feae1311   David Howells   NOMMU: Make VMAs ...
1364

ea6376395   Jie Zhang   nommu: fix malloc...
1365
1366
1367
1368
  	/* clear anonymous mappings that don't ask for uninitialized data */
  	if (!vma->vm_file && !(flags & MAP_UNINITIALIZED))
  		memset((void *)region->vm_start, 0,
  		       region->vm_end - region->vm_start);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1369
  	/* okay... we have a mapping; now we have to register it */
8feae1311   David Howells   NOMMU: Make VMAs ...
1370
  	result = vma->vm_start;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1371

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1372
  	current->mm->total_vm += len >> PAGE_SHIFT;
8feae1311   David Howells   NOMMU: Make VMAs ...
1373
1374
  share:
  	add_vma_to_mm(current->mm, vma);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1375

cfe79c00a   Mike Frysinger   NOMMU: Avoiding d...
1376
1377
1378
1379
1380
1381
  	/* we flush the region from the icache only when the first executable
  	 * mapping of it is made  */
  	if (vma->vm_flags & VM_EXEC && !region->vm_icache_flushed) {
  		flush_icache_range(region->vm_start, region->vm_end);
  		region->vm_icache_flushed = true;
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1382

cfe79c00a   Mike Frysinger   NOMMU: Avoiding d...
1383
  	up_write(&nommu_region_sem);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1384

8feae1311   David Howells   NOMMU: Make VMAs ...
1385
1386
  	kleave(" = %lx", result);
  	return result;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1387

8feae1311   David Howells   NOMMU: Make VMAs ...
1388
1389
1390
  error_just_free:
  	up_write(&nommu_region_sem);
  error:
89a864027   David Howells   NOMMU: Don't pass...
1391
1392
  	if (region->vm_file)
  		fput(region->vm_file);
8feae1311   David Howells   NOMMU: Make VMAs ...
1393
  	kmem_cache_free(vm_region_jar, region);
89a864027   David Howells   NOMMU: Don't pass...
1394
1395
  	if (vma->vm_file)
  		fput(vma->vm_file);
8feae1311   David Howells   NOMMU: Make VMAs ...
1396
1397
1398
1399
1400
1401
1402
1403
1404
1405
1406
1407
  	if (vma->vm_flags & VM_EXECUTABLE)
  		removed_exe_file_vma(vma->vm_mm);
  	kmem_cache_free(vm_area_cachep, vma);
  	kleave(" = %d", ret);
  	return ret;
  
  sharing_violation:
  	up_write(&nommu_region_sem);
  	printk(KERN_WARNING "Attempt to share mismatched mappings
  ");
  	ret = -EINVAL;
  	goto error;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1408

8feae1311   David Howells   NOMMU: Make VMAs ...
1409
1410
1411
1412
1413
  error_getting_vma:
  	kmem_cache_free(vm_region_jar, region);
  	printk(KERN_WARNING "Allocation of vma for %lu byte allocation"
  	       " from process %d failed
  ",
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1414
  	       len, current->pid);
7bf02ea22   David Rientjes   arch, mm: filter ...
1415
  	show_free_areas(0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1416
  	return -ENOMEM;
8feae1311   David Howells   NOMMU: Make VMAs ...
1417
1418
1419
1420
  error_getting_region:
  	printk(KERN_WARNING "Allocation of vm region for %lu byte allocation"
  	       " from process %d failed
  ",
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1421
  	       len, current->pid);
7bf02ea22   David Rientjes   arch, mm: filter ...
1422
  	show_free_areas(0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1423
1424
  	return -ENOMEM;
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
1425
  EXPORT_SYMBOL(do_mmap_pgoff);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1426

66f0dc481   Hugh Dickins   mm: move sys_mmap...
1427
1428
1429
1430
1431
1432
  SYSCALL_DEFINE6(mmap_pgoff, unsigned long, addr, unsigned long, len,
  		unsigned long, prot, unsigned long, flags,
  		unsigned long, fd, unsigned long, pgoff)
  {
  	struct file *file = NULL;
  	unsigned long retval = -EBADF;
120a795da   Al Viro   audit mmap
1433
  	audit_mmap_fd(fd, flags);
66f0dc481   Hugh Dickins   mm: move sys_mmap...
1434
1435
1436
1437
1438
1439
1440
1441
1442
1443
1444
1445
1446
1447
1448
1449
1450
  	if (!(flags & MAP_ANONYMOUS)) {
  		file = fget(fd);
  		if (!file)
  			goto out;
  	}
  
  	flags &= ~(MAP_EXECUTABLE | MAP_DENYWRITE);
  
  	down_write(&current->mm->mmap_sem);
  	retval = do_mmap_pgoff(file, addr, len, prot, flags, pgoff);
  	up_write(&current->mm->mmap_sem);
  
  	if (file)
  		fput(file);
  out:
  	return retval;
  }
a4679373c   Christoph Hellwig   Add generic sys_o...
1451
1452
1453
1454
1455
1456
1457
1458
1459
1460
1461
1462
1463
1464
1465
1466
1467
1468
1469
1470
1471
1472
1473
  #ifdef __ARCH_WANT_SYS_OLD_MMAP
  struct mmap_arg_struct {
  	unsigned long addr;
  	unsigned long len;
  	unsigned long prot;
  	unsigned long flags;
  	unsigned long fd;
  	unsigned long offset;
  };
  
  SYSCALL_DEFINE1(old_mmap, struct mmap_arg_struct __user *, arg)
  {
  	struct mmap_arg_struct a;
  
  	if (copy_from_user(&a, arg, sizeof(a)))
  		return -EFAULT;
  	if (a.offset & ~PAGE_MASK)
  		return -EINVAL;
  
  	return sys_mmap_pgoff(a.addr, a.len, a.prot, a.flags, a.fd,
  			      a.offset >> PAGE_SHIFT);
  }
  #endif /* __ARCH_WANT_SYS_OLD_MMAP */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1474
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
1475
1476
   * split a vma into two pieces at address 'addr', a new vma is allocated either
   * for the first part or the tail.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1477
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
1478
1479
  int split_vma(struct mm_struct *mm, struct vm_area_struct *vma,
  	      unsigned long addr, int new_below)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1480
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
1481
1482
1483
  	struct vm_area_struct *new;
  	struct vm_region *region;
  	unsigned long npages;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1484

8feae1311   David Howells   NOMMU: Make VMAs ...
1485
  	kenter("");
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1486

779c10232   David Howells   nommu: remove a s...
1487
1488
1489
  	/* we're only permitted to split anonymous regions (these should have
  	 * only a single usage on the region) */
  	if (vma->vm_file)
8feae1311   David Howells   NOMMU: Make VMAs ...
1490
  		return -ENOMEM;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1491

8feae1311   David Howells   NOMMU: Make VMAs ...
1492
1493
  	if (mm->map_count >= sysctl_max_map_count)
  		return -ENOMEM;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1494

8feae1311   David Howells   NOMMU: Make VMAs ...
1495
1496
1497
  	region = kmem_cache_alloc(vm_region_jar, GFP_KERNEL);
  	if (!region)
  		return -ENOMEM;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1498

8feae1311   David Howells   NOMMU: Make VMAs ...
1499
1500
1501
1502
1503
1504
1505
1506
1507
1508
1509
1510
1511
1512
  	new = kmem_cache_alloc(vm_area_cachep, GFP_KERNEL);
  	if (!new) {
  		kmem_cache_free(vm_region_jar, region);
  		return -ENOMEM;
  	}
  
  	/* most fields are the same, copy all, and then fixup */
  	*new = *vma;
  	*region = *vma->vm_region;
  	new->vm_region = region;
  
  	npages = (addr - vma->vm_start) >> PAGE_SHIFT;
  
  	if (new_below) {
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1513
  		region->vm_top = region->vm_end = new->vm_end = addr;
8feae1311   David Howells   NOMMU: Make VMAs ...
1514
1515
1516
  	} else {
  		region->vm_start = new->vm_start = addr;
  		region->vm_pgoff = new->vm_pgoff += npages;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1517
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1518
1519
1520
1521
1522
1523
1524
1525
1526
1527
1528
1529
  
  	if (new->vm_ops && new->vm_ops->open)
  		new->vm_ops->open(new);
  
  	delete_vma_from_mm(vma);
  	down_write(&nommu_region_sem);
  	delete_nommu_region(vma->vm_region);
  	if (new_below) {
  		vma->vm_region->vm_start = vma->vm_start = addr;
  		vma->vm_region->vm_pgoff = vma->vm_pgoff += npages;
  	} else {
  		vma->vm_region->vm_end = vma->vm_end = addr;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1530
  		vma->vm_region->vm_top = addr;
8feae1311   David Howells   NOMMU: Make VMAs ...
1531
1532
1533
1534
1535
1536
1537
  	}
  	add_nommu_region(vma->vm_region);
  	add_nommu_region(new->vm_region);
  	up_write(&nommu_region_sem);
  	add_vma_to_mm(mm, vma);
  	add_vma_to_mm(mm, new);
  	return 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1538
  }
3034097a5   David Howells   [PATCH] NOMMU: Or...
1539
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
1540
1541
   * shrink a VMA by removing the specified chunk from either the beginning or
   * the end
3034097a5   David Howells   [PATCH] NOMMU: Or...
1542
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
1543
1544
1545
  static int shrink_vma(struct mm_struct *mm,
  		      struct vm_area_struct *vma,
  		      unsigned long from, unsigned long to)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1546
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
1547
  	struct vm_region *region;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1548

8feae1311   David Howells   NOMMU: Make VMAs ...
1549
  	kenter("");
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1550

8feae1311   David Howells   NOMMU: Make VMAs ...
1551
1552
1553
1554
1555
1556
1557
1558
  	/* adjust the VMA's pointers, which may reposition it in the MM's tree
  	 * and list */
  	delete_vma_from_mm(vma);
  	if (from > vma->vm_start)
  		vma->vm_end = from;
  	else
  		vma->vm_start = to;
  	add_vma_to_mm(mm, vma);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1559

8feae1311   David Howells   NOMMU: Make VMAs ...
1560
1561
  	/* cut the backing region down to size */
  	region = vma->vm_region;
1e2ae599d   David Howells   nommu: struct vm_...
1562
  	BUG_ON(region->vm_usage != 1);
8feae1311   David Howells   NOMMU: Make VMAs ...
1563
1564
1565
  
  	down_write(&nommu_region_sem);
  	delete_nommu_region(region);
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1566
1567
1568
1569
  	if (from > region->vm_start) {
  		to = region->vm_top;
  		region->vm_top = region->vm_end = from;
  	} else {
8feae1311   David Howells   NOMMU: Make VMAs ...
1570
  		region->vm_start = to;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1571
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1572
1573
1574
1575
1576
1577
  	add_nommu_region(region);
  	up_write(&nommu_region_sem);
  
  	free_page_series(from, to);
  	return 0;
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1578

8feae1311   David Howells   NOMMU: Make VMAs ...
1579
1580
1581
1582
1583
1584
1585
1586
  /*
   * release a mapping
   * - under NOMMU conditions the chunk to be unmapped must be backed by a single
   *   VMA, though it need not cover the whole VMA
   */
  int do_munmap(struct mm_struct *mm, unsigned long start, size_t len)
  {
  	struct vm_area_struct *vma;
f67d9b157   Bob Liu   nommu: add page a...
1587
  	unsigned long end;
8feae1311   David Howells   NOMMU: Make VMAs ...
1588
  	int ret;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1589

8feae1311   David Howells   NOMMU: Make VMAs ...
1590
  	kenter(",%lx,%zx", start, len);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1591

f67d9b157   Bob Liu   nommu: add page a...
1592
  	len = PAGE_ALIGN(len);
8feae1311   David Howells   NOMMU: Make VMAs ...
1593
1594
  	if (len == 0)
  		return -EINVAL;
365e9c87a   Hugh Dickins   [PATCH] mm: updat...
1595

f67d9b157   Bob Liu   nommu: add page a...
1596
  	end = start + len;
8feae1311   David Howells   NOMMU: Make VMAs ...
1597
1598
1599
  	/* find the first potentially overlapping VMA */
  	vma = find_vma(mm, start);
  	if (!vma) {
33e5d7697   David Howells   nommu: fix a numb...
1600
1601
1602
1603
1604
1605
1606
1607
1608
1609
  		static int limit = 0;
  		if (limit < 5) {
  			printk(KERN_WARNING
  			       "munmap of memory not mmapped by process %d"
  			       " (%s): 0x%lx-0x%lx
  ",
  			       current->pid, current->comm,
  			       start, start + len - 1);
  			limit++;
  		}
8feae1311   David Howells   NOMMU: Make VMAs ...
1610
1611
  		return -EINVAL;
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1612

8feae1311   David Howells   NOMMU: Make VMAs ...
1613
1614
1615
1616
1617
1618
1619
1620
1621
  	/* we're allowed to split an anonymous VMA but not a file-backed one */
  	if (vma->vm_file) {
  		do {
  			if (start > vma->vm_start) {
  				kleave(" = -EINVAL [miss]");
  				return -EINVAL;
  			}
  			if (end == vma->vm_end)
  				goto erase_whole_vma;
d75a310c4   Namhyung Kim   mm: nommu: check ...
1622
1623
  			vma = vma->vm_next;
  		} while (vma);
8feae1311   David Howells   NOMMU: Make VMAs ...
1624
1625
1626
1627
1628
1629
1630
1631
1632
1633
1634
1635
1636
1637
1638
1639
1640
1641
1642
1643
1644
1645
1646
1647
1648
1649
1650
  		kleave(" = -EINVAL [split file]");
  		return -EINVAL;
  	} else {
  		/* the chunk must be a subset of the VMA found */
  		if (start == vma->vm_start && end == vma->vm_end)
  			goto erase_whole_vma;
  		if (start < vma->vm_start || end > vma->vm_end) {
  			kleave(" = -EINVAL [superset]");
  			return -EINVAL;
  		}
  		if (start & ~PAGE_MASK) {
  			kleave(" = -EINVAL [unaligned start]");
  			return -EINVAL;
  		}
  		if (end != vma->vm_end && end & ~PAGE_MASK) {
  			kleave(" = -EINVAL [unaligned split]");
  			return -EINVAL;
  		}
  		if (start != vma->vm_start && end != vma->vm_end) {
  			ret = split_vma(mm, vma, start, 1);
  			if (ret < 0) {
  				kleave(" = %d [split]", ret);
  				return ret;
  			}
  		}
  		return shrink_vma(mm, vma, start, end);
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1651

8feae1311   David Howells   NOMMU: Make VMAs ...
1652
1653
1654
1655
  erase_whole_vma:
  	delete_vma_from_mm(vma);
  	delete_vma(mm, vma);
  	kleave(" = 0");
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1656
1657
  	return 0;
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
1658
  EXPORT_SYMBOL(do_munmap);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1659

6a6160a7b   Heiko Carstens   [CVE-2009-0029] S...
1660
  SYSCALL_DEFINE2(munmap, unsigned long, addr, size_t, len)
3034097a5   David Howells   [PATCH] NOMMU: Or...
1661
1662
1663
1664
1665
1666
1667
1668
1669
1670
1671
  {
  	int ret;
  	struct mm_struct *mm = current->mm;
  
  	down_write(&mm->mmap_sem);
  	ret = do_munmap(mm, addr, len);
  	up_write(&mm->mmap_sem);
  	return ret;
  }
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
1672
   * release all the mappings made in a process's VM space
3034097a5   David Howells   [PATCH] NOMMU: Or...
1673
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
1674
  void exit_mmap(struct mm_struct *mm)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1675
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
1676
  	struct vm_area_struct *vma;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1677

8feae1311   David Howells   NOMMU: Make VMAs ...
1678
1679
  	if (!mm)
  		return;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1680

8feae1311   David Howells   NOMMU: Make VMAs ...
1681
  	kenter("");
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1682

8feae1311   David Howells   NOMMU: Make VMAs ...
1683
  	mm->total_vm = 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1684

8feae1311   David Howells   NOMMU: Make VMAs ...
1685
1686
1687
1688
  	while ((vma = mm->mmap)) {
  		mm->mmap = vma->vm_next;
  		delete_vma_from_mm(vma);
  		delete_vma(mm, vma);
04c349615   Steven J. Magnani   nommu: yield CPU ...
1689
  		cond_resched();
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1690
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1691
1692
  
  	kleave("");
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1693
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1694
1695
1696
1697
1698
1699
  unsigned long do_brk(unsigned long addr, unsigned long len)
  {
  	return -ENOMEM;
  }
  
  /*
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1700
1701
   * expand (or shrink) an existing mapping, potentially moving it at the same
   * time (controlled by the MREMAP_MAYMOVE flag and available VM space)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1702
   *
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1703
   * under NOMMU conditions, we only permit changing a mapping's size, and only
8feae1311   David Howells   NOMMU: Make VMAs ...
1704
1705
   * as long as it stays within the region allocated by do_mmap_private() and the
   * block is not shareable
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1706
   *
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1707
   * MREMAP_FIXED is not supported under NOMMU conditions
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1708
1709
1710
1711
1712
   */
  unsigned long do_mremap(unsigned long addr,
  			unsigned long old_len, unsigned long new_len,
  			unsigned long flags, unsigned long new_addr)
  {
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1713
  	struct vm_area_struct *vma;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1714
1715
  
  	/* insanity checks first */
f67d9b157   Bob Liu   nommu: add page a...
1716
1717
  	old_len = PAGE_ALIGN(old_len);
  	new_len = PAGE_ALIGN(new_len);
8feae1311   David Howells   NOMMU: Make VMAs ...
1718
  	if (old_len == 0 || new_len == 0)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1719
  		return (unsigned long) -EINVAL;
8feae1311   David Howells   NOMMU: Make VMAs ...
1720
1721
  	if (addr & ~PAGE_MASK)
  		return -EINVAL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1722
1723
  	if (flags & MREMAP_FIXED && new_addr != addr)
  		return (unsigned long) -EINVAL;
8feae1311   David Howells   NOMMU: Make VMAs ...
1724
  	vma = find_vma_exact(current->mm, addr, old_len);
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1725
1726
  	if (!vma)
  		return (unsigned long) -EINVAL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1727

6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1728
  	if (vma->vm_end != vma->vm_start + old_len)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1729
  		return (unsigned long) -EFAULT;
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1730
  	if (vma->vm_flags & VM_MAYSHARE)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1731
  		return (unsigned long) -EPERM;
8feae1311   David Howells   NOMMU: Make VMAs ...
1732
  	if (new_len > vma->vm_region->vm_end - vma->vm_region->vm_start)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1733
1734
1735
  		return (unsigned long) -ENOMEM;
  
  	/* all checks complete - do it */
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1736
  	vma->vm_end = vma->vm_start + new_len;
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1737
1738
  	return vma->vm_start;
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
1739
  EXPORT_SYMBOL(do_mremap);
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1740

6a6160a7b   Heiko Carstens   [CVE-2009-0029] S...
1741
1742
1743
  SYSCALL_DEFINE5(mremap, unsigned long, addr, unsigned long, old_len,
  		unsigned long, new_len, unsigned long, flags,
  		unsigned long, new_addr)
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1744
1745
1746
1747
1748
1749
1750
  {
  	unsigned long ret;
  
  	down_write(&current->mm->mmap_sem);
  	ret = do_mremap(addr, old_len, new_len, flags, new_addr);
  	up_write(&current->mm->mmap_sem);
  	return ret;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1751
  }
6aab341e0   Linus Torvalds   mm: re-architect ...
1752
  struct page *follow_page(struct vm_area_struct *vma, unsigned long address,
deceb6cd1   Hugh Dickins   [PATCH] mm: follo...
1753
  			unsigned int foll_flags)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1754
1755
1756
  {
  	return NULL;
  }
8f3b1327a   Bob Liu   mm/nommu.c: fix r...
1757
1758
  int remap_pfn_range(struct vm_area_struct *vma, unsigned long addr,
  		unsigned long pfn, unsigned long size, pgprot_t prot)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1759
  {
8f3b1327a   Bob Liu   mm/nommu.c: fix r...
1760
1761
1762
1763
  	if (addr != (pfn << PAGE_SHIFT))
  		return -EINVAL;
  
  	vma->vm_flags |= VM_IO | VM_RESERVED | VM_PFNMAP;
66aa2b4b1   Greg Ungerer   [PATCH] uclinux: ...
1764
  	return 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1765
  }
22c4af409   Luke Yang   [PATCH] nommu: ex...
1766
  EXPORT_SYMBOL(remap_pfn_range);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1767

f905bc447   Paul Mundt   nommu: add new vm...
1768
1769
1770
1771
1772
1773
1774
1775
1776
1777
1778
1779
1780
1781
  int remap_vmalloc_range(struct vm_area_struct *vma, void *addr,
  			unsigned long pgoff)
  {
  	unsigned int size = vma->vm_end - vma->vm_start;
  
  	if (!(vma->vm_flags & VM_USERMAP))
  		return -EINVAL;
  
  	vma->vm_start = (unsigned long)(addr + (pgoff << PAGE_SHIFT));
  	vma->vm_end = vma->vm_start + size;
  
  	return 0;
  }
  EXPORT_SYMBOL(remap_vmalloc_range);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1782
1783
1784
1785
1786
  unsigned long arch_get_unmapped_area(struct file *file, unsigned long addr,
  	unsigned long len, unsigned long pgoff, unsigned long flags)
  {
  	return -ENOMEM;
  }
1363c3cd8   Wolfgang Wander   [PATCH] Avoiding ...
1787
  void arch_unmap_area(struct mm_struct *mm, unsigned long addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1788
1789
  {
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1790
1791
1792
1793
1794
  void unmap_mapping_range(struct address_space *mapping,
  			 loff_t const holebegin, loff_t const holelen,
  			 int even_cows)
  {
  }
22c4af409   Luke Yang   [PATCH] nommu: ex...
1795
  EXPORT_SYMBOL(unmap_mapping_range);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1796
1797
1798
1799
1800
1801
1802
1803
1804
1805
1806
1807
1808
1809
1810
1811
1812
  
  /*
   * Check that a process has enough memory to allocate a new virtual
   * mapping. 0 means there is enough memory for the allocation to
   * succeed and -ENOMEM implies there is not.
   *
   * We currently support three overcommit policies, which are set via the
   * vm.overcommit_memory sysctl.  See Documentation/vm/overcommit-accounting
   *
   * Strict overcommit modes added 2002 Feb 26 by Alan Cox.
   * Additional code 2002 Jul 20 by Robert Love.
   *
   * cap_sys_admin is 1 if the process has admin privileges, 0 otherwise.
   *
   * Note this is a helper function intended to be used by LSMs which
   * wish to use this logic.
   */
34b4e4aa3   Alan Cox   fix NULL pointer ...
1813
  int __vm_enough_memory(struct mm_struct *mm, long pages, int cap_sys_admin)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1814
1815
1816
1817
1818
1819
1820
1821
1822
1823
1824
1825
  {
  	unsigned long free, allowed;
  
  	vm_acct_memory(pages);
  
  	/*
  	 * Sometimes we want to use more memory than we have
  	 */
  	if (sysctl_overcommit_memory == OVERCOMMIT_ALWAYS)
  		return 0;
  
  	if (sysctl_overcommit_memory == OVERCOMMIT_GUESS) {
c15bef309   Dmitry Fink   mmap: fix and tid...
1826
1827
1828
1829
1830
1831
1832
1833
1834
1835
  		free = global_page_state(NR_FREE_PAGES);
  		free += global_page_state(NR_FILE_PAGES);
  
  		/*
  		 * shmem pages shouldn't be counted as free in this
  		 * case, they can't be purged, only swapped out, and
  		 * that won't affect the overall amount of available
  		 * memory in the system.
  		 */
  		free -= global_page_state(NR_SHMEM);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1836

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1837
1838
1839
1840
1841
1842
1843
1844
  		free += nr_swap_pages;
  
  		/*
  		 * Any slabs which are created with the
  		 * SLAB_RECLAIM_ACCOUNT flag claim to have contents
  		 * which are reclaimable, under pressure.  The dentry
  		 * cache and most inode caches should fall into this
  		 */
972d1a7b1   Christoph Lameter   [PATCH] ZVC: Supp...
1845
  		free += global_page_state(NR_SLAB_RECLAIMABLE);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1846
1847
  
  		/*
d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1848
1849
  		 * Leave reserved pages. The pages are not for anonymous pages.
  		 */
c15bef309   Dmitry Fink   mmap: fix and tid...
1850
  		if (free <= totalreserve_pages)
d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1851
1852
  			goto error;
  		else
c15bef309   Dmitry Fink   mmap: fix and tid...
1853
  			free -= totalreserve_pages;
d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1854
1855
1856
1857
  
  		/*
  		 * Leave the last 3% for root
  		 */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1858
  		if (!cap_sys_admin)
c15bef309   Dmitry Fink   mmap: fix and tid...
1859
  			free -= free / 32;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1860
1861
1862
  
  		if (free > pages)
  			return 0;
d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1863
1864
  
  		goto error;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1865
1866
1867
1868
1869
1870
1871
1872
1873
1874
1875
1876
  	}
  
  	allowed = totalram_pages * sysctl_overcommit_ratio / 100;
  	/*
  	 * Leave the last 3% for root
  	 */
  	if (!cap_sys_admin)
  		allowed -= allowed / 32;
  	allowed += total_swap_pages;
  
  	/* Don't let a single process grow too big:
  	   leave 3% of the size of this process for other processes */
731572d39   Alan Cox   nfsd: fix vm over...
1877
1878
  	if (mm)
  		allowed -= mm->total_vm / 32;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1879

00a62ce91   KOSAKI Motohiro   mm: fix Committed...
1880
  	if (percpu_counter_read_positive(&vm_committed_as) < allowed)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1881
  		return 0;
00a62ce91   KOSAKI Motohiro   mm: fix Committed...
1882

d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1883
  error:
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1884
1885
1886
1887
  	vm_unacct_memory(pages);
  
  	return -ENOMEM;
  }
cae5d3903   Stephen Wilson   mm: arch: rename ...
1888
  int in_gate_area_no_mm(unsigned long addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1889
1890
1891
  {
  	return 0;
  }
b0e15190e   David Howells   [PATCH] NOMMU: Ma...
1892

d0217ac04   Nick Piggin   mm: fault feedbac...
1893
  int filemap_fault(struct vm_area_struct *vma, struct vm_fault *vmf)
b0e15190e   David Howells   [PATCH] NOMMU: Ma...
1894
1895
  {
  	BUG();
d0217ac04   Nick Piggin   mm: fault feedbac...
1896
  	return 0;
b0e15190e   David Howells   [PATCH] NOMMU: Ma...
1897
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
1898
  EXPORT_SYMBOL(filemap_fault);
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1899

f55f199b7   Mike Frysinger   NOMMU: implement ...
1900
1901
  static int __access_remote_vm(struct task_struct *tsk, struct mm_struct *mm,
  		unsigned long addr, void *buf, int len, int write)
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1902
  {
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1903
  	struct vm_area_struct *vma;
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1904
1905
1906
1907
  
  	down_read(&mm->mmap_sem);
  
  	/* the access must start within one of the target process's mappings */
0159b141d   David Howells   [PATCH] NOMMU: Us...
1908
1909
  	vma = find_vma(mm, addr);
  	if (vma) {
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1910
1911
1912
1913
1914
  		/* don't overrun this mapping */
  		if (addr + len >= vma->vm_end)
  			len = vma->vm_end - addr;
  
  		/* only read or write mappings where it is permitted */
d00c7b993   David Howells   [PATCH] NOMMU: Pe...
1915
  		if (write && vma->vm_flags & VM_MAYWRITE)
7959722b9   Jie Zhang   NOMMU: Use copy_*...
1916
1917
  			copy_to_user_page(vma, NULL, addr,
  					 (void *) addr, buf, len);
d00c7b993   David Howells   [PATCH] NOMMU: Pe...
1918
  		else if (!write && vma->vm_flags & VM_MAYREAD)
7959722b9   Jie Zhang   NOMMU: Use copy_*...
1919
1920
  			copy_from_user_page(vma, NULL, addr,
  					    buf, (void *) addr, len);
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1921
1922
1923
1924
1925
1926
1927
  		else
  			len = 0;
  	} else {
  		len = 0;
  	}
  
  	up_read(&mm->mmap_sem);
f55f199b7   Mike Frysinger   NOMMU: implement ...
1928
1929
1930
1931
1932
1933
1934
1935
1936
1937
1938
1939
1940
1941
1942
1943
1944
1945
1946
1947
1948
1949
1950
1951
1952
1953
1954
1955
1956
1957
1958
1959
1960
1961
1962
1963
  
  	return len;
  }
  
  /**
   * @access_remote_vm - access another process' address space
   * @mm:		the mm_struct of the target address space
   * @addr:	start address to access
   * @buf:	source or destination buffer
   * @len:	number of bytes to transfer
   * @write:	whether the access is a write
   *
   * The caller must hold a reference on @mm.
   */
  int access_remote_vm(struct mm_struct *mm, unsigned long addr,
  		void *buf, int len, int write)
  {
  	return __access_remote_vm(NULL, mm, addr, buf, len, write);
  }
  
  /*
   * Access another process' address space.
   * - source/target buffer must be kernel space
   */
  int access_process_vm(struct task_struct *tsk, unsigned long addr, void *buf, int len, int write)
  {
  	struct mm_struct *mm;
  
  	if (addr + len < addr)
  		return 0;
  
  	mm = get_task_mm(tsk);
  	if (!mm)
  		return 0;
  
  	len = __access_remote_vm(tsk, mm, addr, buf, len, write);
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1964
1965
1966
  	mmput(mm);
  	return len;
  }
7e6608724   David Howells   nommu: fix shared...
1967
1968
1969
1970
1971
1972
1973
1974
1975
1976
1977
1978
1979
1980
1981
1982
1983
1984
1985
1986
1987
1988
1989
1990
1991
1992
1993
1994
1995
1996
1997
1998
1999
2000
2001
2002
2003
2004
2005
2006
2007
2008
2009
2010
2011
2012
2013
2014
2015
2016
2017
2018
2019
2020
2021
2022
2023
2024
2025
2026
2027
2028
  
  /**
   * nommu_shrink_inode_mappings - Shrink the shared mappings on an inode
   * @inode: The inode to check
   * @size: The current filesize of the inode
   * @newsize: The proposed filesize of the inode
   *
   * Check the shared mappings on an inode on behalf of a shrinking truncate to
   * make sure that that any outstanding VMAs aren't broken and then shrink the
   * vm_regions that extend that beyond so that do_mmap_pgoff() doesn't
   * automatically grant mappings that are too large.
   */
  int nommu_shrink_inode_mappings(struct inode *inode, size_t size,
  				size_t newsize)
  {
  	struct vm_area_struct *vma;
  	struct prio_tree_iter iter;
  	struct vm_region *region;
  	pgoff_t low, high;
  	size_t r_size, r_top;
  
  	low = newsize >> PAGE_SHIFT;
  	high = (size + PAGE_SIZE - 1) >> PAGE_SHIFT;
  
  	down_write(&nommu_region_sem);
  
  	/* search for VMAs that fall within the dead zone */
  	vma_prio_tree_foreach(vma, &iter, &inode->i_mapping->i_mmap,
  			      low, high) {
  		/* found one - only interested if it's shared out of the page
  		 * cache */
  		if (vma->vm_flags & VM_SHARED) {
  			up_write(&nommu_region_sem);
  			return -ETXTBSY; /* not quite true, but near enough */
  		}
  	}
  
  	/* reduce any regions that overlap the dead zone - if in existence,
  	 * these will be pointed to by VMAs that don't overlap the dead zone
  	 *
  	 * we don't check for any regions that start beyond the EOF as there
  	 * shouldn't be any
  	 */
  	vma_prio_tree_foreach(vma, &iter, &inode->i_mapping->i_mmap,
  			      0, ULONG_MAX) {
  		if (!(vma->vm_flags & VM_SHARED))
  			continue;
  
  		region = vma->vm_region;
  		r_size = region->vm_top - region->vm_start;
  		r_top = (region->vm_pgoff << PAGE_SHIFT) + r_size;
  
  		if (r_top > newsize) {
  			region->vm_top -= r_top - newsize;
  			if (region->vm_end > region->vm_top)
  				region->vm_end = region->vm_top;
  		}
  	}
  
  	up_write(&nommu_region_sem);
  	return 0;
  }