Blame view

mm/nommu.c 50.7 KB
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1
2
3
4
5
6
7
8
  /*
   *  linux/mm/nommu.c
   *
   *  Replacement code for mm functions to support CPU's that don't
   *  have any form of memory management unit (thus no virtual memory).
   *
   *  See Documentation/nommu-mmap.txt
   *
8feae1311   David Howells   NOMMU: Make VMAs ...
9
   *  Copyright (c) 2004-2008 David Howells <dhowells@redhat.com>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
10
11
12
   *  Copyright (c) 2000-2003 David McCullough <davidm@snapgear.com>
   *  Copyright (c) 2000-2001 D Jeff Dionne <jeff@uClinux.org>
   *  Copyright (c) 2002      Greg Ungerer <gerg@snapgear.com>
29c185e5c   Paul Mundt   nommu: Provide st...
13
   *  Copyright (c) 2007-2010 Paul Mundt <lethal@linux-sh.org>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
14
   */
f2b8544f5   David Howells   NOMMU: mm/nommu.c...
15
  #include <linux/module.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
16
17
18
19
20
21
22
23
  #include <linux/mm.h>
  #include <linux/mman.h>
  #include <linux/swap.h>
  #include <linux/file.h>
  #include <linux/highmem.h>
  #include <linux/pagemap.h>
  #include <linux/slab.h>
  #include <linux/vmalloc.h>
fa8e26ccd   Roland McGrath   tracehook: traceh...
24
  #include <linux/tracehook.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
25
26
27
28
29
30
  #include <linux/blkdev.h>
  #include <linux/backing-dev.h>
  #include <linux/mount.h>
  #include <linux/personality.h>
  #include <linux/security.h>
  #include <linux/syscalls.h>
120a795da   Al Viro   audit mmap
31
  #include <linux/audit.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
32
33
34
35
  
  #include <asm/uaccess.h>
  #include <asm/tlb.h>
  #include <asm/tlbflush.h>
eb8cdec4a   Bernd Schmidt   nommu: add suppor...
36
  #include <asm/mmu_context.h>
8feae1311   David Howells   NOMMU: Make VMAs ...
37
  #include "internal.h"
8feae1311   David Howells   NOMMU: Make VMAs ...
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
  #if 0
  #define kenter(FMT, ...) \
  	printk(KERN_DEBUG "==> %s("FMT")
  ", __func__, ##__VA_ARGS__)
  #define kleave(FMT, ...) \
  	printk(KERN_DEBUG "<== %s()"FMT"
  ", __func__, ##__VA_ARGS__)
  #define kdebug(FMT, ...) \
  	printk(KERN_DEBUG "xxx" FMT"yyy
  ", ##__VA_ARGS__)
  #else
  #define kenter(FMT, ...) \
  	no_printk(KERN_DEBUG "==> %s("FMT")
  ", __func__, ##__VA_ARGS__)
  #define kleave(FMT, ...) \
  	no_printk(KERN_DEBUG "<== %s()"FMT"
  ", __func__, ##__VA_ARGS__)
  #define kdebug(FMT, ...) \
  	no_printk(KERN_DEBUG FMT"
  ", ##__VA_ARGS__)
  #endif
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
59
60
61
62
63
  
  void *high_memory;
  struct page *mem_map;
  unsigned long max_mapnr;
  unsigned long num_physpages;
4266c97a3   Hugh Dickins   nommu: fix two bu...
64
  unsigned long highest_memmap_pfn;
00a62ce91   KOSAKI Motohiro   mm: fix Committed...
65
  struct percpu_counter vm_committed_as;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
66
67
68
  int sysctl_overcommit_memory = OVERCOMMIT_GUESS; /* heuristic overcommit */
  int sysctl_overcommit_ratio = 50; /* default is 50% */
  int sysctl_max_map_count = DEFAULT_MAX_MAP_COUNT;
fc4d5c292   David Howells   nommu: make the i...
69
  int sysctl_nr_trim_pages = CONFIG_NOMMU_INITIAL_TRIM_EXCESS;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
70
  int heap_stack_gap = 0;
33e5d7697   David Howells   nommu: fix a numb...
71
  atomic_long_t mmap_pages_allocated;
8feae1311   David Howells   NOMMU: Make VMAs ...
72

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
73
  EXPORT_SYMBOL(mem_map);
6a04de6db   Wu, Bryan   [PATCH] nommu: fi...
74
  EXPORT_SYMBOL(num_physpages);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
75

8feae1311   David Howells   NOMMU: Make VMAs ...
76
77
78
79
  /* list of mapped, potentially shareable regions */
  static struct kmem_cache *vm_region_jar;
  struct rb_root nommu_region_tree = RB_ROOT;
  DECLARE_RWSEM(nommu_region_sem);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
80

f0f37e2f7   Alexey Dobriyan   const: mark struc...
81
  const struct vm_operations_struct generic_file_vm_ops = {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
82
83
84
  };
  
  /*
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
85
86
87
88
89
90
91
92
   * Return the total memory allocated for this pointer, not
   * just what the caller asked for.
   *
   * Doesn't have to be accurate, i.e. may have races.
   */
  unsigned int kobjsize(const void *objp)
  {
  	struct page *page;
4016a1390   Michael Hennerich   mm/nommu.c: retur...
93
94
95
96
  	/*
  	 * If the object we have should not have ksize performed on it,
  	 * return size of 0
  	 */
5a1603be5   Paul Mundt   nommu: Correct ko...
97
  	if (!objp || !virt_addr_valid(objp))
6cfd53fc0   Paul Mundt   nommu: fix kobjsi...
98
99
100
  		return 0;
  
  	page = virt_to_head_page(objp);
6cfd53fc0   Paul Mundt   nommu: fix kobjsi...
101
102
103
104
105
  
  	/*
  	 * If the allocator sets PageSlab, we know the pointer came from
  	 * kmalloc().
  	 */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
106
107
  	if (PageSlab(page))
  		return ksize(objp);
6cfd53fc0   Paul Mundt   nommu: fix kobjsi...
108
  	/*
ab2e83ead   Paul Mundt   NOMMU: Teach kobj...
109
110
111
112
113
114
115
116
117
118
119
120
121
122
  	 * If it's not a compound page, see if we have a matching VMA
  	 * region. This test is intentionally done in reverse order,
  	 * so if there's no VMA, we still fall through and hand back
  	 * PAGE_SIZE for 0-order pages.
  	 */
  	if (!PageCompound(page)) {
  		struct vm_area_struct *vma;
  
  		vma = find_vma(current->mm, (unsigned long)objp);
  		if (vma)
  			return vma->vm_end - vma->vm_start;
  	}
  
  	/*
6cfd53fc0   Paul Mundt   nommu: fix kobjsi...
123
  	 * The ksize() function is only guaranteed to work for pointers
5a1603be5   Paul Mundt   nommu: Correct ko...
124
  	 * returned by kmalloc(). So handle arbitrary pointers here.
6cfd53fc0   Paul Mundt   nommu: fix kobjsi...
125
  	 */
5a1603be5   Paul Mundt   nommu: Correct ko...
126
  	return PAGE_SIZE << compound_order(page);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
127
  }
b291f0003   Nick Piggin   mlock: mlocked pa...
128
  int __get_user_pages(struct task_struct *tsk, struct mm_struct *mm,
4266c97a3   Hugh Dickins   nommu: fix two bu...
129
  		     unsigned long start, int nr_pages, unsigned int foll_flags,
53a7706d5   Michel Lespinasse   mlock: do not hol...
130
131
  		     struct page **pages, struct vm_area_struct **vmas,
  		     int *retry)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
132
  {
910e46da4   Sonic Zhang   [PATCH] Check if ...
133
  	struct vm_area_struct *vma;
7b4d5b8b3   David Howells   [PATCH] NOMMU: Ch...
134
135
136
137
  	unsigned long vm_flags;
  	int i;
  
  	/* calculate required read or write permissions.
58fa879e1   Hugh Dickins   mm: FOLL flags fo...
138
  	 * If FOLL_FORCE is set, we only require the "MAY" flags.
7b4d5b8b3   David Howells   [PATCH] NOMMU: Ch...
139
  	 */
58fa879e1   Hugh Dickins   mm: FOLL flags fo...
140
141
142
143
  	vm_flags  = (foll_flags & FOLL_WRITE) ?
  			(VM_WRITE | VM_MAYWRITE) : (VM_READ | VM_MAYREAD);
  	vm_flags &= (foll_flags & FOLL_FORCE) ?
  			(VM_MAYREAD | VM_MAYWRITE) : (VM_READ | VM_WRITE);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
144

9d73777e5   Peter Zijlstra   clarify get_user_...
145
  	for (i = 0; i < nr_pages; i++) {
7561e8ca0   David Howells   NOMMU: Revert 'no...
146
  		vma = find_vma(mm, start);
7b4d5b8b3   David Howells   [PATCH] NOMMU: Ch...
147
148
149
150
  		if (!vma)
  			goto finish_or_fault;
  
  		/* protect what we can, including chardevs */
1c3aff1ce   Hugh Dickins   mm: remove unused...
151
152
  		if ((vma->vm_flags & (VM_IO | VM_PFNMAP)) ||
  		    !(vm_flags & vma->vm_flags))
7b4d5b8b3   David Howells   [PATCH] NOMMU: Ch...
153
  			goto finish_or_fault;
910e46da4   Sonic Zhang   [PATCH] Check if ...
154

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
155
156
157
158
159
160
  		if (pages) {
  			pages[i] = virt_to_page(start);
  			if (pages[i])
  				page_cache_get(pages[i]);
  		}
  		if (vmas)
910e46da4   Sonic Zhang   [PATCH] Check if ...
161
  			vmas[i] = vma;
e1ee65d85   David Howells   NOMMU: Fix __get_...
162
  		start = (start + PAGE_SIZE) & PAGE_MASK;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
163
  	}
7b4d5b8b3   David Howells   [PATCH] NOMMU: Ch...
164
165
166
167
168
  
  	return i;
  
  finish_or_fault:
  	return i ? : -EFAULT;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
169
  }
b291f0003   Nick Piggin   mlock: mlocked pa...
170

b291f0003   Nick Piggin   mlock: mlocked pa...
171
172
173
174
175
176
177
178
  /*
   * get a list of pages in an address range belonging to the specified process
   * and indicate the VMA that covers each page
   * - this is potentially dodgy as we may end incrementing the page count of a
   *   slab page or a secondary page from a compound page
   * - don't permit access to VMAs that don't support it, such as I/O mappings
   */
  int get_user_pages(struct task_struct *tsk, struct mm_struct *mm,
9d73777e5   Peter Zijlstra   clarify get_user_...
179
  	unsigned long start, int nr_pages, int write, int force,
b291f0003   Nick Piggin   mlock: mlocked pa...
180
181
182
183
184
  	struct page **pages, struct vm_area_struct **vmas)
  {
  	int flags = 0;
  
  	if (write)
58fa879e1   Hugh Dickins   mm: FOLL flags fo...
185
  		flags |= FOLL_WRITE;
b291f0003   Nick Piggin   mlock: mlocked pa...
186
  	if (force)
58fa879e1   Hugh Dickins   mm: FOLL flags fo...
187
  		flags |= FOLL_FORCE;
b291f0003   Nick Piggin   mlock: mlocked pa...
188

53a7706d5   Michel Lespinasse   mlock: do not hol...
189
190
  	return __get_user_pages(tsk, mm, start, nr_pages, flags, pages, vmas,
  				NULL);
b291f0003   Nick Piggin   mlock: mlocked pa...
191
  }
66aa2b4b1   Greg Ungerer   [PATCH] uclinux: ...
192
  EXPORT_SYMBOL(get_user_pages);
dfc2f91ac   Paul Mundt   nommu: provide fo...
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
  /**
   * follow_pfn - look up PFN at a user virtual address
   * @vma: memory mapping
   * @address: user virtual address
   * @pfn: location to store found PFN
   *
   * Only IO mappings and raw PFN mappings are allowed.
   *
   * Returns zero and the pfn at @pfn on success, -ve otherwise.
   */
  int follow_pfn(struct vm_area_struct *vma, unsigned long address,
  	unsigned long *pfn)
  {
  	if (!(vma->vm_flags & (VM_IO | VM_PFNMAP)))
  		return -EINVAL;
  
  	*pfn = address >> PAGE_SHIFT;
  	return 0;
  }
  EXPORT_SYMBOL(follow_pfn);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
213
214
  DEFINE_RWLOCK(vmlist_lock);
  struct vm_struct *vmlist;
b3bdda02a   Christoph Lameter   vmalloc: add cons...
215
  void vfree(const void *addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
216
217
218
  {
  	kfree(addr);
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
219
  EXPORT_SYMBOL(vfree);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
220

dd0fc66fb   Al Viro   [PATCH] gfp flags...
221
  void *__vmalloc(unsigned long size, gfp_t gfp_mask, pgprot_t prot)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
222
223
  {
  	/*
8518609de   Robert P. J. Day   Explain clearly w...
224
225
  	 *  You can't specify __GFP_HIGHMEM with kmalloc() since kmalloc()
  	 * returns only a logical address.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
226
  	 */
84097518d   Nick Piggin   [PATCH] mm: nommu...
227
  	return kmalloc(size, (gfp_mask | __GFP_COMP) & ~__GFP_HIGHMEM);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
228
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
229
  EXPORT_SYMBOL(__vmalloc);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
230

f905bc447   Paul Mundt   nommu: add new vm...
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
  void *vmalloc_user(unsigned long size)
  {
  	void *ret;
  
  	ret = __vmalloc(size, GFP_KERNEL | __GFP_HIGHMEM | __GFP_ZERO,
  			PAGE_KERNEL);
  	if (ret) {
  		struct vm_area_struct *vma;
  
  		down_write(&current->mm->mmap_sem);
  		vma = find_vma(current->mm, (unsigned long)ret);
  		if (vma)
  			vma->vm_flags |= VM_USERMAP;
  		up_write(&current->mm->mmap_sem);
  	}
  
  	return ret;
  }
  EXPORT_SYMBOL(vmalloc_user);
b3bdda02a   Christoph Lameter   vmalloc: add cons...
250
  struct page *vmalloc_to_page(const void *addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
251
252
253
  {
  	return virt_to_page(addr);
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
254
  EXPORT_SYMBOL(vmalloc_to_page);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
255

b3bdda02a   Christoph Lameter   vmalloc: add cons...
256
  unsigned long vmalloc_to_pfn(const void *addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
257
258
259
  {
  	return page_to_pfn(virt_to_page(addr));
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
260
  EXPORT_SYMBOL(vmalloc_to_pfn);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
  
  long vread(char *buf, char *addr, unsigned long count)
  {
  	memcpy(buf, addr, count);
  	return count;
  }
  
  long vwrite(char *buf, char *addr, unsigned long count)
  {
  	/* Don't allow overflow */
  	if ((unsigned long) addr + count < count)
  		count = -(unsigned long) addr;
  
  	memcpy(addr, buf, count);
  	return(count);
  }
  
  /*
   *	vmalloc  -  allocate virtually continguos memory
   *
   *	@size:		allocation size
   *
   *	Allocate enough pages to cover @size from the page level
   *	allocator and map them into continguos kernel virtual space.
   *
c1c8897f8   Michael Opdenacker   Spelling fix: "co...
286
   *	For tight control over page level allocator and protection flags
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
287
288
289
290
291
292
   *	use __vmalloc() instead.
   */
  void *vmalloc(unsigned long size)
  {
         return __vmalloc(size, GFP_KERNEL | __GFP_HIGHMEM, PAGE_KERNEL);
  }
f61388822   Andrew Morton   [PATCH] nommu: im...
293
  EXPORT_SYMBOL(vmalloc);
e1ca7788d   Dave Young   mm: add vzalloc()...
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
  /*
   *	vzalloc - allocate virtually continguos memory with zero fill
   *
   *	@size:		allocation size
   *
   *	Allocate enough pages to cover @size from the page level
   *	allocator and map them into continguos kernel virtual space.
   *	The memory allocated is set to zero.
   *
   *	For tight control over page level allocator and protection flags
   *	use __vmalloc() instead.
   */
  void *vzalloc(unsigned long size)
  {
  	return __vmalloc(size, GFP_KERNEL | __GFP_HIGHMEM | __GFP_ZERO,
  			PAGE_KERNEL);
  }
  EXPORT_SYMBOL(vzalloc);
  
  /**
   * vmalloc_node - allocate memory on a specific node
   * @size:	allocation size
   * @node:	numa node
   *
   * Allocate enough pages to cover @size from the page level
   * allocator and map them into contiguous kernel virtual space.
   *
   * For tight control over page level allocator and protection flags
   * use __vmalloc() instead.
   */
f61388822   Andrew Morton   [PATCH] nommu: im...
324
325
326
327
  void *vmalloc_node(unsigned long size, int node)
  {
  	return vmalloc(size);
  }
9a14f653d   Paul Mundt   nommu: Fix up vma...
328
  EXPORT_SYMBOL(vmalloc_node);
e1ca7788d   Dave Young   mm: add vzalloc()...
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
  
  /**
   * vzalloc_node - allocate memory on a specific node with zero fill
   * @size:	allocation size
   * @node:	numa node
   *
   * Allocate enough pages to cover @size from the page level
   * allocator and map them into contiguous kernel virtual space.
   * The memory allocated is set to zero.
   *
   * For tight control over page level allocator and protection flags
   * use __vmalloc() instead.
   */
  void *vzalloc_node(unsigned long size, int node)
  {
  	return vzalloc(size);
  }
  EXPORT_SYMBOL(vzalloc_node);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
347

1af446edf   Paul Mundt   nommu: Provide vm...
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
  #ifndef PAGE_KERNEL_EXEC
  # define PAGE_KERNEL_EXEC PAGE_KERNEL
  #endif
  
  /**
   *	vmalloc_exec  -  allocate virtually contiguous, executable memory
   *	@size:		allocation size
   *
   *	Kernel-internal function to allocate enough pages to cover @size
   *	the page level allocator and map them into contiguous and
   *	executable kernel virtual space.
   *
   *	For tight control over page level allocator and protection flags
   *	use __vmalloc() instead.
   */
  
  void *vmalloc_exec(unsigned long size)
  {
  	return __vmalloc(size, GFP_KERNEL | __GFP_HIGHMEM, PAGE_KERNEL_EXEC);
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
368
369
  /**
   * vmalloc_32  -  allocate virtually contiguous memory (32bit addressable)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
370
371
372
373
374
375
376
377
378
   *	@size:		allocation size
   *
   *	Allocate enough 32bit PA addressable pages to cover @size from the
   *	page level allocator and map them into continguos kernel virtual space.
   */
  void *vmalloc_32(unsigned long size)
  {
  	return __vmalloc(size, GFP_KERNEL, PAGE_KERNEL);
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
379
380
381
382
383
384
385
386
  EXPORT_SYMBOL(vmalloc_32);
  
  /**
   * vmalloc_32_user - allocate zeroed virtually contiguous 32bit memory
   *	@size:		allocation size
   *
   * The resulting memory area is 32bit addressable and zeroed so it can be
   * mapped to userspace without leaking data.
f905bc447   Paul Mundt   nommu: add new vm...
387
388
389
   *
   * VM_USERMAP is set on the corresponding VMA so that subsequent calls to
   * remap_vmalloc_range() are permissible.
b50731732   Paul Mundt   nommu: vmalloc_32...
390
391
392
   */
  void *vmalloc_32_user(unsigned long size)
  {
f905bc447   Paul Mundt   nommu: add new vm...
393
394
395
396
397
  	/*
  	 * We'll have to sort out the ZONE_DMA bits for 64-bit,
  	 * but for now this can simply use vmalloc_user() directly.
  	 */
  	return vmalloc_user(size);
b50731732   Paul Mundt   nommu: vmalloc_32...
398
399
  }
  EXPORT_SYMBOL(vmalloc_32_user);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
400
401
402
403
404
405
  
  void *vmap(struct page **pages, unsigned int count, unsigned long flags, pgprot_t prot)
  {
  	BUG();
  	return NULL;
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
406
  EXPORT_SYMBOL(vmap);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
407

b3bdda02a   Christoph Lameter   vmalloc: add cons...
408
  void vunmap(const void *addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
409
410
411
  {
  	BUG();
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
412
  EXPORT_SYMBOL(vunmap);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
413

eb6434d9e   Paul Mundt   nommu: Stub in vm...
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
  void *vm_map_ram(struct page **pages, unsigned int count, int node, pgprot_t prot)
  {
  	BUG();
  	return NULL;
  }
  EXPORT_SYMBOL(vm_map_ram);
  
  void vm_unmap_ram(const void *mem, unsigned int count)
  {
  	BUG();
  }
  EXPORT_SYMBOL(vm_unmap_ram);
  
  void vm_unmap_aliases(void)
  {
  }
  EXPORT_SYMBOL_GPL(vm_unmap_aliases);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
431
  /*
1eeb66a1b   Christoph Hellwig   move die notifier...
432
433
434
435
436
437
   * Implement a stub for vmalloc_sync_all() if the architecture chose not to
   * have one.
   */
  void  __attribute__((weak)) vmalloc_sync_all(void)
  {
  }
29c185e5c   Paul Mundt   nommu: Provide st...
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
  /**
   *	alloc_vm_area - allocate a range of kernel address space
   *	@size:		size of the area
   *
   *	Returns:	NULL on failure, vm_struct on success
   *
   *	This function reserves a range of kernel address space, and
   *	allocates pagetables to map that range.  No actual mappings
   *	are created.  If the kernel address space is not shared
   *	between processes, it syncs the pagetable across all
   *	processes.
   */
  struct vm_struct *alloc_vm_area(size_t size)
  {
  	BUG();
  	return NULL;
  }
  EXPORT_SYMBOL_GPL(alloc_vm_area);
  
  void free_vm_area(struct vm_struct *area)
  {
  	BUG();
  }
  EXPORT_SYMBOL_GPL(free_vm_area);
b50731732   Paul Mundt   nommu: vmalloc_32...
462
463
464
465
466
467
  int vm_insert_page(struct vm_area_struct *vma, unsigned long addr,
  		   struct page *page)
  {
  	return -EINVAL;
  }
  EXPORT_SYMBOL(vm_insert_page);
1eeb66a1b   Christoph Hellwig   move die notifier...
468
  /*
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
469
470
471
472
473
474
   *  sys_brk() for the most part doesn't need the global kernel
   *  lock, except when an application is doing something nasty
   *  like trying to un-brk an area that has already been mapped
   *  to a regular file.  in this case, the unmapping will need
   *  to invoke file system routines that need the global lock.
   */
6a6160a7b   Heiko Carstens   [CVE-2009-0029] S...
475
  SYSCALL_DEFINE1(brk, unsigned long, brk)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
  {
  	struct mm_struct *mm = current->mm;
  
  	if (brk < mm->start_brk || brk > mm->context.end_brk)
  		return mm->brk;
  
  	if (mm->brk == brk)
  		return mm->brk;
  
  	/*
  	 * Always allow shrinking brk
  	 */
  	if (brk <= mm->brk) {
  		mm->brk = brk;
  		return brk;
  	}
  
  	/*
  	 * Ok, looks good - let it rip.
  	 */
cfe79c00a   Mike Frysinger   NOMMU: Avoiding d...
496
  	flush_icache_range(mm->brk, brk);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
497
498
  	return mm->brk = brk;
  }
8feae1311   David Howells   NOMMU: Make VMAs ...
499
500
501
502
  /*
   * initialise the VMA and region record slabs
   */
  void __init mmap_init(void)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
503
  {
00a62ce91   KOSAKI Motohiro   mm: fix Committed...
504
505
506
507
  	int ret;
  
  	ret = percpu_counter_init(&vm_committed_as, 0);
  	VM_BUG_ON(ret);
33e5d7697   David Howells   nommu: fix a numb...
508
  	vm_region_jar = KMEM_CACHE(vm_region, SLAB_PANIC);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
509
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
510

3034097a5   David Howells   [PATCH] NOMMU: Or...
511
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
512
513
   * validate the region tree
   * - the caller must hold the region lock
3034097a5   David Howells   [PATCH] NOMMU: Or...
514
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
515
516
  #ifdef CONFIG_DEBUG_NOMMU_REGIONS
  static noinline void validate_nommu_regions(void)
3034097a5   David Howells   [PATCH] NOMMU: Or...
517
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
518
519
  	struct vm_region *region, *last;
  	struct rb_node *p, *lastp;
3034097a5   David Howells   [PATCH] NOMMU: Or...
520

8feae1311   David Howells   NOMMU: Make VMAs ...
521
522
523
524
525
  	lastp = rb_first(&nommu_region_tree);
  	if (!lastp)
  		return;
  
  	last = rb_entry(lastp, struct vm_region, vm_rb);
33e5d7697   David Howells   nommu: fix a numb...
526
527
  	BUG_ON(unlikely(last->vm_end <= last->vm_start));
  	BUG_ON(unlikely(last->vm_top < last->vm_end));
8feae1311   David Howells   NOMMU: Make VMAs ...
528
529
530
531
  
  	while ((p = rb_next(lastp))) {
  		region = rb_entry(p, struct vm_region, vm_rb);
  		last = rb_entry(lastp, struct vm_region, vm_rb);
33e5d7697   David Howells   nommu: fix a numb...
532
533
534
  		BUG_ON(unlikely(region->vm_end <= region->vm_start));
  		BUG_ON(unlikely(region->vm_top < region->vm_end));
  		BUG_ON(unlikely(region->vm_start < last->vm_top));
3034097a5   David Howells   [PATCH] NOMMU: Or...
535

8feae1311   David Howells   NOMMU: Make VMAs ...
536
537
  		lastp = p;
  	}
3034097a5   David Howells   [PATCH] NOMMU: Or...
538
  }
8feae1311   David Howells   NOMMU: Make VMAs ...
539
  #else
33e5d7697   David Howells   nommu: fix a numb...
540
541
542
  static void validate_nommu_regions(void)
  {
  }
8feae1311   David Howells   NOMMU: Make VMAs ...
543
  #endif
3034097a5   David Howells   [PATCH] NOMMU: Or...
544
545
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
546
   * add a region into the global tree
3034097a5   David Howells   [PATCH] NOMMU: Or...
547
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
548
  static void add_nommu_region(struct vm_region *region)
3034097a5   David Howells   [PATCH] NOMMU: Or...
549
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
550
551
  	struct vm_region *pregion;
  	struct rb_node **p, *parent;
3034097a5   David Howells   [PATCH] NOMMU: Or...
552

8feae1311   David Howells   NOMMU: Make VMAs ...
553
  	validate_nommu_regions();
8feae1311   David Howells   NOMMU: Make VMAs ...
554
555
556
557
558
559
560
561
562
563
564
565
566
  	parent = NULL;
  	p = &nommu_region_tree.rb_node;
  	while (*p) {
  		parent = *p;
  		pregion = rb_entry(parent, struct vm_region, vm_rb);
  		if (region->vm_start < pregion->vm_start)
  			p = &(*p)->rb_left;
  		else if (region->vm_start > pregion->vm_start)
  			p = &(*p)->rb_right;
  		else if (pregion == region)
  			return;
  		else
  			BUG();
3034097a5   David Howells   [PATCH] NOMMU: Or...
567
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
568
569
  	rb_link_node(&region->vm_rb, parent, p);
  	rb_insert_color(&region->vm_rb, &nommu_region_tree);
3034097a5   David Howells   [PATCH] NOMMU: Or...
570

8feae1311   David Howells   NOMMU: Make VMAs ...
571
  	validate_nommu_regions();
3034097a5   David Howells   [PATCH] NOMMU: Or...
572
  }
3034097a5   David Howells   [PATCH] NOMMU: Or...
573
574
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
575
   * delete a region from the global tree
930e652a2   David Howells   [PATCH] NOMMU: Ma...
576
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
577
  static void delete_nommu_region(struct vm_region *region)
930e652a2   David Howells   [PATCH] NOMMU: Ma...
578
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
579
  	BUG_ON(!nommu_region_tree.rb_node);
930e652a2   David Howells   [PATCH] NOMMU: Ma...
580

8feae1311   David Howells   NOMMU: Make VMAs ...
581
582
583
  	validate_nommu_regions();
  	rb_erase(&region->vm_rb, &nommu_region_tree);
  	validate_nommu_regions();
57c8f63e8   Greg Ungerer   nommu: stub expan...
584
  }
930e652a2   David Howells   [PATCH] NOMMU: Ma...
585
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
586
   * free a contiguous series of pages
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
587
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
588
  static void free_page_series(unsigned long from, unsigned long to)
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
589
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
590
591
592
593
  	for (; from < to; from += PAGE_SIZE) {
  		struct page *page = virt_to_page(from);
  
  		kdebug("- free %lx", from);
33e5d7697   David Howells   nommu: fix a numb...
594
  		atomic_long_dec(&mmap_pages_allocated);
8feae1311   David Howells   NOMMU: Make VMAs ...
595
  		if (page_count(page) != 1)
33e5d7697   David Howells   nommu: fix a numb...
596
597
  			kdebug("free page %p: refcount not one: %d",
  			       page, page_count(page));
8feae1311   David Howells   NOMMU: Make VMAs ...
598
  		put_page(page);
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
599
  	}
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
600
601
602
  }
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
603
   * release a reference to a region
33e5d7697   David Howells   nommu: fix a numb...
604
   * - the caller must hold the region semaphore for writing, which this releases
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
605
   * - the region may not have been added to the tree yet, in which case vm_top
8feae1311   David Howells   NOMMU: Make VMAs ...
606
   *   will equal vm_start
3034097a5   David Howells   [PATCH] NOMMU: Or...
607
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
608
609
  static void __put_nommu_region(struct vm_region *region)
  	__releases(nommu_region_sem)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
610
  {
1e2ae599d   David Howells   nommu: struct vm_...
611
  	kenter("%p{%d}", region, region->vm_usage);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
612

8feae1311   David Howells   NOMMU: Make VMAs ...
613
  	BUG_ON(!nommu_region_tree.rb_node);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
614

1e2ae599d   David Howells   nommu: struct vm_...
615
  	if (--region->vm_usage == 0) {
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
616
  		if (region->vm_top > region->vm_start)
8feae1311   David Howells   NOMMU: Make VMAs ...
617
618
619
620
621
622
623
624
625
626
  			delete_nommu_region(region);
  		up_write(&nommu_region_sem);
  
  		if (region->vm_file)
  			fput(region->vm_file);
  
  		/* IO memory and memory shared directly out of the pagecache
  		 * from ramfs/tmpfs mustn't be released here */
  		if (region->vm_flags & VM_MAPPED_COPY) {
  			kdebug("free series");
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
627
  			free_page_series(region->vm_start, region->vm_top);
8feae1311   David Howells   NOMMU: Make VMAs ...
628
629
630
631
  		}
  		kmem_cache_free(vm_region_jar, region);
  	} else {
  		up_write(&nommu_region_sem);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
632
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
633
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
634

8feae1311   David Howells   NOMMU: Make VMAs ...
635
636
637
638
639
640
641
  /*
   * release a reference to a region
   */
  static void put_nommu_region(struct vm_region *region)
  {
  	down_write(&nommu_region_sem);
  	__put_nommu_region(region);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
642
  }
3034097a5   David Howells   [PATCH] NOMMU: Or...
643
  /*
eb8cdec4a   Bernd Schmidt   nommu: add suppor...
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
   * update protection on a vma
   */
  static void protect_vma(struct vm_area_struct *vma, unsigned long flags)
  {
  #ifdef CONFIG_MPU
  	struct mm_struct *mm = vma->vm_mm;
  	long start = vma->vm_start & PAGE_MASK;
  	while (start < vma->vm_end) {
  		protect_page(mm, start, flags);
  		start += PAGE_SIZE;
  	}
  	update_protections(mm);
  #endif
  }
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
660
661
662
663
   * add a VMA into a process's mm_struct in the appropriate place in the list
   * and tree and add to the address space's page tree also if not an anonymous
   * page
   * - should be called with mm->mmap_sem held writelocked
3034097a5   David Howells   [PATCH] NOMMU: Or...
664
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
665
  static void add_vma_to_mm(struct mm_struct *mm, struct vm_area_struct *vma)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
666
  {
6038def0d   Namhyung Kim   mm: nommu: sort m...
667
  	struct vm_area_struct *pvma, *prev;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
668
  	struct address_space *mapping;
6038def0d   Namhyung Kim   mm: nommu: sort m...
669
  	struct rb_node **p, *parent, *rb_prev;
8feae1311   David Howells   NOMMU: Make VMAs ...
670
671
672
673
674
675
676
  
  	kenter(",%p", vma);
  
  	BUG_ON(!vma->vm_region);
  
  	mm->map_count++;
  	vma->vm_mm = mm;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
677

eb8cdec4a   Bernd Schmidt   nommu: add suppor...
678
  	protect_vma(vma, vma->vm_flags);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
679
680
681
682
683
684
685
686
  	/* add the VMA to the mapping */
  	if (vma->vm_file) {
  		mapping = vma->vm_file->f_mapping;
  
  		flush_dcache_mmap_lock(mapping);
  		vma_prio_tree_insert(vma, &mapping->i_mmap);
  		flush_dcache_mmap_unlock(mapping);
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
687
  	/* add the VMA to the tree */
6038def0d   Namhyung Kim   mm: nommu: sort m...
688
  	parent = rb_prev = NULL;
8feae1311   David Howells   NOMMU: Make VMAs ...
689
  	p = &mm->mm_rb.rb_node;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
690
691
692
  	while (*p) {
  		parent = *p;
  		pvma = rb_entry(parent, struct vm_area_struct, vm_rb);
8feae1311   David Howells   NOMMU: Make VMAs ...
693
694
695
  		/* sort by: start addr, end addr, VMA struct addr in that order
  		 * (the latter is necessary as we may get identical VMAs) */
  		if (vma->vm_start < pvma->vm_start)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
696
  			p = &(*p)->rb_left;
6038def0d   Namhyung Kim   mm: nommu: sort m...
697
698
  		else if (vma->vm_start > pvma->vm_start) {
  			rb_prev = parent;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
699
  			p = &(*p)->rb_right;
6038def0d   Namhyung Kim   mm: nommu: sort m...
700
  		} else if (vma->vm_end < pvma->vm_end)
8feae1311   David Howells   NOMMU: Make VMAs ...
701
  			p = &(*p)->rb_left;
6038def0d   Namhyung Kim   mm: nommu: sort m...
702
703
  		else if (vma->vm_end > pvma->vm_end) {
  			rb_prev = parent;
8feae1311   David Howells   NOMMU: Make VMAs ...
704
  			p = &(*p)->rb_right;
6038def0d   Namhyung Kim   mm: nommu: sort m...
705
  		} else if (vma < pvma)
8feae1311   David Howells   NOMMU: Make VMAs ...
706
  			p = &(*p)->rb_left;
6038def0d   Namhyung Kim   mm: nommu: sort m...
707
708
  		else if (vma > pvma) {
  			rb_prev = parent;
8feae1311   David Howells   NOMMU: Make VMAs ...
709
  			p = &(*p)->rb_right;
6038def0d   Namhyung Kim   mm: nommu: sort m...
710
  		} else
8feae1311   David Howells   NOMMU: Make VMAs ...
711
  			BUG();
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
712
713
714
  	}
  
  	rb_link_node(&vma->vm_rb, parent, p);
8feae1311   David Howells   NOMMU: Make VMAs ...
715
716
717
  	rb_insert_color(&vma->vm_rb, &mm->mm_rb);
  
  	/* add VMA to the VMA list also */
6038def0d   Namhyung Kim   mm: nommu: sort m...
718
719
720
  	prev = NULL;
  	if (rb_prev)
  		prev = rb_entry(rb_prev, struct vm_area_struct, vm_rb);
8feae1311   David Howells   NOMMU: Make VMAs ...
721

6038def0d   Namhyung Kim   mm: nommu: sort m...
722
  	__vma_link_list(mm, vma, prev, parent);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
723
  }
3034097a5   David Howells   [PATCH] NOMMU: Or...
724
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
725
   * delete a VMA from its owning mm_struct and address space
3034097a5   David Howells   [PATCH] NOMMU: Or...
726
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
727
  static void delete_vma_from_mm(struct vm_area_struct *vma)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
728
729
  {
  	struct address_space *mapping;
8feae1311   David Howells   NOMMU: Make VMAs ...
730
731
732
  	struct mm_struct *mm = vma->vm_mm;
  
  	kenter("%p", vma);
eb8cdec4a   Bernd Schmidt   nommu: add suppor...
733
  	protect_vma(vma, 0);
8feae1311   David Howells   NOMMU: Make VMAs ...
734
735
736
  	mm->map_count--;
  	if (mm->mmap_cache == vma)
  		mm->mmap_cache = NULL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
737
738
739
740
741
742
743
744
745
  
  	/* remove the VMA from the mapping */
  	if (vma->vm_file) {
  		mapping = vma->vm_file->f_mapping;
  
  		flush_dcache_mmap_lock(mapping);
  		vma_prio_tree_remove(vma, &mapping->i_mmap);
  		flush_dcache_mmap_unlock(mapping);
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
746
747
  	/* remove from the MM's tree and list */
  	rb_erase(&vma->vm_rb, &mm->mm_rb);
b951bf2c4   Namhyung Kim   mm: nommu: don't ...
748
749
750
751
752
753
754
755
  
  	if (vma->vm_prev)
  		vma->vm_prev->vm_next = vma->vm_next;
  	else
  		mm->mmap = vma->vm_next;
  
  	if (vma->vm_next)
  		vma->vm_next->vm_prev = vma->vm_prev;
8feae1311   David Howells   NOMMU: Make VMAs ...
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
  
  	vma->vm_mm = NULL;
  }
  
  /*
   * destroy a VMA record
   */
  static void delete_vma(struct mm_struct *mm, struct vm_area_struct *vma)
  {
  	kenter("%p", vma);
  	if (vma->vm_ops && vma->vm_ops->close)
  		vma->vm_ops->close(vma);
  	if (vma->vm_file) {
  		fput(vma->vm_file);
  		if (vma->vm_flags & VM_EXECUTABLE)
  			removed_exe_file_vma(mm);
  	}
  	put_nommu_region(vma->vm_region);
  	kmem_cache_free(vm_area_cachep, vma);
  }
  
  /*
   * look up the first VMA in which addr resides, NULL if none
   * - should be called with mm->mmap_sem at least held readlocked
   */
  struct vm_area_struct *find_vma(struct mm_struct *mm, unsigned long addr)
  {
  	struct vm_area_struct *vma;
8feae1311   David Howells   NOMMU: Make VMAs ...
784
785
786
787
788
  
  	/* check the cache first */
  	vma = mm->mmap_cache;
  	if (vma && vma->vm_start <= addr && vma->vm_end > addr)
  		return vma;
e922c4c53   Namhyung Kim   mm: nommu: find v...
789
  	/* trawl the list (there may be multiple mappings in which addr
8feae1311   David Howells   NOMMU: Make VMAs ...
790
  	 * resides) */
e922c4c53   Namhyung Kim   mm: nommu: find v...
791
  	for (vma = mm->mmap; vma; vma = vma->vm_next) {
8feae1311   David Howells   NOMMU: Make VMAs ...
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
  		if (vma->vm_start > addr)
  			return NULL;
  		if (vma->vm_end > addr) {
  			mm->mmap_cache = vma;
  			return vma;
  		}
  	}
  
  	return NULL;
  }
  EXPORT_SYMBOL(find_vma);
  
  /*
   * find a VMA
   * - we don't extend stack VMAs under NOMMU conditions
   */
  struct vm_area_struct *find_extend_vma(struct mm_struct *mm, unsigned long addr)
  {
7561e8ca0   David Howells   NOMMU: Revert 'no...
810
  	return find_vma(mm, addr);
8feae1311   David Howells   NOMMU: Make VMAs ...
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
  }
  
  /*
   * expand a stack to a given address
   * - not supported under NOMMU conditions
   */
  int expand_stack(struct vm_area_struct *vma, unsigned long address)
  {
  	return -ENOMEM;
  }
  
  /*
   * look up the first VMA exactly that exactly matches addr
   * - should be called with mm->mmap_sem at least held readlocked
   */
  static struct vm_area_struct *find_vma_exact(struct mm_struct *mm,
  					     unsigned long addr,
  					     unsigned long len)
  {
  	struct vm_area_struct *vma;
8feae1311   David Howells   NOMMU: Make VMAs ...
831
832
833
834
835
836
  	unsigned long end = addr + len;
  
  	/* check the cache first */
  	vma = mm->mmap_cache;
  	if (vma && vma->vm_start == addr && vma->vm_end == end)
  		return vma;
e922c4c53   Namhyung Kim   mm: nommu: find v...
837
  	/* trawl the list (there may be multiple mappings in which addr
8feae1311   David Howells   NOMMU: Make VMAs ...
838
  	 * resides) */
e922c4c53   Namhyung Kim   mm: nommu: find v...
839
  	for (vma = mm->mmap; vma; vma = vma->vm_next) {
8feae1311   David Howells   NOMMU: Make VMAs ...
840
841
842
843
844
845
846
847
848
849
850
  		if (vma->vm_start < addr)
  			continue;
  		if (vma->vm_start > addr)
  			return NULL;
  		if (vma->vm_end == end) {
  			mm->mmap_cache = vma;
  			return vma;
  		}
  	}
  
  	return NULL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
851
852
853
854
855
856
857
858
859
860
861
862
863
864
  }
  
  /*
   * determine whether a mapping should be permitted and, if so, what sort of
   * mapping we're capable of supporting
   */
  static int validate_mmap_request(struct file *file,
  				 unsigned long addr,
  				 unsigned long len,
  				 unsigned long prot,
  				 unsigned long flags,
  				 unsigned long pgoff,
  				 unsigned long *_capabilities)
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
865
  	unsigned long capabilities, rlen;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
866
867
868
869
  	unsigned long reqprot = prot;
  	int ret;
  
  	/* do the simple checks first */
06aab5a30   David Howells   NOMMU: Ignore mma...
870
  	if (flags & MAP_FIXED) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
871
872
873
874
875
876
877
878
879
880
  		printk(KERN_DEBUG
  		       "%d: Can't do fixed-address/overlay mmap of RAM
  ",
  		       current->pid);
  		return -EINVAL;
  	}
  
  	if ((flags & MAP_TYPE) != MAP_PRIVATE &&
  	    (flags & MAP_TYPE) != MAP_SHARED)
  		return -EINVAL;
f81cff0d4   Mike Frysinger   [PATCH] uclinux: ...
881
  	if (!len)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
882
  		return -EINVAL;
f81cff0d4   Mike Frysinger   [PATCH] uclinux: ...
883
  	/* Careful about overflows.. */
8feae1311   David Howells   NOMMU: Make VMAs ...
884
885
  	rlen = PAGE_ALIGN(len);
  	if (!rlen || rlen > TASK_SIZE)
f81cff0d4   Mike Frysinger   [PATCH] uclinux: ...
886
  		return -ENOMEM;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
887
  	/* offset overflow? */
8feae1311   David Howells   NOMMU: Make VMAs ...
888
  	if ((pgoff + (rlen >> PAGE_SHIFT)) < pgoff)
f81cff0d4   Mike Frysinger   [PATCH] uclinux: ...
889
  		return -EOVERFLOW;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
  
  	if (file) {
  		/* validate file mapping requests */
  		struct address_space *mapping;
  
  		/* files must support mmap */
  		if (!file->f_op || !file->f_op->mmap)
  			return -ENODEV;
  
  		/* work out if what we've got could possibly be shared
  		 * - we support chardevs that provide their own "memory"
  		 * - we support files/blockdevs that are memory backed
  		 */
  		mapping = file->f_mapping;
  		if (!mapping)
e9536ae72   Josef Sipek   [PATCH] struct pa...
905
  			mapping = file->f_path.dentry->d_inode->i_mapping;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
906
907
908
909
910
911
912
913
  
  		capabilities = 0;
  		if (mapping && mapping->backing_dev_info)
  			capabilities = mapping->backing_dev_info->capabilities;
  
  		if (!capabilities) {
  			/* no explicit capabilities set, so assume some
  			 * defaults */
e9536ae72   Josef Sipek   [PATCH] struct pa...
914
  			switch (file->f_path.dentry->d_inode->i_mode & S_IFMT) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
  			case S_IFREG:
  			case S_IFBLK:
  				capabilities = BDI_CAP_MAP_COPY;
  				break;
  
  			case S_IFCHR:
  				capabilities =
  					BDI_CAP_MAP_DIRECT |
  					BDI_CAP_READ_MAP |
  					BDI_CAP_WRITE_MAP;
  				break;
  
  			default:
  				return -EINVAL;
  			}
  		}
  
  		/* eliminate any capabilities that we can't support on this
  		 * device */
  		if (!file->f_op->get_unmapped_area)
  			capabilities &= ~BDI_CAP_MAP_DIRECT;
  		if (!file->f_op->read)
  			capabilities &= ~BDI_CAP_MAP_COPY;
28d7a6ae9   Graff Yang   nommu: check fd r...
938
939
940
  		/* The file shall have been opened with read permission. */
  		if (!(file->f_mode & FMODE_READ))
  			return -EACCES;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
941
942
943
944
945
  		if (flags & MAP_SHARED) {
  			/* do checks for writing, appending and locking */
  			if ((prot & PROT_WRITE) &&
  			    !(file->f_mode & FMODE_WRITE))
  				return -EACCES;
e9536ae72   Josef Sipek   [PATCH] struct pa...
946
  			if (IS_APPEND(file->f_path.dentry->d_inode) &&
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
947
948
  			    (file->f_mode & FMODE_WRITE))
  				return -EACCES;
e9536ae72   Josef Sipek   [PATCH] struct pa...
949
  			if (locks_verify_locked(file->f_path.dentry->d_inode))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
950
951
952
953
  				return -EAGAIN;
  
  			if (!(capabilities & BDI_CAP_MAP_DIRECT))
  				return -ENODEV;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
954
955
956
957
958
959
960
961
962
963
964
965
966
967
  			/* we mustn't privatise shared mappings */
  			capabilities &= ~BDI_CAP_MAP_COPY;
  		}
  		else {
  			/* we're going to read the file into private memory we
  			 * allocate */
  			if (!(capabilities & BDI_CAP_MAP_COPY))
  				return -ENODEV;
  
  			/* we don't permit a private writable mapping to be
  			 * shared with the backing device */
  			if (prot & PROT_WRITE)
  				capabilities &= ~BDI_CAP_MAP_DIRECT;
  		}
3c7b20454   Bernd Schmidt   nommu: allow priv...
968
969
970
971
972
973
974
975
976
977
978
979
980
981
  		if (capabilities & BDI_CAP_MAP_DIRECT) {
  			if (((prot & PROT_READ)  && !(capabilities & BDI_CAP_READ_MAP))  ||
  			    ((prot & PROT_WRITE) && !(capabilities & BDI_CAP_WRITE_MAP)) ||
  			    ((prot & PROT_EXEC)  && !(capabilities & BDI_CAP_EXEC_MAP))
  			    ) {
  				capabilities &= ~BDI_CAP_MAP_DIRECT;
  				if (flags & MAP_SHARED) {
  					printk(KERN_WARNING
  					       "MAP_SHARED not completely supported on !MMU
  ");
  					return -EINVAL;
  				}
  			}
  		}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
982
983
  		/* handle executable mappings and implied executable
  		 * mappings */
e9536ae72   Josef Sipek   [PATCH] struct pa...
984
  		if (file->f_path.mnt->mnt_flags & MNT_NOEXEC) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
1001
1002
1003
1004
1005
1006
1007
1008
1009
1010
1011
1012
1013
1014
1015
  			if (prot & PROT_EXEC)
  				return -EPERM;
  		}
  		else if ((prot & PROT_READ) && !(prot & PROT_EXEC)) {
  			/* handle implication of PROT_EXEC by PROT_READ */
  			if (current->personality & READ_IMPLIES_EXEC) {
  				if (capabilities & BDI_CAP_EXEC_MAP)
  					prot |= PROT_EXEC;
  			}
  		}
  		else if ((prot & PROT_READ) &&
  			 (prot & PROT_EXEC) &&
  			 !(capabilities & BDI_CAP_EXEC_MAP)
  			 ) {
  			/* backing file is not executable, try to copy */
  			capabilities &= ~BDI_CAP_MAP_DIRECT;
  		}
  	}
  	else {
  		/* anonymous mappings are always memory backed and can be
  		 * privately mapped
  		 */
  		capabilities = BDI_CAP_MAP_COPY;
  
  		/* handle PROT_EXEC implication by PROT_READ */
  		if ((prot & PROT_READ) &&
  		    (current->personality & READ_IMPLIES_EXEC))
  			prot |= PROT_EXEC;
  	}
  
  	/* allow the security API to have its say */
ed0321895   Eric Paris   security: Protect...
1016
  	ret = security_file_mmap(file, reqprot, prot, flags, addr, 0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1017
1018
1019
1020
1021
1022
1023
1024
1025
1026
1027
1028
1029
1030
1031
1032
1033
1034
1035
1036
  	if (ret < 0)
  		return ret;
  
  	/* looks okay */
  	*_capabilities = capabilities;
  	return 0;
  }
  
  /*
   * we've determined that we can make the mapping, now translate what we
   * now know into VMA flags
   */
  static unsigned long determine_vm_flags(struct file *file,
  					unsigned long prot,
  					unsigned long flags,
  					unsigned long capabilities)
  {
  	unsigned long vm_flags;
  
  	vm_flags = calc_vm_prot_bits(prot) | calc_vm_flag_bits(flags);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1037
1038
1039
1040
  	/* vm_flags |= mm->def_flags; */
  
  	if (!(capabilities & BDI_CAP_MAP_DIRECT)) {
  		/* attempt to share read-only copies of mapped file chunks */
3c7b20454   Bernd Schmidt   nommu: allow priv...
1041
  		vm_flags |= VM_MAYREAD | VM_MAYWRITE | VM_MAYEXEC;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1042
1043
  		if (file && !(prot & PROT_WRITE))
  			vm_flags |= VM_MAYSHARE;
3c7b20454   Bernd Schmidt   nommu: allow priv...
1044
  	} else {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1045
1046
1047
  		/* overlay a shareable mapping on the backing device or inode
  		 * if possible - used for chardevs, ramfs/tmpfs/shmfs and
  		 * romfs/cramfs */
3c7b20454   Bernd Schmidt   nommu: allow priv...
1048
  		vm_flags |= VM_MAYSHARE | (capabilities & BDI_CAP_VMFLAGS);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1049
  		if (flags & MAP_SHARED)
3c7b20454   Bernd Schmidt   nommu: allow priv...
1050
  			vm_flags |= VM_SHARED;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1051
1052
1053
1054
1055
1056
  	}
  
  	/* refuse to let anyone share private mappings with this process if
  	 * it's being traced - otherwise breakpoints set in it may interfere
  	 * with another untraced process
  	 */
fa8e26ccd   Roland McGrath   tracehook: traceh...
1057
  	if ((flags & MAP_PRIVATE) && tracehook_expect_breakpoints(current))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1058
1059
1060
1061
1062
1063
  		vm_flags &= ~VM_MAYSHARE;
  
  	return vm_flags;
  }
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
1064
1065
   * set up a shared mapping on a file (the driver or filesystem provides and
   * pins the storage)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1066
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
1067
  static int do_mmap_shared_file(struct vm_area_struct *vma)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1068
1069
1070
1071
  {
  	int ret;
  
  	ret = vma->vm_file->f_op->mmap(vma->vm_file, vma);
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1072
1073
  	if (ret == 0) {
  		vma->vm_region->vm_top = vma->vm_region->vm_end;
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1074
  		return 0;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1075
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1076
1077
  	if (ret != -ENOSYS)
  		return ret;
3fa30460e   David Howells   nommu: fix an inc...
1078
1079
1080
  	/* getting -ENOSYS indicates that direct mmap isn't possible (as
  	 * opposed to tried but failed) so we can only give a suitable error as
  	 * it's not possible to make a private copy if MAP_SHARED was given */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1081
1082
1083
1084
1085
1086
  	return -ENODEV;
  }
  
  /*
   * set up a private mapping or an anonymous shared mapping
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
1087
1088
  static int do_mmap_private(struct vm_area_struct *vma,
  			   struct vm_region *region,
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1089
1090
  			   unsigned long len,
  			   unsigned long capabilities)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1091
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
1092
  	struct page *pages;
f67d9b157   Bob Liu   nommu: add page a...
1093
  	unsigned long total, point, n;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1094
  	void *base;
8feae1311   David Howells   NOMMU: Make VMAs ...
1095
  	int ret, order;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1096
1097
1098
1099
1100
  
  	/* invoke the file's mapping function so that it can keep track of
  	 * shared mappings on devices or memory
  	 * - VM_MAYSHARE will be set if it may attempt to share
  	 */
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1101
  	if (capabilities & BDI_CAP_MAP_DIRECT) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1102
  		ret = vma->vm_file->f_op->mmap(vma->vm_file, vma);
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1103
  		if (ret == 0) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1104
  			/* shouldn't return success if we're not sharing */
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1105
1106
  			BUG_ON(!(vma->vm_flags & VM_MAYSHARE));
  			vma->vm_region->vm_top = vma->vm_region->vm_end;
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1107
  			return 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1108
  		}
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1109
1110
  		if (ret != -ENOSYS)
  			return ret;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1111
1112
1113
1114
1115
  
  		/* getting an ENOSYS error indicates that direct mmap isn't
  		 * possible (as opposed to tried but failed) so we'll try to
  		 * make a private copy of the data and map that instead */
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1116

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1117
1118
1119
1120
  	/* allocate some memory to hold the mapping
  	 * - note that this may not return a page-aligned address if the object
  	 *   we're allocating is smaller than a page
  	 */
f67d9b157   Bob Liu   nommu: add page a...
1121
  	order = get_order(len);
8feae1311   David Howells   NOMMU: Make VMAs ...
1122
1123
1124
1125
  	kdebug("alloc order %d for %lx", order, len);
  
  	pages = alloc_pages(GFP_KERNEL, order);
  	if (!pages)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1126
  		goto enomem;
8feae1311   David Howells   NOMMU: Make VMAs ...
1127
  	total = 1 << order;
33e5d7697   David Howells   nommu: fix a numb...
1128
  	atomic_long_add(total, &mmap_pages_allocated);
8feae1311   David Howells   NOMMU: Make VMAs ...
1129

f67d9b157   Bob Liu   nommu: add page a...
1130
  	point = len >> PAGE_SHIFT;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1131
1132
1133
1134
1135
1136
1137
1138
  
  	/* we allocated a power-of-2 sized page set, so we may want to trim off
  	 * the excess */
  	if (sysctl_nr_trim_pages && total - point >= sysctl_nr_trim_pages) {
  		while (total > point) {
  			order = ilog2(total - point);
  			n = 1 << order;
  			kdebug("shave %lu/%lu @%lu", n, total - point, total);
33e5d7697   David Howells   nommu: fix a numb...
1139
  			atomic_long_sub(n, &mmap_pages_allocated);
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1140
1141
1142
1143
  			total -= n;
  			set_page_refcounted(pages + total);
  			__free_pages(pages + total, order);
  		}
8feae1311   David Howells   NOMMU: Make VMAs ...
1144
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1145
1146
  	for (point = 1; point < total; point++)
  		set_page_refcounted(&pages[point]);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1147

8feae1311   David Howells   NOMMU: Make VMAs ...
1148
1149
1150
  	base = page_address(pages);
  	region->vm_flags = vma->vm_flags |= VM_MAPPED_COPY;
  	region->vm_start = (unsigned long) base;
f67d9b157   Bob Liu   nommu: add page a...
1151
  	region->vm_end   = region->vm_start + len;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1152
  	region->vm_top   = region->vm_start + (total << PAGE_SHIFT);
8feae1311   David Howells   NOMMU: Make VMAs ...
1153
1154
1155
  
  	vma->vm_start = region->vm_start;
  	vma->vm_end   = region->vm_start + len;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1156
1157
1158
1159
1160
1161
1162
1163
1164
1165
1166
  
  	if (vma->vm_file) {
  		/* read the contents of a file into the copy */
  		mm_segment_t old_fs;
  		loff_t fpos;
  
  		fpos = vma->vm_pgoff;
  		fpos <<= PAGE_SHIFT;
  
  		old_fs = get_fs();
  		set_fs(KERNEL_DS);
f67d9b157   Bob Liu   nommu: add page a...
1167
  		ret = vma->vm_file->f_op->read(vma->vm_file, base, len, &fpos);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1168
1169
1170
1171
1172
1173
  		set_fs(old_fs);
  
  		if (ret < 0)
  			goto error_free;
  
  		/* clear the last little bit */
f67d9b157   Bob Liu   nommu: add page a...
1174
1175
  		if (ret < len)
  			memset(base + ret, 0, len - ret);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1176

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1177
1178
1179
1180
1181
  	}
  
  	return 0;
  
  error_free:
7223bb4a8   Namhyung Kim   mm: nommu: fix a ...
1182
  	free_page_series(region->vm_start, region->vm_top);
8feae1311   David Howells   NOMMU: Make VMAs ...
1183
1184
  	region->vm_start = vma->vm_start = 0;
  	region->vm_end   = vma->vm_end = 0;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1185
  	region->vm_top   = 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1186
1187
1188
  	return ret;
  
  enomem:
05ae6fa31   Greg Ungerer   uclinux: add proc...
1189
1190
1191
  	printk("Allocation of length %lu from process %d (%s) failed
  ",
  	       len, current->pid, current->comm);
7bf02ea22   David Rientjes   arch, mm: filter ...
1192
  	show_free_areas(0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1193
1194
1195
1196
1197
1198
1199
1200
1201
1202
1203
1204
1205
  	return -ENOMEM;
  }
  
  /*
   * handle mapping creation for uClinux
   */
  unsigned long do_mmap_pgoff(struct file *file,
  			    unsigned long addr,
  			    unsigned long len,
  			    unsigned long prot,
  			    unsigned long flags,
  			    unsigned long pgoff)
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
1206
1207
  	struct vm_area_struct *vma;
  	struct vm_region *region;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1208
  	struct rb_node *rb;
8feae1311   David Howells   NOMMU: Make VMAs ...
1209
  	unsigned long capabilities, vm_flags, result;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1210
  	int ret;
8feae1311   David Howells   NOMMU: Make VMAs ...
1211
  	kenter(",%lx,%lx,%lx,%lx,%lx", addr, len, prot, flags, pgoff);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1212
1213
1214
1215
  	/* decide whether we should attempt the mapping, and if so what sort of
  	 * mapping */
  	ret = validate_mmap_request(file, addr, len, prot, flags, pgoff,
  				    &capabilities);
8feae1311   David Howells   NOMMU: Make VMAs ...
1216
1217
  	if (ret < 0) {
  		kleave(" = %d [val]", ret);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1218
  		return ret;
8feae1311   David Howells   NOMMU: Make VMAs ...
1219
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1220

06aab5a30   David Howells   NOMMU: Ignore mma...
1221
1222
  	/* we ignore the address hint */
  	addr = 0;
f67d9b157   Bob Liu   nommu: add page a...
1223
  	len = PAGE_ALIGN(len);
06aab5a30   David Howells   NOMMU: Ignore mma...
1224

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1225
1226
1227
  	/* we've determined that we can make the mapping, now translate what we
  	 * now know into VMA flags */
  	vm_flags = determine_vm_flags(file, prot, flags, capabilities);
8feae1311   David Howells   NOMMU: Make VMAs ...
1228
1229
1230
1231
1232
1233
1234
1235
  	/* we're going to need to record the mapping */
  	region = kmem_cache_zalloc(vm_region_jar, GFP_KERNEL);
  	if (!region)
  		goto error_getting_region;
  
  	vma = kmem_cache_zalloc(vm_area_cachep, GFP_KERNEL);
  	if (!vma)
  		goto error_getting_vma;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1236

1e2ae599d   David Howells   nommu: struct vm_...
1237
  	region->vm_usage = 1;
8feae1311   David Howells   NOMMU: Make VMAs ...
1238
1239
  	region->vm_flags = vm_flags;
  	region->vm_pgoff = pgoff;
5beb49305   Rik van Riel   mm: change anon_v...
1240
  	INIT_LIST_HEAD(&vma->anon_vma_chain);
8feae1311   David Howells   NOMMU: Make VMAs ...
1241
1242
  	vma->vm_flags = vm_flags;
  	vma->vm_pgoff = pgoff;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1243

8feae1311   David Howells   NOMMU: Make VMAs ...
1244
1245
1246
1247
1248
1249
1250
1251
1252
1253
1254
1255
1256
1257
  	if (file) {
  		region->vm_file = file;
  		get_file(file);
  		vma->vm_file = file;
  		get_file(file);
  		if (vm_flags & VM_EXECUTABLE) {
  			added_exe_file_vma(current->mm);
  			vma->vm_mm = current->mm;
  		}
  	}
  
  	down_write(&nommu_region_sem);
  
  	/* if we want to share, we need to check for regions created by other
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1258
  	 * mmap() calls that overlap with our proposed mapping
8feae1311   David Howells   NOMMU: Make VMAs ...
1259
  	 * - we can only share with a superset match on most regular files
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1260
1261
1262
1263
1264
1265
  	 * - shared mappings on character devices and memory backed files are
  	 *   permitted to overlap inexactly as far as we are concerned for in
  	 *   these cases, sharing is handled in the driver or filesystem rather
  	 *   than here
  	 */
  	if (vm_flags & VM_MAYSHARE) {
8feae1311   David Howells   NOMMU: Make VMAs ...
1266
1267
  		struct vm_region *pregion;
  		unsigned long pglen, rpglen, pgend, rpgend, start;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1268

8feae1311   David Howells   NOMMU: Make VMAs ...
1269
1270
  		pglen = (len + PAGE_SIZE - 1) >> PAGE_SHIFT;
  		pgend = pgoff + pglen;
165b23927   David Howells   [PATCH] NOMMU: ma...
1271

8feae1311   David Howells   NOMMU: Make VMAs ...
1272
1273
  		for (rb = rb_first(&nommu_region_tree); rb; rb = rb_next(rb)) {
  			pregion = rb_entry(rb, struct vm_region, vm_rb);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1274

8feae1311   David Howells   NOMMU: Make VMAs ...
1275
  			if (!(pregion->vm_flags & VM_MAYSHARE))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1276
1277
1278
  				continue;
  
  			/* search for overlapping mappings on the same file */
8feae1311   David Howells   NOMMU: Make VMAs ...
1279
1280
  			if (pregion->vm_file->f_path.dentry->d_inode !=
  			    file->f_path.dentry->d_inode)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1281
  				continue;
8feae1311   David Howells   NOMMU: Make VMAs ...
1282
  			if (pregion->vm_pgoff >= pgend)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1283
  				continue;
8feae1311   David Howells   NOMMU: Make VMAs ...
1284
1285
1286
1287
  			rpglen = pregion->vm_end - pregion->vm_start;
  			rpglen = (rpglen + PAGE_SIZE - 1) >> PAGE_SHIFT;
  			rpgend = pregion->vm_pgoff + rpglen;
  			if (pgoff >= rpgend)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1288
  				continue;
8feae1311   David Howells   NOMMU: Make VMAs ...
1289
1290
1291
1292
1293
  			/* handle inexactly overlapping matches between
  			 * mappings */
  			if ((pregion->vm_pgoff != pgoff || rpglen != pglen) &&
  			    !(pgoff >= pregion->vm_pgoff && pgend <= rpgend)) {
  				/* new mapping is not a subset of the region */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1294
1295
1296
1297
  				if (!(capabilities & BDI_CAP_MAP_DIRECT))
  					goto sharing_violation;
  				continue;
  			}
8feae1311   David Howells   NOMMU: Make VMAs ...
1298
  			/* we've found a region we can share */
1e2ae599d   David Howells   nommu: struct vm_...
1299
  			pregion->vm_usage++;
8feae1311   David Howells   NOMMU: Make VMAs ...
1300
1301
1302
1303
1304
1305
1306
1307
1308
1309
1310
1311
1312
1313
1314
1315
  			vma->vm_region = pregion;
  			start = pregion->vm_start;
  			start += (pgoff - pregion->vm_pgoff) << PAGE_SHIFT;
  			vma->vm_start = start;
  			vma->vm_end = start + len;
  
  			if (pregion->vm_flags & VM_MAPPED_COPY) {
  				kdebug("share copy");
  				vma->vm_flags |= VM_MAPPED_COPY;
  			} else {
  				kdebug("share mmap");
  				ret = do_mmap_shared_file(vma);
  				if (ret < 0) {
  					vma->vm_region = NULL;
  					vma->vm_start = 0;
  					vma->vm_end = 0;
1e2ae599d   David Howells   nommu: struct vm_...
1316
  					pregion->vm_usage--;
8feae1311   David Howells   NOMMU: Make VMAs ...
1317
1318
1319
1320
1321
1322
1323
1324
1325
  					pregion = NULL;
  					goto error_just_free;
  				}
  			}
  			fput(region->vm_file);
  			kmem_cache_free(vm_region_jar, region);
  			region = pregion;
  			result = start;
  			goto share;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1326
  		}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1327
1328
1329
1330
  		/* obtain the address at which to make a shared mapping
  		 * - this is the hook for quasi-memory character devices to
  		 *   tell us the location of a shared mapping
  		 */
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1331
  		if (capabilities & BDI_CAP_MAP_DIRECT) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1332
1333
  			addr = file->f_op->get_unmapped_area(file, addr, len,
  							     pgoff, flags);
bb005a59e   Namhyung Kim   mm: nommu: fix a ...
1334
  			if (IS_ERR_VALUE(addr)) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1335
  				ret = addr;
bb005a59e   Namhyung Kim   mm: nommu: fix a ...
1336
  				if (ret != -ENOSYS)
8feae1311   David Howells   NOMMU: Make VMAs ...
1337
  					goto error_just_free;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1338
1339
1340
1341
  
  				/* the driver refused to tell us where to site
  				 * the mapping so we'll have to attempt to copy
  				 * it */
bb005a59e   Namhyung Kim   mm: nommu: fix a ...
1342
  				ret = -ENODEV;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1343
  				if (!(capabilities & BDI_CAP_MAP_COPY))
8feae1311   David Howells   NOMMU: Make VMAs ...
1344
  					goto error_just_free;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1345
1346
  
  				capabilities &= ~BDI_CAP_MAP_DIRECT;
8feae1311   David Howells   NOMMU: Make VMAs ...
1347
1348
1349
  			} else {
  				vma->vm_start = region->vm_start = addr;
  				vma->vm_end = region->vm_end = addr + len;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1350
1351
1352
  			}
  		}
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1353
  	vma->vm_region = region;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1354

645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1355
1356
1357
  	/* set up the mapping
  	 * - the region is filled in if BDI_CAP_MAP_DIRECT is still set
  	 */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1358
  	if (file && vma->vm_flags & VM_SHARED)
8feae1311   David Howells   NOMMU: Make VMAs ...
1359
  		ret = do_mmap_shared_file(vma);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1360
  	else
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1361
  		ret = do_mmap_private(vma, region, len, capabilities);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1362
  	if (ret < 0)
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1363
1364
  		goto error_just_free;
  	add_nommu_region(region);
8feae1311   David Howells   NOMMU: Make VMAs ...
1365

ea6376395   Jie Zhang   nommu: fix malloc...
1366
1367
1368
1369
  	/* clear anonymous mappings that don't ask for uninitialized data */
  	if (!vma->vm_file && !(flags & MAP_UNINITIALIZED))
  		memset((void *)region->vm_start, 0,
  		       region->vm_end - region->vm_start);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1370
  	/* okay... we have a mapping; now we have to register it */
8feae1311   David Howells   NOMMU: Make VMAs ...
1371
  	result = vma->vm_start;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1372

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1373
  	current->mm->total_vm += len >> PAGE_SHIFT;
8feae1311   David Howells   NOMMU: Make VMAs ...
1374
1375
  share:
  	add_vma_to_mm(current->mm, vma);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1376

cfe79c00a   Mike Frysinger   NOMMU: Avoiding d...
1377
1378
1379
1380
1381
1382
  	/* we flush the region from the icache only when the first executable
  	 * mapping of it is made  */
  	if (vma->vm_flags & VM_EXEC && !region->vm_icache_flushed) {
  		flush_icache_range(region->vm_start, region->vm_end);
  		region->vm_icache_flushed = true;
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1383

cfe79c00a   Mike Frysinger   NOMMU: Avoiding d...
1384
  	up_write(&nommu_region_sem);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1385

8feae1311   David Howells   NOMMU: Make VMAs ...
1386
1387
  	kleave(" = %lx", result);
  	return result;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1388

8feae1311   David Howells   NOMMU: Make VMAs ...
1389
1390
1391
  error_just_free:
  	up_write(&nommu_region_sem);
  error:
89a864027   David Howells   NOMMU: Don't pass...
1392
1393
  	if (region->vm_file)
  		fput(region->vm_file);
8feae1311   David Howells   NOMMU: Make VMAs ...
1394
  	kmem_cache_free(vm_region_jar, region);
89a864027   David Howells   NOMMU: Don't pass...
1395
1396
  	if (vma->vm_file)
  		fput(vma->vm_file);
8feae1311   David Howells   NOMMU: Make VMAs ...
1397
1398
1399
1400
1401
1402
1403
1404
1405
1406
1407
1408
  	if (vma->vm_flags & VM_EXECUTABLE)
  		removed_exe_file_vma(vma->vm_mm);
  	kmem_cache_free(vm_area_cachep, vma);
  	kleave(" = %d", ret);
  	return ret;
  
  sharing_violation:
  	up_write(&nommu_region_sem);
  	printk(KERN_WARNING "Attempt to share mismatched mappings
  ");
  	ret = -EINVAL;
  	goto error;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1409

8feae1311   David Howells   NOMMU: Make VMAs ...
1410
1411
1412
1413
1414
  error_getting_vma:
  	kmem_cache_free(vm_region_jar, region);
  	printk(KERN_WARNING "Allocation of vma for %lu byte allocation"
  	       " from process %d failed
  ",
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1415
  	       len, current->pid);
7bf02ea22   David Rientjes   arch, mm: filter ...
1416
  	show_free_areas(0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1417
  	return -ENOMEM;
8feae1311   David Howells   NOMMU: Make VMAs ...
1418
1419
1420
1421
  error_getting_region:
  	printk(KERN_WARNING "Allocation of vm region for %lu byte allocation"
  	       " from process %d failed
  ",
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1422
  	       len, current->pid);
7bf02ea22   David Rientjes   arch, mm: filter ...
1423
  	show_free_areas(0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1424
1425
  	return -ENOMEM;
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
1426
  EXPORT_SYMBOL(do_mmap_pgoff);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1427

66f0dc481   Hugh Dickins   mm: move sys_mmap...
1428
1429
1430
1431
1432
1433
  SYSCALL_DEFINE6(mmap_pgoff, unsigned long, addr, unsigned long, len,
  		unsigned long, prot, unsigned long, flags,
  		unsigned long, fd, unsigned long, pgoff)
  {
  	struct file *file = NULL;
  	unsigned long retval = -EBADF;
120a795da   Al Viro   audit mmap
1434
  	audit_mmap_fd(fd, flags);
66f0dc481   Hugh Dickins   mm: move sys_mmap...
1435
1436
1437
1438
1439
1440
1441
1442
1443
1444
1445
1446
1447
1448
1449
1450
1451
  	if (!(flags & MAP_ANONYMOUS)) {
  		file = fget(fd);
  		if (!file)
  			goto out;
  	}
  
  	flags &= ~(MAP_EXECUTABLE | MAP_DENYWRITE);
  
  	down_write(&current->mm->mmap_sem);
  	retval = do_mmap_pgoff(file, addr, len, prot, flags, pgoff);
  	up_write(&current->mm->mmap_sem);
  
  	if (file)
  		fput(file);
  out:
  	return retval;
  }
a4679373c   Christoph Hellwig   Add generic sys_o...
1452
1453
1454
1455
1456
1457
1458
1459
1460
1461
1462
1463
1464
1465
1466
1467
1468
1469
1470
1471
1472
1473
1474
  #ifdef __ARCH_WANT_SYS_OLD_MMAP
  struct mmap_arg_struct {
  	unsigned long addr;
  	unsigned long len;
  	unsigned long prot;
  	unsigned long flags;
  	unsigned long fd;
  	unsigned long offset;
  };
  
  SYSCALL_DEFINE1(old_mmap, struct mmap_arg_struct __user *, arg)
  {
  	struct mmap_arg_struct a;
  
  	if (copy_from_user(&a, arg, sizeof(a)))
  		return -EFAULT;
  	if (a.offset & ~PAGE_MASK)
  		return -EINVAL;
  
  	return sys_mmap_pgoff(a.addr, a.len, a.prot, a.flags, a.fd,
  			      a.offset >> PAGE_SHIFT);
  }
  #endif /* __ARCH_WANT_SYS_OLD_MMAP */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1475
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
1476
1477
   * split a vma into two pieces at address 'addr', a new vma is allocated either
   * for the first part or the tail.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1478
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
1479
1480
  int split_vma(struct mm_struct *mm, struct vm_area_struct *vma,
  	      unsigned long addr, int new_below)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1481
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
1482
1483
1484
  	struct vm_area_struct *new;
  	struct vm_region *region;
  	unsigned long npages;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1485

8feae1311   David Howells   NOMMU: Make VMAs ...
1486
  	kenter("");
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1487

779c10232   David Howells   nommu: remove a s...
1488
1489
1490
  	/* we're only permitted to split anonymous regions (these should have
  	 * only a single usage on the region) */
  	if (vma->vm_file)
8feae1311   David Howells   NOMMU: Make VMAs ...
1491
  		return -ENOMEM;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1492

8feae1311   David Howells   NOMMU: Make VMAs ...
1493
1494
  	if (mm->map_count >= sysctl_max_map_count)
  		return -ENOMEM;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1495

8feae1311   David Howells   NOMMU: Make VMAs ...
1496
1497
1498
  	region = kmem_cache_alloc(vm_region_jar, GFP_KERNEL);
  	if (!region)
  		return -ENOMEM;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1499

8feae1311   David Howells   NOMMU: Make VMAs ...
1500
1501
1502
1503
1504
1505
1506
1507
1508
1509
1510
1511
1512
1513
  	new = kmem_cache_alloc(vm_area_cachep, GFP_KERNEL);
  	if (!new) {
  		kmem_cache_free(vm_region_jar, region);
  		return -ENOMEM;
  	}
  
  	/* most fields are the same, copy all, and then fixup */
  	*new = *vma;
  	*region = *vma->vm_region;
  	new->vm_region = region;
  
  	npages = (addr - vma->vm_start) >> PAGE_SHIFT;
  
  	if (new_below) {
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1514
  		region->vm_top = region->vm_end = new->vm_end = addr;
8feae1311   David Howells   NOMMU: Make VMAs ...
1515
1516
1517
  	} else {
  		region->vm_start = new->vm_start = addr;
  		region->vm_pgoff = new->vm_pgoff += npages;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1518
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1519
1520
1521
1522
1523
1524
1525
1526
1527
1528
1529
1530
  
  	if (new->vm_ops && new->vm_ops->open)
  		new->vm_ops->open(new);
  
  	delete_vma_from_mm(vma);
  	down_write(&nommu_region_sem);
  	delete_nommu_region(vma->vm_region);
  	if (new_below) {
  		vma->vm_region->vm_start = vma->vm_start = addr;
  		vma->vm_region->vm_pgoff = vma->vm_pgoff += npages;
  	} else {
  		vma->vm_region->vm_end = vma->vm_end = addr;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1531
  		vma->vm_region->vm_top = addr;
8feae1311   David Howells   NOMMU: Make VMAs ...
1532
1533
1534
1535
1536
1537
1538
  	}
  	add_nommu_region(vma->vm_region);
  	add_nommu_region(new->vm_region);
  	up_write(&nommu_region_sem);
  	add_vma_to_mm(mm, vma);
  	add_vma_to_mm(mm, new);
  	return 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1539
  }
3034097a5   David Howells   [PATCH] NOMMU: Or...
1540
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
1541
1542
   * shrink a VMA by removing the specified chunk from either the beginning or
   * the end
3034097a5   David Howells   [PATCH] NOMMU: Or...
1543
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
1544
1545
1546
  static int shrink_vma(struct mm_struct *mm,
  		      struct vm_area_struct *vma,
  		      unsigned long from, unsigned long to)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1547
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
1548
  	struct vm_region *region;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1549

8feae1311   David Howells   NOMMU: Make VMAs ...
1550
  	kenter("");
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1551

8feae1311   David Howells   NOMMU: Make VMAs ...
1552
1553
1554
1555
1556
1557
1558
1559
  	/* adjust the VMA's pointers, which may reposition it in the MM's tree
  	 * and list */
  	delete_vma_from_mm(vma);
  	if (from > vma->vm_start)
  		vma->vm_end = from;
  	else
  		vma->vm_start = to;
  	add_vma_to_mm(mm, vma);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1560

8feae1311   David Howells   NOMMU: Make VMAs ...
1561
1562
  	/* cut the backing region down to size */
  	region = vma->vm_region;
1e2ae599d   David Howells   nommu: struct vm_...
1563
  	BUG_ON(region->vm_usage != 1);
8feae1311   David Howells   NOMMU: Make VMAs ...
1564
1565
1566
  
  	down_write(&nommu_region_sem);
  	delete_nommu_region(region);
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1567
1568
1569
1570
  	if (from > region->vm_start) {
  		to = region->vm_top;
  		region->vm_top = region->vm_end = from;
  	} else {
8feae1311   David Howells   NOMMU: Make VMAs ...
1571
  		region->vm_start = to;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1572
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1573
1574
1575
1576
1577
1578
  	add_nommu_region(region);
  	up_write(&nommu_region_sem);
  
  	free_page_series(from, to);
  	return 0;
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1579

8feae1311   David Howells   NOMMU: Make VMAs ...
1580
1581
1582
1583
1584
1585
1586
1587
  /*
   * release a mapping
   * - under NOMMU conditions the chunk to be unmapped must be backed by a single
   *   VMA, though it need not cover the whole VMA
   */
  int do_munmap(struct mm_struct *mm, unsigned long start, size_t len)
  {
  	struct vm_area_struct *vma;
f67d9b157   Bob Liu   nommu: add page a...
1588
  	unsigned long end;
8feae1311   David Howells   NOMMU: Make VMAs ...
1589
  	int ret;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1590

8feae1311   David Howells   NOMMU: Make VMAs ...
1591
  	kenter(",%lx,%zx", start, len);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1592

f67d9b157   Bob Liu   nommu: add page a...
1593
  	len = PAGE_ALIGN(len);
8feae1311   David Howells   NOMMU: Make VMAs ...
1594
1595
  	if (len == 0)
  		return -EINVAL;
365e9c87a   Hugh Dickins   [PATCH] mm: updat...
1596

f67d9b157   Bob Liu   nommu: add page a...
1597
  	end = start + len;
8feae1311   David Howells   NOMMU: Make VMAs ...
1598
1599
1600
  	/* find the first potentially overlapping VMA */
  	vma = find_vma(mm, start);
  	if (!vma) {
33e5d7697   David Howells   nommu: fix a numb...
1601
1602
1603
1604
1605
1606
1607
1608
1609
1610
  		static int limit = 0;
  		if (limit < 5) {
  			printk(KERN_WARNING
  			       "munmap of memory not mmapped by process %d"
  			       " (%s): 0x%lx-0x%lx
  ",
  			       current->pid, current->comm,
  			       start, start + len - 1);
  			limit++;
  		}
8feae1311   David Howells   NOMMU: Make VMAs ...
1611
1612
  		return -EINVAL;
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1613

8feae1311   David Howells   NOMMU: Make VMAs ...
1614
1615
1616
1617
1618
1619
1620
1621
1622
  	/* we're allowed to split an anonymous VMA but not a file-backed one */
  	if (vma->vm_file) {
  		do {
  			if (start > vma->vm_start) {
  				kleave(" = -EINVAL [miss]");
  				return -EINVAL;
  			}
  			if (end == vma->vm_end)
  				goto erase_whole_vma;
d75a310c4   Namhyung Kim   mm: nommu: check ...
1623
1624
  			vma = vma->vm_next;
  		} while (vma);
8feae1311   David Howells   NOMMU: Make VMAs ...
1625
1626
1627
1628
1629
1630
1631
1632
1633
1634
1635
1636
1637
1638
1639
1640
1641
1642
1643
1644
1645
1646
1647
1648
1649
1650
1651
  		kleave(" = -EINVAL [split file]");
  		return -EINVAL;
  	} else {
  		/* the chunk must be a subset of the VMA found */
  		if (start == vma->vm_start && end == vma->vm_end)
  			goto erase_whole_vma;
  		if (start < vma->vm_start || end > vma->vm_end) {
  			kleave(" = -EINVAL [superset]");
  			return -EINVAL;
  		}
  		if (start & ~PAGE_MASK) {
  			kleave(" = -EINVAL [unaligned start]");
  			return -EINVAL;
  		}
  		if (end != vma->vm_end && end & ~PAGE_MASK) {
  			kleave(" = -EINVAL [unaligned split]");
  			return -EINVAL;
  		}
  		if (start != vma->vm_start && end != vma->vm_end) {
  			ret = split_vma(mm, vma, start, 1);
  			if (ret < 0) {
  				kleave(" = %d [split]", ret);
  				return ret;
  			}
  		}
  		return shrink_vma(mm, vma, start, end);
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1652

8feae1311   David Howells   NOMMU: Make VMAs ...
1653
1654
1655
1656
  erase_whole_vma:
  	delete_vma_from_mm(vma);
  	delete_vma(mm, vma);
  	kleave(" = 0");
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1657
1658
  	return 0;
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
1659
  EXPORT_SYMBOL(do_munmap);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1660

6a6160a7b   Heiko Carstens   [CVE-2009-0029] S...
1661
  SYSCALL_DEFINE2(munmap, unsigned long, addr, size_t, len)
3034097a5   David Howells   [PATCH] NOMMU: Or...
1662
1663
1664
1665
1666
1667
1668
1669
1670
1671
1672
  {
  	int ret;
  	struct mm_struct *mm = current->mm;
  
  	down_write(&mm->mmap_sem);
  	ret = do_munmap(mm, addr, len);
  	up_write(&mm->mmap_sem);
  	return ret;
  }
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
1673
   * release all the mappings made in a process's VM space
3034097a5   David Howells   [PATCH] NOMMU: Or...
1674
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
1675
  void exit_mmap(struct mm_struct *mm)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1676
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
1677
  	struct vm_area_struct *vma;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1678

8feae1311   David Howells   NOMMU: Make VMAs ...
1679
1680
  	if (!mm)
  		return;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1681

8feae1311   David Howells   NOMMU: Make VMAs ...
1682
  	kenter("");
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1683

8feae1311   David Howells   NOMMU: Make VMAs ...
1684
  	mm->total_vm = 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1685

8feae1311   David Howells   NOMMU: Make VMAs ...
1686
1687
1688
1689
  	while ((vma = mm->mmap)) {
  		mm->mmap = vma->vm_next;
  		delete_vma_from_mm(vma);
  		delete_vma(mm, vma);
04c349615   Steven J. Magnani   nommu: yield CPU ...
1690
  		cond_resched();
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1691
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1692
1693
  
  	kleave("");
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1694
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1695
1696
1697
1698
1699
1700
  unsigned long do_brk(unsigned long addr, unsigned long len)
  {
  	return -ENOMEM;
  }
  
  /*
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1701
1702
   * expand (or shrink) an existing mapping, potentially moving it at the same
   * time (controlled by the MREMAP_MAYMOVE flag and available VM space)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1703
   *
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1704
   * under NOMMU conditions, we only permit changing a mapping's size, and only
8feae1311   David Howells   NOMMU: Make VMAs ...
1705
1706
   * as long as it stays within the region allocated by do_mmap_private() and the
   * block is not shareable
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1707
   *
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1708
   * MREMAP_FIXED is not supported under NOMMU conditions
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1709
1710
1711
1712
1713
   */
  unsigned long do_mremap(unsigned long addr,
  			unsigned long old_len, unsigned long new_len,
  			unsigned long flags, unsigned long new_addr)
  {
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1714
  	struct vm_area_struct *vma;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1715
1716
  
  	/* insanity checks first */
f67d9b157   Bob Liu   nommu: add page a...
1717
1718
  	old_len = PAGE_ALIGN(old_len);
  	new_len = PAGE_ALIGN(new_len);
8feae1311   David Howells   NOMMU: Make VMAs ...
1719
  	if (old_len == 0 || new_len == 0)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1720
  		return (unsigned long) -EINVAL;
8feae1311   David Howells   NOMMU: Make VMAs ...
1721
1722
  	if (addr & ~PAGE_MASK)
  		return -EINVAL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1723
1724
  	if (flags & MREMAP_FIXED && new_addr != addr)
  		return (unsigned long) -EINVAL;
8feae1311   David Howells   NOMMU: Make VMAs ...
1725
  	vma = find_vma_exact(current->mm, addr, old_len);
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1726
1727
  	if (!vma)
  		return (unsigned long) -EINVAL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1728

6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1729
  	if (vma->vm_end != vma->vm_start + old_len)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1730
  		return (unsigned long) -EFAULT;
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1731
  	if (vma->vm_flags & VM_MAYSHARE)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1732
  		return (unsigned long) -EPERM;
8feae1311   David Howells   NOMMU: Make VMAs ...
1733
  	if (new_len > vma->vm_region->vm_end - vma->vm_region->vm_start)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1734
1735
1736
  		return (unsigned long) -ENOMEM;
  
  	/* all checks complete - do it */
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1737
  	vma->vm_end = vma->vm_start + new_len;
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1738
1739
  	return vma->vm_start;
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
1740
  EXPORT_SYMBOL(do_mremap);
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1741

6a6160a7b   Heiko Carstens   [CVE-2009-0029] S...
1742
1743
1744
  SYSCALL_DEFINE5(mremap, unsigned long, addr, unsigned long, old_len,
  		unsigned long, new_len, unsigned long, flags,
  		unsigned long, new_addr)
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1745
1746
1747
1748
1749
1750
1751
  {
  	unsigned long ret;
  
  	down_write(&current->mm->mmap_sem);
  	ret = do_mremap(addr, old_len, new_len, flags, new_addr);
  	up_write(&current->mm->mmap_sem);
  	return ret;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1752
  }
6aab341e0   Linus Torvalds   mm: re-architect ...
1753
  struct page *follow_page(struct vm_area_struct *vma, unsigned long address,
deceb6cd1   Hugh Dickins   [PATCH] mm: follo...
1754
  			unsigned int foll_flags)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1755
1756
1757
  {
  	return NULL;
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1758
1759
1760
  int remap_pfn_range(struct vm_area_struct *vma, unsigned long from,
  		unsigned long to, unsigned long size, pgprot_t prot)
  {
66aa2b4b1   Greg Ungerer   [PATCH] uclinux: ...
1761
1762
  	vma->vm_start = vma->vm_pgoff << PAGE_SHIFT;
  	return 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1763
  }
22c4af409   Luke Yang   [PATCH] nommu: ex...
1764
  EXPORT_SYMBOL(remap_pfn_range);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1765

f905bc447   Paul Mundt   nommu: add new vm...
1766
1767
1768
1769
1770
1771
1772
1773
1774
1775
1776
1777
1778
1779
  int remap_vmalloc_range(struct vm_area_struct *vma, void *addr,
  			unsigned long pgoff)
  {
  	unsigned int size = vma->vm_end - vma->vm_start;
  
  	if (!(vma->vm_flags & VM_USERMAP))
  		return -EINVAL;
  
  	vma->vm_start = (unsigned long)(addr + (pgoff << PAGE_SHIFT));
  	vma->vm_end = vma->vm_start + size;
  
  	return 0;
  }
  EXPORT_SYMBOL(remap_vmalloc_range);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1780
1781
1782
1783
1784
  unsigned long arch_get_unmapped_area(struct file *file, unsigned long addr,
  	unsigned long len, unsigned long pgoff, unsigned long flags)
  {
  	return -ENOMEM;
  }
1363c3cd8   Wolfgang Wander   [PATCH] Avoiding ...
1785
  void arch_unmap_area(struct mm_struct *mm, unsigned long addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1786
1787
  {
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1788
1789
1790
1791
1792
  void unmap_mapping_range(struct address_space *mapping,
  			 loff_t const holebegin, loff_t const holelen,
  			 int even_cows)
  {
  }
22c4af409   Luke Yang   [PATCH] nommu: ex...
1793
  EXPORT_SYMBOL(unmap_mapping_range);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1794
1795
1796
1797
1798
1799
1800
1801
1802
1803
1804
1805
1806
1807
1808
1809
1810
  
  /*
   * Check that a process has enough memory to allocate a new virtual
   * mapping. 0 means there is enough memory for the allocation to
   * succeed and -ENOMEM implies there is not.
   *
   * We currently support three overcommit policies, which are set via the
   * vm.overcommit_memory sysctl.  See Documentation/vm/overcommit-accounting
   *
   * Strict overcommit modes added 2002 Feb 26 by Alan Cox.
   * Additional code 2002 Jul 20 by Robert Love.
   *
   * cap_sys_admin is 1 if the process has admin privileges, 0 otherwise.
   *
   * Note this is a helper function intended to be used by LSMs which
   * wish to use this logic.
   */
34b4e4aa3   Alan Cox   fix NULL pointer ...
1811
  int __vm_enough_memory(struct mm_struct *mm, long pages, int cap_sys_admin)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1812
1813
1814
1815
1816
1817
1818
1819
1820
1821
1822
1823
1824
  {
  	unsigned long free, allowed;
  
  	vm_acct_memory(pages);
  
  	/*
  	 * Sometimes we want to use more memory than we have
  	 */
  	if (sysctl_overcommit_memory == OVERCOMMIT_ALWAYS)
  		return 0;
  
  	if (sysctl_overcommit_memory == OVERCOMMIT_GUESS) {
  		unsigned long n;
347ce434d   Christoph Lameter   [PATCH] zoned vm ...
1825
  		free = global_page_state(NR_FILE_PAGES);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1826
1827
1828
1829
1830
1831
1832
1833
  		free += nr_swap_pages;
  
  		/*
  		 * Any slabs which are created with the
  		 * SLAB_RECLAIM_ACCOUNT flag claim to have contents
  		 * which are reclaimable, under pressure.  The dentry
  		 * cache and most inode caches should fall into this
  		 */
972d1a7b1   Christoph Lameter   [PATCH] ZVC: Supp...
1834
  		free += global_page_state(NR_SLAB_RECLAIMABLE);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1835
1836
1837
1838
1839
1840
1841
1842
1843
1844
1845
1846
1847
1848
1849
  
  		/*
  		 * Leave the last 3% for root
  		 */
  		if (!cap_sys_admin)
  			free -= free / 32;
  
  		if (free > pages)
  			return 0;
  
  		/*
  		 * nr_free_pages() is very expensive on large systems,
  		 * only call if we're about to fail.
  		 */
  		n = nr_free_pages();
d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1850
1851
1852
1853
1854
1855
1856
1857
1858
1859
1860
1861
  
  		/*
  		 * Leave reserved pages. The pages are not for anonymous pages.
  		 */
  		if (n <= totalreserve_pages)
  			goto error;
  		else
  			n -= totalreserve_pages;
  
  		/*
  		 * Leave the last 3% for root
  		 */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1862
1863
1864
1865
1866
1867
  		if (!cap_sys_admin)
  			n -= n / 32;
  		free += n;
  
  		if (free > pages)
  			return 0;
d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1868
1869
  
  		goto error;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1870
1871
1872
1873
1874
1875
1876
1877
1878
1879
1880
1881
  	}
  
  	allowed = totalram_pages * sysctl_overcommit_ratio / 100;
  	/*
  	 * Leave the last 3% for root
  	 */
  	if (!cap_sys_admin)
  		allowed -= allowed / 32;
  	allowed += total_swap_pages;
  
  	/* Don't let a single process grow too big:
  	   leave 3% of the size of this process for other processes */
731572d39   Alan Cox   nfsd: fix vm over...
1882
1883
  	if (mm)
  		allowed -= mm->total_vm / 32;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1884

00a62ce91   KOSAKI Motohiro   mm: fix Committed...
1885
  	if (percpu_counter_read_positive(&vm_committed_as) < allowed)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1886
  		return 0;
00a62ce91   KOSAKI Motohiro   mm: fix Committed...
1887

d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1888
  error:
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1889
1890
1891
1892
  	vm_unacct_memory(pages);
  
  	return -ENOMEM;
  }
cae5d3903   Stephen Wilson   mm: arch: rename ...
1893
  int in_gate_area_no_mm(unsigned long addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1894
1895
1896
  {
  	return 0;
  }
b0e15190e   David Howells   [PATCH] NOMMU: Ma...
1897

d0217ac04   Nick Piggin   mm: fault feedbac...
1898
  int filemap_fault(struct vm_area_struct *vma, struct vm_fault *vmf)
b0e15190e   David Howells   [PATCH] NOMMU: Ma...
1899
1900
  {
  	BUG();
d0217ac04   Nick Piggin   mm: fault feedbac...
1901
  	return 0;
b0e15190e   David Howells   [PATCH] NOMMU: Ma...
1902
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
1903
  EXPORT_SYMBOL(filemap_fault);
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1904

f55f199b7   Mike Frysinger   NOMMU: implement ...
1905
1906
  static int __access_remote_vm(struct task_struct *tsk, struct mm_struct *mm,
  		unsigned long addr, void *buf, int len, int write)
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1907
  {
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1908
  	struct vm_area_struct *vma;
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1909
1910
1911
1912
  
  	down_read(&mm->mmap_sem);
  
  	/* the access must start within one of the target process's mappings */
0159b141d   David Howells   [PATCH] NOMMU: Us...
1913
1914
  	vma = find_vma(mm, addr);
  	if (vma) {
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1915
1916
1917
1918
1919
  		/* don't overrun this mapping */
  		if (addr + len >= vma->vm_end)
  			len = vma->vm_end - addr;
  
  		/* only read or write mappings where it is permitted */
d00c7b993   David Howells   [PATCH] NOMMU: Pe...
1920
  		if (write && vma->vm_flags & VM_MAYWRITE)
7959722b9   Jie Zhang   NOMMU: Use copy_*...
1921
1922
  			copy_to_user_page(vma, NULL, addr,
  					 (void *) addr, buf, len);
d00c7b993   David Howells   [PATCH] NOMMU: Pe...
1923
  		else if (!write && vma->vm_flags & VM_MAYREAD)
7959722b9   Jie Zhang   NOMMU: Use copy_*...
1924
1925
  			copy_from_user_page(vma, NULL, addr,
  					    buf, (void *) addr, len);
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1926
1927
1928
1929
1930
1931
1932
  		else
  			len = 0;
  	} else {
  		len = 0;
  	}
  
  	up_read(&mm->mmap_sem);
f55f199b7   Mike Frysinger   NOMMU: implement ...
1933
1934
1935
1936
1937
1938
1939
1940
1941
1942
1943
1944
1945
1946
1947
1948
1949
1950
1951
1952
1953
1954
1955
1956
1957
1958
1959
1960
1961
1962
1963
1964
1965
1966
1967
1968
  
  	return len;
  }
  
  /**
   * @access_remote_vm - access another process' address space
   * @mm:		the mm_struct of the target address space
   * @addr:	start address to access
   * @buf:	source or destination buffer
   * @len:	number of bytes to transfer
   * @write:	whether the access is a write
   *
   * The caller must hold a reference on @mm.
   */
  int access_remote_vm(struct mm_struct *mm, unsigned long addr,
  		void *buf, int len, int write)
  {
  	return __access_remote_vm(NULL, mm, addr, buf, len, write);
  }
  
  /*
   * Access another process' address space.
   * - source/target buffer must be kernel space
   */
  int access_process_vm(struct task_struct *tsk, unsigned long addr, void *buf, int len, int write)
  {
  	struct mm_struct *mm;
  
  	if (addr + len < addr)
  		return 0;
  
  	mm = get_task_mm(tsk);
  	if (!mm)
  		return 0;
  
  	len = __access_remote_vm(tsk, mm, addr, buf, len, write);
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1969
1970
1971
  	mmput(mm);
  	return len;
  }
7e6608724   David Howells   nommu: fix shared...
1972
1973
1974
1975
1976
1977
1978
1979
1980
1981
1982
1983
1984
1985
1986
1987
1988
1989
1990
1991
1992
1993
1994
1995
1996
1997
1998
1999
2000
2001
2002
2003
2004
2005
2006
2007
2008
2009
2010
2011
2012
2013
2014
2015
2016
2017
2018
2019
2020
2021
2022
2023
2024
2025
2026
2027
2028
2029
2030
2031
2032
2033
  
  /**
   * nommu_shrink_inode_mappings - Shrink the shared mappings on an inode
   * @inode: The inode to check
   * @size: The current filesize of the inode
   * @newsize: The proposed filesize of the inode
   *
   * Check the shared mappings on an inode on behalf of a shrinking truncate to
   * make sure that that any outstanding VMAs aren't broken and then shrink the
   * vm_regions that extend that beyond so that do_mmap_pgoff() doesn't
   * automatically grant mappings that are too large.
   */
  int nommu_shrink_inode_mappings(struct inode *inode, size_t size,
  				size_t newsize)
  {
  	struct vm_area_struct *vma;
  	struct prio_tree_iter iter;
  	struct vm_region *region;
  	pgoff_t low, high;
  	size_t r_size, r_top;
  
  	low = newsize >> PAGE_SHIFT;
  	high = (size + PAGE_SIZE - 1) >> PAGE_SHIFT;
  
  	down_write(&nommu_region_sem);
  
  	/* search for VMAs that fall within the dead zone */
  	vma_prio_tree_foreach(vma, &iter, &inode->i_mapping->i_mmap,
  			      low, high) {
  		/* found one - only interested if it's shared out of the page
  		 * cache */
  		if (vma->vm_flags & VM_SHARED) {
  			up_write(&nommu_region_sem);
  			return -ETXTBSY; /* not quite true, but near enough */
  		}
  	}
  
  	/* reduce any regions that overlap the dead zone - if in existence,
  	 * these will be pointed to by VMAs that don't overlap the dead zone
  	 *
  	 * we don't check for any regions that start beyond the EOF as there
  	 * shouldn't be any
  	 */
  	vma_prio_tree_foreach(vma, &iter, &inode->i_mapping->i_mmap,
  			      0, ULONG_MAX) {
  		if (!(vma->vm_flags & VM_SHARED))
  			continue;
  
  		region = vma->vm_region;
  		r_size = region->vm_top - region->vm_start;
  		r_top = (region->vm_pgoff << PAGE_SHIFT) + r_size;
  
  		if (r_top > newsize) {
  			region->vm_top -= r_top - newsize;
  			if (region->vm_end > region->vm_top)
  				region->vm_end = region->vm_top;
  		}
  	}
  
  	up_write(&nommu_region_sem);
  	return 0;
  }