Blame view

mm/nommu.c 53.7 KB
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1
2
3
4
5
6
7
8
  /*
   *  linux/mm/nommu.c
   *
   *  Replacement code for mm functions to support CPU's that don't
   *  have any form of memory management unit (thus no virtual memory).
   *
   *  See Documentation/nommu-mmap.txt
   *
8feae1311   David Howells   NOMMU: Make VMAs ...
9
   *  Copyright (c) 2004-2008 David Howells <dhowells@redhat.com>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
10
11
12
   *  Copyright (c) 2000-2003 David McCullough <davidm@snapgear.com>
   *  Copyright (c) 2000-2001 D Jeff Dionne <jeff@uClinux.org>
   *  Copyright (c) 2002      Greg Ungerer <gerg@snapgear.com>
29c185e5c   Paul Mundt   nommu: Provide st...
13
   *  Copyright (c) 2007-2010 Paul Mundt <lethal@linux-sh.org>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
14
   */
b1de0d139   Mitchel Humpherys   mm: convert some ...
15
  #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
b95f1b31b   Paul Gortmaker   mm: Map most file...
16
  #include <linux/export.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
17
  #include <linux/mm.h>
615d6e875   Davidlohr Bueso   mm: per-thread vm...
18
  #include <linux/vmacache.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
19
20
21
22
23
24
25
  #include <linux/mman.h>
  #include <linux/swap.h>
  #include <linux/file.h>
  #include <linux/highmem.h>
  #include <linux/pagemap.h>
  #include <linux/slab.h>
  #include <linux/vmalloc.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
26
27
  #include <linux/blkdev.h>
  #include <linux/backing-dev.h>
3b32123d7   Gideon Israel Dsouza   mm: use macros fr...
28
  #include <linux/compiler.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
29
30
31
32
  #include <linux/mount.h>
  #include <linux/personality.h>
  #include <linux/security.h>
  #include <linux/syscalls.h>
120a795da   Al Viro   audit mmap
33
  #include <linux/audit.h>
cf4aebc29   Clark Williams   sched: Move sched...
34
  #include <linux/sched/sysctl.h>
b1de0d139   Mitchel Humpherys   mm: convert some ...
35
  #include <linux/printk.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
36
37
38
39
  
  #include <asm/uaccess.h>
  #include <asm/tlb.h>
  #include <asm/tlbflush.h>
eb8cdec4a   Bernd Schmidt   nommu: add suppor...
40
  #include <asm/mmu_context.h>
8feae1311   David Howells   NOMMU: Make VMAs ...
41
  #include "internal.h"
8feae1311   David Howells   NOMMU: Make VMAs ...
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
  #if 0
  #define kenter(FMT, ...) \
  	printk(KERN_DEBUG "==> %s("FMT")
  ", __func__, ##__VA_ARGS__)
  #define kleave(FMT, ...) \
  	printk(KERN_DEBUG "<== %s()"FMT"
  ", __func__, ##__VA_ARGS__)
  #define kdebug(FMT, ...) \
  	printk(KERN_DEBUG "xxx" FMT"yyy
  ", ##__VA_ARGS__)
  #else
  #define kenter(FMT, ...) \
  	no_printk(KERN_DEBUG "==> %s("FMT")
  ", __func__, ##__VA_ARGS__)
  #define kleave(FMT, ...) \
  	no_printk(KERN_DEBUG "<== %s()"FMT"
  ", __func__, ##__VA_ARGS__)
  #define kdebug(FMT, ...) \
  	no_printk(KERN_DEBUG FMT"
  ", ##__VA_ARGS__)
  #endif
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
63
64
  
  void *high_memory;
944b68749   Arnd Bergmann   mm: export "high_...
65
  EXPORT_SYMBOL(high_memory);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
66
67
  struct page *mem_map;
  unsigned long max_mapnr;
5b8bf3072   gchen gchen   mm/nommu.c: expor...
68
  EXPORT_SYMBOL(max_mapnr);
4266c97a3   Hugh Dickins   nommu: fix two bu...
69
  unsigned long highest_memmap_pfn;
00a62ce91   KOSAKI Motohiro   mm: fix Committed...
70
  struct percpu_counter vm_committed_as;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
71
72
  int sysctl_overcommit_memory = OVERCOMMIT_GUESS; /* heuristic overcommit */
  int sysctl_overcommit_ratio = 50; /* default is 50% */
49f0ce5f9   Jerome Marchand   mm: add overcommi...
73
  unsigned long sysctl_overcommit_kbytes __read_mostly;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
74
  int sysctl_max_map_count = DEFAULT_MAX_MAP_COUNT;
fc4d5c292   David Howells   nommu: make the i...
75
  int sysctl_nr_trim_pages = CONFIG_NOMMU_INITIAL_TRIM_EXCESS;
c9b1d0981   Andrew Shewmaker   mm: limit growth ...
76
  unsigned long sysctl_user_reserve_kbytes __read_mostly = 1UL << 17; /* 128MB */
4eeab4f55   Andrew Shewmaker   mm: replace hardc...
77
  unsigned long sysctl_admin_reserve_kbytes __read_mostly = 1UL << 13; /* 8MB */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
78
  int heap_stack_gap = 0;
33e5d7697   David Howells   nommu: fix a numb...
79
  atomic_long_t mmap_pages_allocated;
8feae1311   David Howells   NOMMU: Make VMAs ...
80

997071bcb   K. Y. Srinivasan   mm: export a func...
81
82
83
84
85
86
87
88
89
90
91
92
93
94
  /*
   * The global memory commitment made in the system can be a metric
   * that can be used to drive ballooning decisions when Linux is hosted
   * as a guest. On Hyper-V, the host implements a policy engine for dynamically
   * balancing memory across competing virtual machines that are hosted.
   * Several metrics drive this policy engine including the guest reported
   * memory commitment.
   */
  unsigned long vm_memory_committed(void)
  {
  	return percpu_counter_read_positive(&vm_committed_as);
  }
  
  EXPORT_SYMBOL_GPL(vm_memory_committed);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
95
  EXPORT_SYMBOL(mem_map);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
96

8feae1311   David Howells   NOMMU: Make VMAs ...
97
98
99
100
  /* list of mapped, potentially shareable regions */
  static struct kmem_cache *vm_region_jar;
  struct rb_root nommu_region_tree = RB_ROOT;
  DECLARE_RWSEM(nommu_region_sem);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
101

f0f37e2f7   Alexey Dobriyan   const: mark struc...
102
  const struct vm_operations_struct generic_file_vm_ops = {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
103
104
105
  };
  
  /*
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
106
107
108
109
110
111
112
113
   * Return the total memory allocated for this pointer, not
   * just what the caller asked for.
   *
   * Doesn't have to be accurate, i.e. may have races.
   */
  unsigned int kobjsize(const void *objp)
  {
  	struct page *page;
4016a1390   Michael Hennerich   mm/nommu.c: retur...
114
115
116
117
  	/*
  	 * If the object we have should not have ksize performed on it,
  	 * return size of 0
  	 */
5a1603be5   Paul Mundt   nommu: Correct ko...
118
  	if (!objp || !virt_addr_valid(objp))
6cfd53fc0   Paul Mundt   nommu: fix kobjsi...
119
120
121
  		return 0;
  
  	page = virt_to_head_page(objp);
6cfd53fc0   Paul Mundt   nommu: fix kobjsi...
122
123
124
125
126
  
  	/*
  	 * If the allocator sets PageSlab, we know the pointer came from
  	 * kmalloc().
  	 */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
127
128
  	if (PageSlab(page))
  		return ksize(objp);
6cfd53fc0   Paul Mundt   nommu: fix kobjsi...
129
  	/*
ab2e83ead   Paul Mundt   NOMMU: Teach kobj...
130
131
132
133
134
135
136
137
138
139
140
141
142
143
  	 * If it's not a compound page, see if we have a matching VMA
  	 * region. This test is intentionally done in reverse order,
  	 * so if there's no VMA, we still fall through and hand back
  	 * PAGE_SIZE for 0-order pages.
  	 */
  	if (!PageCompound(page)) {
  		struct vm_area_struct *vma;
  
  		vma = find_vma(current->mm, (unsigned long)objp);
  		if (vma)
  			return vma->vm_end - vma->vm_start;
  	}
  
  	/*
6cfd53fc0   Paul Mundt   nommu: fix kobjsi...
144
  	 * The ksize() function is only guaranteed to work for pointers
5a1603be5   Paul Mundt   nommu: Correct ko...
145
  	 * returned by kmalloc(). So handle arbitrary pointers here.
6cfd53fc0   Paul Mundt   nommu: fix kobjsi...
146
  	 */
5a1603be5   Paul Mundt   nommu: Correct ko...
147
  	return PAGE_SIZE << compound_order(page);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
148
  }
28a35716d   Michel Lespinasse   mm: use long type...
149
150
151
152
  long __get_user_pages(struct task_struct *tsk, struct mm_struct *mm,
  		      unsigned long start, unsigned long nr_pages,
  		      unsigned int foll_flags, struct page **pages,
  		      struct vm_area_struct **vmas, int *nonblocking)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
153
  {
910e46da4   Sonic Zhang   [PATCH] Check if ...
154
  	struct vm_area_struct *vma;
7b4d5b8b3   David Howells   [PATCH] NOMMU: Ch...
155
156
157
158
  	unsigned long vm_flags;
  	int i;
  
  	/* calculate required read or write permissions.
58fa879e1   Hugh Dickins   mm: FOLL flags fo...
159
  	 * If FOLL_FORCE is set, we only require the "MAY" flags.
7b4d5b8b3   David Howells   [PATCH] NOMMU: Ch...
160
  	 */
58fa879e1   Hugh Dickins   mm: FOLL flags fo...
161
162
163
164
  	vm_flags  = (foll_flags & FOLL_WRITE) ?
  			(VM_WRITE | VM_MAYWRITE) : (VM_READ | VM_MAYREAD);
  	vm_flags &= (foll_flags & FOLL_FORCE) ?
  			(VM_MAYREAD | VM_MAYWRITE) : (VM_READ | VM_WRITE);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
165

9d73777e5   Peter Zijlstra   clarify get_user_...
166
  	for (i = 0; i < nr_pages; i++) {
7561e8ca0   David Howells   NOMMU: Revert 'no...
167
  		vma = find_vma(mm, start);
7b4d5b8b3   David Howells   [PATCH] NOMMU: Ch...
168
169
170
171
  		if (!vma)
  			goto finish_or_fault;
  
  		/* protect what we can, including chardevs */
1c3aff1ce   Hugh Dickins   mm: remove unused...
172
173
  		if ((vma->vm_flags & (VM_IO | VM_PFNMAP)) ||
  		    !(vm_flags & vma->vm_flags))
7b4d5b8b3   David Howells   [PATCH] NOMMU: Ch...
174
  			goto finish_or_fault;
910e46da4   Sonic Zhang   [PATCH] Check if ...
175

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
176
177
178
179
180
181
  		if (pages) {
  			pages[i] = virt_to_page(start);
  			if (pages[i])
  				page_cache_get(pages[i]);
  		}
  		if (vmas)
910e46da4   Sonic Zhang   [PATCH] Check if ...
182
  			vmas[i] = vma;
e1ee65d85   David Howells   NOMMU: Fix __get_...
183
  		start = (start + PAGE_SIZE) & PAGE_MASK;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
184
  	}
7b4d5b8b3   David Howells   [PATCH] NOMMU: Ch...
185
186
187
188
189
  
  	return i;
  
  finish_or_fault:
  	return i ? : -EFAULT;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
190
  }
b291f0003   Nick Piggin   mlock: mlocked pa...
191

b291f0003   Nick Piggin   mlock: mlocked pa...
192
193
194
195
196
197
198
  /*
   * get a list of pages in an address range belonging to the specified process
   * and indicate the VMA that covers each page
   * - this is potentially dodgy as we may end incrementing the page count of a
   *   slab page or a secondary page from a compound page
   * - don't permit access to VMAs that don't support it, such as I/O mappings
   */
28a35716d   Michel Lespinasse   mm: use long type...
199
200
201
202
  long get_user_pages(struct task_struct *tsk, struct mm_struct *mm,
  		    unsigned long start, unsigned long nr_pages,
  		    int write, int force, struct page **pages,
  		    struct vm_area_struct **vmas)
b291f0003   Nick Piggin   mlock: mlocked pa...
203
204
205
206
  {
  	int flags = 0;
  
  	if (write)
58fa879e1   Hugh Dickins   mm: FOLL flags fo...
207
  		flags |= FOLL_WRITE;
b291f0003   Nick Piggin   mlock: mlocked pa...
208
  	if (force)
58fa879e1   Hugh Dickins   mm: FOLL flags fo...
209
  		flags |= FOLL_FORCE;
b291f0003   Nick Piggin   mlock: mlocked pa...
210

53a7706d5   Michel Lespinasse   mlock: do not hol...
211
212
  	return __get_user_pages(tsk, mm, start, nr_pages, flags, pages, vmas,
  				NULL);
b291f0003   Nick Piggin   mlock: mlocked pa...
213
  }
66aa2b4b1   Greg Ungerer   [PATCH] uclinux: ...
214
  EXPORT_SYMBOL(get_user_pages);
f0818f472   Andrea Arcangeli   mm: gup: add get_...
215
216
217
218
219
220
221
222
223
  long get_user_pages_locked(struct task_struct *tsk, struct mm_struct *mm,
  			   unsigned long start, unsigned long nr_pages,
  			   int write, int force, struct page **pages,
  			   int *locked)
  {
  	return get_user_pages(tsk, mm, start, nr_pages, write, force,
  			      pages, NULL);
  }
  EXPORT_SYMBOL(get_user_pages_locked);
0fd71a56f   Andrea Arcangeli   mm: gup: add __ge...
224
225
226
227
  long __get_user_pages_unlocked(struct task_struct *tsk, struct mm_struct *mm,
  			       unsigned long start, unsigned long nr_pages,
  			       int write, int force, struct page **pages,
  			       unsigned int gup_flags)
f0818f472   Andrea Arcangeli   mm: gup: add get_...
228
229
230
231
232
233
234
235
  {
  	long ret;
  	down_read(&mm->mmap_sem);
  	ret = get_user_pages(tsk, mm, start, nr_pages, write, force,
  			     pages, NULL);
  	up_read(&mm->mmap_sem);
  	return ret;
  }
0fd71a56f   Andrea Arcangeli   mm: gup: add __ge...
236
237
238
239
240
241
242
243
244
  EXPORT_SYMBOL(__get_user_pages_unlocked);
  
  long get_user_pages_unlocked(struct task_struct *tsk, struct mm_struct *mm,
  			     unsigned long start, unsigned long nr_pages,
  			     int write, int force, struct page **pages)
  {
  	return __get_user_pages_unlocked(tsk, mm, start, nr_pages, write,
  					 force, pages, 0);
  }
f0818f472   Andrea Arcangeli   mm: gup: add get_...
245
  EXPORT_SYMBOL(get_user_pages_unlocked);
dfc2f91ac   Paul Mundt   nommu: provide fo...
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
  /**
   * follow_pfn - look up PFN at a user virtual address
   * @vma: memory mapping
   * @address: user virtual address
   * @pfn: location to store found PFN
   *
   * Only IO mappings and raw PFN mappings are allowed.
   *
   * Returns zero and the pfn at @pfn on success, -ve otherwise.
   */
  int follow_pfn(struct vm_area_struct *vma, unsigned long address,
  	unsigned long *pfn)
  {
  	if (!(vma->vm_flags & (VM_IO | VM_PFNMAP)))
  		return -EINVAL;
  
  	*pfn = address >> PAGE_SHIFT;
  	return 0;
  }
  EXPORT_SYMBOL(follow_pfn);
f1c4069e1   Joonsoo Kim   mm, vmalloc: expo...
266
  LIST_HEAD(vmap_area_list);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
267

b3bdda02a   Christoph Lameter   vmalloc: add cons...
268
  void vfree(const void *addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
269
270
271
  {
  	kfree(addr);
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
272
  EXPORT_SYMBOL(vfree);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
273

dd0fc66fb   Al Viro   [PATCH] gfp flags...
274
  void *__vmalloc(unsigned long size, gfp_t gfp_mask, pgprot_t prot)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
275
276
  {
  	/*
8518609de   Robert P. J. Day   Explain clearly w...
277
278
  	 *  You can't specify __GFP_HIGHMEM with kmalloc() since kmalloc()
  	 * returns only a logical address.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
279
  	 */
84097518d   Nick Piggin   [PATCH] mm: nommu...
280
  	return kmalloc(size, (gfp_mask | __GFP_COMP) & ~__GFP_HIGHMEM);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
281
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
282
  EXPORT_SYMBOL(__vmalloc);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
283

f905bc447   Paul Mundt   nommu: add new vm...
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
  void *vmalloc_user(unsigned long size)
  {
  	void *ret;
  
  	ret = __vmalloc(size, GFP_KERNEL | __GFP_HIGHMEM | __GFP_ZERO,
  			PAGE_KERNEL);
  	if (ret) {
  		struct vm_area_struct *vma;
  
  		down_write(&current->mm->mmap_sem);
  		vma = find_vma(current->mm, (unsigned long)ret);
  		if (vma)
  			vma->vm_flags |= VM_USERMAP;
  		up_write(&current->mm->mmap_sem);
  	}
  
  	return ret;
  }
  EXPORT_SYMBOL(vmalloc_user);
b3bdda02a   Christoph Lameter   vmalloc: add cons...
303
  struct page *vmalloc_to_page(const void *addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
304
305
306
  {
  	return virt_to_page(addr);
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
307
  EXPORT_SYMBOL(vmalloc_to_page);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
308

b3bdda02a   Christoph Lameter   vmalloc: add cons...
309
  unsigned long vmalloc_to_pfn(const void *addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
310
311
312
  {
  	return page_to_pfn(virt_to_page(addr));
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
313
  EXPORT_SYMBOL(vmalloc_to_pfn);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
314
315
316
  
  long vread(char *buf, char *addr, unsigned long count)
  {
9bde916bc   Chen Gang   mm/nommu.c: add a...
317
318
319
  	/* Don't allow overflow */
  	if ((unsigned long) buf + count < count)
  		count = -(unsigned long) buf;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
320
321
322
323
324
325
326
327
328
329
330
  	memcpy(buf, addr, count);
  	return count;
  }
  
  long vwrite(char *buf, char *addr, unsigned long count)
  {
  	/* Don't allow overflow */
  	if ((unsigned long) addr + count < count)
  		count = -(unsigned long) addr;
  
  	memcpy(addr, buf, count);
ac7149045   Choi Gi-yong   mm: fix 'ERROR: d...
331
  	return count;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
332
333
334
335
336
337
338
339
340
341
  }
  
  /*
   *	vmalloc  -  allocate virtually continguos memory
   *
   *	@size:		allocation size
   *
   *	Allocate enough pages to cover @size from the page level
   *	allocator and map them into continguos kernel virtual space.
   *
c1c8897f8   Michael Opdenacker   Spelling fix: "co...
342
   *	For tight control over page level allocator and protection flags
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
343
344
345
346
347
348
   *	use __vmalloc() instead.
   */
  void *vmalloc(unsigned long size)
  {
         return __vmalloc(size, GFP_KERNEL | __GFP_HIGHMEM, PAGE_KERNEL);
  }
f61388822   Andrew Morton   [PATCH] nommu: im...
349
  EXPORT_SYMBOL(vmalloc);
e1ca7788d   Dave Young   mm: add vzalloc()...
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
  /*
   *	vzalloc - allocate virtually continguos memory with zero fill
   *
   *	@size:		allocation size
   *
   *	Allocate enough pages to cover @size from the page level
   *	allocator and map them into continguos kernel virtual space.
   *	The memory allocated is set to zero.
   *
   *	For tight control over page level allocator and protection flags
   *	use __vmalloc() instead.
   */
  void *vzalloc(unsigned long size)
  {
  	return __vmalloc(size, GFP_KERNEL | __GFP_HIGHMEM | __GFP_ZERO,
  			PAGE_KERNEL);
  }
  EXPORT_SYMBOL(vzalloc);
  
  /**
   * vmalloc_node - allocate memory on a specific node
   * @size:	allocation size
   * @node:	numa node
   *
   * Allocate enough pages to cover @size from the page level
   * allocator and map them into contiguous kernel virtual space.
   *
   * For tight control over page level allocator and protection flags
   * use __vmalloc() instead.
   */
f61388822   Andrew Morton   [PATCH] nommu: im...
380
381
382
383
  void *vmalloc_node(unsigned long size, int node)
  {
  	return vmalloc(size);
  }
9a14f653d   Paul Mundt   nommu: Fix up vma...
384
  EXPORT_SYMBOL(vmalloc_node);
e1ca7788d   Dave Young   mm: add vzalloc()...
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
  
  /**
   * vzalloc_node - allocate memory on a specific node with zero fill
   * @size:	allocation size
   * @node:	numa node
   *
   * Allocate enough pages to cover @size from the page level
   * allocator and map them into contiguous kernel virtual space.
   * The memory allocated is set to zero.
   *
   * For tight control over page level allocator and protection flags
   * use __vmalloc() instead.
   */
  void *vzalloc_node(unsigned long size, int node)
  {
  	return vzalloc(size);
  }
  EXPORT_SYMBOL(vzalloc_node);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
403

1af446edf   Paul Mundt   nommu: Provide vm...
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
  #ifndef PAGE_KERNEL_EXEC
  # define PAGE_KERNEL_EXEC PAGE_KERNEL
  #endif
  
  /**
   *	vmalloc_exec  -  allocate virtually contiguous, executable memory
   *	@size:		allocation size
   *
   *	Kernel-internal function to allocate enough pages to cover @size
   *	the page level allocator and map them into contiguous and
   *	executable kernel virtual space.
   *
   *	For tight control over page level allocator and protection flags
   *	use __vmalloc() instead.
   */
  
  void *vmalloc_exec(unsigned long size)
  {
  	return __vmalloc(size, GFP_KERNEL | __GFP_HIGHMEM, PAGE_KERNEL_EXEC);
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
424
425
  /**
   * vmalloc_32  -  allocate virtually contiguous memory (32bit addressable)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
426
427
428
429
430
431
432
433
434
   *	@size:		allocation size
   *
   *	Allocate enough 32bit PA addressable pages to cover @size from the
   *	page level allocator and map them into continguos kernel virtual space.
   */
  void *vmalloc_32(unsigned long size)
  {
  	return __vmalloc(size, GFP_KERNEL, PAGE_KERNEL);
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
435
436
437
438
439
440
441
442
  EXPORT_SYMBOL(vmalloc_32);
  
  /**
   * vmalloc_32_user - allocate zeroed virtually contiguous 32bit memory
   *	@size:		allocation size
   *
   * The resulting memory area is 32bit addressable and zeroed so it can be
   * mapped to userspace without leaking data.
f905bc447   Paul Mundt   nommu: add new vm...
443
444
445
   *
   * VM_USERMAP is set on the corresponding VMA so that subsequent calls to
   * remap_vmalloc_range() are permissible.
b50731732   Paul Mundt   nommu: vmalloc_32...
446
447
448
   */
  void *vmalloc_32_user(unsigned long size)
  {
f905bc447   Paul Mundt   nommu: add new vm...
449
450
451
452
453
  	/*
  	 * We'll have to sort out the ZONE_DMA bits for 64-bit,
  	 * but for now this can simply use vmalloc_user() directly.
  	 */
  	return vmalloc_user(size);
b50731732   Paul Mundt   nommu: vmalloc_32...
454
455
  }
  EXPORT_SYMBOL(vmalloc_32_user);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
456
457
458
459
460
461
  
  void *vmap(struct page **pages, unsigned int count, unsigned long flags, pgprot_t prot)
  {
  	BUG();
  	return NULL;
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
462
  EXPORT_SYMBOL(vmap);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
463

b3bdda02a   Christoph Lameter   vmalloc: add cons...
464
  void vunmap(const void *addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
465
466
467
  {
  	BUG();
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
468
  EXPORT_SYMBOL(vunmap);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
469

eb6434d9e   Paul Mundt   nommu: Stub in vm...
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
  void *vm_map_ram(struct page **pages, unsigned int count, int node, pgprot_t prot)
  {
  	BUG();
  	return NULL;
  }
  EXPORT_SYMBOL(vm_map_ram);
  
  void vm_unmap_ram(const void *mem, unsigned int count)
  {
  	BUG();
  }
  EXPORT_SYMBOL(vm_unmap_ram);
  
  void vm_unmap_aliases(void)
  {
  }
  EXPORT_SYMBOL_GPL(vm_unmap_aliases);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
487
  /*
1eeb66a1b   Christoph Hellwig   move die notifier...
488
489
490
   * Implement a stub for vmalloc_sync_all() if the architecture chose not to
   * have one.
   */
3b32123d7   Gideon Israel Dsouza   mm: use macros fr...
491
  void __weak vmalloc_sync_all(void)
1eeb66a1b   Christoph Hellwig   move die notifier...
492
493
  {
  }
29c185e5c   Paul Mundt   nommu: Provide st...
494
495
496
497
498
499
500
501
502
503
504
505
  /**
   *	alloc_vm_area - allocate a range of kernel address space
   *	@size:		size of the area
   *
   *	Returns:	NULL on failure, vm_struct on success
   *
   *	This function reserves a range of kernel address space, and
   *	allocates pagetables to map that range.  No actual mappings
   *	are created.  If the kernel address space is not shared
   *	between processes, it syncs the pagetable across all
   *	processes.
   */
cd12909cb   David Vrabel   xen: map foreign ...
506
  struct vm_struct *alloc_vm_area(size_t size, pte_t **ptes)
29c185e5c   Paul Mundt   nommu: Provide st...
507
508
509
510
511
512
513
514
515
516
517
  {
  	BUG();
  	return NULL;
  }
  EXPORT_SYMBOL_GPL(alloc_vm_area);
  
  void free_vm_area(struct vm_struct *area)
  {
  	BUG();
  }
  EXPORT_SYMBOL_GPL(free_vm_area);
b50731732   Paul Mundt   nommu: vmalloc_32...
518
519
520
521
522
523
  int vm_insert_page(struct vm_area_struct *vma, unsigned long addr,
  		   struct page *page)
  {
  	return -EINVAL;
  }
  EXPORT_SYMBOL(vm_insert_page);
1eeb66a1b   Christoph Hellwig   move die notifier...
524
  /*
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
525
526
527
528
529
530
   *  sys_brk() for the most part doesn't need the global kernel
   *  lock, except when an application is doing something nasty
   *  like trying to un-brk an area that has already been mapped
   *  to a regular file.  in this case, the unmapping will need
   *  to invoke file system routines that need the global lock.
   */
6a6160a7b   Heiko Carstens   [CVE-2009-0029] S...
531
  SYSCALL_DEFINE1(brk, unsigned long, brk)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
  {
  	struct mm_struct *mm = current->mm;
  
  	if (brk < mm->start_brk || brk > mm->context.end_brk)
  		return mm->brk;
  
  	if (mm->brk == brk)
  		return mm->brk;
  
  	/*
  	 * Always allow shrinking brk
  	 */
  	if (brk <= mm->brk) {
  		mm->brk = brk;
  		return brk;
  	}
  
  	/*
  	 * Ok, looks good - let it rip.
  	 */
cfe79c00a   Mike Frysinger   NOMMU: Avoiding d...
552
  	flush_icache_range(mm->brk, brk);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
553
554
  	return mm->brk = brk;
  }
8feae1311   David Howells   NOMMU: Make VMAs ...
555
556
557
558
  /*
   * initialise the VMA and region record slabs
   */
  void __init mmap_init(void)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
559
  {
00a62ce91   KOSAKI Motohiro   mm: fix Committed...
560
  	int ret;
908c7f194   Tejun Heo   percpu_counter: a...
561
  	ret = percpu_counter_init(&vm_committed_as, 0, GFP_KERNEL);
00a62ce91   KOSAKI Motohiro   mm: fix Committed...
562
  	VM_BUG_ON(ret);
33e5d7697   David Howells   nommu: fix a numb...
563
  	vm_region_jar = KMEM_CACHE(vm_region, SLAB_PANIC);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
564
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
565

3034097a5   David Howells   [PATCH] NOMMU: Or...
566
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
567
568
   * validate the region tree
   * - the caller must hold the region lock
3034097a5   David Howells   [PATCH] NOMMU: Or...
569
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
570
571
  #ifdef CONFIG_DEBUG_NOMMU_REGIONS
  static noinline void validate_nommu_regions(void)
3034097a5   David Howells   [PATCH] NOMMU: Or...
572
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
573
574
  	struct vm_region *region, *last;
  	struct rb_node *p, *lastp;
3034097a5   David Howells   [PATCH] NOMMU: Or...
575

8feae1311   David Howells   NOMMU: Make VMAs ...
576
577
578
579
580
  	lastp = rb_first(&nommu_region_tree);
  	if (!lastp)
  		return;
  
  	last = rb_entry(lastp, struct vm_region, vm_rb);
33e5d7697   David Howells   nommu: fix a numb...
581
582
  	BUG_ON(unlikely(last->vm_end <= last->vm_start));
  	BUG_ON(unlikely(last->vm_top < last->vm_end));
8feae1311   David Howells   NOMMU: Make VMAs ...
583
584
585
586
  
  	while ((p = rb_next(lastp))) {
  		region = rb_entry(p, struct vm_region, vm_rb);
  		last = rb_entry(lastp, struct vm_region, vm_rb);
33e5d7697   David Howells   nommu: fix a numb...
587
588
589
  		BUG_ON(unlikely(region->vm_end <= region->vm_start));
  		BUG_ON(unlikely(region->vm_top < region->vm_end));
  		BUG_ON(unlikely(region->vm_start < last->vm_top));
3034097a5   David Howells   [PATCH] NOMMU: Or...
590

8feae1311   David Howells   NOMMU: Make VMAs ...
591
592
  		lastp = p;
  	}
3034097a5   David Howells   [PATCH] NOMMU: Or...
593
  }
8feae1311   David Howells   NOMMU: Make VMAs ...
594
  #else
33e5d7697   David Howells   nommu: fix a numb...
595
596
597
  static void validate_nommu_regions(void)
  {
  }
8feae1311   David Howells   NOMMU: Make VMAs ...
598
  #endif
3034097a5   David Howells   [PATCH] NOMMU: Or...
599
600
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
601
   * add a region into the global tree
3034097a5   David Howells   [PATCH] NOMMU: Or...
602
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
603
  static void add_nommu_region(struct vm_region *region)
3034097a5   David Howells   [PATCH] NOMMU: Or...
604
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
605
606
  	struct vm_region *pregion;
  	struct rb_node **p, *parent;
3034097a5   David Howells   [PATCH] NOMMU: Or...
607

8feae1311   David Howells   NOMMU: Make VMAs ...
608
  	validate_nommu_regions();
8feae1311   David Howells   NOMMU: Make VMAs ...
609
610
611
612
613
614
615
616
617
618
619
620
621
  	parent = NULL;
  	p = &nommu_region_tree.rb_node;
  	while (*p) {
  		parent = *p;
  		pregion = rb_entry(parent, struct vm_region, vm_rb);
  		if (region->vm_start < pregion->vm_start)
  			p = &(*p)->rb_left;
  		else if (region->vm_start > pregion->vm_start)
  			p = &(*p)->rb_right;
  		else if (pregion == region)
  			return;
  		else
  			BUG();
3034097a5   David Howells   [PATCH] NOMMU: Or...
622
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
623
624
  	rb_link_node(&region->vm_rb, parent, p);
  	rb_insert_color(&region->vm_rb, &nommu_region_tree);
3034097a5   David Howells   [PATCH] NOMMU: Or...
625

8feae1311   David Howells   NOMMU: Make VMAs ...
626
  	validate_nommu_regions();
3034097a5   David Howells   [PATCH] NOMMU: Or...
627
  }
3034097a5   David Howells   [PATCH] NOMMU: Or...
628
629
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
630
   * delete a region from the global tree
930e652a2   David Howells   [PATCH] NOMMU: Ma...
631
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
632
  static void delete_nommu_region(struct vm_region *region)
930e652a2   David Howells   [PATCH] NOMMU: Ma...
633
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
634
  	BUG_ON(!nommu_region_tree.rb_node);
930e652a2   David Howells   [PATCH] NOMMU: Ma...
635

8feae1311   David Howells   NOMMU: Make VMAs ...
636
637
638
  	validate_nommu_regions();
  	rb_erase(&region->vm_rb, &nommu_region_tree);
  	validate_nommu_regions();
57c8f63e8   Greg Ungerer   nommu: stub expan...
639
  }
930e652a2   David Howells   [PATCH] NOMMU: Ma...
640
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
641
   * free a contiguous series of pages
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
642
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
643
  static void free_page_series(unsigned long from, unsigned long to)
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
644
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
645
646
647
648
  	for (; from < to; from += PAGE_SIZE) {
  		struct page *page = virt_to_page(from);
  
  		kdebug("- free %lx", from);
33e5d7697   David Howells   nommu: fix a numb...
649
  		atomic_long_dec(&mmap_pages_allocated);
8feae1311   David Howells   NOMMU: Make VMAs ...
650
  		if (page_count(page) != 1)
33e5d7697   David Howells   nommu: fix a numb...
651
652
  			kdebug("free page %p: refcount not one: %d",
  			       page, page_count(page));
8feae1311   David Howells   NOMMU: Make VMAs ...
653
  		put_page(page);
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
654
  	}
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
655
656
657
  }
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
658
   * release a reference to a region
33e5d7697   David Howells   nommu: fix a numb...
659
   * - the caller must hold the region semaphore for writing, which this releases
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
660
   * - the region may not have been added to the tree yet, in which case vm_top
8feae1311   David Howells   NOMMU: Make VMAs ...
661
   *   will equal vm_start
3034097a5   David Howells   [PATCH] NOMMU: Or...
662
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
663
664
  static void __put_nommu_region(struct vm_region *region)
  	__releases(nommu_region_sem)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
665
  {
1e2ae599d   David Howells   nommu: struct vm_...
666
  	kenter("%p{%d}", region, region->vm_usage);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
667

8feae1311   David Howells   NOMMU: Make VMAs ...
668
  	BUG_ON(!nommu_region_tree.rb_node);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
669

1e2ae599d   David Howells   nommu: struct vm_...
670
  	if (--region->vm_usage == 0) {
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
671
  		if (region->vm_top > region->vm_start)
8feae1311   David Howells   NOMMU: Make VMAs ...
672
673
674
675
676
677
678
679
680
681
  			delete_nommu_region(region);
  		up_write(&nommu_region_sem);
  
  		if (region->vm_file)
  			fput(region->vm_file);
  
  		/* IO memory and memory shared directly out of the pagecache
  		 * from ramfs/tmpfs mustn't be released here */
  		if (region->vm_flags & VM_MAPPED_COPY) {
  			kdebug("free series");
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
682
  			free_page_series(region->vm_start, region->vm_top);
8feae1311   David Howells   NOMMU: Make VMAs ...
683
684
685
686
  		}
  		kmem_cache_free(vm_region_jar, region);
  	} else {
  		up_write(&nommu_region_sem);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
687
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
688
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
689

8feae1311   David Howells   NOMMU: Make VMAs ...
690
691
692
693
694
695
696
  /*
   * release a reference to a region
   */
  static void put_nommu_region(struct vm_region *region)
  {
  	down_write(&nommu_region_sem);
  	__put_nommu_region(region);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
697
  }
3034097a5   David Howells   [PATCH] NOMMU: Or...
698
  /*
eb8cdec4a   Bernd Schmidt   nommu: add suppor...
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
   * update protection on a vma
   */
  static void protect_vma(struct vm_area_struct *vma, unsigned long flags)
  {
  #ifdef CONFIG_MPU
  	struct mm_struct *mm = vma->vm_mm;
  	long start = vma->vm_start & PAGE_MASK;
  	while (start < vma->vm_end) {
  		protect_page(mm, start, flags);
  		start += PAGE_SIZE;
  	}
  	update_protections(mm);
  #endif
  }
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
715
716
717
718
   * add a VMA into a process's mm_struct in the appropriate place in the list
   * and tree and add to the address space's page tree also if not an anonymous
   * page
   * - should be called with mm->mmap_sem held writelocked
3034097a5   David Howells   [PATCH] NOMMU: Or...
719
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
720
  static void add_vma_to_mm(struct mm_struct *mm, struct vm_area_struct *vma)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
721
  {
6038def0d   Namhyung Kim   mm: nommu: sort m...
722
  	struct vm_area_struct *pvma, *prev;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
723
  	struct address_space *mapping;
6038def0d   Namhyung Kim   mm: nommu: sort m...
724
  	struct rb_node **p, *parent, *rb_prev;
8feae1311   David Howells   NOMMU: Make VMAs ...
725
726
727
728
729
730
731
  
  	kenter(",%p", vma);
  
  	BUG_ON(!vma->vm_region);
  
  	mm->map_count++;
  	vma->vm_mm = mm;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
732

eb8cdec4a   Bernd Schmidt   nommu: add suppor...
733
  	protect_vma(vma, vma->vm_flags);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
734
735
736
  	/* add the VMA to the mapping */
  	if (vma->vm_file) {
  		mapping = vma->vm_file->f_mapping;
83cde9e8b   Davidlohr Bueso   mm: use new helpe...
737
  		i_mmap_lock_write(mapping);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
738
  		flush_dcache_mmap_lock(mapping);
6b2dbba8b   Michel Lespinasse   mm: replace vma p...
739
  		vma_interval_tree_insert(vma, &mapping->i_mmap);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
740
  		flush_dcache_mmap_unlock(mapping);
83cde9e8b   Davidlohr Bueso   mm: use new helpe...
741
  		i_mmap_unlock_write(mapping);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
742
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
743
  	/* add the VMA to the tree */
6038def0d   Namhyung Kim   mm: nommu: sort m...
744
  	parent = rb_prev = NULL;
8feae1311   David Howells   NOMMU: Make VMAs ...
745
  	p = &mm->mm_rb.rb_node;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
746
747
748
  	while (*p) {
  		parent = *p;
  		pvma = rb_entry(parent, struct vm_area_struct, vm_rb);
8feae1311   David Howells   NOMMU: Make VMAs ...
749
750
751
  		/* sort by: start addr, end addr, VMA struct addr in that order
  		 * (the latter is necessary as we may get identical VMAs) */
  		if (vma->vm_start < pvma->vm_start)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
752
  			p = &(*p)->rb_left;
6038def0d   Namhyung Kim   mm: nommu: sort m...
753
754
  		else if (vma->vm_start > pvma->vm_start) {
  			rb_prev = parent;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
755
  			p = &(*p)->rb_right;
6038def0d   Namhyung Kim   mm: nommu: sort m...
756
  		} else if (vma->vm_end < pvma->vm_end)
8feae1311   David Howells   NOMMU: Make VMAs ...
757
  			p = &(*p)->rb_left;
6038def0d   Namhyung Kim   mm: nommu: sort m...
758
759
  		else if (vma->vm_end > pvma->vm_end) {
  			rb_prev = parent;
8feae1311   David Howells   NOMMU: Make VMAs ...
760
  			p = &(*p)->rb_right;
6038def0d   Namhyung Kim   mm: nommu: sort m...
761
  		} else if (vma < pvma)
8feae1311   David Howells   NOMMU: Make VMAs ...
762
  			p = &(*p)->rb_left;
6038def0d   Namhyung Kim   mm: nommu: sort m...
763
764
  		else if (vma > pvma) {
  			rb_prev = parent;
8feae1311   David Howells   NOMMU: Make VMAs ...
765
  			p = &(*p)->rb_right;
6038def0d   Namhyung Kim   mm: nommu: sort m...
766
  		} else
8feae1311   David Howells   NOMMU: Make VMAs ...
767
  			BUG();
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
768
769
770
  	}
  
  	rb_link_node(&vma->vm_rb, parent, p);
8feae1311   David Howells   NOMMU: Make VMAs ...
771
772
773
  	rb_insert_color(&vma->vm_rb, &mm->mm_rb);
  
  	/* add VMA to the VMA list also */
6038def0d   Namhyung Kim   mm: nommu: sort m...
774
775
776
  	prev = NULL;
  	if (rb_prev)
  		prev = rb_entry(rb_prev, struct vm_area_struct, vm_rb);
8feae1311   David Howells   NOMMU: Make VMAs ...
777

6038def0d   Namhyung Kim   mm: nommu: sort m...
778
  	__vma_link_list(mm, vma, prev, parent);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
779
  }
3034097a5   David Howells   [PATCH] NOMMU: Or...
780
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
781
   * delete a VMA from its owning mm_struct and address space
3034097a5   David Howells   [PATCH] NOMMU: Or...
782
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
783
  static void delete_vma_from_mm(struct vm_area_struct *vma)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
784
  {
615d6e875   Davidlohr Bueso   mm: per-thread vm...
785
  	int i;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
786
  	struct address_space *mapping;
8feae1311   David Howells   NOMMU: Make VMAs ...
787
  	struct mm_struct *mm = vma->vm_mm;
615d6e875   Davidlohr Bueso   mm: per-thread vm...
788
  	struct task_struct *curr = current;
8feae1311   David Howells   NOMMU: Make VMAs ...
789
790
  
  	kenter("%p", vma);
eb8cdec4a   Bernd Schmidt   nommu: add suppor...
791
  	protect_vma(vma, 0);
8feae1311   David Howells   NOMMU: Make VMAs ...
792
  	mm->map_count--;
615d6e875   Davidlohr Bueso   mm: per-thread vm...
793
794
795
  	for (i = 0; i < VMACACHE_SIZE; i++) {
  		/* if the vma is cached, invalidate the entire cache */
  		if (curr->vmacache[i] == vma) {
e020d5bd8   Steven Miao   mm: nommu: per-th...
796
  			vmacache_invalidate(mm);
615d6e875   Davidlohr Bueso   mm: per-thread vm...
797
798
799
  			break;
  		}
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
800
801
802
803
  
  	/* remove the VMA from the mapping */
  	if (vma->vm_file) {
  		mapping = vma->vm_file->f_mapping;
83cde9e8b   Davidlohr Bueso   mm: use new helpe...
804
  		i_mmap_lock_write(mapping);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
805
  		flush_dcache_mmap_lock(mapping);
6b2dbba8b   Michel Lespinasse   mm: replace vma p...
806
  		vma_interval_tree_remove(vma, &mapping->i_mmap);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
807
  		flush_dcache_mmap_unlock(mapping);
83cde9e8b   Davidlohr Bueso   mm: use new helpe...
808
  		i_mmap_unlock_write(mapping);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
809
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
810
811
  	/* remove from the MM's tree and list */
  	rb_erase(&vma->vm_rb, &mm->mm_rb);
b951bf2c4   Namhyung Kim   mm: nommu: don't ...
812
813
814
815
816
817
818
819
  
  	if (vma->vm_prev)
  		vma->vm_prev->vm_next = vma->vm_next;
  	else
  		mm->mmap = vma->vm_next;
  
  	if (vma->vm_next)
  		vma->vm_next->vm_prev = vma->vm_prev;
8feae1311   David Howells   NOMMU: Make VMAs ...
820
821
822
823
824
825
826
827
828
829
  }
  
  /*
   * destroy a VMA record
   */
  static void delete_vma(struct mm_struct *mm, struct vm_area_struct *vma)
  {
  	kenter("%p", vma);
  	if (vma->vm_ops && vma->vm_ops->close)
  		vma->vm_ops->close(vma);
e9714acf8   Konstantin Khlebnikov   mm: kill vma flag...
830
  	if (vma->vm_file)
8feae1311   David Howells   NOMMU: Make VMAs ...
831
  		fput(vma->vm_file);
8feae1311   David Howells   NOMMU: Make VMAs ...
832
833
834
835
836
837
838
839
840
841
842
  	put_nommu_region(vma->vm_region);
  	kmem_cache_free(vm_area_cachep, vma);
  }
  
  /*
   * look up the first VMA in which addr resides, NULL if none
   * - should be called with mm->mmap_sem at least held readlocked
   */
  struct vm_area_struct *find_vma(struct mm_struct *mm, unsigned long addr)
  {
  	struct vm_area_struct *vma;
8feae1311   David Howells   NOMMU: Make VMAs ...
843
844
  
  	/* check the cache first */
615d6e875   Davidlohr Bueso   mm: per-thread vm...
845
846
  	vma = vmacache_find(mm, addr);
  	if (likely(vma))
8feae1311   David Howells   NOMMU: Make VMAs ...
847
  		return vma;
e922c4c53   Namhyung Kim   mm: nommu: find v...
848
  	/* trawl the list (there may be multiple mappings in which addr
8feae1311   David Howells   NOMMU: Make VMAs ...
849
  	 * resides) */
e922c4c53   Namhyung Kim   mm: nommu: find v...
850
  	for (vma = mm->mmap; vma; vma = vma->vm_next) {
8feae1311   David Howells   NOMMU: Make VMAs ...
851
852
853
  		if (vma->vm_start > addr)
  			return NULL;
  		if (vma->vm_end > addr) {
615d6e875   Davidlohr Bueso   mm: per-thread vm...
854
  			vmacache_update(addr, vma);
8feae1311   David Howells   NOMMU: Make VMAs ...
855
856
857
858
859
860
861
862
863
864
865
866
867
868
  			return vma;
  		}
  	}
  
  	return NULL;
  }
  EXPORT_SYMBOL(find_vma);
  
  /*
   * find a VMA
   * - we don't extend stack VMAs under NOMMU conditions
   */
  struct vm_area_struct *find_extend_vma(struct mm_struct *mm, unsigned long addr)
  {
7561e8ca0   David Howells   NOMMU: Revert 'no...
869
  	return find_vma(mm, addr);
8feae1311   David Howells   NOMMU: Make VMAs ...
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
  }
  
  /*
   * expand a stack to a given address
   * - not supported under NOMMU conditions
   */
  int expand_stack(struct vm_area_struct *vma, unsigned long address)
  {
  	return -ENOMEM;
  }
  
  /*
   * look up the first VMA exactly that exactly matches addr
   * - should be called with mm->mmap_sem at least held readlocked
   */
  static struct vm_area_struct *find_vma_exact(struct mm_struct *mm,
  					     unsigned long addr,
  					     unsigned long len)
  {
  	struct vm_area_struct *vma;
8feae1311   David Howells   NOMMU: Make VMAs ...
890
891
892
  	unsigned long end = addr + len;
  
  	/* check the cache first */
615d6e875   Davidlohr Bueso   mm: per-thread vm...
893
894
  	vma = vmacache_find_exact(mm, addr, end);
  	if (vma)
8feae1311   David Howells   NOMMU: Make VMAs ...
895
  		return vma;
e922c4c53   Namhyung Kim   mm: nommu: find v...
896
  	/* trawl the list (there may be multiple mappings in which addr
8feae1311   David Howells   NOMMU: Make VMAs ...
897
  	 * resides) */
e922c4c53   Namhyung Kim   mm: nommu: find v...
898
  	for (vma = mm->mmap; vma; vma = vma->vm_next) {
8feae1311   David Howells   NOMMU: Make VMAs ...
899
900
901
902
903
  		if (vma->vm_start < addr)
  			continue;
  		if (vma->vm_start > addr)
  			return NULL;
  		if (vma->vm_end == end) {
615d6e875   Davidlohr Bueso   mm: per-thread vm...
904
  			vmacache_update(addr, vma);
8feae1311   David Howells   NOMMU: Make VMAs ...
905
906
907
908
909
  			return vma;
  		}
  	}
  
  	return NULL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
910
911
912
913
914
915
916
917
918
919
920
921
922
923
  }
  
  /*
   * determine whether a mapping should be permitted and, if so, what sort of
   * mapping we're capable of supporting
   */
  static int validate_mmap_request(struct file *file,
  				 unsigned long addr,
  				 unsigned long len,
  				 unsigned long prot,
  				 unsigned long flags,
  				 unsigned long pgoff,
  				 unsigned long *_capabilities)
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
924
  	unsigned long capabilities, rlen;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
925
926
927
  	int ret;
  
  	/* do the simple checks first */
06aab5a30   David Howells   NOMMU: Ignore mma...
928
  	if (flags & MAP_FIXED) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
929
930
931
932
933
934
935
936
937
938
  		printk(KERN_DEBUG
  		       "%d: Can't do fixed-address/overlay mmap of RAM
  ",
  		       current->pid);
  		return -EINVAL;
  	}
  
  	if ((flags & MAP_TYPE) != MAP_PRIVATE &&
  	    (flags & MAP_TYPE) != MAP_SHARED)
  		return -EINVAL;
f81cff0d4   Mike Frysinger   [PATCH] uclinux: ...
939
  	if (!len)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
940
  		return -EINVAL;
f81cff0d4   Mike Frysinger   [PATCH] uclinux: ...
941
  	/* Careful about overflows.. */
8feae1311   David Howells   NOMMU: Make VMAs ...
942
943
  	rlen = PAGE_ALIGN(len);
  	if (!rlen || rlen > TASK_SIZE)
f81cff0d4   Mike Frysinger   [PATCH] uclinux: ...
944
  		return -ENOMEM;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
945
  	/* offset overflow? */
8feae1311   David Howells   NOMMU: Make VMAs ...
946
  	if ((pgoff + (rlen >> PAGE_SHIFT)) < pgoff)
f81cff0d4   Mike Frysinger   [PATCH] uclinux: ...
947
  		return -EOVERFLOW;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
948
949
  
  	if (file) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
950
  		/* files must support mmap */
72c2d5319   Al Viro   file->f_op is nev...
951
  		if (!file->f_op->mmap)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
952
953
954
955
956
957
  			return -ENODEV;
  
  		/* work out if what we've got could possibly be shared
  		 * - we support chardevs that provide their own "memory"
  		 * - we support files/blockdevs that are memory backed
  		 */
b4caecd48   Christoph Hellwig   fs: introduce f_o...
958
959
960
  		if (file->f_op->mmap_capabilities) {
  			capabilities = file->f_op->mmap_capabilities(file);
  		} else {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
961
962
  			/* no explicit capabilities set, so assume some
  			 * defaults */
496ad9aa8   Al Viro   new helper: file_...
963
  			switch (file_inode(file)->i_mode & S_IFMT) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
964
965
  			case S_IFREG:
  			case S_IFBLK:
b4caecd48   Christoph Hellwig   fs: introduce f_o...
966
  				capabilities = NOMMU_MAP_COPY;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
967
968
969
970
  				break;
  
  			case S_IFCHR:
  				capabilities =
b4caecd48   Christoph Hellwig   fs: introduce f_o...
971
972
973
  					NOMMU_MAP_DIRECT |
  					NOMMU_MAP_READ |
  					NOMMU_MAP_WRITE;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
974
975
976
977
978
979
980
981
982
983
  				break;
  
  			default:
  				return -EINVAL;
  			}
  		}
  
  		/* eliminate any capabilities that we can't support on this
  		 * device */
  		if (!file->f_op->get_unmapped_area)
b4caecd48   Christoph Hellwig   fs: introduce f_o...
984
  			capabilities &= ~NOMMU_MAP_DIRECT;
6e242a1ce   Al Viro   nommu: use __vfs_...
985
  		if (!(file->f_mode & FMODE_CAN_READ))
b4caecd48   Christoph Hellwig   fs: introduce f_o...
986
  			capabilities &= ~NOMMU_MAP_COPY;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
987

28d7a6ae9   Graff Yang   nommu: check fd r...
988
989
990
  		/* The file shall have been opened with read permission. */
  		if (!(file->f_mode & FMODE_READ))
  			return -EACCES;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
991
992
993
994
995
  		if (flags & MAP_SHARED) {
  			/* do checks for writing, appending and locking */
  			if ((prot & PROT_WRITE) &&
  			    !(file->f_mode & FMODE_WRITE))
  				return -EACCES;
496ad9aa8   Al Viro   new helper: file_...
996
  			if (IS_APPEND(file_inode(file)) &&
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
997
998
  			    (file->f_mode & FMODE_WRITE))
  				return -EACCES;
d7a06983a   Jeff Layton   locks: fix locks_...
999
  			if (locks_verify_locked(file))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1000
  				return -EAGAIN;
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1001
  			if (!(capabilities & NOMMU_MAP_DIRECT))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1002
  				return -ENODEV;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1003
  			/* we mustn't privatise shared mappings */
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1004
  			capabilities &= ~NOMMU_MAP_COPY;
ac7149045   Choi Gi-yong   mm: fix 'ERROR: d...
1005
  		} else {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1006
1007
  			/* we're going to read the file into private memory we
  			 * allocate */
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1008
  			if (!(capabilities & NOMMU_MAP_COPY))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1009
1010
1011
1012
1013
  				return -ENODEV;
  
  			/* we don't permit a private writable mapping to be
  			 * shared with the backing device */
  			if (prot & PROT_WRITE)
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1014
  				capabilities &= ~NOMMU_MAP_DIRECT;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1015
  		}
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1016
1017
1018
1019
  		if (capabilities & NOMMU_MAP_DIRECT) {
  			if (((prot & PROT_READ)  && !(capabilities & NOMMU_MAP_READ))  ||
  			    ((prot & PROT_WRITE) && !(capabilities & NOMMU_MAP_WRITE)) ||
  			    ((prot & PROT_EXEC)  && !(capabilities & NOMMU_MAP_EXEC))
3c7b20454   Bernd Schmidt   nommu: allow priv...
1020
  			    ) {
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1021
  				capabilities &= ~NOMMU_MAP_DIRECT;
3c7b20454   Bernd Schmidt   nommu: allow priv...
1022
1023
1024
1025
1026
1027
1028
1029
  				if (flags & MAP_SHARED) {
  					printk(KERN_WARNING
  					       "MAP_SHARED not completely supported on !MMU
  ");
  					return -EINVAL;
  				}
  			}
  		}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1030
1031
  		/* handle executable mappings and implied executable
  		 * mappings */
e9536ae72   Josef Sipek   [PATCH] struct pa...
1032
  		if (file->f_path.mnt->mnt_flags & MNT_NOEXEC) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1033
1034
  			if (prot & PROT_EXEC)
  				return -EPERM;
ac7149045   Choi Gi-yong   mm: fix 'ERROR: d...
1035
  		} else if ((prot & PROT_READ) && !(prot & PROT_EXEC)) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1036
1037
  			/* handle implication of PROT_EXEC by PROT_READ */
  			if (current->personality & READ_IMPLIES_EXEC) {
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1038
  				if (capabilities & NOMMU_MAP_EXEC)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1039
1040
  					prot |= PROT_EXEC;
  			}
ac7149045   Choi Gi-yong   mm: fix 'ERROR: d...
1041
  		} else if ((prot & PROT_READ) &&
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1042
  			 (prot & PROT_EXEC) &&
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1043
  			 !(capabilities & NOMMU_MAP_EXEC)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1044
1045
  			 ) {
  			/* backing file is not executable, try to copy */
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1046
  			capabilities &= ~NOMMU_MAP_DIRECT;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1047
  		}
ac7149045   Choi Gi-yong   mm: fix 'ERROR: d...
1048
  	} else {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1049
1050
1051
  		/* anonymous mappings are always memory backed and can be
  		 * privately mapped
  		 */
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1052
  		capabilities = NOMMU_MAP_COPY;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1053
1054
1055
1056
1057
1058
1059
1060
  
  		/* handle PROT_EXEC implication by PROT_READ */
  		if ((prot & PROT_READ) &&
  		    (current->personality & READ_IMPLIES_EXEC))
  			prot |= PROT_EXEC;
  	}
  
  	/* allow the security API to have its say */
e5467859f   Al Viro   split ->file_mmap...
1061
1062
1063
  	ret = security_mmap_addr(addr);
  	if (ret < 0)
  		return ret;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1064
1065
1066
1067
1068
1069
1070
1071
1072
1073
1074
1075
1076
1077
1078
1079
1080
1081
  
  	/* looks okay */
  	*_capabilities = capabilities;
  	return 0;
  }
  
  /*
   * we've determined that we can make the mapping, now translate what we
   * now know into VMA flags
   */
  static unsigned long determine_vm_flags(struct file *file,
  					unsigned long prot,
  					unsigned long flags,
  					unsigned long capabilities)
  {
  	unsigned long vm_flags;
  
  	vm_flags = calc_vm_prot_bits(prot) | calc_vm_flag_bits(flags);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1082
  	/* vm_flags |= mm->def_flags; */
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1083
  	if (!(capabilities & NOMMU_MAP_DIRECT)) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1084
  		/* attempt to share read-only copies of mapped file chunks */
3c7b20454   Bernd Schmidt   nommu: allow priv...
1085
  		vm_flags |= VM_MAYREAD | VM_MAYWRITE | VM_MAYEXEC;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1086
1087
  		if (file && !(prot & PROT_WRITE))
  			vm_flags |= VM_MAYSHARE;
3c7b20454   Bernd Schmidt   nommu: allow priv...
1088
  	} else {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1089
1090
1091
  		/* overlay a shareable mapping on the backing device or inode
  		 * if possible - used for chardevs, ramfs/tmpfs/shmfs and
  		 * romfs/cramfs */
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1092
  		vm_flags |= VM_MAYSHARE | (capabilities & NOMMU_VMFLAGS);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1093
  		if (flags & MAP_SHARED)
3c7b20454   Bernd Schmidt   nommu: allow priv...
1094
  			vm_flags |= VM_SHARED;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1095
1096
1097
1098
1099
1100
  	}
  
  	/* refuse to let anyone share private mappings with this process if
  	 * it's being traced - otherwise breakpoints set in it may interfere
  	 * with another untraced process
  	 */
a288eecce   Tejun Heo   ptrace: kill triv...
1101
  	if ((flags & MAP_PRIVATE) && current->ptrace)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1102
1103
1104
1105
1106
1107
  		vm_flags &= ~VM_MAYSHARE;
  
  	return vm_flags;
  }
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
1108
1109
   * set up a shared mapping on a file (the driver or filesystem provides and
   * pins the storage)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1110
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
1111
  static int do_mmap_shared_file(struct vm_area_struct *vma)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1112
1113
1114
1115
  {
  	int ret;
  
  	ret = vma->vm_file->f_op->mmap(vma->vm_file, vma);
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1116
1117
  	if (ret == 0) {
  		vma->vm_region->vm_top = vma->vm_region->vm_end;
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1118
  		return 0;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1119
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1120
1121
  	if (ret != -ENOSYS)
  		return ret;
3fa30460e   David Howells   nommu: fix an inc...
1122
1123
1124
  	/* getting -ENOSYS indicates that direct mmap isn't possible (as
  	 * opposed to tried but failed) so we can only give a suitable error as
  	 * it's not possible to make a private copy if MAP_SHARED was given */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1125
1126
1127
1128
1129
1130
  	return -ENODEV;
  }
  
  /*
   * set up a private mapping or an anonymous shared mapping
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
1131
1132
  static int do_mmap_private(struct vm_area_struct *vma,
  			   struct vm_region *region,
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1133
1134
  			   unsigned long len,
  			   unsigned long capabilities)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1135
  {
dbc8358c7   Joonsoo Kim   mm/nommu: use all...
1136
  	unsigned long total, point;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1137
  	void *base;
8feae1311   David Howells   NOMMU: Make VMAs ...
1138
  	int ret, order;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1139
1140
1141
1142
1143
  
  	/* invoke the file's mapping function so that it can keep track of
  	 * shared mappings on devices or memory
  	 * - VM_MAYSHARE will be set if it may attempt to share
  	 */
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1144
  	if (capabilities & NOMMU_MAP_DIRECT) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1145
  		ret = vma->vm_file->f_op->mmap(vma->vm_file, vma);
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1146
  		if (ret == 0) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1147
  			/* shouldn't return success if we're not sharing */
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1148
1149
  			BUG_ON(!(vma->vm_flags & VM_MAYSHARE));
  			vma->vm_region->vm_top = vma->vm_region->vm_end;
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1150
  			return 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1151
  		}
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1152
1153
  		if (ret != -ENOSYS)
  			return ret;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1154
1155
1156
1157
1158
  
  		/* getting an ENOSYS error indicates that direct mmap isn't
  		 * possible (as opposed to tried but failed) so we'll try to
  		 * make a private copy of the data and map that instead */
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1159

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1160
1161
1162
1163
  	/* allocate some memory to hold the mapping
  	 * - note that this may not return a page-aligned address if the object
  	 *   we're allocating is smaller than a page
  	 */
f67d9b157   Bob Liu   nommu: add page a...
1164
  	order = get_order(len);
8feae1311   David Howells   NOMMU: Make VMAs ...
1165
  	kdebug("alloc order %d for %lx", order, len);
8feae1311   David Howells   NOMMU: Make VMAs ...
1166
  	total = 1 << order;
f67d9b157   Bob Liu   nommu: add page a...
1167
  	point = len >> PAGE_SHIFT;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1168

dbc8358c7   Joonsoo Kim   mm/nommu: use all...
1169
  	/* we don't want to allocate a power-of-2 sized page set */
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1170
  	if (sysctl_nr_trim_pages && total - point >= sysctl_nr_trim_pages) {
dbc8358c7   Joonsoo Kim   mm/nommu: use all...
1171
1172
  		total = point;
  		kdebug("try to alloc exact %lu pages", total);
8feae1311   David Howells   NOMMU: Make VMAs ...
1173
  	}
da616534e   Joonsoo Kim   mm/nommu: fix mem...
1174
  	base = alloc_pages_exact(total << PAGE_SHIFT, GFP_KERNEL);
dbc8358c7   Joonsoo Kim   mm/nommu: use all...
1175
1176
1177
1178
  	if (!base)
  		goto enomem;
  
  	atomic_long_add(total, &mmap_pages_allocated);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1179

8feae1311   David Howells   NOMMU: Make VMAs ...
1180
1181
  	region->vm_flags = vma->vm_flags |= VM_MAPPED_COPY;
  	region->vm_start = (unsigned long) base;
f67d9b157   Bob Liu   nommu: add page a...
1182
  	region->vm_end   = region->vm_start + len;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1183
  	region->vm_top   = region->vm_start + (total << PAGE_SHIFT);
8feae1311   David Howells   NOMMU: Make VMAs ...
1184
1185
1186
  
  	vma->vm_start = region->vm_start;
  	vma->vm_end   = region->vm_start + len;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1187
1188
1189
1190
1191
1192
1193
1194
1195
1196
1197
  
  	if (vma->vm_file) {
  		/* read the contents of a file into the copy */
  		mm_segment_t old_fs;
  		loff_t fpos;
  
  		fpos = vma->vm_pgoff;
  		fpos <<= PAGE_SHIFT;
  
  		old_fs = get_fs();
  		set_fs(KERNEL_DS);
6e242a1ce   Al Viro   nommu: use __vfs_...
1198
  		ret = __vfs_read(vma->vm_file, base, len, &fpos);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1199
1200
1201
1202
1203
1204
  		set_fs(old_fs);
  
  		if (ret < 0)
  			goto error_free;
  
  		/* clear the last little bit */
f67d9b157   Bob Liu   nommu: add page a...
1205
1206
  		if (ret < len)
  			memset(base + ret, 0, len - ret);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1207

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1208
1209
1210
1211
1212
  	}
  
  	return 0;
  
  error_free:
7223bb4a8   Namhyung Kim   mm: nommu: fix a ...
1213
  	free_page_series(region->vm_start, region->vm_top);
8feae1311   David Howells   NOMMU: Make VMAs ...
1214
1215
  	region->vm_start = vma->vm_start = 0;
  	region->vm_end   = vma->vm_end = 0;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1216
  	region->vm_top   = 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1217
1218
1219
  	return ret;
  
  enomem:
b1de0d139   Mitchel Humpherys   mm: convert some ...
1220
1221
  	pr_err("Allocation of length %lu from process %d (%s) failed
  ",
05ae6fa31   Greg Ungerer   uclinux: add proc...
1222
  	       len, current->pid, current->comm);
7bf02ea22   David Rientjes   arch, mm: filter ...
1223
  	show_free_areas(0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1224
1225
1226
1227
1228
1229
  	return -ENOMEM;
  }
  
  /*
   * handle mapping creation for uClinux
   */
e3fc629d7   Al Viro   switch aio and sh...
1230
  unsigned long do_mmap_pgoff(struct file *file,
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1231
1232
1233
1234
  			    unsigned long addr,
  			    unsigned long len,
  			    unsigned long prot,
  			    unsigned long flags,
bebeb3d68   Michel Lespinasse   mm: introduce mm_...
1235
  			    unsigned long pgoff,
41badc15c   Michel Lespinasse   mm: make do_mmap_...
1236
  			    unsigned long *populate)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1237
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
1238
1239
  	struct vm_area_struct *vma;
  	struct vm_region *region;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1240
  	struct rb_node *rb;
8feae1311   David Howells   NOMMU: Make VMAs ...
1241
  	unsigned long capabilities, vm_flags, result;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1242
  	int ret;
8feae1311   David Howells   NOMMU: Make VMAs ...
1243
  	kenter(",%lx,%lx,%lx,%lx,%lx", addr, len, prot, flags, pgoff);
41badc15c   Michel Lespinasse   mm: make do_mmap_...
1244
  	*populate = 0;
bebeb3d68   Michel Lespinasse   mm: introduce mm_...
1245

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1246
1247
1248
1249
  	/* decide whether we should attempt the mapping, and if so what sort of
  	 * mapping */
  	ret = validate_mmap_request(file, addr, len, prot, flags, pgoff,
  				    &capabilities);
8feae1311   David Howells   NOMMU: Make VMAs ...
1250
1251
  	if (ret < 0) {
  		kleave(" = %d [val]", ret);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1252
  		return ret;
8feae1311   David Howells   NOMMU: Make VMAs ...
1253
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1254

06aab5a30   David Howells   NOMMU: Ignore mma...
1255
1256
  	/* we ignore the address hint */
  	addr = 0;
f67d9b157   Bob Liu   nommu: add page a...
1257
  	len = PAGE_ALIGN(len);
06aab5a30   David Howells   NOMMU: Ignore mma...
1258

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1259
1260
1261
  	/* we've determined that we can make the mapping, now translate what we
  	 * now know into VMA flags */
  	vm_flags = determine_vm_flags(file, prot, flags, capabilities);
8feae1311   David Howells   NOMMU: Make VMAs ...
1262
1263
1264
1265
1266
1267
1268
1269
  	/* we're going to need to record the mapping */
  	region = kmem_cache_zalloc(vm_region_jar, GFP_KERNEL);
  	if (!region)
  		goto error_getting_region;
  
  	vma = kmem_cache_zalloc(vm_area_cachep, GFP_KERNEL);
  	if (!vma)
  		goto error_getting_vma;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1270

1e2ae599d   David Howells   nommu: struct vm_...
1271
  	region->vm_usage = 1;
8feae1311   David Howells   NOMMU: Make VMAs ...
1272
1273
  	region->vm_flags = vm_flags;
  	region->vm_pgoff = pgoff;
5beb49305   Rik van Riel   mm: change anon_v...
1274
  	INIT_LIST_HEAD(&vma->anon_vma_chain);
8feae1311   David Howells   NOMMU: Make VMAs ...
1275
1276
  	vma->vm_flags = vm_flags;
  	vma->vm_pgoff = pgoff;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1277

8feae1311   David Howells   NOMMU: Make VMAs ...
1278
  	if (file) {
cb0942b81   Al Viro   make get_file() r...
1279
1280
  		region->vm_file = get_file(file);
  		vma->vm_file = get_file(file);
8feae1311   David Howells   NOMMU: Make VMAs ...
1281
1282
1283
1284
1285
  	}
  
  	down_write(&nommu_region_sem);
  
  	/* if we want to share, we need to check for regions created by other
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1286
  	 * mmap() calls that overlap with our proposed mapping
8feae1311   David Howells   NOMMU: Make VMAs ...
1287
  	 * - we can only share with a superset match on most regular files
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1288
1289
1290
1291
1292
1293
  	 * - shared mappings on character devices and memory backed files are
  	 *   permitted to overlap inexactly as far as we are concerned for in
  	 *   these cases, sharing is handled in the driver or filesystem rather
  	 *   than here
  	 */
  	if (vm_flags & VM_MAYSHARE) {
8feae1311   David Howells   NOMMU: Make VMAs ...
1294
1295
  		struct vm_region *pregion;
  		unsigned long pglen, rpglen, pgend, rpgend, start;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1296

8feae1311   David Howells   NOMMU: Make VMAs ...
1297
1298
  		pglen = (len + PAGE_SIZE - 1) >> PAGE_SHIFT;
  		pgend = pgoff + pglen;
165b23927   David Howells   [PATCH] NOMMU: ma...
1299

8feae1311   David Howells   NOMMU: Make VMAs ...
1300
1301
  		for (rb = rb_first(&nommu_region_tree); rb; rb = rb_next(rb)) {
  			pregion = rb_entry(rb, struct vm_region, vm_rb);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1302

8feae1311   David Howells   NOMMU: Make VMAs ...
1303
  			if (!(pregion->vm_flags & VM_MAYSHARE))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1304
1305
1306
  				continue;
  
  			/* search for overlapping mappings on the same file */
496ad9aa8   Al Viro   new helper: file_...
1307
1308
  			if (file_inode(pregion->vm_file) !=
  			    file_inode(file))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1309
  				continue;
8feae1311   David Howells   NOMMU: Make VMAs ...
1310
  			if (pregion->vm_pgoff >= pgend)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1311
  				continue;
8feae1311   David Howells   NOMMU: Make VMAs ...
1312
1313
1314
1315
  			rpglen = pregion->vm_end - pregion->vm_start;
  			rpglen = (rpglen + PAGE_SIZE - 1) >> PAGE_SHIFT;
  			rpgend = pregion->vm_pgoff + rpglen;
  			if (pgoff >= rpgend)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1316
  				continue;
8feae1311   David Howells   NOMMU: Make VMAs ...
1317
1318
1319
1320
1321
  			/* handle inexactly overlapping matches between
  			 * mappings */
  			if ((pregion->vm_pgoff != pgoff || rpglen != pglen) &&
  			    !(pgoff >= pregion->vm_pgoff && pgend <= rpgend)) {
  				/* new mapping is not a subset of the region */
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1322
  				if (!(capabilities & NOMMU_MAP_DIRECT))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1323
1324
1325
  					goto sharing_violation;
  				continue;
  			}
8feae1311   David Howells   NOMMU: Make VMAs ...
1326
  			/* we've found a region we can share */
1e2ae599d   David Howells   nommu: struct vm_...
1327
  			pregion->vm_usage++;
8feae1311   David Howells   NOMMU: Make VMAs ...
1328
1329
1330
1331
1332
1333
1334
1335
1336
1337
1338
1339
1340
1341
1342
1343
  			vma->vm_region = pregion;
  			start = pregion->vm_start;
  			start += (pgoff - pregion->vm_pgoff) << PAGE_SHIFT;
  			vma->vm_start = start;
  			vma->vm_end = start + len;
  
  			if (pregion->vm_flags & VM_MAPPED_COPY) {
  				kdebug("share copy");
  				vma->vm_flags |= VM_MAPPED_COPY;
  			} else {
  				kdebug("share mmap");
  				ret = do_mmap_shared_file(vma);
  				if (ret < 0) {
  					vma->vm_region = NULL;
  					vma->vm_start = 0;
  					vma->vm_end = 0;
1e2ae599d   David Howells   nommu: struct vm_...
1344
  					pregion->vm_usage--;
8feae1311   David Howells   NOMMU: Make VMAs ...
1345
1346
1347
1348
1349
1350
1351
1352
1353
  					pregion = NULL;
  					goto error_just_free;
  				}
  			}
  			fput(region->vm_file);
  			kmem_cache_free(vm_region_jar, region);
  			region = pregion;
  			result = start;
  			goto share;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1354
  		}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1355
1356
1357
1358
  		/* obtain the address at which to make a shared mapping
  		 * - this is the hook for quasi-memory character devices to
  		 *   tell us the location of a shared mapping
  		 */
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1359
  		if (capabilities & NOMMU_MAP_DIRECT) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1360
1361
  			addr = file->f_op->get_unmapped_area(file, addr, len,
  							     pgoff, flags);
bb005a59e   Namhyung Kim   mm: nommu: fix a ...
1362
  			if (IS_ERR_VALUE(addr)) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1363
  				ret = addr;
bb005a59e   Namhyung Kim   mm: nommu: fix a ...
1364
  				if (ret != -ENOSYS)
8feae1311   David Howells   NOMMU: Make VMAs ...
1365
  					goto error_just_free;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1366
1367
1368
1369
  
  				/* the driver refused to tell us where to site
  				 * the mapping so we'll have to attempt to copy
  				 * it */
bb005a59e   Namhyung Kim   mm: nommu: fix a ...
1370
  				ret = -ENODEV;
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1371
  				if (!(capabilities & NOMMU_MAP_COPY))
8feae1311   David Howells   NOMMU: Make VMAs ...
1372
  					goto error_just_free;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1373

b4caecd48   Christoph Hellwig   fs: introduce f_o...
1374
  				capabilities &= ~NOMMU_MAP_DIRECT;
8feae1311   David Howells   NOMMU: Make VMAs ...
1375
1376
1377
  			} else {
  				vma->vm_start = region->vm_start = addr;
  				vma->vm_end = region->vm_end = addr + len;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1378
1379
1380
  			}
  		}
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1381
  	vma->vm_region = region;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1382

645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1383
  	/* set up the mapping
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1384
  	 * - the region is filled in if NOMMU_MAP_DIRECT is still set
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1385
  	 */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1386
  	if (file && vma->vm_flags & VM_SHARED)
8feae1311   David Howells   NOMMU: Make VMAs ...
1387
  		ret = do_mmap_shared_file(vma);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1388
  	else
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1389
  		ret = do_mmap_private(vma, region, len, capabilities);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1390
  	if (ret < 0)
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1391
1392
  		goto error_just_free;
  	add_nommu_region(region);
8feae1311   David Howells   NOMMU: Make VMAs ...
1393

ea6376395   Jie Zhang   nommu: fix malloc...
1394
1395
1396
1397
  	/* clear anonymous mappings that don't ask for uninitialized data */
  	if (!vma->vm_file && !(flags & MAP_UNINITIALIZED))
  		memset((void *)region->vm_start, 0,
  		       region->vm_end - region->vm_start);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1398
  	/* okay... we have a mapping; now we have to register it */
8feae1311   David Howells   NOMMU: Make VMAs ...
1399
  	result = vma->vm_start;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1400

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1401
  	current->mm->total_vm += len >> PAGE_SHIFT;
8feae1311   David Howells   NOMMU: Make VMAs ...
1402
1403
  share:
  	add_vma_to_mm(current->mm, vma);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1404

cfe79c00a   Mike Frysinger   NOMMU: Avoiding d...
1405
1406
1407
1408
1409
1410
  	/* we flush the region from the icache only when the first executable
  	 * mapping of it is made  */
  	if (vma->vm_flags & VM_EXEC && !region->vm_icache_flushed) {
  		flush_icache_range(region->vm_start, region->vm_end);
  		region->vm_icache_flushed = true;
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1411

cfe79c00a   Mike Frysinger   NOMMU: Avoiding d...
1412
  	up_write(&nommu_region_sem);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1413

8feae1311   David Howells   NOMMU: Make VMAs ...
1414
1415
  	kleave(" = %lx", result);
  	return result;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1416

8feae1311   David Howells   NOMMU: Make VMAs ...
1417
1418
1419
  error_just_free:
  	up_write(&nommu_region_sem);
  error:
89a864027   David Howells   NOMMU: Don't pass...
1420
1421
  	if (region->vm_file)
  		fput(region->vm_file);
8feae1311   David Howells   NOMMU: Make VMAs ...
1422
  	kmem_cache_free(vm_region_jar, region);
89a864027   David Howells   NOMMU: Don't pass...
1423
1424
  	if (vma->vm_file)
  		fput(vma->vm_file);
8feae1311   David Howells   NOMMU: Make VMAs ...
1425
1426
1427
1428
1429
1430
1431
1432
1433
1434
  	kmem_cache_free(vm_area_cachep, vma);
  	kleave(" = %d", ret);
  	return ret;
  
  sharing_violation:
  	up_write(&nommu_region_sem);
  	printk(KERN_WARNING "Attempt to share mismatched mappings
  ");
  	ret = -EINVAL;
  	goto error;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1435

8feae1311   David Howells   NOMMU: Make VMAs ...
1436
1437
1438
1439
1440
  error_getting_vma:
  	kmem_cache_free(vm_region_jar, region);
  	printk(KERN_WARNING "Allocation of vma for %lu byte allocation"
  	       " from process %d failed
  ",
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1441
  	       len, current->pid);
7bf02ea22   David Rientjes   arch, mm: filter ...
1442
  	show_free_areas(0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1443
  	return -ENOMEM;
8feae1311   David Howells   NOMMU: Make VMAs ...
1444
1445
1446
1447
  error_getting_region:
  	printk(KERN_WARNING "Allocation of vm region for %lu byte allocation"
  	       " from process %d failed
  ",
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1448
  	       len, current->pid);
7bf02ea22   David Rientjes   arch, mm: filter ...
1449
  	show_free_areas(0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1450
1451
  	return -ENOMEM;
  }
6be5ceb02   Linus Torvalds   VM: add "vm_mmap(...
1452

66f0dc481   Hugh Dickins   mm: move sys_mmap...
1453
1454
1455
1456
1457
1458
  SYSCALL_DEFINE6(mmap_pgoff, unsigned long, addr, unsigned long, len,
  		unsigned long, prot, unsigned long, flags,
  		unsigned long, fd, unsigned long, pgoff)
  {
  	struct file *file = NULL;
  	unsigned long retval = -EBADF;
120a795da   Al Viro   audit mmap
1459
  	audit_mmap_fd(fd, flags);
66f0dc481   Hugh Dickins   mm: move sys_mmap...
1460
1461
1462
1463
1464
1465
1466
  	if (!(flags & MAP_ANONYMOUS)) {
  		file = fget(fd);
  		if (!file)
  			goto out;
  	}
  
  	flags &= ~(MAP_EXECUTABLE | MAP_DENYWRITE);
ad1ed2937   Greg Ungerer   nommu: fix compil...
1467
  	retval = vm_mmap_pgoff(file, addr, len, prot, flags, pgoff);
66f0dc481   Hugh Dickins   mm: move sys_mmap...
1468
1469
1470
1471
1472
1473
  
  	if (file)
  		fput(file);
  out:
  	return retval;
  }
a4679373c   Christoph Hellwig   Add generic sys_o...
1474
1475
1476
1477
1478
1479
1480
1481
1482
1483
1484
1485
1486
1487
1488
1489
1490
1491
1492
1493
1494
1495
1496
  #ifdef __ARCH_WANT_SYS_OLD_MMAP
  struct mmap_arg_struct {
  	unsigned long addr;
  	unsigned long len;
  	unsigned long prot;
  	unsigned long flags;
  	unsigned long fd;
  	unsigned long offset;
  };
  
  SYSCALL_DEFINE1(old_mmap, struct mmap_arg_struct __user *, arg)
  {
  	struct mmap_arg_struct a;
  
  	if (copy_from_user(&a, arg, sizeof(a)))
  		return -EFAULT;
  	if (a.offset & ~PAGE_MASK)
  		return -EINVAL;
  
  	return sys_mmap_pgoff(a.addr, a.len, a.prot, a.flags, a.fd,
  			      a.offset >> PAGE_SHIFT);
  }
  #endif /* __ARCH_WANT_SYS_OLD_MMAP */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1497
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
1498
1499
   * split a vma into two pieces at address 'addr', a new vma is allocated either
   * for the first part or the tail.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1500
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
1501
1502
  int split_vma(struct mm_struct *mm, struct vm_area_struct *vma,
  	      unsigned long addr, int new_below)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1503
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
1504
1505
1506
  	struct vm_area_struct *new;
  	struct vm_region *region;
  	unsigned long npages;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1507

8feae1311   David Howells   NOMMU: Make VMAs ...
1508
  	kenter("");
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1509

779c10232   David Howells   nommu: remove a s...
1510
1511
1512
  	/* we're only permitted to split anonymous regions (these should have
  	 * only a single usage on the region) */
  	if (vma->vm_file)
8feae1311   David Howells   NOMMU: Make VMAs ...
1513
  		return -ENOMEM;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1514

8feae1311   David Howells   NOMMU: Make VMAs ...
1515
1516
  	if (mm->map_count >= sysctl_max_map_count)
  		return -ENOMEM;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1517

8feae1311   David Howells   NOMMU: Make VMAs ...
1518
1519
1520
  	region = kmem_cache_alloc(vm_region_jar, GFP_KERNEL);
  	if (!region)
  		return -ENOMEM;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1521

8feae1311   David Howells   NOMMU: Make VMAs ...
1522
1523
1524
1525
1526
1527
1528
1529
1530
1531
1532
1533
1534
1535
  	new = kmem_cache_alloc(vm_area_cachep, GFP_KERNEL);
  	if (!new) {
  		kmem_cache_free(vm_region_jar, region);
  		return -ENOMEM;
  	}
  
  	/* most fields are the same, copy all, and then fixup */
  	*new = *vma;
  	*region = *vma->vm_region;
  	new->vm_region = region;
  
  	npages = (addr - vma->vm_start) >> PAGE_SHIFT;
  
  	if (new_below) {
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1536
  		region->vm_top = region->vm_end = new->vm_end = addr;
8feae1311   David Howells   NOMMU: Make VMAs ...
1537
1538
1539
  	} else {
  		region->vm_start = new->vm_start = addr;
  		region->vm_pgoff = new->vm_pgoff += npages;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1540
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1541
1542
1543
1544
1545
1546
1547
1548
1549
1550
1551
1552
  
  	if (new->vm_ops && new->vm_ops->open)
  		new->vm_ops->open(new);
  
  	delete_vma_from_mm(vma);
  	down_write(&nommu_region_sem);
  	delete_nommu_region(vma->vm_region);
  	if (new_below) {
  		vma->vm_region->vm_start = vma->vm_start = addr;
  		vma->vm_region->vm_pgoff = vma->vm_pgoff += npages;
  	} else {
  		vma->vm_region->vm_end = vma->vm_end = addr;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1553
  		vma->vm_region->vm_top = addr;
8feae1311   David Howells   NOMMU: Make VMAs ...
1554
1555
1556
1557
1558
1559
1560
  	}
  	add_nommu_region(vma->vm_region);
  	add_nommu_region(new->vm_region);
  	up_write(&nommu_region_sem);
  	add_vma_to_mm(mm, vma);
  	add_vma_to_mm(mm, new);
  	return 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1561
  }
3034097a5   David Howells   [PATCH] NOMMU: Or...
1562
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
1563
1564
   * shrink a VMA by removing the specified chunk from either the beginning or
   * the end
3034097a5   David Howells   [PATCH] NOMMU: Or...
1565
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
1566
1567
1568
  static int shrink_vma(struct mm_struct *mm,
  		      struct vm_area_struct *vma,
  		      unsigned long from, unsigned long to)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1569
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
1570
  	struct vm_region *region;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1571

8feae1311   David Howells   NOMMU: Make VMAs ...
1572
  	kenter("");
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1573

8feae1311   David Howells   NOMMU: Make VMAs ...
1574
1575
1576
1577
1578
1579
1580
1581
  	/* adjust the VMA's pointers, which may reposition it in the MM's tree
  	 * and list */
  	delete_vma_from_mm(vma);
  	if (from > vma->vm_start)
  		vma->vm_end = from;
  	else
  		vma->vm_start = to;
  	add_vma_to_mm(mm, vma);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1582

8feae1311   David Howells   NOMMU: Make VMAs ...
1583
1584
  	/* cut the backing region down to size */
  	region = vma->vm_region;
1e2ae599d   David Howells   nommu: struct vm_...
1585
  	BUG_ON(region->vm_usage != 1);
8feae1311   David Howells   NOMMU: Make VMAs ...
1586
1587
1588
  
  	down_write(&nommu_region_sem);
  	delete_nommu_region(region);
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1589
1590
1591
1592
  	if (from > region->vm_start) {
  		to = region->vm_top;
  		region->vm_top = region->vm_end = from;
  	} else {
8feae1311   David Howells   NOMMU: Make VMAs ...
1593
  		region->vm_start = to;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1594
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1595
1596
1597
1598
1599
1600
  	add_nommu_region(region);
  	up_write(&nommu_region_sem);
  
  	free_page_series(from, to);
  	return 0;
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1601

8feae1311   David Howells   NOMMU: Make VMAs ...
1602
1603
1604
1605
1606
1607
1608
1609
  /*
   * release a mapping
   * - under NOMMU conditions the chunk to be unmapped must be backed by a single
   *   VMA, though it need not cover the whole VMA
   */
  int do_munmap(struct mm_struct *mm, unsigned long start, size_t len)
  {
  	struct vm_area_struct *vma;
f67d9b157   Bob Liu   nommu: add page a...
1610
  	unsigned long end;
8feae1311   David Howells   NOMMU: Make VMAs ...
1611
  	int ret;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1612

8feae1311   David Howells   NOMMU: Make VMAs ...
1613
  	kenter(",%lx,%zx", start, len);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1614

f67d9b157   Bob Liu   nommu: add page a...
1615
  	len = PAGE_ALIGN(len);
8feae1311   David Howells   NOMMU: Make VMAs ...
1616
1617
  	if (len == 0)
  		return -EINVAL;
365e9c87a   Hugh Dickins   [PATCH] mm: updat...
1618

f67d9b157   Bob Liu   nommu: add page a...
1619
  	end = start + len;
8feae1311   David Howells   NOMMU: Make VMAs ...
1620
1621
1622
  	/* find the first potentially overlapping VMA */
  	vma = find_vma(mm, start);
  	if (!vma) {
ac7149045   Choi Gi-yong   mm: fix 'ERROR: d...
1623
  		static int limit;
33e5d7697   David Howells   nommu: fix a numb...
1624
1625
1626
1627
1628
1629
1630
1631
1632
  		if (limit < 5) {
  			printk(KERN_WARNING
  			       "munmap of memory not mmapped by process %d"
  			       " (%s): 0x%lx-0x%lx
  ",
  			       current->pid, current->comm,
  			       start, start + len - 1);
  			limit++;
  		}
8feae1311   David Howells   NOMMU: Make VMAs ...
1633
1634
  		return -EINVAL;
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1635

8feae1311   David Howells   NOMMU: Make VMAs ...
1636
1637
1638
1639
1640
1641
1642
1643
1644
  	/* we're allowed to split an anonymous VMA but not a file-backed one */
  	if (vma->vm_file) {
  		do {
  			if (start > vma->vm_start) {
  				kleave(" = -EINVAL [miss]");
  				return -EINVAL;
  			}
  			if (end == vma->vm_end)
  				goto erase_whole_vma;
d75a310c4   Namhyung Kim   mm: nommu: check ...
1645
1646
  			vma = vma->vm_next;
  		} while (vma);
8feae1311   David Howells   NOMMU: Make VMAs ...
1647
1648
1649
1650
1651
1652
1653
1654
1655
1656
1657
1658
1659
1660
1661
1662
1663
1664
1665
1666
1667
1668
1669
1670
1671
1672
1673
  		kleave(" = -EINVAL [split file]");
  		return -EINVAL;
  	} else {
  		/* the chunk must be a subset of the VMA found */
  		if (start == vma->vm_start && end == vma->vm_end)
  			goto erase_whole_vma;
  		if (start < vma->vm_start || end > vma->vm_end) {
  			kleave(" = -EINVAL [superset]");
  			return -EINVAL;
  		}
  		if (start & ~PAGE_MASK) {
  			kleave(" = -EINVAL [unaligned start]");
  			return -EINVAL;
  		}
  		if (end != vma->vm_end && end & ~PAGE_MASK) {
  			kleave(" = -EINVAL [unaligned split]");
  			return -EINVAL;
  		}
  		if (start != vma->vm_start && end != vma->vm_end) {
  			ret = split_vma(mm, vma, start, 1);
  			if (ret < 0) {
  				kleave(" = %d [split]", ret);
  				return ret;
  			}
  		}
  		return shrink_vma(mm, vma, start, end);
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1674

8feae1311   David Howells   NOMMU: Make VMAs ...
1675
1676
1677
1678
  erase_whole_vma:
  	delete_vma_from_mm(vma);
  	delete_vma(mm, vma);
  	kleave(" = 0");
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1679
1680
  	return 0;
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
1681
  EXPORT_SYMBOL(do_munmap);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1682

bfce281c2   Al Viro   kill mm argument ...
1683
  int vm_munmap(unsigned long addr, size_t len)
3034097a5   David Howells   [PATCH] NOMMU: Or...
1684
  {
bfce281c2   Al Viro   kill mm argument ...
1685
  	struct mm_struct *mm = current->mm;
3034097a5   David Howells   [PATCH] NOMMU: Or...
1686
  	int ret;
3034097a5   David Howells   [PATCH] NOMMU: Or...
1687
1688
1689
1690
1691
1692
  
  	down_write(&mm->mmap_sem);
  	ret = do_munmap(mm, addr, len);
  	up_write(&mm->mmap_sem);
  	return ret;
  }
a46ef99d8   Linus Torvalds   VM: add "vm_munma...
1693
1694
1695
1696
  EXPORT_SYMBOL(vm_munmap);
  
  SYSCALL_DEFINE2(munmap, unsigned long, addr, size_t, len)
  {
bfce281c2   Al Viro   kill mm argument ...
1697
  	return vm_munmap(addr, len);
a46ef99d8   Linus Torvalds   VM: add "vm_munma...
1698
  }
3034097a5   David Howells   [PATCH] NOMMU: Or...
1699
1700
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
1701
   * release all the mappings made in a process's VM space
3034097a5   David Howells   [PATCH] NOMMU: Or...
1702
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
1703
  void exit_mmap(struct mm_struct *mm)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1704
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
1705
  	struct vm_area_struct *vma;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1706

8feae1311   David Howells   NOMMU: Make VMAs ...
1707
1708
  	if (!mm)
  		return;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1709

8feae1311   David Howells   NOMMU: Make VMAs ...
1710
  	kenter("");
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1711

8feae1311   David Howells   NOMMU: Make VMAs ...
1712
  	mm->total_vm = 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1713

8feae1311   David Howells   NOMMU: Make VMAs ...
1714
1715
1716
1717
  	while ((vma = mm->mmap)) {
  		mm->mmap = vma->vm_next;
  		delete_vma_from_mm(vma);
  		delete_vma(mm, vma);
04c349615   Steven J. Magnani   nommu: yield CPU ...
1718
  		cond_resched();
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1719
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1720
1721
  
  	kleave("");
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1722
  }
e4eb1ff61   Linus Torvalds   VM: add "vm_brk()...
1723
  unsigned long vm_brk(unsigned long addr, unsigned long len)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1724
1725
1726
1727
1728
  {
  	return -ENOMEM;
  }
  
  /*
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1729
1730
   * expand (or shrink) an existing mapping, potentially moving it at the same
   * time (controlled by the MREMAP_MAYMOVE flag and available VM space)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1731
   *
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1732
   * under NOMMU conditions, we only permit changing a mapping's size, and only
8feae1311   David Howells   NOMMU: Make VMAs ...
1733
1734
   * as long as it stays within the region allocated by do_mmap_private() and the
   * block is not shareable
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1735
   *
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1736
   * MREMAP_FIXED is not supported under NOMMU conditions
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1737
   */
4b377bab2   Al Viro   make do_mremap() ...
1738
  static unsigned long do_mremap(unsigned long addr,
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1739
1740
1741
  			unsigned long old_len, unsigned long new_len,
  			unsigned long flags, unsigned long new_addr)
  {
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1742
  	struct vm_area_struct *vma;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1743
1744
  
  	/* insanity checks first */
f67d9b157   Bob Liu   nommu: add page a...
1745
1746
  	old_len = PAGE_ALIGN(old_len);
  	new_len = PAGE_ALIGN(new_len);
8feae1311   David Howells   NOMMU: Make VMAs ...
1747
  	if (old_len == 0 || new_len == 0)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1748
  		return (unsigned long) -EINVAL;
8feae1311   David Howells   NOMMU: Make VMAs ...
1749
1750
  	if (addr & ~PAGE_MASK)
  		return -EINVAL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1751
1752
  	if (flags & MREMAP_FIXED && new_addr != addr)
  		return (unsigned long) -EINVAL;
8feae1311   David Howells   NOMMU: Make VMAs ...
1753
  	vma = find_vma_exact(current->mm, addr, old_len);
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1754
1755
  	if (!vma)
  		return (unsigned long) -EINVAL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1756

6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1757
  	if (vma->vm_end != vma->vm_start + old_len)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1758
  		return (unsigned long) -EFAULT;
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1759
  	if (vma->vm_flags & VM_MAYSHARE)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1760
  		return (unsigned long) -EPERM;
8feae1311   David Howells   NOMMU: Make VMAs ...
1761
  	if (new_len > vma->vm_region->vm_end - vma->vm_region->vm_start)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1762
1763
1764
  		return (unsigned long) -ENOMEM;
  
  	/* all checks complete - do it */
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1765
  	vma->vm_end = vma->vm_start + new_len;
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1766
1767
  	return vma->vm_start;
  }
6a6160a7b   Heiko Carstens   [CVE-2009-0029] S...
1768
1769
1770
  SYSCALL_DEFINE5(mremap, unsigned long, addr, unsigned long, old_len,
  		unsigned long, new_len, unsigned long, flags,
  		unsigned long, new_addr)
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1771
1772
1773
1774
1775
1776
1777
  {
  	unsigned long ret;
  
  	down_write(&current->mm->mmap_sem);
  	ret = do_mremap(addr, old_len, new_len, flags, new_addr);
  	up_write(&current->mm->mmap_sem);
  	return ret;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1778
  }
240aadeed   Michel Lespinasse   mm: accelerate mm...
1779
1780
1781
  struct page *follow_page_mask(struct vm_area_struct *vma,
  			      unsigned long address, unsigned int flags,
  			      unsigned int *page_mask)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1782
  {
240aadeed   Michel Lespinasse   mm: accelerate mm...
1783
  	*page_mask = 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1784
1785
  	return NULL;
  }
8f3b1327a   Bob Liu   mm/nommu.c: fix r...
1786
1787
  int remap_pfn_range(struct vm_area_struct *vma, unsigned long addr,
  		unsigned long pfn, unsigned long size, pgprot_t prot)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1788
  {
8f3b1327a   Bob Liu   mm/nommu.c: fix r...
1789
1790
  	if (addr != (pfn << PAGE_SHIFT))
  		return -EINVAL;
314e51b98   Konstantin Khlebnikov   mm: kill vma flag...
1791
  	vma->vm_flags |= VM_IO | VM_PFNMAP | VM_DONTEXPAND | VM_DONTDUMP;
66aa2b4b1   Greg Ungerer   [PATCH] uclinux: ...
1792
  	return 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1793
  }
22c4af409   Luke Yang   [PATCH] nommu: ex...
1794
  EXPORT_SYMBOL(remap_pfn_range);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1795

3c0b9de6d   Linus Torvalds   vm: add no-mmu vm...
1796
1797
1798
1799
1800
1801
1802
1803
1804
  int vm_iomap_memory(struct vm_area_struct *vma, phys_addr_t start, unsigned long len)
  {
  	unsigned long pfn = start >> PAGE_SHIFT;
  	unsigned long vm_len = vma->vm_end - vma->vm_start;
  
  	pfn += vma->vm_pgoff;
  	return io_remap_pfn_range(vma, vma->vm_start, pfn, vm_len, vma->vm_page_prot);
  }
  EXPORT_SYMBOL(vm_iomap_memory);
f905bc447   Paul Mundt   nommu: add new vm...
1805
1806
1807
1808
1809
1810
1811
1812
1813
1814
1815
1816
1817
1818
  int remap_vmalloc_range(struct vm_area_struct *vma, void *addr,
  			unsigned long pgoff)
  {
  	unsigned int size = vma->vm_end - vma->vm_start;
  
  	if (!(vma->vm_flags & VM_USERMAP))
  		return -EINVAL;
  
  	vma->vm_start = (unsigned long)(addr + (pgoff << PAGE_SHIFT));
  	vma->vm_end = vma->vm_start + size;
  
  	return 0;
  }
  EXPORT_SYMBOL(remap_vmalloc_range);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1819
1820
1821
1822
1823
  unsigned long arch_get_unmapped_area(struct file *file, unsigned long addr,
  	unsigned long len, unsigned long pgoff, unsigned long flags)
  {
  	return -ENOMEM;
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1824
1825
1826
1827
1828
  void unmap_mapping_range(struct address_space *mapping,
  			 loff_t const holebegin, loff_t const holelen,
  			 int even_cows)
  {
  }
22c4af409   Luke Yang   [PATCH] nommu: ex...
1829
  EXPORT_SYMBOL(unmap_mapping_range);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1830
1831
1832
1833
1834
1835
1836
1837
1838
1839
1840
1841
1842
1843
1844
1845
1846
  
  /*
   * Check that a process has enough memory to allocate a new virtual
   * mapping. 0 means there is enough memory for the allocation to
   * succeed and -ENOMEM implies there is not.
   *
   * We currently support three overcommit policies, which are set via the
   * vm.overcommit_memory sysctl.  See Documentation/vm/overcommit-accounting
   *
   * Strict overcommit modes added 2002 Feb 26 by Alan Cox.
   * Additional code 2002 Jul 20 by Robert Love.
   *
   * cap_sys_admin is 1 if the process has admin privileges, 0 otherwise.
   *
   * Note this is a helper function intended to be used by LSMs which
   * wish to use this logic.
   */
34b4e4aa3   Alan Cox   fix NULL pointer ...
1847
  int __vm_enough_memory(struct mm_struct *mm, long pages, int cap_sys_admin)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1848
  {
8138a67a5   Roman Gushchin   mm/nommu.c: fix a...
1849
  	long free, allowed, reserve;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1850
1851
1852
1853
1854
1855
1856
1857
1858
1859
  
  	vm_acct_memory(pages);
  
  	/*
  	 * Sometimes we want to use more memory than we have
  	 */
  	if (sysctl_overcommit_memory == OVERCOMMIT_ALWAYS)
  		return 0;
  
  	if (sysctl_overcommit_memory == OVERCOMMIT_GUESS) {
c15bef309   Dmitry Fink   mmap: fix and tid...
1860
1861
1862
1863
1864
1865
1866
1867
1868
1869
  		free = global_page_state(NR_FREE_PAGES);
  		free += global_page_state(NR_FILE_PAGES);
  
  		/*
  		 * shmem pages shouldn't be counted as free in this
  		 * case, they can't be purged, only swapped out, and
  		 * that won't affect the overall amount of available
  		 * memory in the system.
  		 */
  		free -= global_page_state(NR_SHMEM);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1870

ec8acf20a   Shaohua Li   swap: add per-par...
1871
  		free += get_nr_swap_pages();
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1872
1873
1874
1875
1876
1877
1878
  
  		/*
  		 * Any slabs which are created with the
  		 * SLAB_RECLAIM_ACCOUNT flag claim to have contents
  		 * which are reclaimable, under pressure.  The dentry
  		 * cache and most inode caches should fall into this
  		 */
972d1a7b1   Christoph Lameter   [PATCH] ZVC: Supp...
1879
  		free += global_page_state(NR_SLAB_RECLAIMABLE);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1880
1881
  
  		/*
d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1882
1883
  		 * Leave reserved pages. The pages are not for anonymous pages.
  		 */
c15bef309   Dmitry Fink   mmap: fix and tid...
1884
  		if (free <= totalreserve_pages)
d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1885
1886
  			goto error;
  		else
c15bef309   Dmitry Fink   mmap: fix and tid...
1887
  			free -= totalreserve_pages;
d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1888
1889
  
  		/*
4eeab4f55   Andrew Shewmaker   mm: replace hardc...
1890
  		 * Reserve some for root
d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1891
  		 */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1892
  		if (!cap_sys_admin)
4eeab4f55   Andrew Shewmaker   mm: replace hardc...
1893
  			free -= sysctl_admin_reserve_kbytes >> (PAGE_SHIFT - 10);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1894
1895
1896
  
  		if (free > pages)
  			return 0;
d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1897
1898
  
  		goto error;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1899
  	}
00619bcc4   Jerome Marchand   mm: factor commit...
1900
  	allowed = vm_commit_limit();
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1901
  	/*
4eeab4f55   Andrew Shewmaker   mm: replace hardc...
1902
  	 * Reserve some 3% for root
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1903
1904
  	 */
  	if (!cap_sys_admin)
4eeab4f55   Andrew Shewmaker   mm: replace hardc...
1905
  		allowed -= sysctl_admin_reserve_kbytes >> (PAGE_SHIFT - 10);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1906

c9b1d0981   Andrew Shewmaker   mm: limit growth ...
1907
1908
1909
1910
1911
  	/*
  	 * Don't let a single process grow so big a user can't recover
  	 */
  	if (mm) {
  		reserve = sysctl_user_reserve_kbytes >> (PAGE_SHIFT - 10);
8138a67a5   Roman Gushchin   mm/nommu.c: fix a...
1912
  		allowed -= min_t(long, mm->total_vm / 32, reserve);
c9b1d0981   Andrew Shewmaker   mm: limit growth ...
1913
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1914

00a62ce91   KOSAKI Motohiro   mm: fix Committed...
1915
  	if (percpu_counter_read_positive(&vm_committed_as) < allowed)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1916
  		return 0;
00a62ce91   KOSAKI Motohiro   mm: fix Committed...
1917

d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1918
  error:
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1919
1920
1921
1922
  	vm_unacct_memory(pages);
  
  	return -ENOMEM;
  }
d0217ac04   Nick Piggin   mm: fault feedbac...
1923
  int filemap_fault(struct vm_area_struct *vma, struct vm_fault *vmf)
b0e15190e   David Howells   [PATCH] NOMMU: Ma...
1924
1925
  {
  	BUG();
d0217ac04   Nick Piggin   mm: fault feedbac...
1926
  	return 0;
b0e15190e   David Howells   [PATCH] NOMMU: Ma...
1927
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
1928
  EXPORT_SYMBOL(filemap_fault);
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1929

f1820361f   Kirill A. Shutemov   mm: implement ->m...
1930
1931
1932
1933
1934
  void filemap_map_pages(struct vm_area_struct *vma, struct vm_fault *vmf)
  {
  	BUG();
  }
  EXPORT_SYMBOL(filemap_map_pages);
f55f199b7   Mike Frysinger   NOMMU: implement ...
1935
1936
  static int __access_remote_vm(struct task_struct *tsk, struct mm_struct *mm,
  		unsigned long addr, void *buf, int len, int write)
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1937
  {
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1938
  	struct vm_area_struct *vma;
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1939
1940
1941
1942
  
  	down_read(&mm->mmap_sem);
  
  	/* the access must start within one of the target process's mappings */
0159b141d   David Howells   [PATCH] NOMMU: Us...
1943
1944
  	vma = find_vma(mm, addr);
  	if (vma) {
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1945
1946
1947
1948
1949
  		/* don't overrun this mapping */
  		if (addr + len >= vma->vm_end)
  			len = vma->vm_end - addr;
  
  		/* only read or write mappings where it is permitted */
d00c7b993   David Howells   [PATCH] NOMMU: Pe...
1950
  		if (write && vma->vm_flags & VM_MAYWRITE)
7959722b9   Jie Zhang   NOMMU: Use copy_*...
1951
1952
  			copy_to_user_page(vma, NULL, addr,
  					 (void *) addr, buf, len);
d00c7b993   David Howells   [PATCH] NOMMU: Pe...
1953
  		else if (!write && vma->vm_flags & VM_MAYREAD)
7959722b9   Jie Zhang   NOMMU: Use copy_*...
1954
1955
  			copy_from_user_page(vma, NULL, addr,
  					    buf, (void *) addr, len);
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1956
1957
1958
1959
1960
1961
1962
  		else
  			len = 0;
  	} else {
  		len = 0;
  	}
  
  	up_read(&mm->mmap_sem);
f55f199b7   Mike Frysinger   NOMMU: implement ...
1963
1964
1965
1966
1967
1968
1969
1970
1971
1972
1973
1974
1975
1976
1977
1978
1979
1980
1981
1982
1983
1984
1985
1986
1987
1988
1989
1990
1991
1992
1993
1994
1995
1996
1997
1998
  
  	return len;
  }
  
  /**
   * @access_remote_vm - access another process' address space
   * @mm:		the mm_struct of the target address space
   * @addr:	start address to access
   * @buf:	source or destination buffer
   * @len:	number of bytes to transfer
   * @write:	whether the access is a write
   *
   * The caller must hold a reference on @mm.
   */
  int access_remote_vm(struct mm_struct *mm, unsigned long addr,
  		void *buf, int len, int write)
  {
  	return __access_remote_vm(NULL, mm, addr, buf, len, write);
  }
  
  /*
   * Access another process' address space.
   * - source/target buffer must be kernel space
   */
  int access_process_vm(struct task_struct *tsk, unsigned long addr, void *buf, int len, int write)
  {
  	struct mm_struct *mm;
  
  	if (addr + len < addr)
  		return 0;
  
  	mm = get_task_mm(tsk);
  	if (!mm)
  		return 0;
  
  	len = __access_remote_vm(tsk, mm, addr, buf, len, write);
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1999
2000
2001
  	mmput(mm);
  	return len;
  }
7e6608724   David Howells   nommu: fix shared...
2002
2003
2004
2005
2006
2007
2008
2009
2010
2011
2012
2013
2014
2015
2016
2017
  
  /**
   * nommu_shrink_inode_mappings - Shrink the shared mappings on an inode
   * @inode: The inode to check
   * @size: The current filesize of the inode
   * @newsize: The proposed filesize of the inode
   *
   * Check the shared mappings on an inode on behalf of a shrinking truncate to
   * make sure that that any outstanding VMAs aren't broken and then shrink the
   * vm_regions that extend that beyond so that do_mmap_pgoff() doesn't
   * automatically grant mappings that are too large.
   */
  int nommu_shrink_inode_mappings(struct inode *inode, size_t size,
  				size_t newsize)
  {
  	struct vm_area_struct *vma;
7e6608724   David Howells   nommu: fix shared...
2018
2019
2020
2021
2022
2023
2024
2025
  	struct vm_region *region;
  	pgoff_t low, high;
  	size_t r_size, r_top;
  
  	low = newsize >> PAGE_SHIFT;
  	high = (size + PAGE_SIZE - 1) >> PAGE_SHIFT;
  
  	down_write(&nommu_region_sem);
1acf2e040   Davidlohr Bueso   mm/nommu: share t...
2026
  	i_mmap_lock_read(inode->i_mapping);
7e6608724   David Howells   nommu: fix shared...
2027
2028
  
  	/* search for VMAs that fall within the dead zone */
6b2dbba8b   Michel Lespinasse   mm: replace vma p...
2029
  	vma_interval_tree_foreach(vma, &inode->i_mapping->i_mmap, low, high) {
7e6608724   David Howells   nommu: fix shared...
2030
2031
2032
  		/* found one - only interested if it's shared out of the page
  		 * cache */
  		if (vma->vm_flags & VM_SHARED) {
1acf2e040   Davidlohr Bueso   mm/nommu: share t...
2033
  			i_mmap_unlock_read(inode->i_mapping);
7e6608724   David Howells   nommu: fix shared...
2034
2035
2036
2037
2038
2039
2040
2041
2042
2043
2044
  			up_write(&nommu_region_sem);
  			return -ETXTBSY; /* not quite true, but near enough */
  		}
  	}
  
  	/* reduce any regions that overlap the dead zone - if in existence,
  	 * these will be pointed to by VMAs that don't overlap the dead zone
  	 *
  	 * we don't check for any regions that start beyond the EOF as there
  	 * shouldn't be any
  	 */
1acf2e040   Davidlohr Bueso   mm/nommu: share t...
2045
  	vma_interval_tree_foreach(vma, &inode->i_mapping->i_mmap, 0, ULONG_MAX) {
7e6608724   David Howells   nommu: fix shared...
2046
2047
2048
2049
2050
2051
2052
2053
2054
2055
2056
2057
2058
  		if (!(vma->vm_flags & VM_SHARED))
  			continue;
  
  		region = vma->vm_region;
  		r_size = region->vm_top - region->vm_start;
  		r_top = (region->vm_pgoff << PAGE_SHIFT) + r_size;
  
  		if (r_top > newsize) {
  			region->vm_top -= r_top - newsize;
  			if (region->vm_end > region->vm_top)
  				region->vm_end = region->vm_top;
  		}
  	}
1acf2e040   Davidlohr Bueso   mm/nommu: share t...
2059
  	i_mmap_unlock_read(inode->i_mapping);
7e6608724   David Howells   nommu: fix shared...
2060
2061
2062
  	up_write(&nommu_region_sem);
  	return 0;
  }
c9b1d0981   Andrew Shewmaker   mm: limit growth ...
2063
2064
2065
2066
2067
2068
2069
2070
2071
2072
2073
2074
2075
2076
2077
2078
2079
2080
2081
2082
2083
  
  /*
   * Initialise sysctl_user_reserve_kbytes.
   *
   * This is intended to prevent a user from starting a single memory hogging
   * process, such that they cannot recover (kill the hog) in OVERCOMMIT_NEVER
   * mode.
   *
   * The default value is min(3% of free memory, 128MB)
   * 128MB is enough to recover with sshd/login, bash, and top/kill.
   */
  static int __meminit init_user_reserve(void)
  {
  	unsigned long free_kbytes;
  
  	free_kbytes = global_page_state(NR_FREE_PAGES) << (PAGE_SHIFT - 10);
  
  	sysctl_user_reserve_kbytes = min(free_kbytes / 32, 1UL << 17);
  	return 0;
  }
  module_init(init_user_reserve)
4eeab4f55   Andrew Shewmaker   mm: replace hardc...
2084
2085
2086
2087
2088
2089
2090
2091
2092
2093
2094
2095
2096
2097
2098
2099
2100
2101
2102
2103
2104
  
  /*
   * Initialise sysctl_admin_reserve_kbytes.
   *
   * The purpose of sysctl_admin_reserve_kbytes is to allow the sys admin
   * to log in and kill a memory hogging process.
   *
   * Systems with more than 256MB will reserve 8MB, enough to recover
   * with sshd, bash, and top in OVERCOMMIT_GUESS. Smaller systems will
   * only reserve 3% of free pages by default.
   */
  static int __meminit init_admin_reserve(void)
  {
  	unsigned long free_kbytes;
  
  	free_kbytes = global_page_state(NR_FREE_PAGES) << (PAGE_SHIFT - 10);
  
  	sysctl_admin_reserve_kbytes = min(free_kbytes / 32, 1UL << 13);
  	return 0;
  }
  module_init(init_admin_reserve)