Blame view

mm/nommu.c 52 KB
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1
2
3
4
5
6
7
8
  /*
   *  linux/mm/nommu.c
   *
   *  Replacement code for mm functions to support CPU's that don't
   *  have any form of memory management unit (thus no virtual memory).
   *
   *  See Documentation/nommu-mmap.txt
   *
8feae1311   David Howells   NOMMU: Make VMAs ...
9
   *  Copyright (c) 2004-2008 David Howells <dhowells@redhat.com>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
10
11
12
   *  Copyright (c) 2000-2003 David McCullough <davidm@snapgear.com>
   *  Copyright (c) 2000-2001 D Jeff Dionne <jeff@uClinux.org>
   *  Copyright (c) 2002      Greg Ungerer <gerg@snapgear.com>
29c185e5c   Paul Mundt   nommu: Provide st...
13
   *  Copyright (c) 2007-2010 Paul Mundt <lethal@linux-sh.org>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
14
   */
b1de0d139   Mitchel Humpherys   mm: convert some ...
15
  #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
b95f1b31b   Paul Gortmaker   mm: Map most file...
16
  #include <linux/export.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
17
  #include <linux/mm.h>
615d6e875   Davidlohr Bueso   mm: per-thread vm...
18
  #include <linux/vmacache.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
19
20
21
22
23
24
25
  #include <linux/mman.h>
  #include <linux/swap.h>
  #include <linux/file.h>
  #include <linux/highmem.h>
  #include <linux/pagemap.h>
  #include <linux/slab.h>
  #include <linux/vmalloc.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
26
27
  #include <linux/blkdev.h>
  #include <linux/backing-dev.h>
3b32123d7   Gideon Israel Dsouza   mm: use macros fr...
28
  #include <linux/compiler.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
29
30
31
32
  #include <linux/mount.h>
  #include <linux/personality.h>
  #include <linux/security.h>
  #include <linux/syscalls.h>
120a795da   Al Viro   audit mmap
33
  #include <linux/audit.h>
cf4aebc29   Clark Williams   sched: Move sched...
34
  #include <linux/sched/sysctl.h>
b1de0d139   Mitchel Humpherys   mm: convert some ...
35
  #include <linux/printk.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
36
37
38
39
  
  #include <asm/uaccess.h>
  #include <asm/tlb.h>
  #include <asm/tlbflush.h>
eb8cdec4a   Bernd Schmidt   nommu: add suppor...
40
  #include <asm/mmu_context.h>
8feae1311   David Howells   NOMMU: Make VMAs ...
41
  #include "internal.h"
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
42
  void *high_memory;
944b68749   Arnd Bergmann   mm: export "high_...
43
  EXPORT_SYMBOL(high_memory);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
44
45
  struct page *mem_map;
  unsigned long max_mapnr;
5b8bf3072   gchen gchen   mm/nommu.c: expor...
46
  EXPORT_SYMBOL(max_mapnr);
4266c97a3   Hugh Dickins   nommu: fix two bu...
47
  unsigned long highest_memmap_pfn;
00a62ce91   KOSAKI Motohiro   mm: fix Committed...
48
  struct percpu_counter vm_committed_as;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
49
50
  int sysctl_overcommit_memory = OVERCOMMIT_GUESS; /* heuristic overcommit */
  int sysctl_overcommit_ratio = 50; /* default is 50% */
49f0ce5f9   Jerome Marchand   mm: add overcommi...
51
  unsigned long sysctl_overcommit_kbytes __read_mostly;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
52
  int sysctl_max_map_count = DEFAULT_MAX_MAP_COUNT;
fc4d5c292   David Howells   nommu: make the i...
53
  int sysctl_nr_trim_pages = CONFIG_NOMMU_INITIAL_TRIM_EXCESS;
c9b1d0981   Andrew Shewmaker   mm: limit growth ...
54
  unsigned long sysctl_user_reserve_kbytes __read_mostly = 1UL << 17; /* 128MB */
4eeab4f55   Andrew Shewmaker   mm: replace hardc...
55
  unsigned long sysctl_admin_reserve_kbytes __read_mostly = 1UL << 13; /* 8MB */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
56
  int heap_stack_gap = 0;
33e5d7697   David Howells   nommu: fix a numb...
57
  atomic_long_t mmap_pages_allocated;
8feae1311   David Howells   NOMMU: Make VMAs ...
58

997071bcb   K. Y. Srinivasan   mm: export a func...
59
60
61
62
63
64
65
66
67
68
69
70
71
72
  /*
   * The global memory commitment made in the system can be a metric
   * that can be used to drive ballooning decisions when Linux is hosted
   * as a guest. On Hyper-V, the host implements a policy engine for dynamically
   * balancing memory across competing virtual machines that are hosted.
   * Several metrics drive this policy engine including the guest reported
   * memory commitment.
   */
  unsigned long vm_memory_committed(void)
  {
  	return percpu_counter_read_positive(&vm_committed_as);
  }
  
  EXPORT_SYMBOL_GPL(vm_memory_committed);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
73
  EXPORT_SYMBOL(mem_map);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
74

8feae1311   David Howells   NOMMU: Make VMAs ...
75
76
77
78
  /* list of mapped, potentially shareable regions */
  static struct kmem_cache *vm_region_jar;
  struct rb_root nommu_region_tree = RB_ROOT;
  DECLARE_RWSEM(nommu_region_sem);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
79

f0f37e2f7   Alexey Dobriyan   const: mark struc...
80
  const struct vm_operations_struct generic_file_vm_ops = {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
81
82
83
  };
  
  /*
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
84
85
86
87
88
89
90
91
   * Return the total memory allocated for this pointer, not
   * just what the caller asked for.
   *
   * Doesn't have to be accurate, i.e. may have races.
   */
  unsigned int kobjsize(const void *objp)
  {
  	struct page *page;
4016a1390   Michael Hennerich   mm/nommu.c: retur...
92
93
94
95
  	/*
  	 * If the object we have should not have ksize performed on it,
  	 * return size of 0
  	 */
5a1603be5   Paul Mundt   nommu: Correct ko...
96
  	if (!objp || !virt_addr_valid(objp))
6cfd53fc0   Paul Mundt   nommu: fix kobjsi...
97
98
99
  		return 0;
  
  	page = virt_to_head_page(objp);
6cfd53fc0   Paul Mundt   nommu: fix kobjsi...
100
101
102
103
104
  
  	/*
  	 * If the allocator sets PageSlab, we know the pointer came from
  	 * kmalloc().
  	 */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
105
106
  	if (PageSlab(page))
  		return ksize(objp);
6cfd53fc0   Paul Mundt   nommu: fix kobjsi...
107
  	/*
ab2e83ead   Paul Mundt   NOMMU: Teach kobj...
108
109
110
111
112
113
114
115
116
117
118
119
120
121
  	 * If it's not a compound page, see if we have a matching VMA
  	 * region. This test is intentionally done in reverse order,
  	 * so if there's no VMA, we still fall through and hand back
  	 * PAGE_SIZE for 0-order pages.
  	 */
  	if (!PageCompound(page)) {
  		struct vm_area_struct *vma;
  
  		vma = find_vma(current->mm, (unsigned long)objp);
  		if (vma)
  			return vma->vm_end - vma->vm_start;
  	}
  
  	/*
6cfd53fc0   Paul Mundt   nommu: fix kobjsi...
122
  	 * The ksize() function is only guaranteed to work for pointers
5a1603be5   Paul Mundt   nommu: Correct ko...
123
  	 * returned by kmalloc(). So handle arbitrary pointers here.
6cfd53fc0   Paul Mundt   nommu: fix kobjsi...
124
  	 */
5a1603be5   Paul Mundt   nommu: Correct ko...
125
  	return PAGE_SIZE << compound_order(page);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
126
  }
28a35716d   Michel Lespinasse   mm: use long type...
127
128
129
130
  long __get_user_pages(struct task_struct *tsk, struct mm_struct *mm,
  		      unsigned long start, unsigned long nr_pages,
  		      unsigned int foll_flags, struct page **pages,
  		      struct vm_area_struct **vmas, int *nonblocking)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
131
  {
910e46da4   Sonic Zhang   [PATCH] Check if ...
132
  	struct vm_area_struct *vma;
7b4d5b8b3   David Howells   [PATCH] NOMMU: Ch...
133
134
135
136
  	unsigned long vm_flags;
  	int i;
  
  	/* calculate required read or write permissions.
58fa879e1   Hugh Dickins   mm: FOLL flags fo...
137
  	 * If FOLL_FORCE is set, we only require the "MAY" flags.
7b4d5b8b3   David Howells   [PATCH] NOMMU: Ch...
138
  	 */
58fa879e1   Hugh Dickins   mm: FOLL flags fo...
139
140
141
142
  	vm_flags  = (foll_flags & FOLL_WRITE) ?
  			(VM_WRITE | VM_MAYWRITE) : (VM_READ | VM_MAYREAD);
  	vm_flags &= (foll_flags & FOLL_FORCE) ?
  			(VM_MAYREAD | VM_MAYWRITE) : (VM_READ | VM_WRITE);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
143

9d73777e5   Peter Zijlstra   clarify get_user_...
144
  	for (i = 0; i < nr_pages; i++) {
7561e8ca0   David Howells   NOMMU: Revert 'no...
145
  		vma = find_vma(mm, start);
7b4d5b8b3   David Howells   [PATCH] NOMMU: Ch...
146
147
148
149
  		if (!vma)
  			goto finish_or_fault;
  
  		/* protect what we can, including chardevs */
1c3aff1ce   Hugh Dickins   mm: remove unused...
150
151
  		if ((vma->vm_flags & (VM_IO | VM_PFNMAP)) ||
  		    !(vm_flags & vma->vm_flags))
7b4d5b8b3   David Howells   [PATCH] NOMMU: Ch...
152
  			goto finish_or_fault;
910e46da4   Sonic Zhang   [PATCH] Check if ...
153

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
154
155
156
157
158
159
  		if (pages) {
  			pages[i] = virt_to_page(start);
  			if (pages[i])
  				page_cache_get(pages[i]);
  		}
  		if (vmas)
910e46da4   Sonic Zhang   [PATCH] Check if ...
160
  			vmas[i] = vma;
e1ee65d85   David Howells   NOMMU: Fix __get_...
161
  		start = (start + PAGE_SIZE) & PAGE_MASK;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
162
  	}
7b4d5b8b3   David Howells   [PATCH] NOMMU: Ch...
163
164
165
166
167
  
  	return i;
  
  finish_or_fault:
  	return i ? : -EFAULT;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
168
  }
b291f0003   Nick Piggin   mlock: mlocked pa...
169

b291f0003   Nick Piggin   mlock: mlocked pa...
170
171
172
173
174
175
176
  /*
   * get a list of pages in an address range belonging to the specified process
   * and indicate the VMA that covers each page
   * - this is potentially dodgy as we may end incrementing the page count of a
   *   slab page or a secondary page from a compound page
   * - don't permit access to VMAs that don't support it, such as I/O mappings
   */
28a35716d   Michel Lespinasse   mm: use long type...
177
178
179
180
  long get_user_pages(struct task_struct *tsk, struct mm_struct *mm,
  		    unsigned long start, unsigned long nr_pages,
  		    int write, int force, struct page **pages,
  		    struct vm_area_struct **vmas)
b291f0003   Nick Piggin   mlock: mlocked pa...
181
182
183
184
  {
  	int flags = 0;
  
  	if (write)
58fa879e1   Hugh Dickins   mm: FOLL flags fo...
185
  		flags |= FOLL_WRITE;
b291f0003   Nick Piggin   mlock: mlocked pa...
186
  	if (force)
58fa879e1   Hugh Dickins   mm: FOLL flags fo...
187
  		flags |= FOLL_FORCE;
b291f0003   Nick Piggin   mlock: mlocked pa...
188

53a7706d5   Michel Lespinasse   mlock: do not hol...
189
190
  	return __get_user_pages(tsk, mm, start, nr_pages, flags, pages, vmas,
  				NULL);
b291f0003   Nick Piggin   mlock: mlocked pa...
191
  }
66aa2b4b1   Greg Ungerer   [PATCH] uclinux: ...
192
  EXPORT_SYMBOL(get_user_pages);
f0818f472   Andrea Arcangeli   mm: gup: add get_...
193
194
195
196
197
198
199
200
201
  long get_user_pages_locked(struct task_struct *tsk, struct mm_struct *mm,
  			   unsigned long start, unsigned long nr_pages,
  			   int write, int force, struct page **pages,
  			   int *locked)
  {
  	return get_user_pages(tsk, mm, start, nr_pages, write, force,
  			      pages, NULL);
  }
  EXPORT_SYMBOL(get_user_pages_locked);
0fd71a56f   Andrea Arcangeli   mm: gup: add __ge...
202
203
204
205
  long __get_user_pages_unlocked(struct task_struct *tsk, struct mm_struct *mm,
  			       unsigned long start, unsigned long nr_pages,
  			       int write, int force, struct page **pages,
  			       unsigned int gup_flags)
f0818f472   Andrea Arcangeli   mm: gup: add get_...
206
207
208
209
210
211
212
213
  {
  	long ret;
  	down_read(&mm->mmap_sem);
  	ret = get_user_pages(tsk, mm, start, nr_pages, write, force,
  			     pages, NULL);
  	up_read(&mm->mmap_sem);
  	return ret;
  }
0fd71a56f   Andrea Arcangeli   mm: gup: add __ge...
214
215
216
217
218
219
220
221
222
  EXPORT_SYMBOL(__get_user_pages_unlocked);
  
  long get_user_pages_unlocked(struct task_struct *tsk, struct mm_struct *mm,
  			     unsigned long start, unsigned long nr_pages,
  			     int write, int force, struct page **pages)
  {
  	return __get_user_pages_unlocked(tsk, mm, start, nr_pages, write,
  					 force, pages, 0);
  }
f0818f472   Andrea Arcangeli   mm: gup: add get_...
223
  EXPORT_SYMBOL(get_user_pages_unlocked);
dfc2f91ac   Paul Mundt   nommu: provide fo...
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
  /**
   * follow_pfn - look up PFN at a user virtual address
   * @vma: memory mapping
   * @address: user virtual address
   * @pfn: location to store found PFN
   *
   * Only IO mappings and raw PFN mappings are allowed.
   *
   * Returns zero and the pfn at @pfn on success, -ve otherwise.
   */
  int follow_pfn(struct vm_area_struct *vma, unsigned long address,
  	unsigned long *pfn)
  {
  	if (!(vma->vm_flags & (VM_IO | VM_PFNMAP)))
  		return -EINVAL;
  
  	*pfn = address >> PAGE_SHIFT;
  	return 0;
  }
  EXPORT_SYMBOL(follow_pfn);
f1c4069e1   Joonsoo Kim   mm, vmalloc: expo...
244
  LIST_HEAD(vmap_area_list);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
245

b3bdda02a   Christoph Lameter   vmalloc: add cons...
246
  void vfree(const void *addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
247
248
249
  {
  	kfree(addr);
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
250
  EXPORT_SYMBOL(vfree);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
251

dd0fc66fb   Al Viro   [PATCH] gfp flags...
252
  void *__vmalloc(unsigned long size, gfp_t gfp_mask, pgprot_t prot)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
253
254
  {
  	/*
8518609de   Robert P. J. Day   Explain clearly w...
255
256
  	 *  You can't specify __GFP_HIGHMEM with kmalloc() since kmalloc()
  	 * returns only a logical address.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
257
  	 */
84097518d   Nick Piggin   [PATCH] mm: nommu...
258
  	return kmalloc(size, (gfp_mask | __GFP_COMP) & ~__GFP_HIGHMEM);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
259
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
260
  EXPORT_SYMBOL(__vmalloc);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
261

f905bc447   Paul Mundt   nommu: add new vm...
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
  void *vmalloc_user(unsigned long size)
  {
  	void *ret;
  
  	ret = __vmalloc(size, GFP_KERNEL | __GFP_HIGHMEM | __GFP_ZERO,
  			PAGE_KERNEL);
  	if (ret) {
  		struct vm_area_struct *vma;
  
  		down_write(&current->mm->mmap_sem);
  		vma = find_vma(current->mm, (unsigned long)ret);
  		if (vma)
  			vma->vm_flags |= VM_USERMAP;
  		up_write(&current->mm->mmap_sem);
  	}
  
  	return ret;
  }
  EXPORT_SYMBOL(vmalloc_user);
b3bdda02a   Christoph Lameter   vmalloc: add cons...
281
  struct page *vmalloc_to_page(const void *addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
282
283
284
  {
  	return virt_to_page(addr);
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
285
  EXPORT_SYMBOL(vmalloc_to_page);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
286

b3bdda02a   Christoph Lameter   vmalloc: add cons...
287
  unsigned long vmalloc_to_pfn(const void *addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
288
289
290
  {
  	return page_to_pfn(virt_to_page(addr));
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
291
  EXPORT_SYMBOL(vmalloc_to_pfn);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
292
293
294
  
  long vread(char *buf, char *addr, unsigned long count)
  {
9bde916bc   Chen Gang   mm/nommu.c: add a...
295
296
297
  	/* Don't allow overflow */
  	if ((unsigned long) buf + count < count)
  		count = -(unsigned long) buf;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
298
299
300
301
302
303
304
305
306
307
308
  	memcpy(buf, addr, count);
  	return count;
  }
  
  long vwrite(char *buf, char *addr, unsigned long count)
  {
  	/* Don't allow overflow */
  	if ((unsigned long) addr + count < count)
  		count = -(unsigned long) addr;
  
  	memcpy(addr, buf, count);
ac7149045   Choi Gi-yong   mm: fix 'ERROR: d...
309
  	return count;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
310
311
312
313
314
315
316
317
318
319
  }
  
  /*
   *	vmalloc  -  allocate virtually continguos memory
   *
   *	@size:		allocation size
   *
   *	Allocate enough pages to cover @size from the page level
   *	allocator and map them into continguos kernel virtual space.
   *
c1c8897f8   Michael Opdenacker   Spelling fix: "co...
320
   *	For tight control over page level allocator and protection flags
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
321
322
323
324
325
326
   *	use __vmalloc() instead.
   */
  void *vmalloc(unsigned long size)
  {
         return __vmalloc(size, GFP_KERNEL | __GFP_HIGHMEM, PAGE_KERNEL);
  }
f61388822   Andrew Morton   [PATCH] nommu: im...
327
  EXPORT_SYMBOL(vmalloc);
e1ca7788d   Dave Young   mm: add vzalloc()...
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
  /*
   *	vzalloc - allocate virtually continguos memory with zero fill
   *
   *	@size:		allocation size
   *
   *	Allocate enough pages to cover @size from the page level
   *	allocator and map them into continguos kernel virtual space.
   *	The memory allocated is set to zero.
   *
   *	For tight control over page level allocator and protection flags
   *	use __vmalloc() instead.
   */
  void *vzalloc(unsigned long size)
  {
  	return __vmalloc(size, GFP_KERNEL | __GFP_HIGHMEM | __GFP_ZERO,
  			PAGE_KERNEL);
  }
  EXPORT_SYMBOL(vzalloc);
  
  /**
   * vmalloc_node - allocate memory on a specific node
   * @size:	allocation size
   * @node:	numa node
   *
   * Allocate enough pages to cover @size from the page level
   * allocator and map them into contiguous kernel virtual space.
   *
   * For tight control over page level allocator and protection flags
   * use __vmalloc() instead.
   */
f61388822   Andrew Morton   [PATCH] nommu: im...
358
359
360
361
  void *vmalloc_node(unsigned long size, int node)
  {
  	return vmalloc(size);
  }
9a14f653d   Paul Mundt   nommu: Fix up vma...
362
  EXPORT_SYMBOL(vmalloc_node);
e1ca7788d   Dave Young   mm: add vzalloc()...
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
  
  /**
   * vzalloc_node - allocate memory on a specific node with zero fill
   * @size:	allocation size
   * @node:	numa node
   *
   * Allocate enough pages to cover @size from the page level
   * allocator and map them into contiguous kernel virtual space.
   * The memory allocated is set to zero.
   *
   * For tight control over page level allocator and protection flags
   * use __vmalloc() instead.
   */
  void *vzalloc_node(unsigned long size, int node)
  {
  	return vzalloc(size);
  }
  EXPORT_SYMBOL(vzalloc_node);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
381

1af446edf   Paul Mundt   nommu: Provide vm...
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
  #ifndef PAGE_KERNEL_EXEC
  # define PAGE_KERNEL_EXEC PAGE_KERNEL
  #endif
  
  /**
   *	vmalloc_exec  -  allocate virtually contiguous, executable memory
   *	@size:		allocation size
   *
   *	Kernel-internal function to allocate enough pages to cover @size
   *	the page level allocator and map them into contiguous and
   *	executable kernel virtual space.
   *
   *	For tight control over page level allocator and protection flags
   *	use __vmalloc() instead.
   */
  
  void *vmalloc_exec(unsigned long size)
  {
  	return __vmalloc(size, GFP_KERNEL | __GFP_HIGHMEM, PAGE_KERNEL_EXEC);
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
402
403
  /**
   * vmalloc_32  -  allocate virtually contiguous memory (32bit addressable)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
404
405
406
407
408
409
410
411
412
   *	@size:		allocation size
   *
   *	Allocate enough 32bit PA addressable pages to cover @size from the
   *	page level allocator and map them into continguos kernel virtual space.
   */
  void *vmalloc_32(unsigned long size)
  {
  	return __vmalloc(size, GFP_KERNEL, PAGE_KERNEL);
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
413
414
415
416
417
418
419
420
  EXPORT_SYMBOL(vmalloc_32);
  
  /**
   * vmalloc_32_user - allocate zeroed virtually contiguous 32bit memory
   *	@size:		allocation size
   *
   * The resulting memory area is 32bit addressable and zeroed so it can be
   * mapped to userspace without leaking data.
f905bc447   Paul Mundt   nommu: add new vm...
421
422
423
   *
   * VM_USERMAP is set on the corresponding VMA so that subsequent calls to
   * remap_vmalloc_range() are permissible.
b50731732   Paul Mundt   nommu: vmalloc_32...
424
425
426
   */
  void *vmalloc_32_user(unsigned long size)
  {
f905bc447   Paul Mundt   nommu: add new vm...
427
428
429
430
431
  	/*
  	 * We'll have to sort out the ZONE_DMA bits for 64-bit,
  	 * but for now this can simply use vmalloc_user() directly.
  	 */
  	return vmalloc_user(size);
b50731732   Paul Mundt   nommu: vmalloc_32...
432
433
  }
  EXPORT_SYMBOL(vmalloc_32_user);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
434
435
436
437
438
439
  
  void *vmap(struct page **pages, unsigned int count, unsigned long flags, pgprot_t prot)
  {
  	BUG();
  	return NULL;
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
440
  EXPORT_SYMBOL(vmap);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
441

b3bdda02a   Christoph Lameter   vmalloc: add cons...
442
  void vunmap(const void *addr)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
443
444
445
  {
  	BUG();
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
446
  EXPORT_SYMBOL(vunmap);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
447

eb6434d9e   Paul Mundt   nommu: Stub in vm...
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
  void *vm_map_ram(struct page **pages, unsigned int count, int node, pgprot_t prot)
  {
  	BUG();
  	return NULL;
  }
  EXPORT_SYMBOL(vm_map_ram);
  
  void vm_unmap_ram(const void *mem, unsigned int count)
  {
  	BUG();
  }
  EXPORT_SYMBOL(vm_unmap_ram);
  
  void vm_unmap_aliases(void)
  {
  }
  EXPORT_SYMBOL_GPL(vm_unmap_aliases);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
465
  /*
1eeb66a1b   Christoph Hellwig   move die notifier...
466
467
468
   * Implement a stub for vmalloc_sync_all() if the architecture chose not to
   * have one.
   */
3b32123d7   Gideon Israel Dsouza   mm: use macros fr...
469
  void __weak vmalloc_sync_all(void)
1eeb66a1b   Christoph Hellwig   move die notifier...
470
471
  {
  }
29c185e5c   Paul Mundt   nommu: Provide st...
472
473
474
475
476
477
478
479
480
481
482
483
  /**
   *	alloc_vm_area - allocate a range of kernel address space
   *	@size:		size of the area
   *
   *	Returns:	NULL on failure, vm_struct on success
   *
   *	This function reserves a range of kernel address space, and
   *	allocates pagetables to map that range.  No actual mappings
   *	are created.  If the kernel address space is not shared
   *	between processes, it syncs the pagetable across all
   *	processes.
   */
cd12909cb   David Vrabel   xen: map foreign ...
484
  struct vm_struct *alloc_vm_area(size_t size, pte_t **ptes)
29c185e5c   Paul Mundt   nommu: Provide st...
485
486
487
488
489
490
491
492
493
494
495
  {
  	BUG();
  	return NULL;
  }
  EXPORT_SYMBOL_GPL(alloc_vm_area);
  
  void free_vm_area(struct vm_struct *area)
  {
  	BUG();
  }
  EXPORT_SYMBOL_GPL(free_vm_area);
b50731732   Paul Mundt   nommu: vmalloc_32...
496
497
498
499
500
501
  int vm_insert_page(struct vm_area_struct *vma, unsigned long addr,
  		   struct page *page)
  {
  	return -EINVAL;
  }
  EXPORT_SYMBOL(vm_insert_page);
1eeb66a1b   Christoph Hellwig   move die notifier...
502
  /*
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
503
504
505
506
507
508
   *  sys_brk() for the most part doesn't need the global kernel
   *  lock, except when an application is doing something nasty
   *  like trying to un-brk an area that has already been mapped
   *  to a regular file.  in this case, the unmapping will need
   *  to invoke file system routines that need the global lock.
   */
6a6160a7b   Heiko Carstens   [CVE-2009-0029] S...
509
  SYSCALL_DEFINE1(brk, unsigned long, brk)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
  {
  	struct mm_struct *mm = current->mm;
  
  	if (brk < mm->start_brk || brk > mm->context.end_brk)
  		return mm->brk;
  
  	if (mm->brk == brk)
  		return mm->brk;
  
  	/*
  	 * Always allow shrinking brk
  	 */
  	if (brk <= mm->brk) {
  		mm->brk = brk;
  		return brk;
  	}
  
  	/*
  	 * Ok, looks good - let it rip.
  	 */
cfe79c00a   Mike Frysinger   NOMMU: Avoiding d...
530
  	flush_icache_range(mm->brk, brk);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
531
532
  	return mm->brk = brk;
  }
8feae1311   David Howells   NOMMU: Make VMAs ...
533
534
535
536
  /*
   * initialise the VMA and region record slabs
   */
  void __init mmap_init(void)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
537
  {
00a62ce91   KOSAKI Motohiro   mm: fix Committed...
538
  	int ret;
908c7f194   Tejun Heo   percpu_counter: a...
539
  	ret = percpu_counter_init(&vm_committed_as, 0, GFP_KERNEL);
00a62ce91   KOSAKI Motohiro   mm: fix Committed...
540
  	VM_BUG_ON(ret);
33e5d7697   David Howells   nommu: fix a numb...
541
  	vm_region_jar = KMEM_CACHE(vm_region, SLAB_PANIC);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
542
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
543

3034097a5   David Howells   [PATCH] NOMMU: Or...
544
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
545
546
   * validate the region tree
   * - the caller must hold the region lock
3034097a5   David Howells   [PATCH] NOMMU: Or...
547
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
548
549
  #ifdef CONFIG_DEBUG_NOMMU_REGIONS
  static noinline void validate_nommu_regions(void)
3034097a5   David Howells   [PATCH] NOMMU: Or...
550
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
551
552
  	struct vm_region *region, *last;
  	struct rb_node *p, *lastp;
3034097a5   David Howells   [PATCH] NOMMU: Or...
553

8feae1311   David Howells   NOMMU: Make VMAs ...
554
555
556
557
558
  	lastp = rb_first(&nommu_region_tree);
  	if (!lastp)
  		return;
  
  	last = rb_entry(lastp, struct vm_region, vm_rb);
33e5d7697   David Howells   nommu: fix a numb...
559
560
  	BUG_ON(unlikely(last->vm_end <= last->vm_start));
  	BUG_ON(unlikely(last->vm_top < last->vm_end));
8feae1311   David Howells   NOMMU: Make VMAs ...
561
562
563
564
  
  	while ((p = rb_next(lastp))) {
  		region = rb_entry(p, struct vm_region, vm_rb);
  		last = rb_entry(lastp, struct vm_region, vm_rb);
33e5d7697   David Howells   nommu: fix a numb...
565
566
567
  		BUG_ON(unlikely(region->vm_end <= region->vm_start));
  		BUG_ON(unlikely(region->vm_top < region->vm_end));
  		BUG_ON(unlikely(region->vm_start < last->vm_top));
3034097a5   David Howells   [PATCH] NOMMU: Or...
568

8feae1311   David Howells   NOMMU: Make VMAs ...
569
570
  		lastp = p;
  	}
3034097a5   David Howells   [PATCH] NOMMU: Or...
571
  }
8feae1311   David Howells   NOMMU: Make VMAs ...
572
  #else
33e5d7697   David Howells   nommu: fix a numb...
573
574
575
  static void validate_nommu_regions(void)
  {
  }
8feae1311   David Howells   NOMMU: Make VMAs ...
576
  #endif
3034097a5   David Howells   [PATCH] NOMMU: Or...
577
578
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
579
   * add a region into the global tree
3034097a5   David Howells   [PATCH] NOMMU: Or...
580
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
581
  static void add_nommu_region(struct vm_region *region)
3034097a5   David Howells   [PATCH] NOMMU: Or...
582
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
583
584
  	struct vm_region *pregion;
  	struct rb_node **p, *parent;
3034097a5   David Howells   [PATCH] NOMMU: Or...
585

8feae1311   David Howells   NOMMU: Make VMAs ...
586
  	validate_nommu_regions();
8feae1311   David Howells   NOMMU: Make VMAs ...
587
588
589
590
591
592
593
594
595
596
597
598
599
  	parent = NULL;
  	p = &nommu_region_tree.rb_node;
  	while (*p) {
  		parent = *p;
  		pregion = rb_entry(parent, struct vm_region, vm_rb);
  		if (region->vm_start < pregion->vm_start)
  			p = &(*p)->rb_left;
  		else if (region->vm_start > pregion->vm_start)
  			p = &(*p)->rb_right;
  		else if (pregion == region)
  			return;
  		else
  			BUG();
3034097a5   David Howells   [PATCH] NOMMU: Or...
600
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
601
602
  	rb_link_node(&region->vm_rb, parent, p);
  	rb_insert_color(&region->vm_rb, &nommu_region_tree);
3034097a5   David Howells   [PATCH] NOMMU: Or...
603

8feae1311   David Howells   NOMMU: Make VMAs ...
604
  	validate_nommu_regions();
3034097a5   David Howells   [PATCH] NOMMU: Or...
605
  }
3034097a5   David Howells   [PATCH] NOMMU: Or...
606
607
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
608
   * delete a region from the global tree
930e652a2   David Howells   [PATCH] NOMMU: Ma...
609
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
610
  static void delete_nommu_region(struct vm_region *region)
930e652a2   David Howells   [PATCH] NOMMU: Ma...
611
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
612
  	BUG_ON(!nommu_region_tree.rb_node);
930e652a2   David Howells   [PATCH] NOMMU: Ma...
613

8feae1311   David Howells   NOMMU: Make VMAs ...
614
615
616
  	validate_nommu_regions();
  	rb_erase(&region->vm_rb, &nommu_region_tree);
  	validate_nommu_regions();
57c8f63e8   Greg Ungerer   nommu: stub expan...
617
  }
930e652a2   David Howells   [PATCH] NOMMU: Ma...
618
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
619
   * free a contiguous series of pages
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
620
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
621
  static void free_page_series(unsigned long from, unsigned long to)
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
622
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
623
624
  	for (; from < to; from += PAGE_SIZE) {
  		struct page *page = virt_to_page(from);
33e5d7697   David Howells   nommu: fix a numb...
625
  		atomic_long_dec(&mmap_pages_allocated);
8feae1311   David Howells   NOMMU: Make VMAs ...
626
  		put_page(page);
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
627
  	}
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
628
629
630
  }
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
631
   * release a reference to a region
33e5d7697   David Howells   nommu: fix a numb...
632
   * - the caller must hold the region semaphore for writing, which this releases
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
633
   * - the region may not have been added to the tree yet, in which case vm_top
8feae1311   David Howells   NOMMU: Make VMAs ...
634
   *   will equal vm_start
3034097a5   David Howells   [PATCH] NOMMU: Or...
635
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
636
637
  static void __put_nommu_region(struct vm_region *region)
  	__releases(nommu_region_sem)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
638
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
639
  	BUG_ON(!nommu_region_tree.rb_node);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
640

1e2ae599d   David Howells   nommu: struct vm_...
641
  	if (--region->vm_usage == 0) {
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
642
  		if (region->vm_top > region->vm_start)
8feae1311   David Howells   NOMMU: Make VMAs ...
643
644
645
646
647
648
649
650
  			delete_nommu_region(region);
  		up_write(&nommu_region_sem);
  
  		if (region->vm_file)
  			fput(region->vm_file);
  
  		/* IO memory and memory shared directly out of the pagecache
  		 * from ramfs/tmpfs mustn't be released here */
22cc877b3   Leon Romanovsky   mm: nommu: refact...
651
  		if (region->vm_flags & VM_MAPPED_COPY)
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
652
  			free_page_series(region->vm_start, region->vm_top);
8feae1311   David Howells   NOMMU: Make VMAs ...
653
654
655
  		kmem_cache_free(vm_region_jar, region);
  	} else {
  		up_write(&nommu_region_sem);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
656
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
657
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
658

8feae1311   David Howells   NOMMU: Make VMAs ...
659
660
661
662
663
664
665
  /*
   * release a reference to a region
   */
  static void put_nommu_region(struct vm_region *region)
  {
  	down_write(&nommu_region_sem);
  	__put_nommu_region(region);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
666
  }
3034097a5   David Howells   [PATCH] NOMMU: Or...
667
  /*
eb8cdec4a   Bernd Schmidt   nommu: add suppor...
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
   * update protection on a vma
   */
  static void protect_vma(struct vm_area_struct *vma, unsigned long flags)
  {
  #ifdef CONFIG_MPU
  	struct mm_struct *mm = vma->vm_mm;
  	long start = vma->vm_start & PAGE_MASK;
  	while (start < vma->vm_end) {
  		protect_page(mm, start, flags);
  		start += PAGE_SIZE;
  	}
  	update_protections(mm);
  #endif
  }
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
684
685
686
687
   * add a VMA into a process's mm_struct in the appropriate place in the list
   * and tree and add to the address space's page tree also if not an anonymous
   * page
   * - should be called with mm->mmap_sem held writelocked
3034097a5   David Howells   [PATCH] NOMMU: Or...
688
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
689
  static void add_vma_to_mm(struct mm_struct *mm, struct vm_area_struct *vma)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
690
  {
6038def0d   Namhyung Kim   mm: nommu: sort m...
691
  	struct vm_area_struct *pvma, *prev;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
692
  	struct address_space *mapping;
6038def0d   Namhyung Kim   mm: nommu: sort m...
693
  	struct rb_node **p, *parent, *rb_prev;
8feae1311   David Howells   NOMMU: Make VMAs ...
694

8feae1311   David Howells   NOMMU: Make VMAs ...
695
696
697
698
  	BUG_ON(!vma->vm_region);
  
  	mm->map_count++;
  	vma->vm_mm = mm;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
699

eb8cdec4a   Bernd Schmidt   nommu: add suppor...
700
  	protect_vma(vma, vma->vm_flags);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
701
702
703
  	/* add the VMA to the mapping */
  	if (vma->vm_file) {
  		mapping = vma->vm_file->f_mapping;
83cde9e8b   Davidlohr Bueso   mm: use new helpe...
704
  		i_mmap_lock_write(mapping);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
705
  		flush_dcache_mmap_lock(mapping);
6b2dbba8b   Michel Lespinasse   mm: replace vma p...
706
  		vma_interval_tree_insert(vma, &mapping->i_mmap);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
707
  		flush_dcache_mmap_unlock(mapping);
83cde9e8b   Davidlohr Bueso   mm: use new helpe...
708
  		i_mmap_unlock_write(mapping);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
709
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
710
  	/* add the VMA to the tree */
6038def0d   Namhyung Kim   mm: nommu: sort m...
711
  	parent = rb_prev = NULL;
8feae1311   David Howells   NOMMU: Make VMAs ...
712
  	p = &mm->mm_rb.rb_node;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
713
714
715
  	while (*p) {
  		parent = *p;
  		pvma = rb_entry(parent, struct vm_area_struct, vm_rb);
8feae1311   David Howells   NOMMU: Make VMAs ...
716
717
718
  		/* sort by: start addr, end addr, VMA struct addr in that order
  		 * (the latter is necessary as we may get identical VMAs) */
  		if (vma->vm_start < pvma->vm_start)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
719
  			p = &(*p)->rb_left;
6038def0d   Namhyung Kim   mm: nommu: sort m...
720
721
  		else if (vma->vm_start > pvma->vm_start) {
  			rb_prev = parent;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
722
  			p = &(*p)->rb_right;
6038def0d   Namhyung Kim   mm: nommu: sort m...
723
  		} else if (vma->vm_end < pvma->vm_end)
8feae1311   David Howells   NOMMU: Make VMAs ...
724
  			p = &(*p)->rb_left;
6038def0d   Namhyung Kim   mm: nommu: sort m...
725
726
  		else if (vma->vm_end > pvma->vm_end) {
  			rb_prev = parent;
8feae1311   David Howells   NOMMU: Make VMAs ...
727
  			p = &(*p)->rb_right;
6038def0d   Namhyung Kim   mm: nommu: sort m...
728
  		} else if (vma < pvma)
8feae1311   David Howells   NOMMU: Make VMAs ...
729
  			p = &(*p)->rb_left;
6038def0d   Namhyung Kim   mm: nommu: sort m...
730
731
  		else if (vma > pvma) {
  			rb_prev = parent;
8feae1311   David Howells   NOMMU: Make VMAs ...
732
  			p = &(*p)->rb_right;
6038def0d   Namhyung Kim   mm: nommu: sort m...
733
  		} else
8feae1311   David Howells   NOMMU: Make VMAs ...
734
  			BUG();
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
735
736
737
  	}
  
  	rb_link_node(&vma->vm_rb, parent, p);
8feae1311   David Howells   NOMMU: Make VMAs ...
738
739
740
  	rb_insert_color(&vma->vm_rb, &mm->mm_rb);
  
  	/* add VMA to the VMA list also */
6038def0d   Namhyung Kim   mm: nommu: sort m...
741
742
743
  	prev = NULL;
  	if (rb_prev)
  		prev = rb_entry(rb_prev, struct vm_area_struct, vm_rb);
8feae1311   David Howells   NOMMU: Make VMAs ...
744

6038def0d   Namhyung Kim   mm: nommu: sort m...
745
  	__vma_link_list(mm, vma, prev, parent);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
746
  }
3034097a5   David Howells   [PATCH] NOMMU: Or...
747
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
748
   * delete a VMA from its owning mm_struct and address space
3034097a5   David Howells   [PATCH] NOMMU: Or...
749
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
750
  static void delete_vma_from_mm(struct vm_area_struct *vma)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
751
  {
615d6e875   Davidlohr Bueso   mm: per-thread vm...
752
  	int i;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
753
  	struct address_space *mapping;
8feae1311   David Howells   NOMMU: Make VMAs ...
754
  	struct mm_struct *mm = vma->vm_mm;
615d6e875   Davidlohr Bueso   mm: per-thread vm...
755
  	struct task_struct *curr = current;
8feae1311   David Howells   NOMMU: Make VMAs ...
756

eb8cdec4a   Bernd Schmidt   nommu: add suppor...
757
  	protect_vma(vma, 0);
8feae1311   David Howells   NOMMU: Make VMAs ...
758
  	mm->map_count--;
615d6e875   Davidlohr Bueso   mm: per-thread vm...
759
760
761
  	for (i = 0; i < VMACACHE_SIZE; i++) {
  		/* if the vma is cached, invalidate the entire cache */
  		if (curr->vmacache[i] == vma) {
e020d5bd8   Steven Miao   mm: nommu: per-th...
762
  			vmacache_invalidate(mm);
615d6e875   Davidlohr Bueso   mm: per-thread vm...
763
764
765
  			break;
  		}
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
766
767
768
769
  
  	/* remove the VMA from the mapping */
  	if (vma->vm_file) {
  		mapping = vma->vm_file->f_mapping;
83cde9e8b   Davidlohr Bueso   mm: use new helpe...
770
  		i_mmap_lock_write(mapping);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
771
  		flush_dcache_mmap_lock(mapping);
6b2dbba8b   Michel Lespinasse   mm: replace vma p...
772
  		vma_interval_tree_remove(vma, &mapping->i_mmap);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
773
  		flush_dcache_mmap_unlock(mapping);
83cde9e8b   Davidlohr Bueso   mm: use new helpe...
774
  		i_mmap_unlock_write(mapping);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
775
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
776
777
  	/* remove from the MM's tree and list */
  	rb_erase(&vma->vm_rb, &mm->mm_rb);
b951bf2c4   Namhyung Kim   mm: nommu: don't ...
778
779
780
781
782
783
784
785
  
  	if (vma->vm_prev)
  		vma->vm_prev->vm_next = vma->vm_next;
  	else
  		mm->mmap = vma->vm_next;
  
  	if (vma->vm_next)
  		vma->vm_next->vm_prev = vma->vm_prev;
8feae1311   David Howells   NOMMU: Make VMAs ...
786
787
788
789
790
791
792
  }
  
  /*
   * destroy a VMA record
   */
  static void delete_vma(struct mm_struct *mm, struct vm_area_struct *vma)
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
793
794
  	if (vma->vm_ops && vma->vm_ops->close)
  		vma->vm_ops->close(vma);
e9714acf8   Konstantin Khlebnikov   mm: kill vma flag...
795
  	if (vma->vm_file)
8feae1311   David Howells   NOMMU: Make VMAs ...
796
  		fput(vma->vm_file);
8feae1311   David Howells   NOMMU: Make VMAs ...
797
798
799
800
801
802
803
804
805
806
807
  	put_nommu_region(vma->vm_region);
  	kmem_cache_free(vm_area_cachep, vma);
  }
  
  /*
   * look up the first VMA in which addr resides, NULL if none
   * - should be called with mm->mmap_sem at least held readlocked
   */
  struct vm_area_struct *find_vma(struct mm_struct *mm, unsigned long addr)
  {
  	struct vm_area_struct *vma;
8feae1311   David Howells   NOMMU: Make VMAs ...
808
809
  
  	/* check the cache first */
615d6e875   Davidlohr Bueso   mm: per-thread vm...
810
811
  	vma = vmacache_find(mm, addr);
  	if (likely(vma))
8feae1311   David Howells   NOMMU: Make VMAs ...
812
  		return vma;
e922c4c53   Namhyung Kim   mm: nommu: find v...
813
  	/* trawl the list (there may be multiple mappings in which addr
8feae1311   David Howells   NOMMU: Make VMAs ...
814
  	 * resides) */
e922c4c53   Namhyung Kim   mm: nommu: find v...
815
  	for (vma = mm->mmap; vma; vma = vma->vm_next) {
8feae1311   David Howells   NOMMU: Make VMAs ...
816
817
818
  		if (vma->vm_start > addr)
  			return NULL;
  		if (vma->vm_end > addr) {
615d6e875   Davidlohr Bueso   mm: per-thread vm...
819
  			vmacache_update(addr, vma);
8feae1311   David Howells   NOMMU: Make VMAs ...
820
821
822
823
824
825
826
827
828
829
830
831
832
833
  			return vma;
  		}
  	}
  
  	return NULL;
  }
  EXPORT_SYMBOL(find_vma);
  
  /*
   * find a VMA
   * - we don't extend stack VMAs under NOMMU conditions
   */
  struct vm_area_struct *find_extend_vma(struct mm_struct *mm, unsigned long addr)
  {
7561e8ca0   David Howells   NOMMU: Revert 'no...
834
  	return find_vma(mm, addr);
8feae1311   David Howells   NOMMU: Make VMAs ...
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
  }
  
  /*
   * expand a stack to a given address
   * - not supported under NOMMU conditions
   */
  int expand_stack(struct vm_area_struct *vma, unsigned long address)
  {
  	return -ENOMEM;
  }
  
  /*
   * look up the first VMA exactly that exactly matches addr
   * - should be called with mm->mmap_sem at least held readlocked
   */
  static struct vm_area_struct *find_vma_exact(struct mm_struct *mm,
  					     unsigned long addr,
  					     unsigned long len)
  {
  	struct vm_area_struct *vma;
8feae1311   David Howells   NOMMU: Make VMAs ...
855
856
857
  	unsigned long end = addr + len;
  
  	/* check the cache first */
615d6e875   Davidlohr Bueso   mm: per-thread vm...
858
859
  	vma = vmacache_find_exact(mm, addr, end);
  	if (vma)
8feae1311   David Howells   NOMMU: Make VMAs ...
860
  		return vma;
e922c4c53   Namhyung Kim   mm: nommu: find v...
861
  	/* trawl the list (there may be multiple mappings in which addr
8feae1311   David Howells   NOMMU: Make VMAs ...
862
  	 * resides) */
e922c4c53   Namhyung Kim   mm: nommu: find v...
863
  	for (vma = mm->mmap; vma; vma = vma->vm_next) {
8feae1311   David Howells   NOMMU: Make VMAs ...
864
865
866
867
868
  		if (vma->vm_start < addr)
  			continue;
  		if (vma->vm_start > addr)
  			return NULL;
  		if (vma->vm_end == end) {
615d6e875   Davidlohr Bueso   mm: per-thread vm...
869
  			vmacache_update(addr, vma);
8feae1311   David Howells   NOMMU: Make VMAs ...
870
871
872
873
874
  			return vma;
  		}
  	}
  
  	return NULL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
875
876
877
878
879
880
881
882
883
884
885
886
887
888
  }
  
  /*
   * determine whether a mapping should be permitted and, if so, what sort of
   * mapping we're capable of supporting
   */
  static int validate_mmap_request(struct file *file,
  				 unsigned long addr,
  				 unsigned long len,
  				 unsigned long prot,
  				 unsigned long flags,
  				 unsigned long pgoff,
  				 unsigned long *_capabilities)
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
889
  	unsigned long capabilities, rlen;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
890
891
892
  	int ret;
  
  	/* do the simple checks first */
22cc877b3   Leon Romanovsky   mm: nommu: refact...
893
  	if (flags & MAP_FIXED)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
894
  		return -EINVAL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
895
896
897
898
  
  	if ((flags & MAP_TYPE) != MAP_PRIVATE &&
  	    (flags & MAP_TYPE) != MAP_SHARED)
  		return -EINVAL;
f81cff0d4   Mike Frysinger   [PATCH] uclinux: ...
899
  	if (!len)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
900
  		return -EINVAL;
f81cff0d4   Mike Frysinger   [PATCH] uclinux: ...
901
  	/* Careful about overflows.. */
8feae1311   David Howells   NOMMU: Make VMAs ...
902
903
  	rlen = PAGE_ALIGN(len);
  	if (!rlen || rlen > TASK_SIZE)
f81cff0d4   Mike Frysinger   [PATCH] uclinux: ...
904
  		return -ENOMEM;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
905
  	/* offset overflow? */
8feae1311   David Howells   NOMMU: Make VMAs ...
906
  	if ((pgoff + (rlen >> PAGE_SHIFT)) < pgoff)
f81cff0d4   Mike Frysinger   [PATCH] uclinux: ...
907
  		return -EOVERFLOW;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
908
909
  
  	if (file) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
910
  		/* files must support mmap */
72c2d5319   Al Viro   file->f_op is nev...
911
  		if (!file->f_op->mmap)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
912
913
914
915
916
917
  			return -ENODEV;
  
  		/* work out if what we've got could possibly be shared
  		 * - we support chardevs that provide their own "memory"
  		 * - we support files/blockdevs that are memory backed
  		 */
b4caecd48   Christoph Hellwig   fs: introduce f_o...
918
919
920
  		if (file->f_op->mmap_capabilities) {
  			capabilities = file->f_op->mmap_capabilities(file);
  		} else {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
921
922
  			/* no explicit capabilities set, so assume some
  			 * defaults */
496ad9aa8   Al Viro   new helper: file_...
923
  			switch (file_inode(file)->i_mode & S_IFMT) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
924
925
  			case S_IFREG:
  			case S_IFBLK:
b4caecd48   Christoph Hellwig   fs: introduce f_o...
926
  				capabilities = NOMMU_MAP_COPY;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
927
928
929
930
  				break;
  
  			case S_IFCHR:
  				capabilities =
b4caecd48   Christoph Hellwig   fs: introduce f_o...
931
932
933
  					NOMMU_MAP_DIRECT |
  					NOMMU_MAP_READ |
  					NOMMU_MAP_WRITE;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
934
935
936
937
938
939
940
941
942
943
  				break;
  
  			default:
  				return -EINVAL;
  			}
  		}
  
  		/* eliminate any capabilities that we can't support on this
  		 * device */
  		if (!file->f_op->get_unmapped_area)
b4caecd48   Christoph Hellwig   fs: introduce f_o...
944
  			capabilities &= ~NOMMU_MAP_DIRECT;
6e242a1ce   Al Viro   nommu: use __vfs_...
945
  		if (!(file->f_mode & FMODE_CAN_READ))
b4caecd48   Christoph Hellwig   fs: introduce f_o...
946
  			capabilities &= ~NOMMU_MAP_COPY;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
947

28d7a6ae9   Graff Yang   nommu: check fd r...
948
949
950
  		/* The file shall have been opened with read permission. */
  		if (!(file->f_mode & FMODE_READ))
  			return -EACCES;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
951
952
953
954
955
  		if (flags & MAP_SHARED) {
  			/* do checks for writing, appending and locking */
  			if ((prot & PROT_WRITE) &&
  			    !(file->f_mode & FMODE_WRITE))
  				return -EACCES;
496ad9aa8   Al Viro   new helper: file_...
956
  			if (IS_APPEND(file_inode(file)) &&
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
957
958
  			    (file->f_mode & FMODE_WRITE))
  				return -EACCES;
d7a06983a   Jeff Layton   locks: fix locks_...
959
  			if (locks_verify_locked(file))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
960
  				return -EAGAIN;
b4caecd48   Christoph Hellwig   fs: introduce f_o...
961
  			if (!(capabilities & NOMMU_MAP_DIRECT))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
962
  				return -ENODEV;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
963
  			/* we mustn't privatise shared mappings */
b4caecd48   Christoph Hellwig   fs: introduce f_o...
964
  			capabilities &= ~NOMMU_MAP_COPY;
ac7149045   Choi Gi-yong   mm: fix 'ERROR: d...
965
  		} else {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
966
967
  			/* we're going to read the file into private memory we
  			 * allocate */
b4caecd48   Christoph Hellwig   fs: introduce f_o...
968
  			if (!(capabilities & NOMMU_MAP_COPY))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
969
970
971
972
973
  				return -ENODEV;
  
  			/* we don't permit a private writable mapping to be
  			 * shared with the backing device */
  			if (prot & PROT_WRITE)
b4caecd48   Christoph Hellwig   fs: introduce f_o...
974
  				capabilities &= ~NOMMU_MAP_DIRECT;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
975
  		}
b4caecd48   Christoph Hellwig   fs: introduce f_o...
976
977
978
979
  		if (capabilities & NOMMU_MAP_DIRECT) {
  			if (((prot & PROT_READ)  && !(capabilities & NOMMU_MAP_READ))  ||
  			    ((prot & PROT_WRITE) && !(capabilities & NOMMU_MAP_WRITE)) ||
  			    ((prot & PROT_EXEC)  && !(capabilities & NOMMU_MAP_EXEC))
3c7b20454   Bernd Schmidt   nommu: allow priv...
980
  			    ) {
b4caecd48   Christoph Hellwig   fs: introduce f_o...
981
  				capabilities &= ~NOMMU_MAP_DIRECT;
3c7b20454   Bernd Schmidt   nommu: allow priv...
982
  				if (flags & MAP_SHARED) {
22cc877b3   Leon Romanovsky   mm: nommu: refact...
983
984
  					pr_warn("MAP_SHARED not completely supported on !MMU
  ");
3c7b20454   Bernd Schmidt   nommu: allow priv...
985
986
987
988
  					return -EINVAL;
  				}
  			}
  		}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
989
990
  		/* handle executable mappings and implied executable
  		 * mappings */
e9536ae72   Josef Sipek   [PATCH] struct pa...
991
  		if (file->f_path.mnt->mnt_flags & MNT_NOEXEC) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
992
993
  			if (prot & PROT_EXEC)
  				return -EPERM;
ac7149045   Choi Gi-yong   mm: fix 'ERROR: d...
994
  		} else if ((prot & PROT_READ) && !(prot & PROT_EXEC)) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
995
996
  			/* handle implication of PROT_EXEC by PROT_READ */
  			if (current->personality & READ_IMPLIES_EXEC) {
b4caecd48   Christoph Hellwig   fs: introduce f_o...
997
  				if (capabilities & NOMMU_MAP_EXEC)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
998
999
  					prot |= PROT_EXEC;
  			}
ac7149045   Choi Gi-yong   mm: fix 'ERROR: d...
1000
  		} else if ((prot & PROT_READ) &&
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1001
  			 (prot & PROT_EXEC) &&
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1002
  			 !(capabilities & NOMMU_MAP_EXEC)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1003
1004
  			 ) {
  			/* backing file is not executable, try to copy */
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1005
  			capabilities &= ~NOMMU_MAP_DIRECT;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1006
  		}
ac7149045   Choi Gi-yong   mm: fix 'ERROR: d...
1007
  	} else {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1008
1009
1010
  		/* anonymous mappings are always memory backed and can be
  		 * privately mapped
  		 */
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1011
  		capabilities = NOMMU_MAP_COPY;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1012
1013
1014
1015
1016
1017
1018
1019
  
  		/* handle PROT_EXEC implication by PROT_READ */
  		if ((prot & PROT_READ) &&
  		    (current->personality & READ_IMPLIES_EXEC))
  			prot |= PROT_EXEC;
  	}
  
  	/* allow the security API to have its say */
e5467859f   Al Viro   split ->file_mmap...
1020
1021
1022
  	ret = security_mmap_addr(addr);
  	if (ret < 0)
  		return ret;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1023
1024
1025
1026
1027
1028
1029
1030
1031
1032
1033
1034
1035
1036
1037
1038
1039
1040
  
  	/* looks okay */
  	*_capabilities = capabilities;
  	return 0;
  }
  
  /*
   * we've determined that we can make the mapping, now translate what we
   * now know into VMA flags
   */
  static unsigned long determine_vm_flags(struct file *file,
  					unsigned long prot,
  					unsigned long flags,
  					unsigned long capabilities)
  {
  	unsigned long vm_flags;
  
  	vm_flags = calc_vm_prot_bits(prot) | calc_vm_flag_bits(flags);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1041
  	/* vm_flags |= mm->def_flags; */
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1042
  	if (!(capabilities & NOMMU_MAP_DIRECT)) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1043
  		/* attempt to share read-only copies of mapped file chunks */
3c7b20454   Bernd Schmidt   nommu: allow priv...
1044
  		vm_flags |= VM_MAYREAD | VM_MAYWRITE | VM_MAYEXEC;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1045
1046
  		if (file && !(prot & PROT_WRITE))
  			vm_flags |= VM_MAYSHARE;
3c7b20454   Bernd Schmidt   nommu: allow priv...
1047
  	} else {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1048
1049
1050
  		/* overlay a shareable mapping on the backing device or inode
  		 * if possible - used for chardevs, ramfs/tmpfs/shmfs and
  		 * romfs/cramfs */
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1051
  		vm_flags |= VM_MAYSHARE | (capabilities & NOMMU_VMFLAGS);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1052
  		if (flags & MAP_SHARED)
3c7b20454   Bernd Schmidt   nommu: allow priv...
1053
  			vm_flags |= VM_SHARED;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1054
1055
1056
1057
1058
1059
  	}
  
  	/* refuse to let anyone share private mappings with this process if
  	 * it's being traced - otherwise breakpoints set in it may interfere
  	 * with another untraced process
  	 */
a288eecce   Tejun Heo   ptrace: kill triv...
1060
  	if ((flags & MAP_PRIVATE) && current->ptrace)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1061
1062
1063
1064
1065
1066
  		vm_flags &= ~VM_MAYSHARE;
  
  	return vm_flags;
  }
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
1067
1068
   * set up a shared mapping on a file (the driver or filesystem provides and
   * pins the storage)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1069
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
1070
  static int do_mmap_shared_file(struct vm_area_struct *vma)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1071
1072
1073
1074
  {
  	int ret;
  
  	ret = vma->vm_file->f_op->mmap(vma->vm_file, vma);
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1075
1076
  	if (ret == 0) {
  		vma->vm_region->vm_top = vma->vm_region->vm_end;
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1077
  		return 0;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1078
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1079
1080
  	if (ret != -ENOSYS)
  		return ret;
3fa30460e   David Howells   nommu: fix an inc...
1081
1082
1083
  	/* getting -ENOSYS indicates that direct mmap isn't possible (as
  	 * opposed to tried but failed) so we can only give a suitable error as
  	 * it's not possible to make a private copy if MAP_SHARED was given */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1084
1085
1086
1087
1088
1089
  	return -ENODEV;
  }
  
  /*
   * set up a private mapping or an anonymous shared mapping
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
1090
1091
  static int do_mmap_private(struct vm_area_struct *vma,
  			   struct vm_region *region,
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1092
1093
  			   unsigned long len,
  			   unsigned long capabilities)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1094
  {
dbc8358c7   Joonsoo Kim   mm/nommu: use all...
1095
  	unsigned long total, point;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1096
  	void *base;
8feae1311   David Howells   NOMMU: Make VMAs ...
1097
  	int ret, order;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1098
1099
1100
1101
1102
  
  	/* invoke the file's mapping function so that it can keep track of
  	 * shared mappings on devices or memory
  	 * - VM_MAYSHARE will be set if it may attempt to share
  	 */
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1103
  	if (capabilities & NOMMU_MAP_DIRECT) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1104
  		ret = vma->vm_file->f_op->mmap(vma->vm_file, vma);
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1105
  		if (ret == 0) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1106
  			/* shouldn't return success if we're not sharing */
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1107
1108
  			BUG_ON(!(vma->vm_flags & VM_MAYSHARE));
  			vma->vm_region->vm_top = vma->vm_region->vm_end;
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1109
  			return 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1110
  		}
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1111
1112
  		if (ret != -ENOSYS)
  			return ret;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1113
1114
1115
1116
1117
  
  		/* getting an ENOSYS error indicates that direct mmap isn't
  		 * possible (as opposed to tried but failed) so we'll try to
  		 * make a private copy of the data and map that instead */
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1118

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1119
1120
1121
1122
  	/* allocate some memory to hold the mapping
  	 * - note that this may not return a page-aligned address if the object
  	 *   we're allocating is smaller than a page
  	 */
f67d9b157   Bob Liu   nommu: add page a...
1123
  	order = get_order(len);
8feae1311   David Howells   NOMMU: Make VMAs ...
1124
  	total = 1 << order;
f67d9b157   Bob Liu   nommu: add page a...
1125
  	point = len >> PAGE_SHIFT;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1126

dbc8358c7   Joonsoo Kim   mm/nommu: use all...
1127
  	/* we don't want to allocate a power-of-2 sized page set */
22cc877b3   Leon Romanovsky   mm: nommu: refact...
1128
  	if (sysctl_nr_trim_pages && total - point >= sysctl_nr_trim_pages)
dbc8358c7   Joonsoo Kim   mm/nommu: use all...
1129
  		total = point;
8feae1311   David Howells   NOMMU: Make VMAs ...
1130

da616534e   Joonsoo Kim   mm/nommu: fix mem...
1131
  	base = alloc_pages_exact(total << PAGE_SHIFT, GFP_KERNEL);
dbc8358c7   Joonsoo Kim   mm/nommu: use all...
1132
1133
1134
1135
  	if (!base)
  		goto enomem;
  
  	atomic_long_add(total, &mmap_pages_allocated);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1136

8feae1311   David Howells   NOMMU: Make VMAs ...
1137
1138
  	region->vm_flags = vma->vm_flags |= VM_MAPPED_COPY;
  	region->vm_start = (unsigned long) base;
f67d9b157   Bob Liu   nommu: add page a...
1139
  	region->vm_end   = region->vm_start + len;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1140
  	region->vm_top   = region->vm_start + (total << PAGE_SHIFT);
8feae1311   David Howells   NOMMU: Make VMAs ...
1141
1142
1143
  
  	vma->vm_start = region->vm_start;
  	vma->vm_end   = region->vm_start + len;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1144
1145
1146
1147
1148
1149
1150
1151
1152
1153
1154
  
  	if (vma->vm_file) {
  		/* read the contents of a file into the copy */
  		mm_segment_t old_fs;
  		loff_t fpos;
  
  		fpos = vma->vm_pgoff;
  		fpos <<= PAGE_SHIFT;
  
  		old_fs = get_fs();
  		set_fs(KERNEL_DS);
6e242a1ce   Al Viro   nommu: use __vfs_...
1155
  		ret = __vfs_read(vma->vm_file, base, len, &fpos);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1156
1157
1158
1159
1160
1161
  		set_fs(old_fs);
  
  		if (ret < 0)
  			goto error_free;
  
  		/* clear the last little bit */
f67d9b157   Bob Liu   nommu: add page a...
1162
1163
  		if (ret < len)
  			memset(base + ret, 0, len - ret);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1164

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1165
1166
1167
1168
1169
  	}
  
  	return 0;
  
  error_free:
7223bb4a8   Namhyung Kim   mm: nommu: fix a ...
1170
  	free_page_series(region->vm_start, region->vm_top);
8feae1311   David Howells   NOMMU: Make VMAs ...
1171
1172
  	region->vm_start = vma->vm_start = 0;
  	region->vm_end   = vma->vm_end = 0;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1173
  	region->vm_top   = 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1174
1175
1176
  	return ret;
  
  enomem:
b1de0d139   Mitchel Humpherys   mm: convert some ...
1177
1178
  	pr_err("Allocation of length %lu from process %d (%s) failed
  ",
05ae6fa31   Greg Ungerer   uclinux: add proc...
1179
  	       len, current->pid, current->comm);
7bf02ea22   David Rientjes   arch, mm: filter ...
1180
  	show_free_areas(0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1181
1182
1183
1184
1185
1186
  	return -ENOMEM;
  }
  
  /*
   * handle mapping creation for uClinux
   */
e3fc629d7   Al Viro   switch aio and sh...
1187
  unsigned long do_mmap_pgoff(struct file *file,
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1188
1189
1190
1191
  			    unsigned long addr,
  			    unsigned long len,
  			    unsigned long prot,
  			    unsigned long flags,
bebeb3d68   Michel Lespinasse   mm: introduce mm_...
1192
  			    unsigned long pgoff,
41badc15c   Michel Lespinasse   mm: make do_mmap_...
1193
  			    unsigned long *populate)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1194
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
1195
1196
  	struct vm_area_struct *vma;
  	struct vm_region *region;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1197
  	struct rb_node *rb;
8feae1311   David Howells   NOMMU: Make VMAs ...
1198
  	unsigned long capabilities, vm_flags, result;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1199
  	int ret;
41badc15c   Michel Lespinasse   mm: make do_mmap_...
1200
  	*populate = 0;
bebeb3d68   Michel Lespinasse   mm: introduce mm_...
1201

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1202
1203
1204
1205
  	/* decide whether we should attempt the mapping, and if so what sort of
  	 * mapping */
  	ret = validate_mmap_request(file, addr, len, prot, flags, pgoff,
  				    &capabilities);
22cc877b3   Leon Romanovsky   mm: nommu: refact...
1206
  	if (ret < 0)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1207
  		return ret;
06aab5a30   David Howells   NOMMU: Ignore mma...
1208
1209
  	/* we ignore the address hint */
  	addr = 0;
f67d9b157   Bob Liu   nommu: add page a...
1210
  	len = PAGE_ALIGN(len);
06aab5a30   David Howells   NOMMU: Ignore mma...
1211

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1212
1213
1214
  	/* we've determined that we can make the mapping, now translate what we
  	 * now know into VMA flags */
  	vm_flags = determine_vm_flags(file, prot, flags, capabilities);
8feae1311   David Howells   NOMMU: Make VMAs ...
1215
1216
1217
1218
1219
1220
1221
1222
  	/* we're going to need to record the mapping */
  	region = kmem_cache_zalloc(vm_region_jar, GFP_KERNEL);
  	if (!region)
  		goto error_getting_region;
  
  	vma = kmem_cache_zalloc(vm_area_cachep, GFP_KERNEL);
  	if (!vma)
  		goto error_getting_vma;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1223

1e2ae599d   David Howells   nommu: struct vm_...
1224
  	region->vm_usage = 1;
8feae1311   David Howells   NOMMU: Make VMAs ...
1225
1226
  	region->vm_flags = vm_flags;
  	region->vm_pgoff = pgoff;
5beb49305   Rik van Riel   mm: change anon_v...
1227
  	INIT_LIST_HEAD(&vma->anon_vma_chain);
8feae1311   David Howells   NOMMU: Make VMAs ...
1228
1229
  	vma->vm_flags = vm_flags;
  	vma->vm_pgoff = pgoff;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1230

8feae1311   David Howells   NOMMU: Make VMAs ...
1231
  	if (file) {
cb0942b81   Al Viro   make get_file() r...
1232
1233
  		region->vm_file = get_file(file);
  		vma->vm_file = get_file(file);
8feae1311   David Howells   NOMMU: Make VMAs ...
1234
1235
1236
1237
1238
  	}
  
  	down_write(&nommu_region_sem);
  
  	/* if we want to share, we need to check for regions created by other
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1239
  	 * mmap() calls that overlap with our proposed mapping
8feae1311   David Howells   NOMMU: Make VMAs ...
1240
  	 * - we can only share with a superset match on most regular files
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1241
1242
1243
1244
1245
1246
  	 * - shared mappings on character devices and memory backed files are
  	 *   permitted to overlap inexactly as far as we are concerned for in
  	 *   these cases, sharing is handled in the driver or filesystem rather
  	 *   than here
  	 */
  	if (vm_flags & VM_MAYSHARE) {
8feae1311   David Howells   NOMMU: Make VMAs ...
1247
1248
  		struct vm_region *pregion;
  		unsigned long pglen, rpglen, pgend, rpgend, start;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1249

8feae1311   David Howells   NOMMU: Make VMAs ...
1250
1251
  		pglen = (len + PAGE_SIZE - 1) >> PAGE_SHIFT;
  		pgend = pgoff + pglen;
165b23927   David Howells   [PATCH] NOMMU: ma...
1252

8feae1311   David Howells   NOMMU: Make VMAs ...
1253
1254
  		for (rb = rb_first(&nommu_region_tree); rb; rb = rb_next(rb)) {
  			pregion = rb_entry(rb, struct vm_region, vm_rb);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1255

8feae1311   David Howells   NOMMU: Make VMAs ...
1256
  			if (!(pregion->vm_flags & VM_MAYSHARE))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1257
1258
1259
  				continue;
  
  			/* search for overlapping mappings on the same file */
496ad9aa8   Al Viro   new helper: file_...
1260
1261
  			if (file_inode(pregion->vm_file) !=
  			    file_inode(file))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1262
  				continue;
8feae1311   David Howells   NOMMU: Make VMAs ...
1263
  			if (pregion->vm_pgoff >= pgend)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1264
  				continue;
8feae1311   David Howells   NOMMU: Make VMAs ...
1265
1266
1267
1268
  			rpglen = pregion->vm_end - pregion->vm_start;
  			rpglen = (rpglen + PAGE_SIZE - 1) >> PAGE_SHIFT;
  			rpgend = pregion->vm_pgoff + rpglen;
  			if (pgoff >= rpgend)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1269
  				continue;
8feae1311   David Howells   NOMMU: Make VMAs ...
1270
1271
1272
1273
1274
  			/* handle inexactly overlapping matches between
  			 * mappings */
  			if ((pregion->vm_pgoff != pgoff || rpglen != pglen) &&
  			    !(pgoff >= pregion->vm_pgoff && pgend <= rpgend)) {
  				/* new mapping is not a subset of the region */
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1275
  				if (!(capabilities & NOMMU_MAP_DIRECT))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1276
1277
1278
  					goto sharing_violation;
  				continue;
  			}
8feae1311   David Howells   NOMMU: Make VMAs ...
1279
  			/* we've found a region we can share */
1e2ae599d   David Howells   nommu: struct vm_...
1280
  			pregion->vm_usage++;
8feae1311   David Howells   NOMMU: Make VMAs ...
1281
1282
1283
1284
1285
  			vma->vm_region = pregion;
  			start = pregion->vm_start;
  			start += (pgoff - pregion->vm_pgoff) << PAGE_SHIFT;
  			vma->vm_start = start;
  			vma->vm_end = start + len;
22cc877b3   Leon Romanovsky   mm: nommu: refact...
1286
  			if (pregion->vm_flags & VM_MAPPED_COPY)
8feae1311   David Howells   NOMMU: Make VMAs ...
1287
  				vma->vm_flags |= VM_MAPPED_COPY;
22cc877b3   Leon Romanovsky   mm: nommu: refact...
1288
  			else {
8feae1311   David Howells   NOMMU: Make VMAs ...
1289
1290
1291
1292
1293
  				ret = do_mmap_shared_file(vma);
  				if (ret < 0) {
  					vma->vm_region = NULL;
  					vma->vm_start = 0;
  					vma->vm_end = 0;
1e2ae599d   David Howells   nommu: struct vm_...
1294
  					pregion->vm_usage--;
8feae1311   David Howells   NOMMU: Make VMAs ...
1295
1296
1297
1298
1299
1300
1301
1302
1303
  					pregion = NULL;
  					goto error_just_free;
  				}
  			}
  			fput(region->vm_file);
  			kmem_cache_free(vm_region_jar, region);
  			region = pregion;
  			result = start;
  			goto share;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1304
  		}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1305
1306
1307
1308
  		/* obtain the address at which to make a shared mapping
  		 * - this is the hook for quasi-memory character devices to
  		 *   tell us the location of a shared mapping
  		 */
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1309
  		if (capabilities & NOMMU_MAP_DIRECT) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1310
1311
  			addr = file->f_op->get_unmapped_area(file, addr, len,
  							     pgoff, flags);
bb005a59e   Namhyung Kim   mm: nommu: fix a ...
1312
  			if (IS_ERR_VALUE(addr)) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1313
  				ret = addr;
bb005a59e   Namhyung Kim   mm: nommu: fix a ...
1314
  				if (ret != -ENOSYS)
8feae1311   David Howells   NOMMU: Make VMAs ...
1315
  					goto error_just_free;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1316
1317
1318
1319
  
  				/* the driver refused to tell us where to site
  				 * the mapping so we'll have to attempt to copy
  				 * it */
bb005a59e   Namhyung Kim   mm: nommu: fix a ...
1320
  				ret = -ENODEV;
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1321
  				if (!(capabilities & NOMMU_MAP_COPY))
8feae1311   David Howells   NOMMU: Make VMAs ...
1322
  					goto error_just_free;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1323

b4caecd48   Christoph Hellwig   fs: introduce f_o...
1324
  				capabilities &= ~NOMMU_MAP_DIRECT;
8feae1311   David Howells   NOMMU: Make VMAs ...
1325
1326
1327
  			} else {
  				vma->vm_start = region->vm_start = addr;
  				vma->vm_end = region->vm_end = addr + len;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1328
1329
1330
  			}
  		}
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1331
  	vma->vm_region = region;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1332

645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1333
  	/* set up the mapping
b4caecd48   Christoph Hellwig   fs: introduce f_o...
1334
  	 * - the region is filled in if NOMMU_MAP_DIRECT is still set
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1335
  	 */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1336
  	if (file && vma->vm_flags & VM_SHARED)
8feae1311   David Howells   NOMMU: Make VMAs ...
1337
  		ret = do_mmap_shared_file(vma);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1338
  	else
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1339
  		ret = do_mmap_private(vma, region, len, capabilities);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1340
  	if (ret < 0)
645d83c5d   David Howells   NOMMU: Fix MAP_PR...
1341
1342
  		goto error_just_free;
  	add_nommu_region(region);
8feae1311   David Howells   NOMMU: Make VMAs ...
1343

ea6376395   Jie Zhang   nommu: fix malloc...
1344
1345
1346
1347
  	/* clear anonymous mappings that don't ask for uninitialized data */
  	if (!vma->vm_file && !(flags & MAP_UNINITIALIZED))
  		memset((void *)region->vm_start, 0,
  		       region->vm_end - region->vm_start);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1348
  	/* okay... we have a mapping; now we have to register it */
8feae1311   David Howells   NOMMU: Make VMAs ...
1349
  	result = vma->vm_start;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1350

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1351
  	current->mm->total_vm += len >> PAGE_SHIFT;
8feae1311   David Howells   NOMMU: Make VMAs ...
1352
1353
  share:
  	add_vma_to_mm(current->mm, vma);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1354

cfe79c00a   Mike Frysinger   NOMMU: Avoiding d...
1355
1356
1357
1358
1359
1360
  	/* we flush the region from the icache only when the first executable
  	 * mapping of it is made  */
  	if (vma->vm_flags & VM_EXEC && !region->vm_icache_flushed) {
  		flush_icache_range(region->vm_start, region->vm_end);
  		region->vm_icache_flushed = true;
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1361

cfe79c00a   Mike Frysinger   NOMMU: Avoiding d...
1362
  	up_write(&nommu_region_sem);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1363

8feae1311   David Howells   NOMMU: Make VMAs ...
1364
  	return result;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1365

8feae1311   David Howells   NOMMU: Make VMAs ...
1366
1367
1368
  error_just_free:
  	up_write(&nommu_region_sem);
  error:
89a864027   David Howells   NOMMU: Don't pass...
1369
1370
  	if (region->vm_file)
  		fput(region->vm_file);
8feae1311   David Howells   NOMMU: Make VMAs ...
1371
  	kmem_cache_free(vm_region_jar, region);
89a864027   David Howells   NOMMU: Don't pass...
1372
1373
  	if (vma->vm_file)
  		fput(vma->vm_file);
8feae1311   David Howells   NOMMU: Make VMAs ...
1374
  	kmem_cache_free(vm_area_cachep, vma);
8feae1311   David Howells   NOMMU: Make VMAs ...
1375
1376
1377
1378
  	return ret;
  
  sharing_violation:
  	up_write(&nommu_region_sem);
22cc877b3   Leon Romanovsky   mm: nommu: refact...
1379
1380
  	pr_warn("Attempt to share mismatched mappings
  ");
8feae1311   David Howells   NOMMU: Make VMAs ...
1381
1382
  	ret = -EINVAL;
  	goto error;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1383

8feae1311   David Howells   NOMMU: Make VMAs ...
1384
1385
  error_getting_vma:
  	kmem_cache_free(vm_region_jar, region);
22cc877b3   Leon Romanovsky   mm: nommu: refact...
1386
1387
1388
  	pr_warn("Allocation of vma for %lu byte allocation from process %d failed
  ",
  			len, current->pid);
7bf02ea22   David Rientjes   arch, mm: filter ...
1389
  	show_free_areas(0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1390
  	return -ENOMEM;
8feae1311   David Howells   NOMMU: Make VMAs ...
1391
  error_getting_region:
22cc877b3   Leon Romanovsky   mm: nommu: refact...
1392
1393
1394
  	pr_warn("Allocation of vm region for %lu byte allocation from process %d failed
  ",
  			len, current->pid);
7bf02ea22   David Rientjes   arch, mm: filter ...
1395
  	show_free_areas(0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1396
1397
  	return -ENOMEM;
  }
6be5ceb02   Linus Torvalds   VM: add "vm_mmap(...
1398

66f0dc481   Hugh Dickins   mm: move sys_mmap...
1399
1400
1401
1402
1403
1404
  SYSCALL_DEFINE6(mmap_pgoff, unsigned long, addr, unsigned long, len,
  		unsigned long, prot, unsigned long, flags,
  		unsigned long, fd, unsigned long, pgoff)
  {
  	struct file *file = NULL;
  	unsigned long retval = -EBADF;
120a795da   Al Viro   audit mmap
1405
  	audit_mmap_fd(fd, flags);
66f0dc481   Hugh Dickins   mm: move sys_mmap...
1406
1407
1408
1409
1410
1411
1412
  	if (!(flags & MAP_ANONYMOUS)) {
  		file = fget(fd);
  		if (!file)
  			goto out;
  	}
  
  	flags &= ~(MAP_EXECUTABLE | MAP_DENYWRITE);
ad1ed2937   Greg Ungerer   nommu: fix compil...
1413
  	retval = vm_mmap_pgoff(file, addr, len, prot, flags, pgoff);
66f0dc481   Hugh Dickins   mm: move sys_mmap...
1414
1415
1416
1417
1418
1419
  
  	if (file)
  		fput(file);
  out:
  	return retval;
  }
a4679373c   Christoph Hellwig   Add generic sys_o...
1420
1421
1422
1423
1424
1425
1426
1427
1428
1429
1430
1431
1432
1433
1434
1435
1436
1437
1438
1439
1440
1441
1442
  #ifdef __ARCH_WANT_SYS_OLD_MMAP
  struct mmap_arg_struct {
  	unsigned long addr;
  	unsigned long len;
  	unsigned long prot;
  	unsigned long flags;
  	unsigned long fd;
  	unsigned long offset;
  };
  
  SYSCALL_DEFINE1(old_mmap, struct mmap_arg_struct __user *, arg)
  {
  	struct mmap_arg_struct a;
  
  	if (copy_from_user(&a, arg, sizeof(a)))
  		return -EFAULT;
  	if (a.offset & ~PAGE_MASK)
  		return -EINVAL;
  
  	return sys_mmap_pgoff(a.addr, a.len, a.prot, a.flags, a.fd,
  			      a.offset >> PAGE_SHIFT);
  }
  #endif /* __ARCH_WANT_SYS_OLD_MMAP */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1443
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
1444
1445
   * split a vma into two pieces at address 'addr', a new vma is allocated either
   * for the first part or the tail.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1446
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
1447
1448
  int split_vma(struct mm_struct *mm, struct vm_area_struct *vma,
  	      unsigned long addr, int new_below)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1449
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
1450
1451
1452
  	struct vm_area_struct *new;
  	struct vm_region *region;
  	unsigned long npages;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1453

779c10232   David Howells   nommu: remove a s...
1454
1455
1456
  	/* we're only permitted to split anonymous regions (these should have
  	 * only a single usage on the region) */
  	if (vma->vm_file)
8feae1311   David Howells   NOMMU: Make VMAs ...
1457
  		return -ENOMEM;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1458

8feae1311   David Howells   NOMMU: Make VMAs ...
1459
1460
  	if (mm->map_count >= sysctl_max_map_count)
  		return -ENOMEM;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1461

8feae1311   David Howells   NOMMU: Make VMAs ...
1462
1463
1464
  	region = kmem_cache_alloc(vm_region_jar, GFP_KERNEL);
  	if (!region)
  		return -ENOMEM;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1465

8feae1311   David Howells   NOMMU: Make VMAs ...
1466
1467
1468
1469
1470
1471
1472
1473
1474
1475
1476
1477
1478
1479
  	new = kmem_cache_alloc(vm_area_cachep, GFP_KERNEL);
  	if (!new) {
  		kmem_cache_free(vm_region_jar, region);
  		return -ENOMEM;
  	}
  
  	/* most fields are the same, copy all, and then fixup */
  	*new = *vma;
  	*region = *vma->vm_region;
  	new->vm_region = region;
  
  	npages = (addr - vma->vm_start) >> PAGE_SHIFT;
  
  	if (new_below) {
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1480
  		region->vm_top = region->vm_end = new->vm_end = addr;
8feae1311   David Howells   NOMMU: Make VMAs ...
1481
1482
1483
  	} else {
  		region->vm_start = new->vm_start = addr;
  		region->vm_pgoff = new->vm_pgoff += npages;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1484
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1485
1486
1487
1488
1489
1490
1491
1492
1493
1494
1495
1496
  
  	if (new->vm_ops && new->vm_ops->open)
  		new->vm_ops->open(new);
  
  	delete_vma_from_mm(vma);
  	down_write(&nommu_region_sem);
  	delete_nommu_region(vma->vm_region);
  	if (new_below) {
  		vma->vm_region->vm_start = vma->vm_start = addr;
  		vma->vm_region->vm_pgoff = vma->vm_pgoff += npages;
  	} else {
  		vma->vm_region->vm_end = vma->vm_end = addr;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1497
  		vma->vm_region->vm_top = addr;
8feae1311   David Howells   NOMMU: Make VMAs ...
1498
1499
1500
1501
1502
1503
1504
  	}
  	add_nommu_region(vma->vm_region);
  	add_nommu_region(new->vm_region);
  	up_write(&nommu_region_sem);
  	add_vma_to_mm(mm, vma);
  	add_vma_to_mm(mm, new);
  	return 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1505
  }
3034097a5   David Howells   [PATCH] NOMMU: Or...
1506
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
1507
1508
   * shrink a VMA by removing the specified chunk from either the beginning or
   * the end
3034097a5   David Howells   [PATCH] NOMMU: Or...
1509
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
1510
1511
1512
  static int shrink_vma(struct mm_struct *mm,
  		      struct vm_area_struct *vma,
  		      unsigned long from, unsigned long to)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1513
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
1514
  	struct vm_region *region;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1515

8feae1311   David Howells   NOMMU: Make VMAs ...
1516
1517
1518
1519
1520
1521
1522
1523
  	/* adjust the VMA's pointers, which may reposition it in the MM's tree
  	 * and list */
  	delete_vma_from_mm(vma);
  	if (from > vma->vm_start)
  		vma->vm_end = from;
  	else
  		vma->vm_start = to;
  	add_vma_to_mm(mm, vma);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1524

8feae1311   David Howells   NOMMU: Make VMAs ...
1525
1526
  	/* cut the backing region down to size */
  	region = vma->vm_region;
1e2ae599d   David Howells   nommu: struct vm_...
1527
  	BUG_ON(region->vm_usage != 1);
8feae1311   David Howells   NOMMU: Make VMAs ...
1528
1529
1530
  
  	down_write(&nommu_region_sem);
  	delete_nommu_region(region);
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1531
1532
1533
1534
  	if (from > region->vm_start) {
  		to = region->vm_top;
  		region->vm_top = region->vm_end = from;
  	} else {
8feae1311   David Howells   NOMMU: Make VMAs ...
1535
  		region->vm_start = to;
dd8632a12   Paul Mundt   NOMMU: Make mmap ...
1536
  	}
8feae1311   David Howells   NOMMU: Make VMAs ...
1537
1538
1539
1540
1541
1542
  	add_nommu_region(region);
  	up_write(&nommu_region_sem);
  
  	free_page_series(from, to);
  	return 0;
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1543

8feae1311   David Howells   NOMMU: Make VMAs ...
1544
1545
1546
1547
1548
1549
1550
1551
  /*
   * release a mapping
   * - under NOMMU conditions the chunk to be unmapped must be backed by a single
   *   VMA, though it need not cover the whole VMA
   */
  int do_munmap(struct mm_struct *mm, unsigned long start, size_t len)
  {
  	struct vm_area_struct *vma;
f67d9b157   Bob Liu   nommu: add page a...
1552
  	unsigned long end;
8feae1311   David Howells   NOMMU: Make VMAs ...
1553
  	int ret;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1554

f67d9b157   Bob Liu   nommu: add page a...
1555
  	len = PAGE_ALIGN(len);
8feae1311   David Howells   NOMMU: Make VMAs ...
1556
1557
  	if (len == 0)
  		return -EINVAL;
365e9c87a   Hugh Dickins   [PATCH] mm: updat...
1558

f67d9b157   Bob Liu   nommu: add page a...
1559
  	end = start + len;
8feae1311   David Howells   NOMMU: Make VMAs ...
1560
1561
1562
  	/* find the first potentially overlapping VMA */
  	vma = find_vma(mm, start);
  	if (!vma) {
ac7149045   Choi Gi-yong   mm: fix 'ERROR: d...
1563
  		static int limit;
33e5d7697   David Howells   nommu: fix a numb...
1564
  		if (limit < 5) {
22cc877b3   Leon Romanovsky   mm: nommu: refact...
1565
1566
1567
1568
  			pr_warn("munmap of memory not mmapped by process %d (%s): 0x%lx-0x%lx
  ",
  					current->pid, current->comm,
  					start, start + len - 1);
33e5d7697   David Howells   nommu: fix a numb...
1569
1570
  			limit++;
  		}
8feae1311   David Howells   NOMMU: Make VMAs ...
1571
1572
  		return -EINVAL;
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1573

8feae1311   David Howells   NOMMU: Make VMAs ...
1574
1575
1576
  	/* we're allowed to split an anonymous VMA but not a file-backed one */
  	if (vma->vm_file) {
  		do {
22cc877b3   Leon Romanovsky   mm: nommu: refact...
1577
  			if (start > vma->vm_start)
8feae1311   David Howells   NOMMU: Make VMAs ...
1578
  				return -EINVAL;
8feae1311   David Howells   NOMMU: Make VMAs ...
1579
1580
  			if (end == vma->vm_end)
  				goto erase_whole_vma;
d75a310c4   Namhyung Kim   mm: nommu: check ...
1581
1582
  			vma = vma->vm_next;
  		} while (vma);
8feae1311   David Howells   NOMMU: Make VMAs ...
1583
1584
1585
1586
1587
  		return -EINVAL;
  	} else {
  		/* the chunk must be a subset of the VMA found */
  		if (start == vma->vm_start && end == vma->vm_end)
  			goto erase_whole_vma;
22cc877b3   Leon Romanovsky   mm: nommu: refact...
1588
  		if (start < vma->vm_start || end > vma->vm_end)
8feae1311   David Howells   NOMMU: Make VMAs ...
1589
  			return -EINVAL;
22cc877b3   Leon Romanovsky   mm: nommu: refact...
1590
  		if (start & ~PAGE_MASK)
8feae1311   David Howells   NOMMU: Make VMAs ...
1591
  			return -EINVAL;
22cc877b3   Leon Romanovsky   mm: nommu: refact...
1592
  		if (end != vma->vm_end && end & ~PAGE_MASK)
8feae1311   David Howells   NOMMU: Make VMAs ...
1593
  			return -EINVAL;
8feae1311   David Howells   NOMMU: Make VMAs ...
1594
1595
  		if (start != vma->vm_start && end != vma->vm_end) {
  			ret = split_vma(mm, vma, start, 1);
22cc877b3   Leon Romanovsky   mm: nommu: refact...
1596
  			if (ret < 0)
8feae1311   David Howells   NOMMU: Make VMAs ...
1597
  				return ret;
8feae1311   David Howells   NOMMU: Make VMAs ...
1598
1599
1600
  		}
  		return shrink_vma(mm, vma, start, end);
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1601

8feae1311   David Howells   NOMMU: Make VMAs ...
1602
1603
1604
  erase_whole_vma:
  	delete_vma_from_mm(vma);
  	delete_vma(mm, vma);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1605
1606
  	return 0;
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
1607
  EXPORT_SYMBOL(do_munmap);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1608

bfce281c2   Al Viro   kill mm argument ...
1609
  int vm_munmap(unsigned long addr, size_t len)
3034097a5   David Howells   [PATCH] NOMMU: Or...
1610
  {
bfce281c2   Al Viro   kill mm argument ...
1611
  	struct mm_struct *mm = current->mm;
3034097a5   David Howells   [PATCH] NOMMU: Or...
1612
  	int ret;
3034097a5   David Howells   [PATCH] NOMMU: Or...
1613
1614
1615
1616
1617
1618
  
  	down_write(&mm->mmap_sem);
  	ret = do_munmap(mm, addr, len);
  	up_write(&mm->mmap_sem);
  	return ret;
  }
a46ef99d8   Linus Torvalds   VM: add "vm_munma...
1619
1620
1621
1622
  EXPORT_SYMBOL(vm_munmap);
  
  SYSCALL_DEFINE2(munmap, unsigned long, addr, size_t, len)
  {
bfce281c2   Al Viro   kill mm argument ...
1623
  	return vm_munmap(addr, len);
a46ef99d8   Linus Torvalds   VM: add "vm_munma...
1624
  }
3034097a5   David Howells   [PATCH] NOMMU: Or...
1625
1626
  
  /*
8feae1311   David Howells   NOMMU: Make VMAs ...
1627
   * release all the mappings made in a process's VM space
3034097a5   David Howells   [PATCH] NOMMU: Or...
1628
   */
8feae1311   David Howells   NOMMU: Make VMAs ...
1629
  void exit_mmap(struct mm_struct *mm)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1630
  {
8feae1311   David Howells   NOMMU: Make VMAs ...
1631
  	struct vm_area_struct *vma;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1632

8feae1311   David Howells   NOMMU: Make VMAs ...
1633
1634
  	if (!mm)
  		return;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1635

8feae1311   David Howells   NOMMU: Make VMAs ...
1636
  	mm->total_vm = 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1637

8feae1311   David Howells   NOMMU: Make VMAs ...
1638
1639
1640
1641
  	while ((vma = mm->mmap)) {
  		mm->mmap = vma->vm_next;
  		delete_vma_from_mm(vma);
  		delete_vma(mm, vma);
04c349615   Steven J. Magnani   nommu: yield CPU ...
1642
  		cond_resched();
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1643
1644
  	}
  }
e4eb1ff61   Linus Torvalds   VM: add "vm_brk()...
1645
  unsigned long vm_brk(unsigned long addr, unsigned long len)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1646
1647
1648
1649
1650
  {
  	return -ENOMEM;
  }
  
  /*
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1651
1652
   * expand (or shrink) an existing mapping, potentially moving it at the same
   * time (controlled by the MREMAP_MAYMOVE flag and available VM space)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1653
   *
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1654
   * under NOMMU conditions, we only permit changing a mapping's size, and only
8feae1311   David Howells   NOMMU: Make VMAs ...
1655
1656
   * as long as it stays within the region allocated by do_mmap_private() and the
   * block is not shareable
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1657
   *
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1658
   * MREMAP_FIXED is not supported under NOMMU conditions
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1659
   */
4b377bab2   Al Viro   make do_mremap() ...
1660
  static unsigned long do_mremap(unsigned long addr,
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1661
1662
1663
  			unsigned long old_len, unsigned long new_len,
  			unsigned long flags, unsigned long new_addr)
  {
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1664
  	struct vm_area_struct *vma;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1665
1666
  
  	/* insanity checks first */
f67d9b157   Bob Liu   nommu: add page a...
1667
1668
  	old_len = PAGE_ALIGN(old_len);
  	new_len = PAGE_ALIGN(new_len);
8feae1311   David Howells   NOMMU: Make VMAs ...
1669
  	if (old_len == 0 || new_len == 0)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1670
  		return (unsigned long) -EINVAL;
8feae1311   David Howells   NOMMU: Make VMAs ...
1671
1672
  	if (addr & ~PAGE_MASK)
  		return -EINVAL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1673
1674
  	if (flags & MREMAP_FIXED && new_addr != addr)
  		return (unsigned long) -EINVAL;
8feae1311   David Howells   NOMMU: Make VMAs ...
1675
  	vma = find_vma_exact(current->mm, addr, old_len);
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1676
1677
  	if (!vma)
  		return (unsigned long) -EINVAL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1678

6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1679
  	if (vma->vm_end != vma->vm_start + old_len)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1680
  		return (unsigned long) -EFAULT;
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1681
  	if (vma->vm_flags & VM_MAYSHARE)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1682
  		return (unsigned long) -EPERM;
8feae1311   David Howells   NOMMU: Make VMAs ...
1683
  	if (new_len > vma->vm_region->vm_end - vma->vm_region->vm_start)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1684
1685
1686
  		return (unsigned long) -ENOMEM;
  
  	/* all checks complete - do it */
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1687
  	vma->vm_end = vma->vm_start + new_len;
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1688
1689
  	return vma->vm_start;
  }
6a6160a7b   Heiko Carstens   [CVE-2009-0029] S...
1690
1691
1692
  SYSCALL_DEFINE5(mremap, unsigned long, addr, unsigned long, old_len,
  		unsigned long, new_len, unsigned long, flags,
  		unsigned long, new_addr)
6fa5f80bc   David Howells   [PATCH] NOMMU: Ma...
1693
1694
1695
1696
1697
1698
1699
  {
  	unsigned long ret;
  
  	down_write(&current->mm->mmap_sem);
  	ret = do_mremap(addr, old_len, new_len, flags, new_addr);
  	up_write(&current->mm->mmap_sem);
  	return ret;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1700
  }
240aadeed   Michel Lespinasse   mm: accelerate mm...
1701
1702
1703
  struct page *follow_page_mask(struct vm_area_struct *vma,
  			      unsigned long address, unsigned int flags,
  			      unsigned int *page_mask)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1704
  {
240aadeed   Michel Lespinasse   mm: accelerate mm...
1705
  	*page_mask = 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1706
1707
  	return NULL;
  }
8f3b1327a   Bob Liu   mm/nommu.c: fix r...
1708
1709
  int remap_pfn_range(struct vm_area_struct *vma, unsigned long addr,
  		unsigned long pfn, unsigned long size, pgprot_t prot)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1710
  {
8f3b1327a   Bob Liu   mm/nommu.c: fix r...
1711
1712
  	if (addr != (pfn << PAGE_SHIFT))
  		return -EINVAL;
314e51b98   Konstantin Khlebnikov   mm: kill vma flag...
1713
  	vma->vm_flags |= VM_IO | VM_PFNMAP | VM_DONTEXPAND | VM_DONTDUMP;
66aa2b4b1   Greg Ungerer   [PATCH] uclinux: ...
1714
  	return 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1715
  }
22c4af409   Luke Yang   [PATCH] nommu: ex...
1716
  EXPORT_SYMBOL(remap_pfn_range);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1717

3c0b9de6d   Linus Torvalds   vm: add no-mmu vm...
1718
1719
1720
1721
1722
1723
1724
1725
1726
  int vm_iomap_memory(struct vm_area_struct *vma, phys_addr_t start, unsigned long len)
  {
  	unsigned long pfn = start >> PAGE_SHIFT;
  	unsigned long vm_len = vma->vm_end - vma->vm_start;
  
  	pfn += vma->vm_pgoff;
  	return io_remap_pfn_range(vma, vma->vm_start, pfn, vm_len, vma->vm_page_prot);
  }
  EXPORT_SYMBOL(vm_iomap_memory);
f905bc447   Paul Mundt   nommu: add new vm...
1727
1728
1729
1730
1731
1732
1733
1734
1735
1736
1737
1738
1739
1740
  int remap_vmalloc_range(struct vm_area_struct *vma, void *addr,
  			unsigned long pgoff)
  {
  	unsigned int size = vma->vm_end - vma->vm_start;
  
  	if (!(vma->vm_flags & VM_USERMAP))
  		return -EINVAL;
  
  	vma->vm_start = (unsigned long)(addr + (pgoff << PAGE_SHIFT));
  	vma->vm_end = vma->vm_start + size;
  
  	return 0;
  }
  EXPORT_SYMBOL(remap_vmalloc_range);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1741
1742
1743
1744
1745
  unsigned long arch_get_unmapped_area(struct file *file, unsigned long addr,
  	unsigned long len, unsigned long pgoff, unsigned long flags)
  {
  	return -ENOMEM;
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1746
1747
1748
1749
1750
  void unmap_mapping_range(struct address_space *mapping,
  			 loff_t const holebegin, loff_t const holelen,
  			 int even_cows)
  {
  }
22c4af409   Luke Yang   [PATCH] nommu: ex...
1751
  EXPORT_SYMBOL(unmap_mapping_range);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1752
1753
1754
1755
1756
1757
1758
1759
1760
1761
1762
1763
1764
1765
1766
1767
1768
  
  /*
   * Check that a process has enough memory to allocate a new virtual
   * mapping. 0 means there is enough memory for the allocation to
   * succeed and -ENOMEM implies there is not.
   *
   * We currently support three overcommit policies, which are set via the
   * vm.overcommit_memory sysctl.  See Documentation/vm/overcommit-accounting
   *
   * Strict overcommit modes added 2002 Feb 26 by Alan Cox.
   * Additional code 2002 Jul 20 by Robert Love.
   *
   * cap_sys_admin is 1 if the process has admin privileges, 0 otherwise.
   *
   * Note this is a helper function intended to be used by LSMs which
   * wish to use this logic.
   */
34b4e4aa3   Alan Cox   fix NULL pointer ...
1769
  int __vm_enough_memory(struct mm_struct *mm, long pages, int cap_sys_admin)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1770
  {
8138a67a5   Roman Gushchin   mm/nommu.c: fix a...
1771
  	long free, allowed, reserve;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1772
1773
1774
1775
1776
1777
1778
1779
1780
1781
  
  	vm_acct_memory(pages);
  
  	/*
  	 * Sometimes we want to use more memory than we have
  	 */
  	if (sysctl_overcommit_memory == OVERCOMMIT_ALWAYS)
  		return 0;
  
  	if (sysctl_overcommit_memory == OVERCOMMIT_GUESS) {
c15bef309   Dmitry Fink   mmap: fix and tid...
1782
1783
1784
1785
1786
1787
1788
1789
1790
1791
  		free = global_page_state(NR_FREE_PAGES);
  		free += global_page_state(NR_FILE_PAGES);
  
  		/*
  		 * shmem pages shouldn't be counted as free in this
  		 * case, they can't be purged, only swapped out, and
  		 * that won't affect the overall amount of available
  		 * memory in the system.
  		 */
  		free -= global_page_state(NR_SHMEM);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1792

ec8acf20a   Shaohua Li   swap: add per-par...
1793
  		free += get_nr_swap_pages();
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1794
1795
1796
1797
1798
1799
1800
  
  		/*
  		 * Any slabs which are created with the
  		 * SLAB_RECLAIM_ACCOUNT flag claim to have contents
  		 * which are reclaimable, under pressure.  The dentry
  		 * cache and most inode caches should fall into this
  		 */
972d1a7b1   Christoph Lameter   [PATCH] ZVC: Supp...
1801
  		free += global_page_state(NR_SLAB_RECLAIMABLE);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1802
1803
  
  		/*
d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1804
1805
  		 * Leave reserved pages. The pages are not for anonymous pages.
  		 */
c15bef309   Dmitry Fink   mmap: fix and tid...
1806
  		if (free <= totalreserve_pages)
d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1807
1808
  			goto error;
  		else
c15bef309   Dmitry Fink   mmap: fix and tid...
1809
  			free -= totalreserve_pages;
d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1810
1811
  
  		/*
4eeab4f55   Andrew Shewmaker   mm: replace hardc...
1812
  		 * Reserve some for root
d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1813
  		 */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1814
  		if (!cap_sys_admin)
4eeab4f55   Andrew Shewmaker   mm: replace hardc...
1815
  			free -= sysctl_admin_reserve_kbytes >> (PAGE_SHIFT - 10);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1816
1817
1818
  
  		if (free > pages)
  			return 0;
d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1819
1820
  
  		goto error;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1821
  	}
00619bcc4   Jerome Marchand   mm: factor commit...
1822
  	allowed = vm_commit_limit();
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1823
  	/*
4eeab4f55   Andrew Shewmaker   mm: replace hardc...
1824
  	 * Reserve some 3% for root
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1825
1826
  	 */
  	if (!cap_sys_admin)
4eeab4f55   Andrew Shewmaker   mm: replace hardc...
1827
  		allowed -= sysctl_admin_reserve_kbytes >> (PAGE_SHIFT - 10);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1828

c9b1d0981   Andrew Shewmaker   mm: limit growth ...
1829
1830
1831
1832
1833
  	/*
  	 * Don't let a single process grow so big a user can't recover
  	 */
  	if (mm) {
  		reserve = sysctl_user_reserve_kbytes >> (PAGE_SHIFT - 10);
8138a67a5   Roman Gushchin   mm/nommu.c: fix a...
1834
  		allowed -= min_t(long, mm->total_vm / 32, reserve);
c9b1d0981   Andrew Shewmaker   mm: limit growth ...
1835
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1836

00a62ce91   KOSAKI Motohiro   mm: fix Committed...
1837
  	if (percpu_counter_read_positive(&vm_committed_as) < allowed)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1838
  		return 0;
00a62ce91   KOSAKI Motohiro   mm: fix Committed...
1839

d5ddc79bc   Hideo AOKI   [PATCH] overcommi...
1840
  error:
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1841
1842
1843
1844
  	vm_unacct_memory(pages);
  
  	return -ENOMEM;
  }
d0217ac04   Nick Piggin   mm: fault feedbac...
1845
  int filemap_fault(struct vm_area_struct *vma, struct vm_fault *vmf)
b0e15190e   David Howells   [PATCH] NOMMU: Ma...
1846
1847
  {
  	BUG();
d0217ac04   Nick Piggin   mm: fault feedbac...
1848
  	return 0;
b0e15190e   David Howells   [PATCH] NOMMU: Ma...
1849
  }
b50731732   Paul Mundt   nommu: vmalloc_32...
1850
  EXPORT_SYMBOL(filemap_fault);
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1851

f1820361f   Kirill A. Shutemov   mm: implement ->m...
1852
1853
1854
1855
1856
  void filemap_map_pages(struct vm_area_struct *vma, struct vm_fault *vmf)
  {
  	BUG();
  }
  EXPORT_SYMBOL(filemap_map_pages);
f55f199b7   Mike Frysinger   NOMMU: implement ...
1857
1858
  static int __access_remote_vm(struct task_struct *tsk, struct mm_struct *mm,
  		unsigned long addr, void *buf, int len, int write)
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1859
  {
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1860
  	struct vm_area_struct *vma;
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1861
1862
1863
1864
  
  	down_read(&mm->mmap_sem);
  
  	/* the access must start within one of the target process's mappings */
0159b141d   David Howells   [PATCH] NOMMU: Us...
1865
1866
  	vma = find_vma(mm, addr);
  	if (vma) {
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1867
1868
1869
1870
1871
  		/* don't overrun this mapping */
  		if (addr + len >= vma->vm_end)
  			len = vma->vm_end - addr;
  
  		/* only read or write mappings where it is permitted */
d00c7b993   David Howells   [PATCH] NOMMU: Pe...
1872
  		if (write && vma->vm_flags & VM_MAYWRITE)
7959722b9   Jie Zhang   NOMMU: Use copy_*...
1873
1874
  			copy_to_user_page(vma, NULL, addr,
  					 (void *) addr, buf, len);
d00c7b993   David Howells   [PATCH] NOMMU: Pe...
1875
  		else if (!write && vma->vm_flags & VM_MAYREAD)
7959722b9   Jie Zhang   NOMMU: Use copy_*...
1876
1877
  			copy_from_user_page(vma, NULL, addr,
  					    buf, (void *) addr, len);
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1878
1879
1880
1881
1882
1883
1884
  		else
  			len = 0;
  	} else {
  		len = 0;
  	}
  
  	up_read(&mm->mmap_sem);
f55f199b7   Mike Frysinger   NOMMU: implement ...
1885
1886
1887
1888
1889
1890
1891
1892
1893
1894
1895
1896
1897
1898
1899
1900
1901
1902
1903
1904
1905
1906
1907
1908
1909
1910
1911
1912
1913
1914
1915
1916
1917
1918
1919
1920
  
  	return len;
  }
  
  /**
   * @access_remote_vm - access another process' address space
   * @mm:		the mm_struct of the target address space
   * @addr:	start address to access
   * @buf:	source or destination buffer
   * @len:	number of bytes to transfer
   * @write:	whether the access is a write
   *
   * The caller must hold a reference on @mm.
   */
  int access_remote_vm(struct mm_struct *mm, unsigned long addr,
  		void *buf, int len, int write)
  {
  	return __access_remote_vm(NULL, mm, addr, buf, len, write);
  }
  
  /*
   * Access another process' address space.
   * - source/target buffer must be kernel space
   */
  int access_process_vm(struct task_struct *tsk, unsigned long addr, void *buf, int len, int write)
  {
  	struct mm_struct *mm;
  
  	if (addr + len < addr)
  		return 0;
  
  	mm = get_task_mm(tsk);
  	if (!mm)
  		return 0;
  
  	len = __access_remote_vm(tsk, mm, addr, buf, len, write);
0ec76a110   David Howells   [PATCH] NOMMU: Ch...
1921
1922
1923
  	mmput(mm);
  	return len;
  }
7e6608724   David Howells   nommu: fix shared...
1924
1925
1926
1927
1928
1929
1930
1931
1932
1933
1934
1935
1936
1937
1938
1939
  
  /**
   * nommu_shrink_inode_mappings - Shrink the shared mappings on an inode
   * @inode: The inode to check
   * @size: The current filesize of the inode
   * @newsize: The proposed filesize of the inode
   *
   * Check the shared mappings on an inode on behalf of a shrinking truncate to
   * make sure that that any outstanding VMAs aren't broken and then shrink the
   * vm_regions that extend that beyond so that do_mmap_pgoff() doesn't
   * automatically grant mappings that are too large.
   */
  int nommu_shrink_inode_mappings(struct inode *inode, size_t size,
  				size_t newsize)
  {
  	struct vm_area_struct *vma;
7e6608724   David Howells   nommu: fix shared...
1940
1941
1942
1943
1944
1945
1946
1947
  	struct vm_region *region;
  	pgoff_t low, high;
  	size_t r_size, r_top;
  
  	low = newsize >> PAGE_SHIFT;
  	high = (size + PAGE_SIZE - 1) >> PAGE_SHIFT;
  
  	down_write(&nommu_region_sem);
1acf2e040   Davidlohr Bueso   mm/nommu: share t...
1948
  	i_mmap_lock_read(inode->i_mapping);
7e6608724   David Howells   nommu: fix shared...
1949
1950
  
  	/* search for VMAs that fall within the dead zone */
6b2dbba8b   Michel Lespinasse   mm: replace vma p...
1951
  	vma_interval_tree_foreach(vma, &inode->i_mapping->i_mmap, low, high) {
7e6608724   David Howells   nommu: fix shared...
1952
1953
1954
  		/* found one - only interested if it's shared out of the page
  		 * cache */
  		if (vma->vm_flags & VM_SHARED) {
1acf2e040   Davidlohr Bueso   mm/nommu: share t...
1955
  			i_mmap_unlock_read(inode->i_mapping);
7e6608724   David Howells   nommu: fix shared...
1956
1957
1958
1959
1960
1961
1962
1963
1964
1965
1966
  			up_write(&nommu_region_sem);
  			return -ETXTBSY; /* not quite true, but near enough */
  		}
  	}
  
  	/* reduce any regions that overlap the dead zone - if in existence,
  	 * these will be pointed to by VMAs that don't overlap the dead zone
  	 *
  	 * we don't check for any regions that start beyond the EOF as there
  	 * shouldn't be any
  	 */
1acf2e040   Davidlohr Bueso   mm/nommu: share t...
1967
  	vma_interval_tree_foreach(vma, &inode->i_mapping->i_mmap, 0, ULONG_MAX) {
7e6608724   David Howells   nommu: fix shared...
1968
1969
1970
1971
1972
1973
1974
1975
1976
1977
1978
1979
1980
  		if (!(vma->vm_flags & VM_SHARED))
  			continue;
  
  		region = vma->vm_region;
  		r_size = region->vm_top - region->vm_start;
  		r_top = (region->vm_pgoff << PAGE_SHIFT) + r_size;
  
  		if (r_top > newsize) {
  			region->vm_top -= r_top - newsize;
  			if (region->vm_end > region->vm_top)
  				region->vm_end = region->vm_top;
  		}
  	}
1acf2e040   Davidlohr Bueso   mm/nommu: share t...
1981
  	i_mmap_unlock_read(inode->i_mapping);
7e6608724   David Howells   nommu: fix shared...
1982
1983
1984
  	up_write(&nommu_region_sem);
  	return 0;
  }
c9b1d0981   Andrew Shewmaker   mm: limit growth ...
1985
1986
1987
1988
1989
1990
1991
1992
1993
1994
1995
1996
1997
1998
1999
2000
2001
2002
2003
2004
  
  /*
   * Initialise sysctl_user_reserve_kbytes.
   *
   * This is intended to prevent a user from starting a single memory hogging
   * process, such that they cannot recover (kill the hog) in OVERCOMMIT_NEVER
   * mode.
   *
   * The default value is min(3% of free memory, 128MB)
   * 128MB is enough to recover with sshd/login, bash, and top/kill.
   */
  static int __meminit init_user_reserve(void)
  {
  	unsigned long free_kbytes;
  
  	free_kbytes = global_page_state(NR_FREE_PAGES) << (PAGE_SHIFT - 10);
  
  	sysctl_user_reserve_kbytes = min(free_kbytes / 32, 1UL << 17);
  	return 0;
  }
a4bc6fc79   Paul Gortmaker   mm: replace modul...
2005
  subsys_initcall(init_user_reserve);
4eeab4f55   Andrew Shewmaker   mm: replace hardc...
2006
2007
2008
2009
2010
2011
2012
2013
2014
2015
2016
2017
2018
2019
2020
2021
2022
2023
2024
2025
  
  /*
   * Initialise sysctl_admin_reserve_kbytes.
   *
   * The purpose of sysctl_admin_reserve_kbytes is to allow the sys admin
   * to log in and kill a memory hogging process.
   *
   * Systems with more than 256MB will reserve 8MB, enough to recover
   * with sshd, bash, and top in OVERCOMMIT_GUESS. Smaller systems will
   * only reserve 3% of free pages by default.
   */
  static int __meminit init_admin_reserve(void)
  {
  	unsigned long free_kbytes;
  
  	free_kbytes = global_page_state(NR_FREE_PAGES) << (PAGE_SHIFT - 10);
  
  	sysctl_admin_reserve_kbytes = min(free_kbytes / 32, 1UL << 13);
  	return 0;
  }
a4bc6fc79   Paul Gortmaker   mm: replace modul...
2026
  subsys_initcall(init_admin_reserve);