Blame view

fs/namei.c 73 KB
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
  /*
   *  linux/fs/namei.c
   *
   *  Copyright (C) 1991, 1992  Linus Torvalds
   */
  
  /*
   * Some corrections by tytso.
   */
  
  /* [Feb 1997 T. Schoebel-Theuer] Complete rewrite of the pathname
   * lookup logic.
   */
  /* [Feb-Apr 2000, AV] Rewrite to the new namespace architecture.
   */
  
  #include <linux/init.h>
  #include <linux/module.h>
  #include <linux/slab.h>
  #include <linux/fs.h>
  #include <linux/namei.h>
  #include <linux/quotaops.h>
  #include <linux/pagemap.h>
0eeca2830   Robert Love   [PATCH] inotify
24
  #include <linux/fsnotify.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
25
26
27
28
29
  #include <linux/personality.h>
  #include <linux/security.h>
  #include <linux/syscalls.h>
  #include <linux/mount.h>
  #include <linux/audit.h>
16f7e0fe2   Randy Dunlap   [PATCH] capable/c...
30
  #include <linux/capability.h>
834f2a4a1   Trond Myklebust   VFS: Allow the fi...
31
  #include <linux/file.h>
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
32
  #include <linux/fcntl.h>
08ce5f16e   Serge E. Hallyn   cgroups: implemen...
33
  #include <linux/device_cgroup.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
  #include <asm/namei.h>
  #include <asm/uaccess.h>
  
  #define ACC_MODE(x) ("\000\004\002\006"[(x)&O_ACCMODE])
  
  /* [Feb-1997 T. Schoebel-Theuer]
   * Fundamental changes in the pathname lookup mechanisms (namei)
   * were necessary because of omirr.  The reason is that omirr needs
   * to know the _real_ pathname, not the user-supplied one, in case
   * of symlinks (and also when transname replacements occur).
   *
   * The new code replaces the old recursive symlink resolution with
   * an iterative one (in case of non-nested symlink chains).  It does
   * this with calls to <fs>_follow_link().
   * As a side effect, dir_namei(), _namei() and follow_link() are now 
   * replaced with a single function lookup_dentry() that can handle all 
   * the special cases of the former code.
   *
   * With the new dcache, the pathname is stored at each inode, at least as
   * long as the refcount of the inode is positive.  As a side effect, the
   * size of the dcache depends on the inode cache and thus is dynamic.
   *
   * [29-Apr-1998 C. Scott Ananian] Updated above description of symlink
   * resolution to correspond with current state of the code.
   *
   * Note that the symlink resolution is not *completely* iterative.
   * There is still a significant amount of tail- and mid- recursion in
   * the algorithm.  Also, note that <fs>_readlink() is not used in
   * lookup_dentry(): lookup_dentry() on the result of <fs>_readlink()
   * may return different results than <fs>_follow_link().  Many virtual
   * filesystems (including /proc) exhibit this behavior.
   */
  
  /* [24-Feb-97 T. Schoebel-Theuer] Side effects caused by new implementation:
   * New symlink semantics: when open() is called with flags O_CREAT | O_EXCL
   * and the name already exists in form of a symlink, try to create the new
   * name indicated by the symlink. The old code always complained that the
   * name already exists, due to not following the symlink even if its target
   * is nonexistent.  The new semantics affects also mknod() and link() when
   * the name is a symlink pointing to a non-existant name.
   *
   * I don't know which semantics is the right one, since I have no access
   * to standards. But I found by trial that HP-UX 9.0 has the full "new"
   * semantics implemented, while SunOS 4.1.1 and Solaris (SunOS 5.4) have the
   * "old" one. Personally, I think the new semantics is much more logical.
   * Note that "ln old new" where "new" is a symlink pointing to a non-existing
   * file does succeed in both HP-UX and SunOs, but not in Solaris
   * and in the old Linux semantics.
   */
  
  /* [16-Dec-97 Kevin Buhr] For security reasons, we change some symlink
   * semantics.  See the comments in "open_namei" and "do_link" below.
   *
   * [10-Sep-98 Alan Modra] Another symlink change.
   */
  
  /* [Feb-Apr 2000 AV] Complete rewrite. Rules for symlinks:
   *	inside the path - always follow.
   *	in the last component in creation/removal/renaming - never follow.
   *	if LOOKUP_FOLLOW passed - follow.
   *	if the pathname has trailing slashes - follow.
   *	otherwise - don't follow.
   * (applied in that order).
   *
   * [Jun 2000 AV] Inconsistent behaviour of open() in case if flags==O_CREAT
   * restored for 2.4. This is the last surviving part of old 4.2BSD bug.
   * During the 2.4 we need to fix the userland stuff depending on it -
   * hopefully we will be able to get rid of that wart in 2.5. So far only
   * XEmacs seems to be relying on it...
   */
  /*
   * [Sep 2001 AV] Single-semaphore locking scheme (kudos to David Holland)
a11f3a057   Arjan van de Ven   [PATCH] sem2mutex...
106
   * implemented.  Let's see if raised priority of ->s_vfs_rename_mutex gives
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
107
108
   * any extra contention...
   */
a02f76c34   Al Viro   [PATCH] get stack...
109
  static int __link_path_walk(const char *name, struct nameidata *nd);
c4a7808fc   Josef 'Jeff' Sipek   fs: mark link_pat...
110

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
111
112
113
114
115
116
117
  /* In order to reduce some races, while at the same time doing additional
   * checking and hopefully speeding things up, we copy filenames to the
   * kernel data space before using them..
   *
   * POSIX.1 2.4: an empty pathname is invalid (ENOENT).
   * PATH_MAX includes the nul terminator --RR.
   */
858119e15   Arjan van de Ven   [PATCH] Unlinline...
118
  static int do_getname(const char __user *filename, char *page)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
  {
  	int retval;
  	unsigned long len = PATH_MAX;
  
  	if (!segment_eq(get_fs(), KERNEL_DS)) {
  		if ((unsigned long) filename >= TASK_SIZE)
  			return -EFAULT;
  		if (TASK_SIZE - (unsigned long) filename < PATH_MAX)
  			len = TASK_SIZE - (unsigned long) filename;
  	}
  
  	retval = strncpy_from_user(page, filename, len);
  	if (retval > 0) {
  		if (retval < len)
  			return 0;
  		return -ENAMETOOLONG;
  	} else if (!retval)
  		retval = -ENOENT;
  	return retval;
  }
  
  char * getname(const char __user * filename)
  {
  	char *tmp, *result;
  
  	result = ERR_PTR(-ENOMEM);
  	tmp = __getname();
  	if (tmp)  {
  		int retval = do_getname(filename, tmp);
  
  		result = tmp;
  		if (retval < 0) {
  			__putname(tmp);
  			result = ERR_PTR(retval);
  		}
  	}
  	audit_getname(result);
  	return result;
  }
  
  #ifdef CONFIG_AUDITSYSCALL
  void putname(const char *name)
  {
5ac3a9c26   Al Viro   [PATCH] don't bot...
162
  	if (unlikely(!audit_dummy_context()))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
  		audit_putname(name);
  	else
  		__putname(name);
  }
  EXPORT_SYMBOL(putname);
  #endif
  
  
  /**
   * generic_permission  -  check for access rights on a Posix-like filesystem
   * @inode:	inode to check access rights for
   * @mask:	right to check for (%MAY_READ, %MAY_WRITE, %MAY_EXEC)
   * @check_acl:	optional callback to check for Posix ACLs
   *
   * Used to check for read/write/execute permissions on a file.
   * We use "fsuid" for this, letting us set arbitrary permissions
   * for filesystem access without changing the "normal" uids which
   * are used for other things..
   */
  int generic_permission(struct inode *inode, int mask,
  		int (*check_acl)(struct inode *inode, int mask))
  {
  	umode_t			mode = inode->i_mode;
  
  	if (current->fsuid == inode->i_uid)
  		mode >>= 6;
  	else {
  		if (IS_POSIXACL(inode) && (mode & S_IRWXG) && check_acl) {
  			int error = check_acl(inode, mask);
  			if (error == -EACCES)
  				goto check_capabilities;
  			else if (error != -EAGAIN)
  				return error;
  		}
  
  		if (in_group_p(inode->i_gid))
  			mode >>= 3;
  	}
  
  	/*
  	 * If the DACs are ok we don't need any capability check.
  	 */
  	if (((mode & mask & (MAY_READ|MAY_WRITE|MAY_EXEC)) == mask))
  		return 0;
  
   check_capabilities:
  	/*
  	 * Read/write DACs are always overridable.
  	 * Executable DACs are overridable if at least one exec bit is set.
  	 */
  	if (!(mask & MAY_EXEC) ||
  	    (inode->i_mode & S_IXUGO) || S_ISDIR(inode->i_mode))
  		if (capable(CAP_DAC_OVERRIDE))
  			return 0;
  
  	/*
  	 * Searching includes executable on directories, else just read.
  	 */
  	if (mask == MAY_READ || (S_ISDIR(inode->i_mode) && !(mask & MAY_WRITE)))
  		if (capable(CAP_DAC_READ_SEARCH))
  			return 0;
  
  	return -EACCES;
  }
  
  int permission(struct inode *inode, int mask, struct nameidata *nd)
  {
  	int retval, submask;
c7eb26678   Dave Hansen   r/o bind mounts: ...
231
232
233
  	struct vfsmount *mnt = NULL;
  
  	if (nd)
4ac913785   Jan Blunck   Embed a struct pa...
234
  		mnt = nd->path.mnt;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
235
236
  
  	if (mask & MAY_WRITE) {
22590e41c   Miklos Szeredi   fix execute check...
237
  		umode_t mode = inode->i_mode;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
238
239
240
241
242
243
244
245
246
247
248
249
250
251
  
  		/*
  		 * Nobody gets write access to a read-only fs.
  		 */
  		if (IS_RDONLY(inode) &&
  		    (S_ISREG(mode) || S_ISDIR(mode) || S_ISLNK(mode)))
  			return -EROFS;
  
  		/*
  		 * Nobody gets write access to an immutable file.
  		 */
  		if (IS_IMMUTABLE(inode))
  			return -EACCES;
  	}
22590e41c   Miklos Szeredi   fix execute check...
252
253
254
255
256
  	if ((mask & MAY_EXEC) && S_ISREG(inode->i_mode)) {
  		/*
  		 * MAY_EXEC on regular files is denied if the fs is mounted
  		 * with the "noexec" flag.
  		 */
c7eb26678   Dave Hansen   r/o bind mounts: ...
257
  		if (mnt && (mnt->mnt_flags & MNT_NOEXEC))
22590e41c   Miklos Szeredi   fix execute check...
258
259
  			return -EACCES;
  	}
a343bb775   Trond Myklebust   VFS: Fix access("...
260

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
261
262
  	/* Ordinary permission routines do not understand MAY_APPEND. */
  	submask = mask & ~MAY_APPEND;
22590e41c   Miklos Szeredi   fix execute check...
263
  	if (inode->i_op && inode->i_op->permission) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
264
  		retval = inode->i_op->permission(inode, submask, nd);
22590e41c   Miklos Szeredi   fix execute check...
265
266
267
268
269
270
271
272
273
274
275
276
277
  		if (!retval) {
  			/*
  			 * Exec permission on a regular file is denied if none
  			 * of the execute bits are set.
  			 *
  			 * This check should be done by the ->permission()
  			 * method.
  			 */
  			if ((mask & MAY_EXEC) && S_ISREG(inode->i_mode) &&
  			    !(inode->i_mode & S_IXUGO))
  				return -EACCES;
  		}
  	} else {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
278
  		retval = generic_permission(inode, submask, NULL);
22590e41c   Miklos Szeredi   fix execute check...
279
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
280
281
  	if (retval)
  		return retval;
08ce5f16e   Serge E. Hallyn   cgroups: implemen...
282
283
284
  	retval = devcgroup_inode_permission(inode, mask);
  	if (retval)
  		return retval;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
285
286
  	return security_inode_permission(inode, mask, nd);
  }
e4543eddf   Christoph Hellwig   [PATCH] add a vfs...
287
288
289
290
291
292
293
294
295
296
297
298
  /**
   * vfs_permission  -  check for access rights to a given path
   * @nd:		lookup result that describes the path
   * @mask:	right to check for (%MAY_READ, %MAY_WRITE, %MAY_EXEC)
   *
   * Used to check for read/write/execute permissions on a path.
   * We use "fsuid" for this, letting us set arbitrary permissions
   * for filesystem access without changing the "normal" uids which
   * are used for other things.
   */
  int vfs_permission(struct nameidata *nd, int mask)
  {
4ac913785   Jan Blunck   Embed a struct pa...
299
  	return permission(nd->path.dentry->d_inode, mask, nd);
e4543eddf   Christoph Hellwig   [PATCH] add a vfs...
300
  }
8c744fb83   Christoph Hellwig   [PATCH] add a fil...
301
302
303
304
305
306
307
308
309
310
311
312
313
314
  /**
   * file_permission  -  check for additional access rights to a given file
   * @file:	file to check access rights for
   * @mask:	right to check for (%MAY_READ, %MAY_WRITE, %MAY_EXEC)
   *
   * Used to check for read/write/execute permissions on an already opened
   * file.
   *
   * Note:
   *	Do not use this function in new code.  All access checks should
   *	be done using vfs_permission().
   */
  int file_permission(struct file *file, int mask)
  {
0f7fc9e4d   Josef "Jeff" Sipek   [PATCH] VFS: chan...
315
  	return permission(file->f_path.dentry->d_inode, mask, NULL);
8c744fb83   Christoph Hellwig   [PATCH] add a fil...
316
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
  /*
   * get_write_access() gets write permission for a file.
   * put_write_access() releases this write permission.
   * This is used for regular files.
   * We cannot support write (and maybe mmap read-write shared) accesses and
   * MAP_DENYWRITE mmappings simultaneously. The i_writecount field of an inode
   * can have the following values:
   * 0: no writers, no VM_DENYWRITE mappings
   * < 0: (-i_writecount) vm_area_structs with VM_DENYWRITE set exist
   * > 0: (i_writecount) users are writing to the file.
   *
   * Normally we operate on that counter with atomic_{inc,dec} and it's safe
   * except for the cases where we don't hold i_writecount yet. Then we need to
   * use {get,deny}_write_access() - these functions check the sign and refuse
   * to do the change if sign is wrong. Exclusion between them is provided by
   * the inode->i_lock spinlock.
   */
  
  int get_write_access(struct inode * inode)
  {
  	spin_lock(&inode->i_lock);
  	if (atomic_read(&inode->i_writecount) < 0) {
  		spin_unlock(&inode->i_lock);
  		return -ETXTBSY;
  	}
  	atomic_inc(&inode->i_writecount);
  	spin_unlock(&inode->i_lock);
  
  	return 0;
  }
  
  int deny_write_access(struct file * file)
  {
0f7fc9e4d   Josef "Jeff" Sipek   [PATCH] VFS: chan...
350
  	struct inode *inode = file->f_path.dentry->d_inode;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
351
352
353
354
355
356
357
358
359
360
361
  
  	spin_lock(&inode->i_lock);
  	if (atomic_read(&inode->i_writecount) > 0) {
  		spin_unlock(&inode->i_lock);
  		return -ETXTBSY;
  	}
  	atomic_dec(&inode->i_writecount);
  	spin_unlock(&inode->i_lock);
  
  	return 0;
  }
1d957f9bf   Jan Blunck   Introduce path_put()
362
  /**
5dd784d04   Jan Blunck   Introduce path_get()
363
364
365
366
367
368
369
370
371
372
373
374
375
   * path_get - get a reference to a path
   * @path: path to get the reference to
   *
   * Given a path increment the reference count to the dentry and the vfsmount.
   */
  void path_get(struct path *path)
  {
  	mntget(path->mnt);
  	dget(path->dentry);
  }
  EXPORT_SYMBOL(path_get);
  
  /**
1d957f9bf   Jan Blunck   Introduce path_put()
376
377
378
379
380
381
   * path_put - put a reference to a path
   * @path: path to put the reference to
   *
   * Given a path decrement the reference count to the dentry and the vfsmount.
   */
  void path_put(struct path *path)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
382
  {
1d957f9bf   Jan Blunck   Introduce path_put()
383
384
  	dput(path->dentry);
  	mntput(path->mnt);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
385
  }
1d957f9bf   Jan Blunck   Introduce path_put()
386
  EXPORT_SYMBOL(path_put);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
387

834f2a4a1   Trond Myklebust   VFS: Allow the fi...
388
389
390
391
392
393
  /**
   * release_open_intent - free up open intent resources
   * @nd: pointer to nameidata
   */
  void release_open_intent(struct nameidata *nd)
  {
0f7fc9e4d   Josef "Jeff" Sipek   [PATCH] VFS: chan...
394
  	if (nd->intent.open.file->f_path.dentry == NULL)
834f2a4a1   Trond Myklebust   VFS: Allow the fi...
395
396
397
398
  		put_filp(nd->intent.open.file);
  	else
  		fput(nd->intent.open.file);
  }
bcdc5e019   Ian Kent   [PATCH] autofs4 n...
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
  static inline struct dentry *
  do_revalidate(struct dentry *dentry, struct nameidata *nd)
  {
  	int status = dentry->d_op->d_revalidate(dentry, nd);
  	if (unlikely(status <= 0)) {
  		/*
  		 * The dentry failed validation.
  		 * If d_revalidate returned 0 attempt to invalidate
  		 * the dentry otherwise d_revalidate is asking us
  		 * to return a fail status.
  		 */
  		if (!status) {
  			if (!d_invalidate(dentry)) {
  				dput(dentry);
  				dentry = NULL;
  			}
  		} else {
  			dput(dentry);
  			dentry = ERR_PTR(status);
  		}
  	}
  	return dentry;
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
422
423
424
425
426
427
428
429
430
431
432
433
434
  /*
   * Internal lookup() using the new generic dcache.
   * SMP-safe
   */
  static struct dentry * cached_lookup(struct dentry * parent, struct qstr * name, struct nameidata *nd)
  {
  	struct dentry * dentry = __d_lookup(parent, name);
  
  	/* lockess __d_lookup may fail due to concurrent d_move() 
  	 * in some unrelated directory, so try with d_lookup
  	 */
  	if (!dentry)
  		dentry = d_lookup(parent, name);
bcdc5e019   Ian Kent   [PATCH] autofs4 n...
435
436
  	if (dentry && dentry->d_op && dentry->d_op->d_revalidate)
  		dentry = do_revalidate(dentry, nd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
437
438
439
440
441
442
443
444
445
446
447
448
449
  	return dentry;
  }
  
  /*
   * Short-cut version of permission(), for calling by
   * path_walk(), when dcache lock is held.  Combines parts
   * of permission() and generic_permission(), and tests ONLY for
   * MAY_EXEC permission.
   *
   * If appropriate, check DAC only.  If not appropriate, or
   * short-cut DAC fails, then call permission() to do more
   * complete permission check.
   */
858119e15   Arjan van de Ven   [PATCH] Unlinline...
450
  static int exec_permission_lite(struct inode *inode,
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
  				       struct nameidata *nd)
  {
  	umode_t	mode = inode->i_mode;
  
  	if (inode->i_op && inode->i_op->permission)
  		return -EAGAIN;
  
  	if (current->fsuid == inode->i_uid)
  		mode >>= 6;
  	else if (in_group_p(inode->i_gid))
  		mode >>= 3;
  
  	if (mode & MAY_EXEC)
  		goto ok;
  
  	if ((inode->i_mode & S_IXUGO) && capable(CAP_DAC_OVERRIDE))
  		goto ok;
  
  	if (S_ISDIR(inode->i_mode) && capable(CAP_DAC_OVERRIDE))
  		goto ok;
  
  	if (S_ISDIR(inode->i_mode) && capable(CAP_DAC_READ_SEARCH))
  		goto ok;
  
  	return -EACCES;
  ok:
  	return security_inode_permission(inode, MAY_EXEC, nd);
  }
  
  /*
   * This is called when everything else fails, and we actually have
   * to go to the low-level filesystem to find out what we should do..
   *
   * We get the directory semaphore, and after getting that we also
   * make sure that nobody added the entry to the dcache in the meantime..
   * SMP-safe
   */
  static struct dentry * real_lookup(struct dentry * parent, struct qstr * name, struct nameidata *nd)
  {
  	struct dentry * result;
  	struct inode *dir = parent->d_inode;
1b1dcc1b5   Jes Sorensen   [PATCH] mutex sub...
492
  	mutex_lock(&dir->i_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
  	/*
  	 * First re-do the cached lookup just in case it was created
  	 * while we waited for the directory semaphore..
  	 *
  	 * FIXME! This could use version numbering or similar to
  	 * avoid unnecessary cache lookups.
  	 *
  	 * The "dcache_lock" is purely to protect the RCU list walker
  	 * from concurrent renames at this point (we mustn't get false
  	 * negatives from the RCU list walk here, unlike the optimistic
  	 * fast walk).
  	 *
  	 * so doing d_lookup() (with seqlock), instead of lockfree __d_lookup
  	 */
  	result = d_lookup(parent, name);
  	if (!result) {
  		struct dentry * dentry = d_alloc(parent, name);
  		result = ERR_PTR(-ENOMEM);
  		if (dentry) {
  			result = dir->i_op->lookup(dir, dentry, nd);
  			if (result)
  				dput(dentry);
  			else
  				result = dentry;
  		}
1b1dcc1b5   Jes Sorensen   [PATCH] mutex sub...
518
  		mutex_unlock(&dir->i_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
519
520
521
522
523
524
525
  		return result;
  	}
  
  	/*
  	 * Uhhuh! Nasty case: the cache was re-populated while
  	 * we waited on the semaphore. Need to revalidate.
  	 */
1b1dcc1b5   Jes Sorensen   [PATCH] mutex sub...
526
  	mutex_unlock(&dir->i_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
527
  	if (result->d_op && result->d_op->d_revalidate) {
bcdc5e019   Ian Kent   [PATCH] autofs4 n...
528
529
  		result = do_revalidate(result, nd);
  		if (!result)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
530
  			result = ERR_PTR(-ENOENT);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
531
532
533
534
535
536
537
  	}
  	return result;
  }
  
  static int __emul_lookup_dentry(const char *, struct nameidata *);
  
  /* SMP-safe */
f16623569   Arjan van de Ven   [PATCH] Mark some...
538
  static __always_inline int
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
539
540
  walk_init_root(const char *name, struct nameidata *nd)
  {
e518ddb7b   Andreas Mohr   [PATCH] fs/namei....
541
542
543
  	struct fs_struct *fs = current->fs;
  
  	read_lock(&fs->lock);
6ac08c39a   Jan Blunck   Use struct path i...
544
545
546
  	if (fs->altroot.dentry && !(nd->flags & LOOKUP_NOALT)) {
  		nd->path = fs->altroot;
  		path_get(&fs->altroot);
e518ddb7b   Andreas Mohr   [PATCH] fs/namei....
547
  		read_unlock(&fs->lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
548
549
  		if (__emul_lookup_dentry(name,nd))
  			return 0;
e518ddb7b   Andreas Mohr   [PATCH] fs/namei....
550
  		read_lock(&fs->lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
551
  	}
6ac08c39a   Jan Blunck   Use struct path i...
552
553
  	nd->path = fs->root;
  	path_get(&fs->root);
e518ddb7b   Andreas Mohr   [PATCH] fs/namei....
554
  	read_unlock(&fs->lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
555
556
  	return 1;
  }
a02f76c34   Al Viro   [PATCH] get stack...
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
  /*
   * Wrapper to retry pathname resolution whenever the underlying
   * file system returns an ESTALE.
   *
   * Retry the whole path once, forcing real lookup requests
   * instead of relying on the dcache.
   */
  static __always_inline int link_path_walk(const char *name, struct nameidata *nd)
  {
  	struct path save = nd->path;
  	int result;
  
  	/* make sure the stuff we saved doesn't go away */
  	dget(save.dentry);
  	mntget(save.mnt);
  
  	result = __link_path_walk(name, nd);
  	if (result == -ESTALE) {
  		/* nd->path had been dropped */
  		nd->path = save;
  		dget(nd->path.dentry);
  		mntget(nd->path.mnt);
  		nd->flags |= LOOKUP_REVAL;
  		result = __link_path_walk(name, nd);
  	}
  
  	path_put(&save);
  
  	return result;
  }
f16623569   Arjan van de Ven   [PATCH] Mark some...
587
  static __always_inline int __vfs_follow_link(struct nameidata *nd, const char *link)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
588
589
590
591
592
593
594
  {
  	int res = 0;
  	char *name;
  	if (IS_ERR(link))
  		goto fail;
  
  	if (*link == '/') {
1d957f9bf   Jan Blunck   Introduce path_put()
595
  		path_put(&nd->path);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
  		if (!walk_init_root(link, nd))
  			/* weird __emul_prefix() stuff did it */
  			goto out;
  	}
  	res = link_path_walk(link, nd);
  out:
  	if (nd->depth || res || nd->last_type!=LAST_NORM)
  		return res;
  	/*
  	 * If it is an iterative symlinks resolution in open_namei() we
  	 * have to copy the last component. And all that crap because of
  	 * bloody create() on broken symlinks. Furrfu...
  	 */
  	name = __getname();
  	if (unlikely(!name)) {
1d957f9bf   Jan Blunck   Introduce path_put()
611
  		path_put(&nd->path);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
612
613
614
615
616
617
  		return -ENOMEM;
  	}
  	strcpy(name, nd->last.name);
  	nd->last.name = name;
  	return 0;
  fail:
1d957f9bf   Jan Blunck   Introduce path_put()
618
  	path_put(&nd->path);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
619
620
  	return PTR_ERR(link);
  }
1d957f9bf   Jan Blunck   Introduce path_put()
621
  static void path_put_conditional(struct path *path, struct nameidata *nd)
051d38125   Ian Kent   [PATCH] autofs4: ...
622
623
  {
  	dput(path->dentry);
4ac913785   Jan Blunck   Embed a struct pa...
624
  	if (path->mnt != nd->path.mnt)
051d38125   Ian Kent   [PATCH] autofs4: ...
625
626
627
628
629
  		mntput(path->mnt);
  }
  
  static inline void path_to_nameidata(struct path *path, struct nameidata *nd)
  {
4ac913785   Jan Blunck   Embed a struct pa...
630
631
632
633
634
  	dput(nd->path.dentry);
  	if (nd->path.mnt != path->mnt)
  		mntput(nd->path.mnt);
  	nd->path.mnt = path->mnt;
  	nd->path.dentry = path->dentry;
051d38125   Ian Kent   [PATCH] autofs4: ...
635
  }
f16623569   Arjan van de Ven   [PATCH] Mark some...
636
  static __always_inline int __do_follow_link(struct path *path, struct nameidata *nd)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
637
638
  {
  	int error;
cc314eef0   Linus Torvalds   Fix nasty ncpfs s...
639
  	void *cookie;
cd4e91d3b   Al Viro   [PATCH] namei fix...
640
  	struct dentry *dentry = path->dentry;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
641

d671a1cbf   Al Viro   [PATCH] namei fix...
642
  	touch_atime(path->mnt, dentry);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
643
  	nd_set_link(nd, NULL);
cd4e91d3b   Al Viro   [PATCH] namei fix...
644

4ac913785   Jan Blunck   Embed a struct pa...
645
  	if (path->mnt != nd->path.mnt) {
051d38125   Ian Kent   [PATCH] autofs4: ...
646
647
648
649
  		path_to_nameidata(path, nd);
  		dget(dentry);
  	}
  	mntget(path->mnt);
cc314eef0   Linus Torvalds   Fix nasty ncpfs s...
650
651
652
  	cookie = dentry->d_inode->i_op->follow_link(dentry, nd);
  	error = PTR_ERR(cookie);
  	if (!IS_ERR(cookie)) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
653
  		char *s = nd_get_link(nd);
cc314eef0   Linus Torvalds   Fix nasty ncpfs s...
654
  		error = 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
655
656
657
  		if (s)
  			error = __vfs_follow_link(nd, s);
  		if (dentry->d_inode->i_op->put_link)
cc314eef0   Linus Torvalds   Fix nasty ncpfs s...
658
  			dentry->d_inode->i_op->put_link(dentry, nd, cookie);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
659
  	}
09da5916b   Jan Blunck   Use path_put() in...
660
  	path_put(path);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
661
662
663
664
665
666
667
668
669
670
671
  
  	return error;
  }
  
  /*
   * This limits recursive symlink follows to 8, while
   * limiting consecutive symlinks to 40.
   *
   * Without that kind of total limit, nasty chains of consecutive
   * symlinks can cause almost arbitrarily long lookups. 
   */
90ebe5654   Al Viro   [PATCH] namei fixes
672
  static inline int do_follow_link(struct path *path, struct nameidata *nd)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
673
674
675
676
677
678
679
680
  {
  	int err = -ELOOP;
  	if (current->link_count >= MAX_NESTED_LINKS)
  		goto loop;
  	if (current->total_link_count >= 40)
  		goto loop;
  	BUG_ON(nd->depth >= MAX_NESTED_LINKS);
  	cond_resched();
90ebe5654   Al Viro   [PATCH] namei fixes
681
  	err = security_inode_follow_link(path->dentry, nd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
682
683
684
685
686
  	if (err)
  		goto loop;
  	current->link_count++;
  	current->total_link_count++;
  	nd->depth++;
cd4e91d3b   Al Viro   [PATCH] namei fix...
687
  	err = __do_follow_link(path, nd);
839d9f93c   Al Viro   [PATCH] namei fix...
688
689
  	current->link_count--;
  	nd->depth--;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
690
691
  	return err;
  loop:
1d957f9bf   Jan Blunck   Introduce path_put()
692
693
  	path_put_conditional(path, nd);
  	path_put(&nd->path);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
  	return err;
  }
  
  int follow_up(struct vfsmount **mnt, struct dentry **dentry)
  {
  	struct vfsmount *parent;
  	struct dentry *mountpoint;
  	spin_lock(&vfsmount_lock);
  	parent=(*mnt)->mnt_parent;
  	if (parent == *mnt) {
  		spin_unlock(&vfsmount_lock);
  		return 0;
  	}
  	mntget(parent);
  	mountpoint=dget((*mnt)->mnt_mountpoint);
  	spin_unlock(&vfsmount_lock);
  	dput(*dentry);
  	*dentry = mountpoint;
  	mntput(*mnt);
  	*mnt = parent;
  	return 1;
  }
  
  /* no need for dcache_lock, as serialization is taken care in
   * namespace.c
   */
463ffb2e9   Al Viro   [PATCH] namei fix...
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
  static int __follow_mount(struct path *path)
  {
  	int res = 0;
  	while (d_mountpoint(path->dentry)) {
  		struct vfsmount *mounted = lookup_mnt(path->mnt, path->dentry);
  		if (!mounted)
  			break;
  		dput(path->dentry);
  		if (res)
  			mntput(path->mnt);
  		path->mnt = mounted;
  		path->dentry = dget(mounted->mnt_root);
  		res = 1;
  	}
  	return res;
  }
58c465eba   Al Viro   [PATCH] namei fix...
736
  static void follow_mount(struct vfsmount **mnt, struct dentry **dentry)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
737
  {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
738
739
740
741
  	while (d_mountpoint(*dentry)) {
  		struct vfsmount *mounted = lookup_mnt(*mnt, *dentry);
  		if (!mounted)
  			break;
58c465eba   Al Viro   [PATCH] namei fix...
742
  		dput(*dentry);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
743
744
  		mntput(*mnt);
  		*mnt = mounted;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
745
  		*dentry = dget(mounted->mnt_root);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
746
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
747
748
749
750
751
  }
  
  /* no need for dcache_lock, as serialization is taken care in
   * namespace.c
   */
e13b210f6   Al Viro   [PATCH] namei fix...
752
  int follow_down(struct vfsmount **mnt, struct dentry **dentry)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
753
754
755
756
757
  {
  	struct vfsmount *mounted;
  
  	mounted = lookup_mnt(*mnt, *dentry);
  	if (mounted) {
e13b210f6   Al Viro   [PATCH] namei fix...
758
  		dput(*dentry);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
759
760
  		mntput(*mnt);
  		*mnt = mounted;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
761
762
763
764
765
  		*dentry = dget(mounted->mnt_root);
  		return 1;
  	}
  	return 0;
  }
f16623569   Arjan van de Ven   [PATCH] Mark some...
766
  static __always_inline void follow_dotdot(struct nameidata *nd)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
767
  {
e518ddb7b   Andreas Mohr   [PATCH] fs/namei....
768
  	struct fs_struct *fs = current->fs;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
769
770
  	while(1) {
  		struct vfsmount *parent;
4ac913785   Jan Blunck   Embed a struct pa...
771
  		struct dentry *old = nd->path.dentry;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
772

e518ddb7b   Andreas Mohr   [PATCH] fs/namei....
773
                  read_lock(&fs->lock);
6ac08c39a   Jan Blunck   Use struct path i...
774
775
  		if (nd->path.dentry == fs->root.dentry &&
  		    nd->path.mnt == fs->root.mnt) {
e518ddb7b   Andreas Mohr   [PATCH] fs/namei....
776
                          read_unlock(&fs->lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
777
778
  			break;
  		}
e518ddb7b   Andreas Mohr   [PATCH] fs/namei....
779
                  read_unlock(&fs->lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
780
  		spin_lock(&dcache_lock);
4ac913785   Jan Blunck   Embed a struct pa...
781
782
  		if (nd->path.dentry != nd->path.mnt->mnt_root) {
  			nd->path.dentry = dget(nd->path.dentry->d_parent);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
783
784
785
786
787
788
  			spin_unlock(&dcache_lock);
  			dput(old);
  			break;
  		}
  		spin_unlock(&dcache_lock);
  		spin_lock(&vfsmount_lock);
4ac913785   Jan Blunck   Embed a struct pa...
789
790
  		parent = nd->path.mnt->mnt_parent;
  		if (parent == nd->path.mnt) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
791
792
793
794
  			spin_unlock(&vfsmount_lock);
  			break;
  		}
  		mntget(parent);
4ac913785   Jan Blunck   Embed a struct pa...
795
  		nd->path.dentry = dget(nd->path.mnt->mnt_mountpoint);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
796
797
  		spin_unlock(&vfsmount_lock);
  		dput(old);
4ac913785   Jan Blunck   Embed a struct pa...
798
799
  		mntput(nd->path.mnt);
  		nd->path.mnt = parent;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
800
  	}
4ac913785   Jan Blunck   Embed a struct pa...
801
  	follow_mount(&nd->path.mnt, &nd->path.dentry);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
802
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
803
804
805
806
807
808
809
810
  /*
   *  It's more convoluted than I'd like it to be, but... it's still fairly
   *  small and for now I'd prefer to have fast path as straight as possible.
   *  It _is_ time-critical.
   */
  static int do_lookup(struct nameidata *nd, struct qstr *name,
  		     struct path *path)
  {
4ac913785   Jan Blunck   Embed a struct pa...
811
812
  	struct vfsmount *mnt = nd->path.mnt;
  	struct dentry *dentry = __d_lookup(nd->path.dentry, name);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
813
814
815
816
817
818
819
820
  
  	if (!dentry)
  		goto need_lookup;
  	if (dentry->d_op && dentry->d_op->d_revalidate)
  		goto need_revalidate;
  done:
  	path->mnt = mnt;
  	path->dentry = dentry;
634ee7017   Al Viro   [PATCH] namei fix...
821
  	__follow_mount(path);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
822
823
824
  	return 0;
  
  need_lookup:
4ac913785   Jan Blunck   Embed a struct pa...
825
  	dentry = real_lookup(nd->path.dentry, name, nd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
826
827
828
829
830
  	if (IS_ERR(dentry))
  		goto fail;
  	goto done;
  
  need_revalidate:
bcdc5e019   Ian Kent   [PATCH] autofs4 n...
831
832
833
834
835
836
  	dentry = do_revalidate(dentry, nd);
  	if (!dentry)
  		goto need_lookup;
  	if (IS_ERR(dentry))
  		goto fail;
  	goto done;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
837
838
839
840
841
842
843
  
  fail:
  	return PTR_ERR(dentry);
  }
  
  /*
   * Name resolution.
ea3834d9f   Prasanna Meda   namei: add audit_...
844
845
   * This is the basic name resolution function, turning a pathname into
   * the final dentry. We expect 'base' to be positive and a directory.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
846
   *
ea3834d9f   Prasanna Meda   namei: add audit_...
847
848
   * Returns 0 and nd will have valid dentry and mnt on success.
   * Returns error and drops reference to input namei data on failure.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
849
   */
fc9b52cd8   Harvey Harrison   fs: remove fastca...
850
  static int __link_path_walk(const char *name, struct nameidata *nd)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
851
852
853
854
855
856
857
858
859
860
  {
  	struct path next;
  	struct inode *inode;
  	int err;
  	unsigned int lookup_flags = nd->flags;
  	
  	while (*name=='/')
  		name++;
  	if (!*name)
  		goto return_reval;
4ac913785   Jan Blunck   Embed a struct pa...
861
  	inode = nd->path.dentry->d_inode;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
862
  	if (nd->depth)
f55eab822   Trond Myklebust   [PATCH] VFS: Ensu...
863
  		lookup_flags = LOOKUP_FOLLOW | (nd->flags & LOOKUP_CONTINUE);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
864
865
866
867
868
869
  
  	/* At this point we know we have a real path component. */
  	for(;;) {
  		unsigned long hash;
  		struct qstr this;
  		unsigned int c;
cdce5d6b9   Trond Myklebust   VFS: Make link_pa...
870
  		nd->flags |= LOOKUP_CONTINUE;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
871
  		err = exec_permission_lite(inode, nd);
e4543eddf   Christoph Hellwig   [PATCH] add a vfs...
872
873
  		if (err == -EAGAIN)
  			err = vfs_permission(nd, MAY_EXEC);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
   		if (err)
  			break;
  
  		this.name = name;
  		c = *(const unsigned char *)name;
  
  		hash = init_name_hash();
  		do {
  			name++;
  			hash = partial_name_hash(c, hash);
  			c = *(const unsigned char *)name;
  		} while (c && (c != '/'));
  		this.len = name - (const char *) this.name;
  		this.hash = end_name_hash(hash);
  
  		/* remove trailing slashes? */
  		if (!c)
  			goto last_component;
  		while (*++name == '/');
  		if (!*name)
  			goto last_with_slashes;
  
  		/*
  		 * "." and ".." are special - ".." especially so because it has
  		 * to be able to know about the current root directory and
  		 * parent relationships.
  		 */
  		if (this.name[0] == '.') switch (this.len) {
  			default:
  				break;
  			case 2:	
  				if (this.name[1] != '.')
  					break;
58c465eba   Al Viro   [PATCH] namei fix...
907
  				follow_dotdot(nd);
4ac913785   Jan Blunck   Embed a struct pa...
908
  				inode = nd->path.dentry->d_inode;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
909
910
911
912
913
914
915
916
  				/* fallthrough */
  			case 1:
  				continue;
  		}
  		/*
  		 * See if the low-level filesystem might want
  		 * to use its own hash..
  		 */
4ac913785   Jan Blunck   Embed a struct pa...
917
918
919
  		if (nd->path.dentry->d_op && nd->path.dentry->d_op->d_hash) {
  			err = nd->path.dentry->d_op->d_hash(nd->path.dentry,
  							    &this);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
920
921
922
  			if (err < 0)
  				break;
  		}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
923
924
925
926
  		/* This does the actual lookups.. */
  		err = do_lookup(nd, &this, &next);
  		if (err)
  			break;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
927
928
929
930
931
932
933
934
935
936
  
  		err = -ENOENT;
  		inode = next.dentry->d_inode;
  		if (!inode)
  			goto out_dput;
  		err = -ENOTDIR; 
  		if (!inode->i_op)
  			goto out_dput;
  
  		if (inode->i_op->follow_link) {
90ebe5654   Al Viro   [PATCH] namei fixes
937
  			err = do_follow_link(&next, nd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
938
939
940
  			if (err)
  				goto return_err;
  			err = -ENOENT;
4ac913785   Jan Blunck   Embed a struct pa...
941
  			inode = nd->path.dentry->d_inode;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
942
943
944
945
946
  			if (!inode)
  				break;
  			err = -ENOTDIR; 
  			if (!inode->i_op)
  				break;
09dd17d3e   Miklos Szeredi   [PATCH] namei cle...
947
948
  		} else
  			path_to_nameidata(&next, nd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
949
950
951
952
953
954
955
956
957
  		err = -ENOTDIR; 
  		if (!inode->i_op->lookup)
  			break;
  		continue;
  		/* here ends the main loop */
  
  last_with_slashes:
  		lookup_flags |= LOOKUP_FOLLOW | LOOKUP_DIRECTORY;
  last_component:
f55eab822   Trond Myklebust   [PATCH] VFS: Ensu...
958
959
  		/* Clear LOOKUP_CONTINUE iff it was previously unset */
  		nd->flags &= lookup_flags | ~LOOKUP_CONTINUE;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
960
961
962
963
964
965
966
967
  		if (lookup_flags & LOOKUP_PARENT)
  			goto lookup_parent;
  		if (this.name[0] == '.') switch (this.len) {
  			default:
  				break;
  			case 2:	
  				if (this.name[1] != '.')
  					break;
58c465eba   Al Viro   [PATCH] namei fix...
968
  				follow_dotdot(nd);
4ac913785   Jan Blunck   Embed a struct pa...
969
  				inode = nd->path.dentry->d_inode;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
970
971
972
973
  				/* fallthrough */
  			case 1:
  				goto return_reval;
  		}
4ac913785   Jan Blunck   Embed a struct pa...
974
975
976
  		if (nd->path.dentry->d_op && nd->path.dentry->d_op->d_hash) {
  			err = nd->path.dentry->d_op->d_hash(nd->path.dentry,
  							    &this);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
977
978
979
980
981
982
  			if (err < 0)
  				break;
  		}
  		err = do_lookup(nd, &this, &next);
  		if (err)
  			break;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
983
984
985
  		inode = next.dentry->d_inode;
  		if ((lookup_flags & LOOKUP_FOLLOW)
  		    && inode && inode->i_op && inode->i_op->follow_link) {
90ebe5654   Al Viro   [PATCH] namei fixes
986
  			err = do_follow_link(&next, nd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
987
988
  			if (err)
  				goto return_err;
4ac913785   Jan Blunck   Embed a struct pa...
989
  			inode = nd->path.dentry->d_inode;
09dd17d3e   Miklos Szeredi   [PATCH] namei cle...
990
991
  		} else
  			path_to_nameidata(&next, nd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
992
993
994
995
996
997
998
999
1000
1001
1002
1003
1004
1005
1006
1007
1008
1009
1010
1011
1012
1013
1014
1015
1016
  		err = -ENOENT;
  		if (!inode)
  			break;
  		if (lookup_flags & LOOKUP_DIRECTORY) {
  			err = -ENOTDIR; 
  			if (!inode->i_op || !inode->i_op->lookup)
  				break;
  		}
  		goto return_base;
  lookup_parent:
  		nd->last = this;
  		nd->last_type = LAST_NORM;
  		if (this.name[0] != '.')
  			goto return_base;
  		if (this.len == 1)
  			nd->last_type = LAST_DOT;
  		else if (this.len == 2 && this.name[1] == '.')
  			nd->last_type = LAST_DOTDOT;
  		else
  			goto return_base;
  return_reval:
  		/*
  		 * We bypassed the ordinary revalidation routines.
  		 * We may need to check the cached dentry for staleness.
  		 */
4ac913785   Jan Blunck   Embed a struct pa...
1017
1018
  		if (nd->path.dentry && nd->path.dentry->d_sb &&
  		    (nd->path.dentry->d_sb->s_type->fs_flags & FS_REVAL_DOT)) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1019
1020
  			err = -ESTALE;
  			/* Note: we do not d_invalidate() */
4ac913785   Jan Blunck   Embed a struct pa...
1021
1022
  			if (!nd->path.dentry->d_op->d_revalidate(
  					nd->path.dentry, nd))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1023
1024
1025
1026
1027
  				break;
  		}
  return_base:
  		return 0;
  out_dput:
1d957f9bf   Jan Blunck   Introduce path_put()
1028
  		path_put_conditional(&next, nd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1029
1030
  		break;
  	}
1d957f9bf   Jan Blunck   Introduce path_put()
1031
  	path_put(&nd->path);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1032
1033
1034
  return_err:
  	return err;
  }
fc9b52cd8   Harvey Harrison   fs: remove fastca...
1035
  static int path_walk(const char *name, struct nameidata *nd)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1036
1037
1038
1039
  {
  	current->total_link_count = 0;
  	return link_path_walk(name, nd);
  }
ea3834d9f   Prasanna Meda   namei: add audit_...
1040
1041
1042
1043
  /* 
   * SMP-safe: Returns 1 and nd will have valid dentry and mnt, if
   * everything is done. Returns 0 and drops input nd, if lookup failed;
   */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1044
1045
1046
1047
  static int __emul_lookup_dentry(const char *name, struct nameidata *nd)
  {
  	if (path_walk(name, nd))
  		return 0;		/* something went wrong... */
4ac913785   Jan Blunck   Embed a struct pa...
1048
1049
  	if (!nd->path.dentry->d_inode ||
  	    S_ISDIR(nd->path.dentry->d_inode->i_mode)) {
09da5916b   Jan Blunck   Use path_put() in...
1050
  		struct path old_path = nd->path;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1051
1052
  		struct qstr last = nd->last;
  		int last_type = nd->last_type;
e518ddb7b   Andreas Mohr   [PATCH] fs/namei....
1053
  		struct fs_struct *fs = current->fs;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1054
  		/*
e518ddb7b   Andreas Mohr   [PATCH] fs/namei....
1055
1056
  		 * NAME was not found in alternate root or it's a directory.
  		 * Try to find it in the normal root:
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1057
1058
  		 */
  		nd->last_type = LAST_ROOT;
e518ddb7b   Andreas Mohr   [PATCH] fs/namei....
1059
  		read_lock(&fs->lock);
6ac08c39a   Jan Blunck   Use struct path i...
1060
1061
  		nd->path = fs->root;
  		path_get(&fs->root);
e518ddb7b   Andreas Mohr   [PATCH] fs/namei....
1062
  		read_unlock(&fs->lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1063
  		if (path_walk(name, nd) == 0) {
4ac913785   Jan Blunck   Embed a struct pa...
1064
  			if (nd->path.dentry->d_inode) {
09da5916b   Jan Blunck   Use path_put() in...
1065
  				path_put(&old_path);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1066
1067
  				return 1;
  			}
1d957f9bf   Jan Blunck   Introduce path_put()
1068
  			path_put(&nd->path);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1069
  		}
09da5916b   Jan Blunck   Use path_put() in...
1070
  		nd->path = old_path;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1071
1072
1073
1074
1075
1076
1077
1078
1079
1080
  		nd->last = last;
  		nd->last_type = last_type;
  	}
  	return 1;
  }
  
  void set_fs_altroot(void)
  {
  	char *emul = __emul_prefix();
  	struct nameidata nd;
6ac08c39a   Jan Blunck   Use struct path i...
1081
  	struct path path = {}, old_path;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1082
  	int err;
e518ddb7b   Andreas Mohr   [PATCH] fs/namei....
1083
  	struct fs_struct *fs = current->fs;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1084
1085
1086
1087
  
  	if (!emul)
  		goto set_it;
  	err = path_lookup(emul, LOOKUP_FOLLOW|LOOKUP_DIRECTORY|LOOKUP_NOALT, &nd);
6ac08c39a   Jan Blunck   Use struct path i...
1088
1089
  	if (!err)
  		path = nd.path;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1090
  set_it:
e518ddb7b   Andreas Mohr   [PATCH] fs/namei....
1091
  	write_lock(&fs->lock);
6ac08c39a   Jan Blunck   Use struct path i...
1092
1093
  	old_path = fs->altroot;
  	fs->altroot = path;
e518ddb7b   Andreas Mohr   [PATCH] fs/namei....
1094
  	write_unlock(&fs->lock);
6ac08c39a   Jan Blunck   Use struct path i...
1095
1096
  	if (old_path.dentry)
  		path_put(&old_path);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1097
  }
ea3834d9f   Prasanna Meda   namei: add audit_...
1098
  /* Returns 0 and nd will be valid on success; Retuns error, otherwise. */
fc9b52cd8   Harvey Harrison   fs: remove fastca...
1099
  static int do_path_lookup(int dfd, const char *name,
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
1100
  				unsigned int flags, struct nameidata *nd)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1101
  {
ea3834d9f   Prasanna Meda   namei: add audit_...
1102
  	int retval = 0;
170aa3d02   Ulrich Drepper   [PATCH] namei.c: ...
1103
1104
  	int fput_needed;
  	struct file *file;
e518ddb7b   Andreas Mohr   [PATCH] fs/namei....
1105
  	struct fs_struct *fs = current->fs;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1106
1107
1108
1109
  
  	nd->last_type = LAST_ROOT; /* if there are only slashes... */
  	nd->flags = flags;
  	nd->depth = 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1110
  	if (*name=='/') {
e518ddb7b   Andreas Mohr   [PATCH] fs/namei....
1111
  		read_lock(&fs->lock);
6ac08c39a   Jan Blunck   Use struct path i...
1112
1113
1114
  		if (fs->altroot.dentry && !(nd->flags & LOOKUP_NOALT)) {
  			nd->path = fs->altroot;
  			path_get(&fs->altroot);
e518ddb7b   Andreas Mohr   [PATCH] fs/namei....
1115
  			read_unlock(&fs->lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1116
  			if (__emul_lookup_dentry(name,nd))
ea3834d9f   Prasanna Meda   namei: add audit_...
1117
  				goto out; /* found in altroot */
e518ddb7b   Andreas Mohr   [PATCH] fs/namei....
1118
  			read_lock(&fs->lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1119
  		}
6ac08c39a   Jan Blunck   Use struct path i...
1120
1121
  		nd->path = fs->root;
  		path_get(&fs->root);
e518ddb7b   Andreas Mohr   [PATCH] fs/namei....
1122
  		read_unlock(&fs->lock);
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
1123
  	} else if (dfd == AT_FDCWD) {
e518ddb7b   Andreas Mohr   [PATCH] fs/namei....
1124
  		read_lock(&fs->lock);
6ac08c39a   Jan Blunck   Use struct path i...
1125
1126
  		nd->path = fs->pwd;
  		path_get(&fs->pwd);
e518ddb7b   Andreas Mohr   [PATCH] fs/namei....
1127
  		read_unlock(&fs->lock);
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
1128
  	} else {
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
1129
1130
1131
  		struct dentry *dentry;
  
  		file = fget_light(dfd, &fput_needed);
170aa3d02   Ulrich Drepper   [PATCH] namei.c: ...
1132
1133
  		retval = -EBADF;
  		if (!file)
6d09bb627   Trond Myklebust   [PATCH] fs/namei....
1134
  			goto out_fail;
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
1135

0f7fc9e4d   Josef "Jeff" Sipek   [PATCH] VFS: chan...
1136
  		dentry = file->f_path.dentry;
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
1137

170aa3d02   Ulrich Drepper   [PATCH] namei.c: ...
1138
1139
  		retval = -ENOTDIR;
  		if (!S_ISDIR(dentry->d_inode->i_mode))
6d09bb627   Trond Myklebust   [PATCH] fs/namei....
1140
  			goto fput_fail;
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
1141
1142
  
  		retval = file_permission(file, MAY_EXEC);
170aa3d02   Ulrich Drepper   [PATCH] namei.c: ...
1143
  		if (retval)
6d09bb627   Trond Myklebust   [PATCH] fs/namei....
1144
  			goto fput_fail;
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
1145

5dd784d04   Jan Blunck   Introduce path_get()
1146
1147
  		nd->path = file->f_path;
  		path_get(&file->f_path);
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
1148
1149
  
  		fput_light(file, fput_needed);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1150
  	}
2dfdd266b   Josef 'Jeff' Sipek   fs: use path_walk...
1151
1152
  
  	retval = path_walk(name, nd);
ea3834d9f   Prasanna Meda   namei: add audit_...
1153
  out:
4ac913785   Jan Blunck   Embed a struct pa...
1154
1155
1156
  	if (unlikely(!retval && !audit_dummy_context() && nd->path.dentry &&
  				nd->path.dentry->d_inode))
  		audit_inode(name, nd->path.dentry);
6d09bb627   Trond Myklebust   [PATCH] fs/namei....
1157
  out_fail:
170aa3d02   Ulrich Drepper   [PATCH] namei.c: ...
1158
  	return retval;
6d09bb627   Trond Myklebust   [PATCH] fs/namei....
1159
  fput_fail:
170aa3d02   Ulrich Drepper   [PATCH] namei.c: ...
1160
  	fput_light(file, fput_needed);
6d09bb627   Trond Myklebust   [PATCH] fs/namei....
1161
  	goto out_fail;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1162
  }
fc9b52cd8   Harvey Harrison   fs: remove fastca...
1163
  int path_lookup(const char *name, unsigned int flags,
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
1164
1165
1166
1167
  			struct nameidata *nd)
  {
  	return do_path_lookup(AT_FDCWD, name, flags, nd);
  }
16f182002   Josef 'Jeff' Sipek   fs: introduce vfs...
1168
1169
1170
1171
1172
1173
1174
1175
1176
1177
1178
1179
1180
1181
1182
1183
1184
1185
  /**
   * vfs_path_lookup - lookup a file path relative to a dentry-vfsmount pair
   * @dentry:  pointer to dentry of the base directory
   * @mnt: pointer to vfs mount of the base directory
   * @name: pointer to file name
   * @flags: lookup flags
   * @nd: pointer to nameidata
   */
  int vfs_path_lookup(struct dentry *dentry, struct vfsmount *mnt,
  		    const char *name, unsigned int flags,
  		    struct nameidata *nd)
  {
  	int retval;
  
  	/* same as do_path_lookup */
  	nd->last_type = LAST_ROOT;
  	nd->flags = flags;
  	nd->depth = 0;
4ac913785   Jan Blunck   Embed a struct pa...
1186
1187
  	nd->path.mnt = mntget(mnt);
  	nd->path.dentry = dget(dentry);
16f182002   Josef 'Jeff' Sipek   fs: introduce vfs...
1188
1189
  
  	retval = path_walk(name, nd);
4ac913785   Jan Blunck   Embed a struct pa...
1190
1191
1192
  	if (unlikely(!retval && !audit_dummy_context() && nd->path.dentry &&
  				nd->path.dentry->d_inode))
  		audit_inode(name, nd->path.dentry);
16f182002   Josef 'Jeff' Sipek   fs: introduce vfs...
1193
1194
1195
1196
  
  	return retval;
  
  }
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
1197
1198
1199
  static int __path_lookup_intent_open(int dfd, const char *name,
  		unsigned int lookup_flags, struct nameidata *nd,
  		int open_flags, int create_mode)
834f2a4a1   Trond Myklebust   VFS: Allow the fi...
1200
1201
1202
1203
1204
1205
1206
1207
1208
  {
  	struct file *filp = get_empty_filp();
  	int err;
  
  	if (filp == NULL)
  		return -ENFILE;
  	nd->intent.open.file = filp;
  	nd->intent.open.flags = open_flags;
  	nd->intent.open.create_mode = create_mode;
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
1209
  	err = do_path_lookup(dfd, name, lookup_flags|LOOKUP_OPEN, nd);
834f2a4a1   Trond Myklebust   VFS: Allow the fi...
1210
1211
1212
  	if (IS_ERR(nd->intent.open.file)) {
  		if (err == 0) {
  			err = PTR_ERR(nd->intent.open.file);
1d957f9bf   Jan Blunck   Introduce path_put()
1213
  			path_put(&nd->path);
834f2a4a1   Trond Myklebust   VFS: Allow the fi...
1214
1215
1216
1217
1218
1219
1220
1221
  		}
  	} else if (err != 0)
  		release_open_intent(nd);
  	return err;
  }
  
  /**
   * path_lookup_open - lookup a file path with open intent
7045f37b1   Martin Waitz   [PATCH] DocBook: ...
1222
   * @dfd: the directory to use as base, or AT_FDCWD
834f2a4a1   Trond Myklebust   VFS: Allow the fi...
1223
1224
1225
1226
1227
   * @name: pointer to file name
   * @lookup_flags: lookup intent flags
   * @nd: pointer to nameidata
   * @open_flags: open intent flags
   */
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
1228
  int path_lookup_open(int dfd, const char *name, unsigned int lookup_flags,
834f2a4a1   Trond Myklebust   VFS: Allow the fi...
1229
1230
  		struct nameidata *nd, int open_flags)
  {
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
1231
  	return __path_lookup_intent_open(dfd, name, lookup_flags, nd,
834f2a4a1   Trond Myklebust   VFS: Allow the fi...
1232
1233
1234
1235
1236
  			open_flags, 0);
  }
  
  /**
   * path_lookup_create - lookup a file path with open + create intent
7045f37b1   Martin Waitz   [PATCH] DocBook: ...
1237
   * @dfd: the directory to use as base, or AT_FDCWD
834f2a4a1   Trond Myklebust   VFS: Allow the fi...
1238
1239
1240
1241
1242
1243
   * @name: pointer to file name
   * @lookup_flags: lookup intent flags
   * @nd: pointer to nameidata
   * @open_flags: open intent flags
   * @create_mode: create intent flags
   */
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
1244
1245
1246
  static int path_lookup_create(int dfd, const char *name,
  			      unsigned int lookup_flags, struct nameidata *nd,
  			      int open_flags, int create_mode)
834f2a4a1   Trond Myklebust   VFS: Allow the fi...
1247
  {
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
1248
1249
  	return __path_lookup_intent_open(dfd, name, lookup_flags|LOOKUP_CREATE,
  			nd, open_flags, create_mode);
834f2a4a1   Trond Myklebust   VFS: Allow the fi...
1250
1251
1252
1253
1254
1255
1256
1257
1258
  }
  
  int __user_path_lookup_open(const char __user *name, unsigned int lookup_flags,
  		struct nameidata *nd, int open_flags)
  {
  	char *tmp = getname(name);
  	int err = PTR_ERR(tmp);
  
  	if (!IS_ERR(tmp)) {
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
1259
  		err = __path_lookup_intent_open(AT_FDCWD, tmp, lookup_flags, nd, open_flags, 0);
834f2a4a1   Trond Myklebust   VFS: Allow the fi...
1260
1261
1262
1263
  		putname(tmp);
  	}
  	return err;
  }
eead19115   Christoph Hellwig   partially fix up ...
1264
1265
  static struct dentry *__lookup_hash(struct qstr *name,
  		struct dentry *base, struct nameidata *nd)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1266
  {
057f6c019   James Morris   security: prevent...
1267
  	struct dentry *dentry;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1268
1269
1270
1271
  	struct inode *inode;
  	int err;
  
  	inode = base->d_inode;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1272
1273
1274
1275
1276
1277
1278
1279
1280
1281
1282
1283
1284
1285
1286
1287
1288
1289
1290
1291
1292
1293
1294
1295
1296
1297
1298
  
  	/*
  	 * See if the low-level filesystem might want
  	 * to use its own hash..
  	 */
  	if (base->d_op && base->d_op->d_hash) {
  		err = base->d_op->d_hash(base, name);
  		dentry = ERR_PTR(err);
  		if (err < 0)
  			goto out;
  	}
  
  	dentry = cached_lookup(base, name, nd);
  	if (!dentry) {
  		struct dentry *new = d_alloc(base, name);
  		dentry = ERR_PTR(-ENOMEM);
  		if (!new)
  			goto out;
  		dentry = inode->i_op->lookup(inode, new, nd);
  		if (!dentry)
  			dentry = new;
  		else
  			dput(new);
  	}
  out:
  	return dentry;
  }
057f6c019   James Morris   security: prevent...
1299
1300
1301
1302
1303
  /*
   * Restricted form of lookup. Doesn't follow links, single-component only,
   * needs parent already locked. Doesn't follow mounts.
   * SMP-safe.
   */
eead19115   Christoph Hellwig   partially fix up ...
1304
  static struct dentry *lookup_hash(struct nameidata *nd)
057f6c019   James Morris   security: prevent...
1305
  {
057f6c019   James Morris   security: prevent...
1306
  	int err;
4ac913785   Jan Blunck   Embed a struct pa...
1307
  	err = permission(nd->path.dentry->d_inode, MAY_EXEC, nd);
057f6c019   James Morris   security: prevent...
1308
  	if (err)
eead19115   Christoph Hellwig   partially fix up ...
1309
  		return ERR_PTR(err);
4ac913785   Jan Blunck   Embed a struct pa...
1310
  	return __lookup_hash(&nd->last, nd->path.dentry, nd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1311
  }
eead19115   Christoph Hellwig   partially fix up ...
1312
1313
  static int __lookup_one_len(const char *name, struct qstr *this,
  		struct dentry *base, int len)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1314
1315
  {
  	unsigned long hash;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1316
  	unsigned int c;
057f6c019   James Morris   security: prevent...
1317
1318
  	this->name = name;
  	this->len = len;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1319
  	if (!len)
057f6c019   James Morris   security: prevent...
1320
  		return -EACCES;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1321
1322
1323
1324
1325
  
  	hash = init_name_hash();
  	while (len--) {
  		c = *(const unsigned char *)name++;
  		if (c == '/' || c == '\0')
057f6c019   James Morris   security: prevent...
1326
  			return -EACCES;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1327
1328
  		hash = partial_name_hash(c, hash);
  	}
057f6c019   James Morris   security: prevent...
1329
1330
1331
  	this->hash = end_name_hash(hash);
  	return 0;
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1332

eead19115   Christoph Hellwig   partially fix up ...
1333
  /**
a6b91919e   Randy Dunlap   fs: fix kernel-do...
1334
   * lookup_one_len - filesystem helper to lookup single pathname component
eead19115   Christoph Hellwig   partially fix up ...
1335
1336
1337
1338
   * @name:	pathname component to lookup
   * @base:	base directory to lookup from
   * @len:	maximum length @len should be interpreted to
   *
a6b91919e   Randy Dunlap   fs: fix kernel-do...
1339
1340
   * Note that this routine is purely a helper for filesystem usage and should
   * not be called by generic code.  Also note that by using this function the
eead19115   Christoph Hellwig   partially fix up ...
1341
1342
1343
   * nameidata argument is passed to the filesystem methods and a filesystem
   * using this helper needs to be prepared for that.
   */
057f6c019   James Morris   security: prevent...
1344
1345
1346
1347
1348
1349
1350
1351
  struct dentry *lookup_one_len(const char *name, struct dentry *base, int len)
  {
  	int err;
  	struct qstr this;
  
  	err = __lookup_one_len(name, &this, base, len);
  	if (err)
  		return ERR_PTR(err);
eead19115   Christoph Hellwig   partially fix up ...
1352
1353
1354
1355
  
  	err = permission(base->d_inode, MAY_EXEC, NULL);
  	if (err)
  		return ERR_PTR(err);
49705b774   Christoph Hellwig   [PATCH] sanitize ...
1356
  	return __lookup_hash(&this, base, NULL);
057f6c019   James Morris   security: prevent...
1357
  }
eead19115   Christoph Hellwig   partially fix up ...
1358
1359
1360
1361
1362
1363
1364
1365
1366
1367
1368
1369
  /**
   * lookup_one_noperm - bad hack for sysfs
   * @name:	pathname component to lookup
   * @base:	base directory to lookup from
   *
   * This is a variant of lookup_one_len that doesn't perform any permission
   * checks.   It's a horrible hack to work around the braindead sysfs
   * architecture and should not be used anywhere else.
   *
   * DON'T USE THIS FUNCTION EVER, thanks.
   */
  struct dentry *lookup_one_noperm(const char *name, struct dentry *base)
057f6c019   James Morris   security: prevent...
1370
1371
1372
  {
  	int err;
  	struct qstr this;
eead19115   Christoph Hellwig   partially fix up ...
1373
  	err = __lookup_one_len(name, &this, base, strlen(name));
057f6c019   James Morris   security: prevent...
1374
1375
  	if (err)
  		return ERR_PTR(err);
eead19115   Christoph Hellwig   partially fix up ...
1376
  	return __lookup_hash(&this, base, NULL);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1377
  }
fc9b52cd8   Harvey Harrison   fs: remove fastca...
1378
  int __user_walk_fd(int dfd, const char __user *name, unsigned flags,
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
1379
  			    struct nameidata *nd)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1380
1381
1382
1383
1384
  {
  	char *tmp = getname(name);
  	int err = PTR_ERR(tmp);
  
  	if (!IS_ERR(tmp)) {
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
1385
  		err = do_path_lookup(dfd, tmp, flags, nd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1386
1387
1388
1389
  		putname(tmp);
  	}
  	return err;
  }
fc9b52cd8   Harvey Harrison   fs: remove fastca...
1390
  int __user_walk(const char __user *name, unsigned flags, struct nameidata *nd)
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
1391
1392
1393
  {
  	return __user_walk_fd(AT_FDCWD, name, flags, nd);
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1394
1395
1396
1397
1398
1399
1400
1401
1402
1403
1404
1405
1406
1407
1408
1409
1410
1411
1412
1413
1414
1415
1416
1417
1418
1419
1420
1421
1422
1423
1424
1425
1426
1427
  /*
   * It's inline, so penalty for filesystems that don't use sticky bit is
   * minimal.
   */
  static inline int check_sticky(struct inode *dir, struct inode *inode)
  {
  	if (!(dir->i_mode & S_ISVTX))
  		return 0;
  	if (inode->i_uid == current->fsuid)
  		return 0;
  	if (dir->i_uid == current->fsuid)
  		return 0;
  	return !capable(CAP_FOWNER);
  }
  
  /*
   *	Check whether we can remove a link victim from directory dir, check
   *  whether the type of victim is right.
   *  1. We can't do it if dir is read-only (done in permission())
   *  2. We should have write and exec permissions on dir
   *  3. We can't remove anything from append-only dir
   *  4. We can't do anything with immutable dir (done in permission())
   *  5. If the sticky bit on dir is set we should either
   *	a. be owner of dir, or
   *	b. be owner of victim, or
   *	c. have CAP_FOWNER capability
   *  6. If the victim is append-only or immutable we can't do antyhing with
   *     links pointing to it.
   *  7. If we were asked to remove a directory and victim isn't one - ENOTDIR.
   *  8. If we were asked to remove a non-directory and victim isn't one - EISDIR.
   *  9. We can't remove a root or mountpoint.
   * 10. We don't allow removal of NFS sillyrenamed files; it's handled by
   *     nfs_async_unlink().
   */
858119e15   Arjan van de Ven   [PATCH] Unlinline...
1428
  static int may_delete(struct inode *dir,struct dentry *victim,int isdir)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1429
1430
1431
1432
1433
1434
1435
  {
  	int error;
  
  	if (!victim->d_inode)
  		return -ENOENT;
  
  	BUG_ON(victim->d_parent->d_inode != dir);
5a190ae69   Al Viro   [PATCH] pass dent...
1436
  	audit_inode_child(victim->d_name.name, victim, dir);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1437
1438
1439
1440
1441
1442
1443
1444
1445
1446
1447
1448
1449
1450
1451
1452
1453
1454
1455
1456
1457
1458
1459
1460
1461
1462
1463
1464
1465
1466
1467
1468
1469
1470
1471
1472
1473
1474
1475
1476
1477
1478
  
  	error = permission(dir,MAY_WRITE | MAY_EXEC, NULL);
  	if (error)
  		return error;
  	if (IS_APPEND(dir))
  		return -EPERM;
  	if (check_sticky(dir, victim->d_inode)||IS_APPEND(victim->d_inode)||
  	    IS_IMMUTABLE(victim->d_inode))
  		return -EPERM;
  	if (isdir) {
  		if (!S_ISDIR(victim->d_inode->i_mode))
  			return -ENOTDIR;
  		if (IS_ROOT(victim))
  			return -EBUSY;
  	} else if (S_ISDIR(victim->d_inode->i_mode))
  		return -EISDIR;
  	if (IS_DEADDIR(dir))
  		return -ENOENT;
  	if (victim->d_flags & DCACHE_NFSFS_RENAMED)
  		return -EBUSY;
  	return 0;
  }
  
  /*	Check whether we can create an object with dentry child in directory
   *  dir.
   *  1. We can't do it if child already exists (open has special treatment for
   *     this case, but since we are inlined it's OK)
   *  2. We can't do it if dir is read-only (done in permission())
   *  3. We should have write and exec permissions on dir
   *  4. We can't do it if dir is immutable (done in permission())
   */
  static inline int may_create(struct inode *dir, struct dentry *child,
  			     struct nameidata *nd)
  {
  	if (child->d_inode)
  		return -EEXIST;
  	if (IS_DEADDIR(dir))
  		return -ENOENT;
  	return permission(dir,MAY_WRITE | MAY_EXEC, nd);
  }
  
  /* 
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1479
1480
1481
1482
1483
1484
1485
1486
1487
   * O_DIRECTORY translates into forcing a directory lookup.
   */
  static inline int lookup_flags(unsigned int f)
  {
  	unsigned long retval = LOOKUP_FOLLOW;
  
  	if (f & O_NOFOLLOW)
  		retval &= ~LOOKUP_FOLLOW;
  	
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1488
1489
1490
1491
1492
1493
1494
1495
1496
1497
1498
1499
1500
1501
  	if (f & O_DIRECTORY)
  		retval |= LOOKUP_DIRECTORY;
  
  	return retval;
  }
  
  /*
   * p1 and p2 should be directories on the same fs.
   */
  struct dentry *lock_rename(struct dentry *p1, struct dentry *p2)
  {
  	struct dentry *p;
  
  	if (p1 == p2) {
f2eace23e   Ingo Molnar   [PATCH] lockdep: ...
1502
  		mutex_lock_nested(&p1->d_inode->i_mutex, I_MUTEX_PARENT);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1503
1504
  		return NULL;
  	}
a11f3a057   Arjan van de Ven   [PATCH] sem2mutex...
1505
  	mutex_lock(&p1->d_inode->i_sb->s_vfs_rename_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1506
1507
1508
  
  	for (p = p1; p->d_parent != p; p = p->d_parent) {
  		if (p->d_parent == p2) {
f2eace23e   Ingo Molnar   [PATCH] lockdep: ...
1509
1510
  			mutex_lock_nested(&p2->d_inode->i_mutex, I_MUTEX_PARENT);
  			mutex_lock_nested(&p1->d_inode->i_mutex, I_MUTEX_CHILD);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1511
1512
1513
1514
1515
1516
  			return p;
  		}
  	}
  
  	for (p = p2; p->d_parent != p; p = p->d_parent) {
  		if (p->d_parent == p1) {
f2eace23e   Ingo Molnar   [PATCH] lockdep: ...
1517
1518
  			mutex_lock_nested(&p1->d_inode->i_mutex, I_MUTEX_PARENT);
  			mutex_lock_nested(&p2->d_inode->i_mutex, I_MUTEX_CHILD);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1519
1520
1521
  			return p;
  		}
  	}
f2eace23e   Ingo Molnar   [PATCH] lockdep: ...
1522
1523
  	mutex_lock_nested(&p1->d_inode->i_mutex, I_MUTEX_PARENT);
  	mutex_lock_nested(&p2->d_inode->i_mutex, I_MUTEX_CHILD);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1524
1525
1526
1527
1528
  	return NULL;
  }
  
  void unlock_rename(struct dentry *p1, struct dentry *p2)
  {
1b1dcc1b5   Jes Sorensen   [PATCH] mutex sub...
1529
  	mutex_unlock(&p1->d_inode->i_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1530
  	if (p1 != p2) {
1b1dcc1b5   Jes Sorensen   [PATCH] mutex sub...
1531
  		mutex_unlock(&p2->d_inode->i_mutex);
a11f3a057   Arjan van de Ven   [PATCH] sem2mutex...
1532
  		mutex_unlock(&p1->d_inode->i_sb->s_vfs_rename_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1533
1534
1535
1536
1537
1538
1539
1540
1541
1542
1543
1544
1545
1546
1547
1548
1549
1550
1551
1552
  	}
  }
  
  int vfs_create(struct inode *dir, struct dentry *dentry, int mode,
  		struct nameidata *nd)
  {
  	int error = may_create(dir, dentry, nd);
  
  	if (error)
  		return error;
  
  	if (!dir->i_op || !dir->i_op->create)
  		return -EACCES;	/* shouldn't it be ENOSYS? */
  	mode &= S_IALLUGO;
  	mode |= S_IFREG;
  	error = security_inode_create(dir, dentry, mode);
  	if (error)
  		return error;
  	DQUOT_INIT(dir);
  	error = dir->i_op->create(dir, dentry, mode, nd);
a74574aaf   Stephen Smalley   [PATCH] Remove se...
1553
  	if (!error)
f38aa9422   Amy Griffis   [PATCH] Pass dent...
1554
  		fsnotify_create(dir, dentry);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1555
1556
1557
1558
1559
  	return error;
  }
  
  int may_open(struct nameidata *nd, int acc_mode, int flag)
  {
4ac913785   Jan Blunck   Embed a struct pa...
1560
  	struct dentry *dentry = nd->path.dentry;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1561
1562
1563
1564
1565
1566
1567
1568
1569
  	struct inode *inode = dentry->d_inode;
  	int error;
  
  	if (!inode)
  		return -ENOENT;
  
  	if (S_ISLNK(inode->i_mode))
  		return -ELOOP;
  	
974a9f0b4   Linus Torvalds   Use access mode i...
1570
  	if (S_ISDIR(inode->i_mode) && (acc_mode & MAY_WRITE))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1571
  		return -EISDIR;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1572
1573
1574
1575
1576
1577
1578
1579
  	/*
  	 * FIFO's, sockets and device files are special: they don't
  	 * actually live on the filesystem itself, and as such you
  	 * can write to them even if the filesystem is read-only.
  	 */
  	if (S_ISFIFO(inode->i_mode) || S_ISSOCK(inode->i_mode)) {
  	    	flag &= ~O_TRUNC;
  	} else if (S_ISBLK(inode->i_mode) || S_ISCHR(inode->i_mode)) {
4ac913785   Jan Blunck   Embed a struct pa...
1580
  		if (nd->path.mnt->mnt_flags & MNT_NODEV)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1581
1582
1583
  			return -EACCES;
  
  		flag &= ~O_TRUNC;
4a3fd211c   Dave Hansen   [PATCH] r/o bind ...
1584
  	}
b41572e92   Dave Hansen   r/o bind mounts: ...
1585
1586
1587
1588
  
  	error = vfs_permission(nd, acc_mode);
  	if (error)
  		return error;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1589
1590
1591
1592
1593
1594
1595
1596
1597
1598
1599
1600
  	/*
  	 * An append-only file must be opened in append mode for writing.
  	 */
  	if (IS_APPEND(inode)) {
  		if  ((flag & FMODE_WRITE) && !(flag & O_APPEND))
  			return -EPERM;
  		if (flag & O_TRUNC)
  			return -EPERM;
  	}
  
  	/* O_NOATIME can only be set by the owner or superuser */
  	if (flag & O_NOATIME)
3bd858ab1   Satyam Sharma   Introduce is_owne...
1601
  		if (!is_owner_or_cap(inode))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1602
1603
1604
1605
1606
1607
1608
1609
1610
1611
1612
1613
1614
1615
1616
1617
1618
1619
1620
1621
  			return -EPERM;
  
  	/*
  	 * Ensure there are no outstanding leases on the file.
  	 */
  	error = break_lease(inode, flag);
  	if (error)
  		return error;
  
  	if (flag & O_TRUNC) {
  		error = get_write_access(inode);
  		if (error)
  			return error;
  
  		/*
  		 * Refuse to truncate files with mandatory locks held on them.
  		 */
  		error = locks_verify_locked(inode);
  		if (!error) {
  			DQUOT_INIT(inode);
d139d7ffd   Miklos Szeredi   VFS: allow filesy...
1622
1623
1624
1625
  
  			error = do_truncate(dentry, 0,
  					    ATTR_MTIME|ATTR_CTIME|ATTR_OPEN,
  					    NULL);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1626
1627
1628
1629
1630
1631
1632
1633
1634
1635
  		}
  		put_write_access(inode);
  		if (error)
  			return error;
  	} else
  		if (flag & FMODE_WRITE)
  			DQUOT_INIT(inode);
  
  	return 0;
  }
d57999e15   Dave Hansen   [PATCH] do namei_...
1636
1637
1638
1639
1640
1641
  /*
   * Be careful about ever adding any more callers of this
   * function.  Its flags must be in the namei format, not
   * what get passed to sys_open().
   */
  static int __open_namei_create(struct nameidata *nd, struct path *path,
aab520e2f   Dave Hansen   [PATCH] r/o bind ...
1642
1643
1644
  				int flag, int mode)
  {
  	int error;
4ac913785   Jan Blunck   Embed a struct pa...
1645
  	struct dentry *dir = nd->path.dentry;
aab520e2f   Dave Hansen   [PATCH] r/o bind ...
1646
1647
1648
1649
1650
  
  	if (!IS_POSIXACL(dir->d_inode))
  		mode &= ~current->fs->umask;
  	error = vfs_create(dir->d_inode, path->dentry, mode, nd);
  	mutex_unlock(&dir->d_inode->i_mutex);
4ac913785   Jan Blunck   Embed a struct pa...
1651
1652
  	dput(nd->path.dentry);
  	nd->path.dentry = path->dentry;
aab520e2f   Dave Hansen   [PATCH] r/o bind ...
1653
1654
1655
1656
1657
  	if (error)
  		return error;
  	/* Don't check for write permission, don't truncate */
  	return may_open(nd, 0, flag & ~O_TRUNC);
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1658
  /*
d57999e15   Dave Hansen   [PATCH] do namei_...
1659
1660
1661
1662
1663
1664
1665
1666
1667
1668
1669
1670
1671
1672
1673
1674
1675
1676
1677
1678
1679
1680
   * Note that while the flag value (low two bits) for sys_open means:
   *	00 - read-only
   *	01 - write-only
   *	10 - read-write
   *	11 - special
   * it is changed into
   *	00 - no permissions needed
   *	01 - read-permission
   *	10 - write-permission
   *	11 - read-write
   * for the internal routines (ie open_namei()/follow_link() etc)
   * This is more logical, and also allows the 00 "no perm needed"
   * to be used for symlinks (where the permissions are checked
   * later).
   *
  */
  static inline int open_to_namei_flags(int flag)
  {
  	if ((flag+1) & O_ACCMODE)
  		flag++;
  	return flag;
  }
4a3fd211c   Dave Hansen   [PATCH] r/o bind ...
1681
1682
1683
1684
1685
1686
1687
1688
1689
1690
  static int open_will_write_to_fs(int flag, struct inode *inode)
  {
  	/*
  	 * We'll never write to the fs underlying
  	 * a device file.
  	 */
  	if (special_file(inode->i_mode))
  		return 0;
  	return (flag & O_TRUNC);
  }
d57999e15   Dave Hansen   [PATCH] do namei_...
1691
  /*
4a3fd211c   Dave Hansen   [PATCH] r/o bind ...
1692
1693
1694
   * Note that the low bits of the passed in "open_flag"
   * are not the same as in the local variable "flag". See
   * open_to_namei_flags() for more details.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1695
   */
a70e65df8   Christoph Hellwig   [PATCH] merge ope...
1696
1697
  struct file *do_filp_open(int dfd, const char *pathname,
  		int open_flag, int mode)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1698
  {
4a3fd211c   Dave Hansen   [PATCH] r/o bind ...
1699
  	struct file *filp;
a70e65df8   Christoph Hellwig   [PATCH] merge ope...
1700
  	struct nameidata nd;
834f2a4a1   Trond Myklebust   VFS: Allow the fi...
1701
  	int acc_mode, error;
4e7506e4d   Al Viro   [PATCH] namei fix...
1702
  	struct path path;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1703
1704
  	struct dentry *dir;
  	int count = 0;
4a3fd211c   Dave Hansen   [PATCH] r/o bind ...
1705
  	int will_write;
d57999e15   Dave Hansen   [PATCH] do namei_...
1706
  	int flag = open_to_namei_flags(open_flag);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1707
1708
  
  	acc_mode = ACC_MODE(flag);
834f2a4a1   Trond Myklebust   VFS: Allow the fi...
1709
1710
1711
  	/* O_TRUNC implies we need access checks for write permissions */
  	if (flag & O_TRUNC)
  		acc_mode |= MAY_WRITE;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1712
1713
1714
1715
  	/* Allow the LSM permission hook to distinguish append 
  	   access from general write access. */
  	if (flag & O_APPEND)
  		acc_mode |= MAY_APPEND;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1716
1717
1718
1719
  	/*
  	 * The simplest case - just a plain lookup.
  	 */
  	if (!(flag & O_CREAT)) {
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
1720
  		error = path_lookup_open(dfd, pathname, lookup_flags(flag),
a70e65df8   Christoph Hellwig   [PATCH] merge ope...
1721
  					 &nd, flag);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1722
  		if (error)
a70e65df8   Christoph Hellwig   [PATCH] merge ope...
1723
  			return ERR_PTR(error);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1724
1725
1726
1727
1728
1729
  		goto ok;
  	}
  
  	/*
  	 * Create - we need to know the parent.
  	 */
a70e65df8   Christoph Hellwig   [PATCH] merge ope...
1730
1731
  	error = path_lookup_create(dfd, pathname, LOOKUP_PARENT,
  				   &nd, flag, mode);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1732
  	if (error)
a70e65df8   Christoph Hellwig   [PATCH] merge ope...
1733
  		return ERR_PTR(error);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1734
1735
1736
1737
1738
1739
1740
  
  	/*
  	 * We have the parent and last component. First of all, check
  	 * that we are not asked to creat(2) an obvious directory - that
  	 * will not do.
  	 */
  	error = -EISDIR;
a70e65df8   Christoph Hellwig   [PATCH] merge ope...
1741
  	if (nd.last_type != LAST_NORM || nd.last.name[nd.last.len])
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1742
  		goto exit;
a70e65df8   Christoph Hellwig   [PATCH] merge ope...
1743
1744
  	dir = nd.path.dentry;
  	nd.flags &= ~LOOKUP_PARENT;
1b1dcc1b5   Jes Sorensen   [PATCH] mutex sub...
1745
  	mutex_lock(&dir->d_inode->i_mutex);
a70e65df8   Christoph Hellwig   [PATCH] merge ope...
1746
1747
  	path.dentry = lookup_hash(&nd);
  	path.mnt = nd.path.mnt;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1748
1749
  
  do_last:
4e7506e4d   Al Viro   [PATCH] namei fix...
1750
1751
  	error = PTR_ERR(path.dentry);
  	if (IS_ERR(path.dentry)) {
1b1dcc1b5   Jes Sorensen   [PATCH] mutex sub...
1752
  		mutex_unlock(&dir->d_inode->i_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1753
1754
  		goto exit;
  	}
a70e65df8   Christoph Hellwig   [PATCH] merge ope...
1755
  	if (IS_ERR(nd.intent.open.file)) {
a70e65df8   Christoph Hellwig   [PATCH] merge ope...
1756
  		error = PTR_ERR(nd.intent.open.file);
4a3fd211c   Dave Hansen   [PATCH] r/o bind ...
1757
  		goto exit_mutex_unlock;
4af4c52f3   Oleg Drokin   [PATCH] Missed er...
1758
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1759
  	/* Negative dentry, just create the file */
4e7506e4d   Al Viro   [PATCH] namei fix...
1760
  	if (!path.dentry->d_inode) {
4a3fd211c   Dave Hansen   [PATCH] r/o bind ...
1761
1762
1763
1764
1765
1766
1767
1768
  		/*
  		 * This write is needed to ensure that a
  		 * ro->rw transition does not occur between
  		 * the time when the file is created and when
  		 * a permanent write count is taken through
  		 * the 'struct file' in nameidata_to_filp().
  		 */
  		error = mnt_want_write(nd.path.mnt);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1769
  		if (error)
4a3fd211c   Dave Hansen   [PATCH] r/o bind ...
1770
1771
1772
1773
  			goto exit_mutex_unlock;
  		error = __open_namei_create(&nd, &path, flag, mode);
  		if (error) {
  			mnt_drop_write(nd.path.mnt);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1774
  			goto exit;
4a3fd211c   Dave Hansen   [PATCH] r/o bind ...
1775
1776
1777
1778
  		}
  		filp = nameidata_to_filp(&nd, open_flag);
  		mnt_drop_write(nd.path.mnt);
  		return filp;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1779
1780
1781
1782
1783
  	}
  
  	/*
  	 * It already exists.
  	 */
1b1dcc1b5   Jes Sorensen   [PATCH] mutex sub...
1784
  	mutex_unlock(&dir->d_inode->i_mutex);
5a190ae69   Al Viro   [PATCH] pass dent...
1785
  	audit_inode(pathname, path.dentry);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1786
1787
1788
1789
  
  	error = -EEXIST;
  	if (flag & O_EXCL)
  		goto exit_dput;
e13b210f6   Al Viro   [PATCH] namei fix...
1790
  	if (__follow_mount(&path)) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1791
  		error = -ELOOP;
ba7a4c1a7   Al Viro   [PATCH] namei fix...
1792
1793
  		if (flag & O_NOFOLLOW)
  			goto exit_dput;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1794
  	}
3e2efce06   Amy Griffis   [PATCH] fix fault...
1795

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1796
  	error = -ENOENT;
4e7506e4d   Al Viro   [PATCH] namei fix...
1797
  	if (!path.dentry->d_inode)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1798
  		goto exit_dput;
4e7506e4d   Al Viro   [PATCH] namei fix...
1799
  	if (path.dentry->d_inode->i_op && path.dentry->d_inode->i_op->follow_link)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1800
  		goto do_link;
a70e65df8   Christoph Hellwig   [PATCH] merge ope...
1801
  	path_to_nameidata(&path, &nd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1802
  	error = -EISDIR;
4e7506e4d   Al Viro   [PATCH] namei fix...
1803
  	if (path.dentry->d_inode && S_ISDIR(path.dentry->d_inode->i_mode))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1804
1805
  		goto exit;
  ok:
4a3fd211c   Dave Hansen   [PATCH] r/o bind ...
1806
1807
1808
1809
1810
1811
1812
1813
1814
1815
1816
1817
1818
1819
1820
1821
  	/*
  	 * Consider:
  	 * 1. may_open() truncates a file
  	 * 2. a rw->ro mount transition occurs
  	 * 3. nameidata_to_filp() fails due to
  	 *    the ro mount.
  	 * That would be inconsistent, and should
  	 * be avoided. Taking this mnt write here
  	 * ensures that (2) can not occur.
  	 */
  	will_write = open_will_write_to_fs(flag, nd.path.dentry->d_inode);
  	if (will_write) {
  		error = mnt_want_write(nd.path.mnt);
  		if (error)
  			goto exit;
  	}
a70e65df8   Christoph Hellwig   [PATCH] merge ope...
1822
  	error = may_open(&nd, acc_mode, flag);
4a3fd211c   Dave Hansen   [PATCH] r/o bind ...
1823
1824
1825
  	if (error) {
  		if (will_write)
  			mnt_drop_write(nd.path.mnt);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1826
  		goto exit;
4a3fd211c   Dave Hansen   [PATCH] r/o bind ...
1827
1828
1829
1830
1831
1832
1833
1834
1835
1836
  	}
  	filp = nameidata_to_filp(&nd, open_flag);
  	/*
  	 * It is now safe to drop the mnt write
  	 * because the filp has had a write taken
  	 * on its behalf.
  	 */
  	if (will_write)
  		mnt_drop_write(nd.path.mnt);
  	return filp;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1837

4a3fd211c   Dave Hansen   [PATCH] r/o bind ...
1838
1839
  exit_mutex_unlock:
  	mutex_unlock(&dir->d_inode->i_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1840
  exit_dput:
a70e65df8   Christoph Hellwig   [PATCH] merge ope...
1841
  	path_put_conditional(&path, &nd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1842
  exit:
a70e65df8   Christoph Hellwig   [PATCH] merge ope...
1843
1844
1845
1846
  	if (!IS_ERR(nd.intent.open.file))
  		release_open_intent(&nd);
  	path_put(&nd.path);
  	return ERR_PTR(error);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1847
1848
1849
1850
1851
1852
1853
1854
1855
1856
1857
1858
1859
1860
1861
  
  do_link:
  	error = -ELOOP;
  	if (flag & O_NOFOLLOW)
  		goto exit_dput;
  	/*
  	 * This is subtle. Instead of calling do_follow_link() we do the
  	 * thing by hands. The reason is that this way we have zero link_count
  	 * and path_walk() (called from ->follow_link) honoring LOOKUP_PARENT.
  	 * After that we have the parent and last component, i.e.
  	 * we are in the same situation as after the first path_walk().
  	 * Well, almost - if the last component is normal we get its copy
  	 * stored in nd->last.name and we will have to putname() it when we
  	 * are done. Procfs-like symlinks just set LAST_BIND.
  	 */
a70e65df8   Christoph Hellwig   [PATCH] merge ope...
1862
1863
  	nd.flags |= LOOKUP_PARENT;
  	error = security_inode_follow_link(path.dentry, &nd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1864
1865
  	if (error)
  		goto exit_dput;
a70e65df8   Christoph Hellwig   [PATCH] merge ope...
1866
  	error = __do_follow_link(&path, &nd);
de4592153   Kirill Korotaev   [PATCH] struct fi...
1867
1868
1869
1870
1871
  	if (error) {
  		/* Does someone understand code flow here? Or it is only
  		 * me so stupid? Anathema to whoever designed this non-sense
  		 * with "intent.open".
  		 */
a70e65df8   Christoph Hellwig   [PATCH] merge ope...
1872
1873
  		release_open_intent(&nd);
  		return ERR_PTR(error);
de4592153   Kirill Korotaev   [PATCH] struct fi...
1874
  	}
a70e65df8   Christoph Hellwig   [PATCH] merge ope...
1875
1876
  	nd.flags &= ~LOOKUP_PARENT;
  	if (nd.last_type == LAST_BIND)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1877
  		goto ok;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1878
  	error = -EISDIR;
a70e65df8   Christoph Hellwig   [PATCH] merge ope...
1879
  	if (nd.last_type != LAST_NORM)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1880
  		goto exit;
a70e65df8   Christoph Hellwig   [PATCH] merge ope...
1881
1882
  	if (nd.last.name[nd.last.len]) {
  		__putname(nd.last.name);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1883
1884
1885
1886
  		goto exit;
  	}
  	error = -ELOOP;
  	if (count++==32) {
a70e65df8   Christoph Hellwig   [PATCH] merge ope...
1887
  		__putname(nd.last.name);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1888
1889
  		goto exit;
  	}
a70e65df8   Christoph Hellwig   [PATCH] merge ope...
1890
  	dir = nd.path.dentry;
1b1dcc1b5   Jes Sorensen   [PATCH] mutex sub...
1891
  	mutex_lock(&dir->d_inode->i_mutex);
a70e65df8   Christoph Hellwig   [PATCH] merge ope...
1892
1893
1894
  	path.dentry = lookup_hash(&nd);
  	path.mnt = nd.path.mnt;
  	__putname(nd.last.name);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1895
1896
1897
1898
  	goto do_last;
  }
  
  /**
a70e65df8   Christoph Hellwig   [PATCH] merge ope...
1899
1900
1901
1902
1903
1904
1905
1906
1907
1908
1909
1910
1911
1912
1913
1914
1915
   * filp_open - open file and return file pointer
   *
   * @filename:	path to open
   * @flags:	open flags as per the open(2) second argument
   * @mode:	mode for the new file if O_CREAT is set, else ignored
   *
   * This is the helper to open a file from kernelspace if you really
   * have to.  But in generally you should not do this, so please move
   * along, nothing to see here..
   */
  struct file *filp_open(const char *filename, int flags, int mode)
  {
  	return do_filp_open(AT_FDCWD, filename, flags, mode);
  }
  EXPORT_SYMBOL(filp_open);
  
  /**
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1916
1917
1918
1919
1920
1921
   * lookup_create - lookup a dentry, creating it if it doesn't exist
   * @nd: nameidata info
   * @is_dir: directory flag
   *
   * Simple function to lookup and return a dentry and create it
   * if it doesn't exist.  Is SMP-safe.
c663e5d80   Christoph Hellwig   [PATCH] add some ...
1922
   *
4ac913785   Jan Blunck   Embed a struct pa...
1923
   * Returns with nd->path.dentry->d_inode->i_mutex locked.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1924
1925
1926
   */
  struct dentry *lookup_create(struct nameidata *nd, int is_dir)
  {
c663e5d80   Christoph Hellwig   [PATCH] add some ...
1927
  	struct dentry *dentry = ERR_PTR(-EEXIST);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1928

4ac913785   Jan Blunck   Embed a struct pa...
1929
  	mutex_lock_nested(&nd->path.dentry->d_inode->i_mutex, I_MUTEX_PARENT);
c663e5d80   Christoph Hellwig   [PATCH] add some ...
1930
1931
1932
1933
  	/*
  	 * Yucky last component or no last component at all?
  	 * (foo/., foo/.., /////)
  	 */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1934
1935
1936
  	if (nd->last_type != LAST_NORM)
  		goto fail;
  	nd->flags &= ~LOOKUP_PARENT;
a634904a7   ASANO Masahiro   VFS: add lookup h...
1937
1938
  	nd->flags |= LOOKUP_CREATE;
  	nd->intent.open.flags = O_EXCL;
c663e5d80   Christoph Hellwig   [PATCH] add some ...
1939
1940
1941
1942
  
  	/*
  	 * Do the final lookup.
  	 */
49705b774   Christoph Hellwig   [PATCH] sanitize ...
1943
  	dentry = lookup_hash(nd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1944
1945
  	if (IS_ERR(dentry))
  		goto fail;
c663e5d80   Christoph Hellwig   [PATCH] add some ...
1946

e9baf6e59   Al Viro   [PATCH] return to...
1947
1948
  	if (dentry->d_inode)
  		goto eexist;
c663e5d80   Christoph Hellwig   [PATCH] add some ...
1949
1950
1951
1952
1953
1954
  	/*
  	 * Special case - lookup gave negative, but... we had foo/bar/
  	 * From the vfs_mknod() POV we just have a negative dentry -
  	 * all is fine. Let's be bastards - you had / on the end, you've
  	 * been asking for (non-existent) directory. -ENOENT for you.
  	 */
e9baf6e59   Al Viro   [PATCH] return to...
1955
1956
1957
1958
  	if (unlikely(!is_dir && nd->last.name[nd->last.len])) {
  		dput(dentry);
  		dentry = ERR_PTR(-ENOENT);
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1959
  	return dentry;
e9baf6e59   Al Viro   [PATCH] return to...
1960
  eexist:
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1961
  	dput(dentry);
e9baf6e59   Al Viro   [PATCH] return to...
1962
  	dentry = ERR_PTR(-EEXIST);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1963
1964
1965
  fail:
  	return dentry;
  }
f81a0bffa   Christoph Hellwig   [AF_UNIX]: Use lo...
1966
  EXPORT_SYMBOL_GPL(lookup_create);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1967
1968
1969
1970
1971
1972
1973
1974
1975
1976
1977
1978
1979
  
  int vfs_mknod(struct inode *dir, struct dentry *dentry, int mode, dev_t dev)
  {
  	int error = may_create(dir, dentry, NULL);
  
  	if (error)
  		return error;
  
  	if ((S_ISCHR(mode) || S_ISBLK(mode)) && !capable(CAP_MKNOD))
  		return -EPERM;
  
  	if (!dir->i_op || !dir->i_op->mknod)
  		return -EPERM;
08ce5f16e   Serge E. Hallyn   cgroups: implemen...
1980
1981
1982
  	error = devcgroup_inode_mknod(mode, dev);
  	if (error)
  		return error;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1983
1984
1985
1986
1987
1988
  	error = security_inode_mknod(dir, dentry, mode, dev);
  	if (error)
  		return error;
  
  	DQUOT_INIT(dir);
  	error = dir->i_op->mknod(dir, dentry, mode, dev);
a74574aaf   Stephen Smalley   [PATCH] Remove se...
1989
  	if (!error)
f38aa9422   Amy Griffis   [PATCH] Pass dent...
1990
  		fsnotify_create(dir, dentry);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1991
1992
  	return error;
  }
463c31972   Dave Hansen   [PATCH] r/o bind ...
1993
1994
1995
1996
1997
1998
1999
2000
2001
2002
2003
2004
2005
2006
2007
2008
  static int may_mknod(mode_t mode)
  {
  	switch (mode & S_IFMT) {
  	case S_IFREG:
  	case S_IFCHR:
  	case S_IFBLK:
  	case S_IFIFO:
  	case S_IFSOCK:
  	case 0: /* zero mode translates to S_IFREG */
  		return 0;
  	case S_IFDIR:
  		return -EPERM;
  	default:
  		return -EINVAL;
  	}
  }
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
2009
2010
  asmlinkage long sys_mknodat(int dfd, const char __user *filename, int mode,
  				unsigned dev)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2011
2012
2013
2014
2015
2016
2017
2018
2019
2020
2021
  {
  	int error = 0;
  	char * tmp;
  	struct dentry * dentry;
  	struct nameidata nd;
  
  	if (S_ISDIR(mode))
  		return -EPERM;
  	tmp = getname(filename);
  	if (IS_ERR(tmp))
  		return PTR_ERR(tmp);
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
2022
  	error = do_path_lookup(dfd, tmp, LOOKUP_PARENT, &nd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2023
2024
2025
  	if (error)
  		goto out;
  	dentry = lookup_create(&nd, 0);
463c31972   Dave Hansen   [PATCH] r/o bind ...
2026
2027
2028
2029
  	if (IS_ERR(dentry)) {
  		error = PTR_ERR(dentry);
  		goto out_unlock;
  	}
4ac913785   Jan Blunck   Embed a struct pa...
2030
  	if (!IS_POSIXACL(nd.path.dentry->d_inode))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2031
  		mode &= ~current->fs->umask;
463c31972   Dave Hansen   [PATCH] r/o bind ...
2032
2033
2034
2035
2036
2037
2038
  	error = may_mknod(mode);
  	if (error)
  		goto out_dput;
  	error = mnt_want_write(nd.path.mnt);
  	if (error)
  		goto out_dput;
  	switch (mode & S_IFMT) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2039
  		case 0: case S_IFREG:
4ac913785   Jan Blunck   Embed a struct pa...
2040
  			error = vfs_create(nd.path.dentry->d_inode,dentry,mode,&nd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2041
2042
  			break;
  		case S_IFCHR: case S_IFBLK:
4ac913785   Jan Blunck   Embed a struct pa...
2043
  			error = vfs_mknod(nd.path.dentry->d_inode,dentry,mode,
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2044
2045
2046
  					new_decode_dev(dev));
  			break;
  		case S_IFIFO: case S_IFSOCK:
4ac913785   Jan Blunck   Embed a struct pa...
2047
  			error = vfs_mknod(nd.path.dentry->d_inode,dentry,mode,0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2048
  			break;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2049
  	}
463c31972   Dave Hansen   [PATCH] r/o bind ...
2050
2051
2052
2053
  	mnt_drop_write(nd.path.mnt);
  out_dput:
  	dput(dentry);
  out_unlock:
4ac913785   Jan Blunck   Embed a struct pa...
2054
  	mutex_unlock(&nd.path.dentry->d_inode->i_mutex);
1d957f9bf   Jan Blunck   Introduce path_put()
2055
  	path_put(&nd.path);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2056
2057
2058
2059
2060
  out:
  	putname(tmp);
  
  	return error;
  }
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
2061
2062
2063
2064
  asmlinkage long sys_mknod(const char __user *filename, int mode, unsigned dev)
  {
  	return sys_mknodat(AT_FDCWD, filename, mode, dev);
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2065
2066
2067
2068
2069
2070
2071
2072
2073
2074
2075
2076
2077
2078
2079
2080
2081
  int vfs_mkdir(struct inode *dir, struct dentry *dentry, int mode)
  {
  	int error = may_create(dir, dentry, NULL);
  
  	if (error)
  		return error;
  
  	if (!dir->i_op || !dir->i_op->mkdir)
  		return -EPERM;
  
  	mode &= (S_IRWXUGO|S_ISVTX);
  	error = security_inode_mkdir(dir, dentry, mode);
  	if (error)
  		return error;
  
  	DQUOT_INIT(dir);
  	error = dir->i_op->mkdir(dir, dentry, mode);
a74574aaf   Stephen Smalley   [PATCH] Remove se...
2082
  	if (!error)
f38aa9422   Amy Griffis   [PATCH] Pass dent...
2083
  		fsnotify_mkdir(dir, dentry);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2084
2085
  	return error;
  }
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
2086
  asmlinkage long sys_mkdirat(int dfd, const char __user *pathname, int mode)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2087
2088
2089
  {
  	int error = 0;
  	char * tmp;
6902d925d   Dave Hansen   [PATCH] r/o bind ...
2090
2091
  	struct dentry *dentry;
  	struct nameidata nd;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2092
2093
2094
  
  	tmp = getname(pathname);
  	error = PTR_ERR(tmp);
6902d925d   Dave Hansen   [PATCH] r/o bind ...
2095
2096
  	if (IS_ERR(tmp))
  		goto out_err;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2097

6902d925d   Dave Hansen   [PATCH] r/o bind ...
2098
2099
2100
2101
2102
2103
2104
  	error = do_path_lookup(dfd, tmp, LOOKUP_PARENT, &nd);
  	if (error)
  		goto out;
  	dentry = lookup_create(&nd, 1);
  	error = PTR_ERR(dentry);
  	if (IS_ERR(dentry))
  		goto out_unlock;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2105

4ac913785   Jan Blunck   Embed a struct pa...
2106
  	if (!IS_POSIXACL(nd.path.dentry->d_inode))
6902d925d   Dave Hansen   [PATCH] r/o bind ...
2107
  		mode &= ~current->fs->umask;
463c31972   Dave Hansen   [PATCH] r/o bind ...
2108
2109
2110
  	error = mnt_want_write(nd.path.mnt);
  	if (error)
  		goto out_dput;
4ac913785   Jan Blunck   Embed a struct pa...
2111
  	error = vfs_mkdir(nd.path.dentry->d_inode, dentry, mode);
463c31972   Dave Hansen   [PATCH] r/o bind ...
2112
2113
  	mnt_drop_write(nd.path.mnt);
  out_dput:
6902d925d   Dave Hansen   [PATCH] r/o bind ...
2114
2115
  	dput(dentry);
  out_unlock:
4ac913785   Jan Blunck   Embed a struct pa...
2116
  	mutex_unlock(&nd.path.dentry->d_inode->i_mutex);
1d957f9bf   Jan Blunck   Introduce path_put()
2117
  	path_put(&nd.path);
6902d925d   Dave Hansen   [PATCH] r/o bind ...
2118
2119
2120
  out:
  	putname(tmp);
  out_err:
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2121
2122
  	return error;
  }
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
2123
2124
2125
2126
  asmlinkage long sys_mkdir(const char __user *pathname, int mode)
  {
  	return sys_mkdirat(AT_FDCWD, pathname, mode);
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2127
2128
2129
2130
2131
2132
2133
2134
2135
2136
2137
2138
2139
2140
2141
2142
2143
2144
  /*
   * We try to drop the dentry early: we should have
   * a usage count of 2 if we're the only user of this
   * dentry, and if that is true (possibly after pruning
   * the dcache), then we drop the dentry now.
   *
   * A low-level filesystem can, if it choses, legally
   * do a
   *
   *	if (!d_unhashed(dentry))
   *		return -EBUSY;
   *
   * if it cannot handle the case of removing a directory
   * that is still in use by something else..
   */
  void dentry_unhash(struct dentry *dentry)
  {
  	dget(dentry);
dc168427e   Vasily Averin   [PATCH] VFS: extr...
2145
  	shrink_dcache_parent(dentry);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2146
2147
2148
2149
2150
2151
2152
2153
2154
2155
2156
2157
2158
2159
2160
2161
2162
2163
2164
  	spin_lock(&dcache_lock);
  	spin_lock(&dentry->d_lock);
  	if (atomic_read(&dentry->d_count) == 2)
  		__d_drop(dentry);
  	spin_unlock(&dentry->d_lock);
  	spin_unlock(&dcache_lock);
  }
  
  int vfs_rmdir(struct inode *dir, struct dentry *dentry)
  {
  	int error = may_delete(dir, dentry, 1);
  
  	if (error)
  		return error;
  
  	if (!dir->i_op || !dir->i_op->rmdir)
  		return -EPERM;
  
  	DQUOT_INIT(dir);
1b1dcc1b5   Jes Sorensen   [PATCH] mutex sub...
2165
  	mutex_lock(&dentry->d_inode->i_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2166
2167
2168
2169
2170
2171
2172
2173
2174
2175
2176
  	dentry_unhash(dentry);
  	if (d_mountpoint(dentry))
  		error = -EBUSY;
  	else {
  		error = security_inode_rmdir(dir, dentry);
  		if (!error) {
  			error = dir->i_op->rmdir(dir, dentry);
  			if (!error)
  				dentry->d_inode->i_flags |= S_DEAD;
  		}
  	}
1b1dcc1b5   Jes Sorensen   [PATCH] mutex sub...
2177
  	mutex_unlock(&dentry->d_inode->i_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2178
  	if (!error) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2179
2180
2181
2182
2183
2184
  		d_delete(dentry);
  	}
  	dput(dentry);
  
  	return error;
  }
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
2185
  static long do_rmdir(int dfd, const char __user *pathname)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2186
2187
2188
2189
2190
2191
2192
2193
2194
  {
  	int error = 0;
  	char * name;
  	struct dentry *dentry;
  	struct nameidata nd;
  
  	name = getname(pathname);
  	if(IS_ERR(name))
  		return PTR_ERR(name);
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
2195
  	error = do_path_lookup(dfd, name, LOOKUP_PARENT, &nd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2196
2197
2198
2199
2200
2201
2202
2203
2204
2205
2206
2207
2208
2209
  	if (error)
  		goto exit;
  
  	switch(nd.last_type) {
  		case LAST_DOTDOT:
  			error = -ENOTEMPTY;
  			goto exit1;
  		case LAST_DOT:
  			error = -EINVAL;
  			goto exit1;
  		case LAST_ROOT:
  			error = -EBUSY;
  			goto exit1;
  	}
4ac913785   Jan Blunck   Embed a struct pa...
2210
  	mutex_lock_nested(&nd.path.dentry->d_inode->i_mutex, I_MUTEX_PARENT);
49705b774   Christoph Hellwig   [PATCH] sanitize ...
2211
  	dentry = lookup_hash(&nd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2212
  	error = PTR_ERR(dentry);
6902d925d   Dave Hansen   [PATCH] r/o bind ...
2213
2214
  	if (IS_ERR(dentry))
  		goto exit2;
0622753b8   Dave Hansen   [PATCH] r/o bind ...
2215
2216
2217
  	error = mnt_want_write(nd.path.mnt);
  	if (error)
  		goto exit3;
4ac913785   Jan Blunck   Embed a struct pa...
2218
  	error = vfs_rmdir(nd.path.dentry->d_inode, dentry);
0622753b8   Dave Hansen   [PATCH] r/o bind ...
2219
2220
  	mnt_drop_write(nd.path.mnt);
  exit3:
6902d925d   Dave Hansen   [PATCH] r/o bind ...
2221
2222
  	dput(dentry);
  exit2:
4ac913785   Jan Blunck   Embed a struct pa...
2223
  	mutex_unlock(&nd.path.dentry->d_inode->i_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2224
  exit1:
1d957f9bf   Jan Blunck   Introduce path_put()
2225
  	path_put(&nd.path);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2226
2227
2228
2229
  exit:
  	putname(name);
  	return error;
  }
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
2230
2231
2232
2233
  asmlinkage long sys_rmdir(const char __user *pathname)
  {
  	return do_rmdir(AT_FDCWD, pathname);
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2234
2235
2236
2237
2238
2239
2240
2241
2242
2243
2244
  int vfs_unlink(struct inode *dir, struct dentry *dentry)
  {
  	int error = may_delete(dir, dentry, 0);
  
  	if (error)
  		return error;
  
  	if (!dir->i_op || !dir->i_op->unlink)
  		return -EPERM;
  
  	DQUOT_INIT(dir);
1b1dcc1b5   Jes Sorensen   [PATCH] mutex sub...
2245
  	mutex_lock(&dentry->d_inode->i_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2246
2247
2248
2249
2250
2251
2252
  	if (d_mountpoint(dentry))
  		error = -EBUSY;
  	else {
  		error = security_inode_unlink(dir, dentry);
  		if (!error)
  			error = dir->i_op->unlink(dir, dentry);
  	}
1b1dcc1b5   Jes Sorensen   [PATCH] mutex sub...
2253
  	mutex_unlock(&dentry->d_inode->i_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2254
2255
2256
  
  	/* We don't d_delete() NFS sillyrenamed files--they still exist. */
  	if (!error && !(dentry->d_flags & DCACHE_NFSFS_RENAMED)) {
ece95912d   Jan Kara   inotify: send IN_...
2257
  		fsnotify_link_count(dentry->d_inode);
e234f35c5   John McCutchan   [PATCH] inotify d...
2258
  		d_delete(dentry);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2259
  	}
0eeca2830   Robert Love   [PATCH] inotify
2260

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2261
2262
2263
2264
2265
  	return error;
  }
  
  /*
   * Make sure that the actual truncation of the file will occur outside its
1b1dcc1b5   Jes Sorensen   [PATCH] mutex sub...
2266
   * directory's i_mutex.  Truncate can take a long time if there is a lot of
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2267
2268
2269
   * writeout happening, and we don't want to prevent access to the directory
   * while waiting on the I/O.
   */
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
2270
  static long do_unlinkat(int dfd, const char __user *pathname)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2271
2272
2273
2274
2275
2276
2277
2278
2279
2280
  {
  	int error = 0;
  	char * name;
  	struct dentry *dentry;
  	struct nameidata nd;
  	struct inode *inode = NULL;
  
  	name = getname(pathname);
  	if(IS_ERR(name))
  		return PTR_ERR(name);
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
2281
  	error = do_path_lookup(dfd, name, LOOKUP_PARENT, &nd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2282
2283
2284
2285
2286
  	if (error)
  		goto exit;
  	error = -EISDIR;
  	if (nd.last_type != LAST_NORM)
  		goto exit1;
4ac913785   Jan Blunck   Embed a struct pa...
2287
  	mutex_lock_nested(&nd.path.dentry->d_inode->i_mutex, I_MUTEX_PARENT);
49705b774   Christoph Hellwig   [PATCH] sanitize ...
2288
  	dentry = lookup_hash(&nd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2289
2290
2291
2292
2293
2294
2295
2296
  	error = PTR_ERR(dentry);
  	if (!IS_ERR(dentry)) {
  		/* Why not before? Because we want correct error value */
  		if (nd.last.name[nd.last.len])
  			goto slashes;
  		inode = dentry->d_inode;
  		if (inode)
  			atomic_inc(&inode->i_count);
0622753b8   Dave Hansen   [PATCH] r/o bind ...
2297
2298
2299
  		error = mnt_want_write(nd.path.mnt);
  		if (error)
  			goto exit2;
4ac913785   Jan Blunck   Embed a struct pa...
2300
  		error = vfs_unlink(nd.path.dentry->d_inode, dentry);
0622753b8   Dave Hansen   [PATCH] r/o bind ...
2301
  		mnt_drop_write(nd.path.mnt);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2302
2303
2304
  	exit2:
  		dput(dentry);
  	}
4ac913785   Jan Blunck   Embed a struct pa...
2305
  	mutex_unlock(&nd.path.dentry->d_inode->i_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2306
2307
2308
  	if (inode)
  		iput(inode);	/* truncate the inode here */
  exit1:
1d957f9bf   Jan Blunck   Introduce path_put()
2309
  	path_put(&nd.path);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2310
2311
2312
2313
2314
2315
2316
2317
2318
  exit:
  	putname(name);
  	return error;
  
  slashes:
  	error = !dentry->d_inode ? -ENOENT :
  		S_ISDIR(dentry->d_inode->i_mode) ? -EISDIR : -ENOTDIR;
  	goto exit2;
  }
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
2319
2320
2321
2322
2323
2324
2325
2326
2327
2328
2329
2330
2331
2332
2333
  asmlinkage long sys_unlinkat(int dfd, const char __user *pathname, int flag)
  {
  	if ((flag & ~AT_REMOVEDIR) != 0)
  		return -EINVAL;
  
  	if (flag & AT_REMOVEDIR)
  		return do_rmdir(dfd, pathname);
  
  	return do_unlinkat(dfd, pathname);
  }
  
  asmlinkage long sys_unlink(const char __user *pathname)
  {
  	return do_unlinkat(AT_FDCWD, pathname);
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2334
2335
2336
2337
2338
2339
2340
2341
2342
2343
2344
2345
2346
2347
2348
2349
  int vfs_symlink(struct inode *dir, struct dentry *dentry, const char *oldname, int mode)
  {
  	int error = may_create(dir, dentry, NULL);
  
  	if (error)
  		return error;
  
  	if (!dir->i_op || !dir->i_op->symlink)
  		return -EPERM;
  
  	error = security_inode_symlink(dir, dentry, oldname);
  	if (error)
  		return error;
  
  	DQUOT_INIT(dir);
  	error = dir->i_op->symlink(dir, dentry, oldname);
a74574aaf   Stephen Smalley   [PATCH] Remove se...
2350
  	if (!error)
f38aa9422   Amy Griffis   [PATCH] Pass dent...
2351
  		fsnotify_create(dir, dentry);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2352
2353
  	return error;
  }
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
2354
2355
  asmlinkage long sys_symlinkat(const char __user *oldname,
  			      int newdfd, const char __user *newname)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2356
2357
2358
2359
  {
  	int error = 0;
  	char * from;
  	char * to;
6902d925d   Dave Hansen   [PATCH] r/o bind ...
2360
2361
  	struct dentry *dentry;
  	struct nameidata nd;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2362
2363
2364
2365
2366
2367
  
  	from = getname(oldname);
  	if(IS_ERR(from))
  		return PTR_ERR(from);
  	to = getname(newname);
  	error = PTR_ERR(to);
6902d925d   Dave Hansen   [PATCH] r/o bind ...
2368
2369
  	if (IS_ERR(to))
  		goto out_putname;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2370

6902d925d   Dave Hansen   [PATCH] r/o bind ...
2371
2372
2373
2374
2375
2376
2377
  	error = do_path_lookup(newdfd, to, LOOKUP_PARENT, &nd);
  	if (error)
  		goto out;
  	dentry = lookup_create(&nd, 0);
  	error = PTR_ERR(dentry);
  	if (IS_ERR(dentry))
  		goto out_unlock;
75c3f29de   Dave Hansen   [PATCH] r/o bind ...
2378
2379
2380
  	error = mnt_want_write(nd.path.mnt);
  	if (error)
  		goto out_dput;
4ac913785   Jan Blunck   Embed a struct pa...
2381
  	error = vfs_symlink(nd.path.dentry->d_inode, dentry, from, S_IALLUGO);
75c3f29de   Dave Hansen   [PATCH] r/o bind ...
2382
2383
  	mnt_drop_write(nd.path.mnt);
  out_dput:
6902d925d   Dave Hansen   [PATCH] r/o bind ...
2384
2385
  	dput(dentry);
  out_unlock:
4ac913785   Jan Blunck   Embed a struct pa...
2386
  	mutex_unlock(&nd.path.dentry->d_inode->i_mutex);
1d957f9bf   Jan Blunck   Introduce path_put()
2387
  	path_put(&nd.path);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2388
  out:
6902d925d   Dave Hansen   [PATCH] r/o bind ...
2389
2390
  	putname(to);
  out_putname:
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2391
2392
2393
  	putname(from);
  	return error;
  }
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
2394
2395
2396
2397
  asmlinkage long sys_symlink(const char __user *oldname, const char __user *newname)
  {
  	return sys_symlinkat(oldname, AT_FDCWD, newname);
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2398
2399
2400
2401
2402
2403
2404
2405
2406
2407
2408
2409
2410
2411
2412
2413
2414
2415
2416
2417
2418
2419
2420
2421
2422
2423
2424
2425
  int vfs_link(struct dentry *old_dentry, struct inode *dir, struct dentry *new_dentry)
  {
  	struct inode *inode = old_dentry->d_inode;
  	int error;
  
  	if (!inode)
  		return -ENOENT;
  
  	error = may_create(dir, new_dentry, NULL);
  	if (error)
  		return error;
  
  	if (dir->i_sb != inode->i_sb)
  		return -EXDEV;
  
  	/*
  	 * A link to an append-only or immutable file cannot be created.
  	 */
  	if (IS_APPEND(inode) || IS_IMMUTABLE(inode))
  		return -EPERM;
  	if (!dir->i_op || !dir->i_op->link)
  		return -EPERM;
  	if (S_ISDIR(old_dentry->d_inode->i_mode))
  		return -EPERM;
  
  	error = security_inode_link(old_dentry, dir, new_dentry);
  	if (error)
  		return error;
1b1dcc1b5   Jes Sorensen   [PATCH] mutex sub...
2426
  	mutex_lock(&old_dentry->d_inode->i_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2427
2428
  	DQUOT_INIT(dir);
  	error = dir->i_op->link(old_dentry, dir, new_dentry);
1b1dcc1b5   Jes Sorensen   [PATCH] mutex sub...
2429
  	mutex_unlock(&old_dentry->d_inode->i_mutex);
e31e14ec3   Stephen Smalley   [PATCH] remove th...
2430
  	if (!error)
ece95912d   Jan Kara   inotify: send IN_...
2431
  		fsnotify_link(dir, old_dentry->d_inode, new_dentry);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2432
2433
2434
2435
2436
2437
2438
2439
2440
2441
2442
2443
  	return error;
  }
  
  /*
   * Hardlinks are often used in delicate situations.  We avoid
   * security-related surprises by not following symlinks on the
   * newname.  --KAB
   *
   * We don't follow them on the oldname either to be compatible
   * with linux 2.0, and to avoid hard-linking to directories
   * and other special files.  --ADM
   */
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
2444
  asmlinkage long sys_linkat(int olddfd, const char __user *oldname,
c04030e16   Ulrich Drepper   [PATCH] flags par...
2445
2446
  			   int newdfd, const char __user *newname,
  			   int flags)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2447
2448
2449
2450
2451
  {
  	struct dentry *new_dentry;
  	struct nameidata nd, old_nd;
  	int error;
  	char * to;
45c9b11a1   Ulrich Drepper   [PATCH] Implement...
2452
  	if ((flags & ~AT_SYMLINK_FOLLOW) != 0)
c04030e16   Ulrich Drepper   [PATCH] flags par...
2453
  		return -EINVAL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2454
2455
2456
  	to = getname(newname);
  	if (IS_ERR(to))
  		return PTR_ERR(to);
45c9b11a1   Ulrich Drepper   [PATCH] Implement...
2457
2458
2459
  	error = __user_walk_fd(olddfd, oldname,
  			       flags & AT_SYMLINK_FOLLOW ? LOOKUP_FOLLOW : 0,
  			       &old_nd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2460
2461
  	if (error)
  		goto exit;
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
2462
  	error = do_path_lookup(newdfd, to, LOOKUP_PARENT, &nd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2463
2464
2465
  	if (error)
  		goto out;
  	error = -EXDEV;
4ac913785   Jan Blunck   Embed a struct pa...
2466
  	if (old_nd.path.mnt != nd.path.mnt)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2467
2468
2469
  		goto out_release;
  	new_dentry = lookup_create(&nd, 0);
  	error = PTR_ERR(new_dentry);
6902d925d   Dave Hansen   [PATCH] r/o bind ...
2470
2471
  	if (IS_ERR(new_dentry))
  		goto out_unlock;
75c3f29de   Dave Hansen   [PATCH] r/o bind ...
2472
2473
2474
  	error = mnt_want_write(nd.path.mnt);
  	if (error)
  		goto out_dput;
4ac913785   Jan Blunck   Embed a struct pa...
2475
  	error = vfs_link(old_nd.path.dentry, nd.path.dentry->d_inode, new_dentry);
75c3f29de   Dave Hansen   [PATCH] r/o bind ...
2476
2477
  	mnt_drop_write(nd.path.mnt);
  out_dput:
6902d925d   Dave Hansen   [PATCH] r/o bind ...
2478
2479
  	dput(new_dentry);
  out_unlock:
4ac913785   Jan Blunck   Embed a struct pa...
2480
  	mutex_unlock(&nd.path.dentry->d_inode->i_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2481
  out_release:
1d957f9bf   Jan Blunck   Introduce path_put()
2482
  	path_put(&nd.path);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2483
  out:
1d957f9bf   Jan Blunck   Introduce path_put()
2484
  	path_put(&old_nd.path);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2485
2486
2487
2488
2489
  exit:
  	putname(to);
  
  	return error;
  }
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
2490
2491
  asmlinkage long sys_link(const char __user *oldname, const char __user *newname)
  {
c04030e16   Ulrich Drepper   [PATCH] flags par...
2492
  	return sys_linkat(AT_FDCWD, oldname, AT_FDCWD, newname, 0);
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
2493
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2494
2495
2496
2497
2498
2499
2500
  /*
   * The worst of all namespace operations - renaming directory. "Perverted"
   * doesn't even start to describe it. Somebody in UCB had a heck of a trip...
   * Problems:
   *	a) we can get into loop creation. Check is done in is_subdir().
   *	b) race potential - two innocent renames can create a loop together.
   *	   That's where 4.4 screws up. Current fix: serialization on
a11f3a057   Arjan van de Ven   [PATCH] sem2mutex...
2501
   *	   sb->s_vfs_rename_mutex. We might be more accurate, but that's another
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2502
2503
   *	   story.
   *	c) we have to lock _three_ objects - parents and victim (if it exists).
1b1dcc1b5   Jes Sorensen   [PATCH] mutex sub...
2504
   *	   And that - after we got ->i_mutex on parents (until then we don't know
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2505
2506
   *	   whether the target exists).  Solution: try to be smart with locking
   *	   order for inodes.  We rely on the fact that tree topology may change
a11f3a057   Arjan van de Ven   [PATCH] sem2mutex...
2507
   *	   only under ->s_vfs_rename_mutex _and_ that parent of the object we
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2508
2509
2510
   *	   move will be locked.  Thus we can rank directories by the tree
   *	   (ancestors first) and rank all non-directories after them.
   *	   That works since everybody except rename does "lock parent, lookup,
a11f3a057   Arjan van de Ven   [PATCH] sem2mutex...
2511
   *	   lock child" and rename is under ->s_vfs_rename_mutex.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2512
2513
2514
2515
2516
2517
2518
2519
2520
   *	   HOWEVER, it relies on the assumption that any object with ->lookup()
   *	   has no more than 1 dentry.  If "hybrid" objects will ever appear,
   *	   we'd better make sure that there's no link(2) for them.
   *	d) some filesystems don't support opened-but-unlinked directories,
   *	   either because of layout or because they are not ready to deal with
   *	   all cases correctly. The latter will be fixed (taking this sort of
   *	   stuff into VFS), but the former is not going away. Solution: the same
   *	   trick as in rmdir().
   *	e) conversion from fhandle to dentry may come in the wrong moment - when
1b1dcc1b5   Jes Sorensen   [PATCH] mutex sub...
2521
   *	   we are removing the target. Solution: we will have to grab ->i_mutex
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2522
   *	   in the fhandle_to_dentry code. [FIXME - current nfsfh.c relies on
1b1dcc1b5   Jes Sorensen   [PATCH] mutex sub...
2523
   *	   ->i_mutex on parents, which works but leads to some truely excessive
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2524
2525
   *	   locking].
   */
75c96f858   Adrian Bunk   [PATCH] make some...
2526
2527
  static int vfs_rename_dir(struct inode *old_dir, struct dentry *old_dentry,
  			  struct inode *new_dir, struct dentry *new_dentry)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2528
2529
2530
2531
2532
2533
2534
2535
2536
2537
2538
2539
2540
2541
2542
2543
2544
2545
2546
2547
  {
  	int error = 0;
  	struct inode *target;
  
  	/*
  	 * If we are going to change the parent - check write permissions,
  	 * we'll need to flip '..'.
  	 */
  	if (new_dir != old_dir) {
  		error = permission(old_dentry->d_inode, MAY_WRITE, NULL);
  		if (error)
  			return error;
  	}
  
  	error = security_inode_rename(old_dir, old_dentry, new_dir, new_dentry);
  	if (error)
  		return error;
  
  	target = new_dentry->d_inode;
  	if (target) {
1b1dcc1b5   Jes Sorensen   [PATCH] mutex sub...
2548
  		mutex_lock(&target->i_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2549
2550
2551
2552
2553
2554
2555
2556
2557
  		dentry_unhash(new_dentry);
  	}
  	if (d_mountpoint(old_dentry)||d_mountpoint(new_dentry))
  		error = -EBUSY;
  	else 
  		error = old_dir->i_op->rename(old_dir, old_dentry, new_dir, new_dentry);
  	if (target) {
  		if (!error)
  			target->i_flags |= S_DEAD;
1b1dcc1b5   Jes Sorensen   [PATCH] mutex sub...
2558
  		mutex_unlock(&target->i_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2559
2560
2561
2562
  		if (d_unhashed(new_dentry))
  			d_rehash(new_dentry);
  		dput(new_dentry);
  	}
e31e14ec3   Stephen Smalley   [PATCH] remove th...
2563
  	if (!error)
349457ccf   Mark Fasheh   [PATCH] Allow fil...
2564
2565
  		if (!(old_dir->i_sb->s_type->fs_flags & FS_RENAME_DOES_D_MOVE))
  			d_move(old_dentry,new_dentry);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2566
2567
  	return error;
  }
75c96f858   Adrian Bunk   [PATCH] make some...
2568
2569
  static int vfs_rename_other(struct inode *old_dir, struct dentry *old_dentry,
  			    struct inode *new_dir, struct dentry *new_dentry)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2570
2571
2572
2573
2574
2575
2576
2577
2578
2579
2580
  {
  	struct inode *target;
  	int error;
  
  	error = security_inode_rename(old_dir, old_dentry, new_dir, new_dentry);
  	if (error)
  		return error;
  
  	dget(new_dentry);
  	target = new_dentry->d_inode;
  	if (target)
1b1dcc1b5   Jes Sorensen   [PATCH] mutex sub...
2581
  		mutex_lock(&target->i_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2582
2583
2584
2585
2586
  	if (d_mountpoint(old_dentry)||d_mountpoint(new_dentry))
  		error = -EBUSY;
  	else
  		error = old_dir->i_op->rename(old_dir, old_dentry, new_dir, new_dentry);
  	if (!error) {
349457ccf   Mark Fasheh   [PATCH] Allow fil...
2587
  		if (!(old_dir->i_sb->s_type->fs_flags & FS_RENAME_DOES_D_MOVE))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2588
  			d_move(old_dentry, new_dentry);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2589
2590
  	}
  	if (target)
1b1dcc1b5   Jes Sorensen   [PATCH] mutex sub...
2591
  		mutex_unlock(&target->i_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2592
2593
2594
2595
2596
2597
2598
2599
2600
  	dput(new_dentry);
  	return error;
  }
  
  int vfs_rename(struct inode *old_dir, struct dentry *old_dentry,
  	       struct inode *new_dir, struct dentry *new_dentry)
  {
  	int error;
  	int is_dir = S_ISDIR(old_dentry->d_inode->i_mode);
0eeca2830   Robert Love   [PATCH] inotify
2601
  	const char *old_name;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2602
2603
2604
2605
2606
2607
2608
2609
2610
2611
2612
2613
2614
2615
2616
2617
2618
2619
2620
2621
  
  	if (old_dentry->d_inode == new_dentry->d_inode)
   		return 0;
   
  	error = may_delete(old_dir, old_dentry, is_dir);
  	if (error)
  		return error;
  
  	if (!new_dentry->d_inode)
  		error = may_create(new_dir, new_dentry, NULL);
  	else
  		error = may_delete(new_dir, new_dentry, is_dir);
  	if (error)
  		return error;
  
  	if (!old_dir->i_op || !old_dir->i_op->rename)
  		return -EPERM;
  
  	DQUOT_INIT(old_dir);
  	DQUOT_INIT(new_dir);
0eeca2830   Robert Love   [PATCH] inotify
2622
  	old_name = fsnotify_oldname_init(old_dentry->d_name.name);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2623
2624
2625
2626
2627
  	if (is_dir)
  		error = vfs_rename_dir(old_dir,old_dentry,new_dir,new_dentry);
  	else
  		error = vfs_rename_other(old_dir,old_dentry,new_dir,new_dentry);
  	if (!error) {
0eeca2830   Robert Love   [PATCH] inotify
2628
  		const char *new_name = old_dentry->d_name.name;
89204c40a   John McCutchan   [PATCH] inotify: ...
2629
  		fsnotify_move(old_dir, new_dir, old_name, new_name, is_dir,
5a190ae69   Al Viro   [PATCH] pass dent...
2630
  			      new_dentry->d_inode, old_dentry);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2631
  	}
0eeca2830   Robert Love   [PATCH] inotify
2632
  	fsnotify_oldname_free(old_name);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2633
2634
  	return error;
  }
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
2635
2636
  static int do_rename(int olddfd, const char *oldname,
  			int newdfd, const char *newname)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2637
2638
2639
2640
2641
2642
  {
  	int error = 0;
  	struct dentry * old_dir, * new_dir;
  	struct dentry * old_dentry, *new_dentry;
  	struct dentry * trap;
  	struct nameidata oldnd, newnd;
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
2643
  	error = do_path_lookup(olddfd, oldname, LOOKUP_PARENT, &oldnd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2644
2645
  	if (error)
  		goto exit;
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
2646
  	error = do_path_lookup(newdfd, newname, LOOKUP_PARENT, &newnd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2647
2648
2649
2650
  	if (error)
  		goto exit1;
  
  	error = -EXDEV;
4ac913785   Jan Blunck   Embed a struct pa...
2651
  	if (oldnd.path.mnt != newnd.path.mnt)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2652
  		goto exit2;
4ac913785   Jan Blunck   Embed a struct pa...
2653
  	old_dir = oldnd.path.dentry;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2654
2655
2656
  	error = -EBUSY;
  	if (oldnd.last_type != LAST_NORM)
  		goto exit2;
4ac913785   Jan Blunck   Embed a struct pa...
2657
  	new_dir = newnd.path.dentry;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2658
2659
2660
2661
  	if (newnd.last_type != LAST_NORM)
  		goto exit2;
  
  	trap = lock_rename(new_dir, old_dir);
49705b774   Christoph Hellwig   [PATCH] sanitize ...
2662
  	old_dentry = lookup_hash(&oldnd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2663
2664
2665
2666
2667
2668
2669
2670
2671
2672
2673
2674
2675
2676
2677
2678
2679
2680
2681
  	error = PTR_ERR(old_dentry);
  	if (IS_ERR(old_dentry))
  		goto exit3;
  	/* source must exist */
  	error = -ENOENT;
  	if (!old_dentry->d_inode)
  		goto exit4;
  	/* unless the source is a directory trailing slashes give -ENOTDIR */
  	if (!S_ISDIR(old_dentry->d_inode->i_mode)) {
  		error = -ENOTDIR;
  		if (oldnd.last.name[oldnd.last.len])
  			goto exit4;
  		if (newnd.last.name[newnd.last.len])
  			goto exit4;
  	}
  	/* source should not be ancestor of target */
  	error = -EINVAL;
  	if (old_dentry == trap)
  		goto exit4;
49705b774   Christoph Hellwig   [PATCH] sanitize ...
2682
  	new_dentry = lookup_hash(&newnd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2683
2684
2685
2686
2687
2688
2689
  	error = PTR_ERR(new_dentry);
  	if (IS_ERR(new_dentry))
  		goto exit4;
  	/* target should not be an ancestor of source */
  	error = -ENOTEMPTY;
  	if (new_dentry == trap)
  		goto exit5;
9079b1eb1   Dave Hansen   [PATCH] r/o bind ...
2690
2691
2692
  	error = mnt_want_write(oldnd.path.mnt);
  	if (error)
  		goto exit5;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2693
2694
  	error = vfs_rename(old_dir->d_inode, old_dentry,
  				   new_dir->d_inode, new_dentry);
9079b1eb1   Dave Hansen   [PATCH] r/o bind ...
2695
  	mnt_drop_write(oldnd.path.mnt);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2696
2697
2698
2699
2700
2701
2702
  exit5:
  	dput(new_dentry);
  exit4:
  	dput(old_dentry);
  exit3:
  	unlock_rename(new_dir, old_dir);
  exit2:
1d957f9bf   Jan Blunck   Introduce path_put()
2703
  	path_put(&newnd.path);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2704
  exit1:
1d957f9bf   Jan Blunck   Introduce path_put()
2705
  	path_put(&oldnd.path);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2706
2707
2708
  exit:
  	return error;
  }
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
2709
2710
  asmlinkage long sys_renameat(int olddfd, const char __user *oldname,
  			     int newdfd, const char __user *newname)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2711
2712
2713
2714
2715
2716
2717
2718
2719
2720
2721
  {
  	int error;
  	char * from;
  	char * to;
  
  	from = getname(oldname);
  	if(IS_ERR(from))
  		return PTR_ERR(from);
  	to = getname(newname);
  	error = PTR_ERR(to);
  	if (!IS_ERR(to)) {
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
2722
  		error = do_rename(olddfd, from, newdfd, to);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2723
2724
2725
2726
2727
  		putname(to);
  	}
  	putname(from);
  	return error;
  }
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
2728
2729
2730
2731
  asmlinkage long sys_rename(const char __user *oldname, const char __user *newname)
  {
  	return sys_renameat(AT_FDCWD, oldname, AT_FDCWD, newname);
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2732
2733
2734
2735
2736
2737
2738
2739
2740
2741
2742
2743
2744
2745
2746
2747
2748
2749
2750
2751
2752
2753
2754
2755
2756
  int vfs_readlink(struct dentry *dentry, char __user *buffer, int buflen, const char *link)
  {
  	int len;
  
  	len = PTR_ERR(link);
  	if (IS_ERR(link))
  		goto out;
  
  	len = strlen(link);
  	if (len > (unsigned) buflen)
  		len = buflen;
  	if (copy_to_user(buffer, link, len))
  		len = -EFAULT;
  out:
  	return len;
  }
  
  /*
   * A helper for ->readlink().  This should be used *ONLY* for symlinks that
   * have ->follow_link() touching nd only in nd_set_link().  Using (or not
   * using) it for any given inode is up to filesystem.
   */
  int generic_readlink(struct dentry *dentry, char __user *buffer, int buflen)
  {
  	struct nameidata nd;
cc314eef0   Linus Torvalds   Fix nasty ncpfs s...
2757
  	void *cookie;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2758
  	nd.depth = 0;
cc314eef0   Linus Torvalds   Fix nasty ncpfs s...
2759
2760
2761
  	cookie = dentry->d_inode->i_op->follow_link(dentry, &nd);
  	if (!IS_ERR(cookie)) {
  		int res = vfs_readlink(dentry, buffer, buflen, nd_get_link(&nd));
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2762
  		if (dentry->d_inode->i_op->put_link)
cc314eef0   Linus Torvalds   Fix nasty ncpfs s...
2763
2764
  			dentry->d_inode->i_op->put_link(dentry, &nd, cookie);
  		cookie = ERR_PTR(res);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2765
  	}
cc314eef0   Linus Torvalds   Fix nasty ncpfs s...
2766
  	return PTR_ERR(cookie);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2767
2768
2769
2770
2771
2772
2773
2774
2775
2776
2777
2778
  }
  
  int vfs_follow_link(struct nameidata *nd, const char *link)
  {
  	return __vfs_follow_link(nd, link);
  }
  
  /* get the link contents into pagecache */
  static char *page_getlink(struct dentry * dentry, struct page **ppage)
  {
  	struct page * page;
  	struct address_space *mapping = dentry->d_inode->i_mapping;
090d2b185   Pekka Enberg   [PATCH] read_mapp...
2779
  	page = read_mapping_page(mapping, 0, NULL);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2780
  	if (IS_ERR(page))
6fe6900e1   Nick Piggin   mm: make read_cac...
2781
  		return (char*)page;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2782
2783
  	*ppage = page;
  	return kmap(page);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2784
2785
2786
2787
2788
2789
2790
2791
2792
2793
2794
2795
2796
  }
  
  int page_readlink(struct dentry *dentry, char __user *buffer, int buflen)
  {
  	struct page *page = NULL;
  	char *s = page_getlink(dentry, &page);
  	int res = vfs_readlink(dentry,buffer,buflen,s);
  	if (page) {
  		kunmap(page);
  		page_cache_release(page);
  	}
  	return res;
  }
cc314eef0   Linus Torvalds   Fix nasty ncpfs s...
2797
  void *page_follow_link_light(struct dentry *dentry, struct nameidata *nd)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2798
  {
cc314eef0   Linus Torvalds   Fix nasty ncpfs s...
2799
  	struct page *page = NULL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2800
  	nd_set_link(nd, page_getlink(dentry, &page));
cc314eef0   Linus Torvalds   Fix nasty ncpfs s...
2801
  	return page;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2802
  }
cc314eef0   Linus Torvalds   Fix nasty ncpfs s...
2803
  void page_put_link(struct dentry *dentry, struct nameidata *nd, void *cookie)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2804
  {
cc314eef0   Linus Torvalds   Fix nasty ncpfs s...
2805
2806
2807
  	struct page *page = cookie;
  
  	if (page) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2808
2809
  		kunmap(page);
  		page_cache_release(page);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2810
2811
  	}
  }
0adb25d2e   Kirill Korotaev   [PATCH] ext3: ext...
2812
2813
  int __page_symlink(struct inode *inode, const char *symname, int len,
  		gfp_t gfp_mask)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2814
2815
  {
  	struct address_space *mapping = inode->i_mapping;
0adb25d2e   Kirill Korotaev   [PATCH] ext3: ext...
2816
  	struct page *page;
afddba49d   Nick Piggin   fs: introduce wri...
2817
  	void *fsdata;
beb497ab4   Dmitriy Monakhov   [PATCH] __page_sy...
2818
  	int err;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2819
  	char *kaddr;
7e53cac41   NeilBrown   [PATCH] Honour AO...
2820
  retry:
afddba49d   Nick Piggin   fs: introduce wri...
2821
2822
  	err = pagecache_write_begin(NULL, mapping, 0, len-1,
  				AOP_FLAG_UNINTERRUPTIBLE, &page, &fsdata);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2823
  	if (err)
afddba49d   Nick Piggin   fs: introduce wri...
2824
  		goto fail;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2825
2826
2827
  	kaddr = kmap_atomic(page, KM_USER0);
  	memcpy(kaddr, symname, len-1);
  	kunmap_atomic(kaddr, KM_USER0);
afddba49d   Nick Piggin   fs: introduce wri...
2828
2829
2830
  
  	err = pagecache_write_end(NULL, mapping, 0, len-1, len-1,
  							page, fsdata);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2831
2832
  	if (err < 0)
  		goto fail;
afddba49d   Nick Piggin   fs: introduce wri...
2833
2834
  	if (err < len-1)
  		goto retry;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2835
2836
  	mark_inode_dirty(inode);
  	return 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2837
2838
2839
  fail:
  	return err;
  }
0adb25d2e   Kirill Korotaev   [PATCH] ext3: ext...
2840
2841
2842
2843
2844
  int page_symlink(struct inode *inode, const char *symname, int len)
  {
  	return __page_symlink(inode, symname, len,
  			mapping_gfp_mask(inode->i_mapping));
  }
92e1d5be9   Arjan van de Ven   [PATCH] mark stru...
2845
  const struct inode_operations page_symlink_inode_operations = {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2846
2847
2848
2849
2850
2851
  	.readlink	= generic_readlink,
  	.follow_link	= page_follow_link_light,
  	.put_link	= page_put_link,
  };
  
  EXPORT_SYMBOL(__user_walk);
5590ff0d5   Ulrich Drepper   [PATCH] vfs: *at ...
2852
  EXPORT_SYMBOL(__user_walk_fd);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2853
2854
2855
2856
2857
  EXPORT_SYMBOL(follow_down);
  EXPORT_SYMBOL(follow_up);
  EXPORT_SYMBOL(get_write_access); /* binfmt_aout */
  EXPORT_SYMBOL(getname);
  EXPORT_SYMBOL(lock_rename);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2858
2859
2860
2861
  EXPORT_SYMBOL(lookup_one_len);
  EXPORT_SYMBOL(page_follow_link_light);
  EXPORT_SYMBOL(page_put_link);
  EXPORT_SYMBOL(page_readlink);
0adb25d2e   Kirill Korotaev   [PATCH] ext3: ext...
2862
  EXPORT_SYMBOL(__page_symlink);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2863
2864
2865
  EXPORT_SYMBOL(page_symlink);
  EXPORT_SYMBOL(page_symlink_inode_operations);
  EXPORT_SYMBOL(path_lookup);
16f182002   Josef 'Jeff' Sipek   fs: introduce vfs...
2866
  EXPORT_SYMBOL(vfs_path_lookup);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2867
  EXPORT_SYMBOL(permission);
e4543eddf   Christoph Hellwig   [PATCH] add a vfs...
2868
  EXPORT_SYMBOL(vfs_permission);
8c744fb83   Christoph Hellwig   [PATCH] add a fil...
2869
  EXPORT_SYMBOL(file_permission);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2870
2871
2872
2873
2874
2875
2876
2877
2878
2879
2880
2881
2882
2883
  EXPORT_SYMBOL(unlock_rename);
  EXPORT_SYMBOL(vfs_create);
  EXPORT_SYMBOL(vfs_follow_link);
  EXPORT_SYMBOL(vfs_link);
  EXPORT_SYMBOL(vfs_mkdir);
  EXPORT_SYMBOL(vfs_mknod);
  EXPORT_SYMBOL(generic_permission);
  EXPORT_SYMBOL(vfs_readlink);
  EXPORT_SYMBOL(vfs_rename);
  EXPORT_SYMBOL(vfs_rmdir);
  EXPORT_SYMBOL(vfs_symlink);
  EXPORT_SYMBOL(vfs_unlink);
  EXPORT_SYMBOL(dentry_unhash);
  EXPORT_SYMBOL(generic_readlink);