Blame view

fs/super.c 22 KB
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
  /*
   *  linux/fs/super.c
   *
   *  Copyright (C) 1991, 1992  Linus Torvalds
   *
   *  super.c contains code to handle: - mount structures
   *                                   - super-block tables
   *                                   - filesystem drivers list
   *                                   - mount system call
   *                                   - umount system call
   *                                   - ustat system call
   *
   * GK 2/5/95  -  Changed to support mounting the root fs via NFS
   *
   *  Added kerneld support: Jacques Gelinas and Bjorn Ekwall
   *  Added change_root: Werner Almesberger & Hans Lermen, Feb '96
   *  Added options to /proc/mounts:
96de0e252   Jan Engelhardt   Convert files to ...
18
   *    Torbjörn Lindh (torbjorn.lindh@gopta.se), April 14, 1996.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
19
20
21
   *  Added devfs support: Richard Gooch <rgooch@atnf.csiro.au>, 13-JAN-1998
   *  Heavily rewritten for 'one fs - one tree' dcache architecture. AV, Mar 2000
   */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
  #include <linux/module.h>
  #include <linux/slab.h>
  #include <linux/init.h>
  #include <linux/smp_lock.h>
  #include <linux/acct.h>
  #include <linux/blkdev.h>
  #include <linux/quotaops.h>
  #include <linux/namei.h>
  #include <linux/buffer_head.h>		/* for fsync_super() */
  #include <linux/mount.h>
  #include <linux/security.h>
  #include <linux/syscalls.h>
  #include <linux/vfs.h>
  #include <linux/writeback.h>		/* for the emergency remount stuff */
  #include <linux/idr.h>
  #include <linux/kobject.h>
353ab6e97   Ingo Molnar   [PATCH] sem2mutex...
38
  #include <linux/mutex.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
39
  #include <asm/uaccess.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
40
41
42
43
44
  LIST_HEAD(super_blocks);
  DEFINE_SPINLOCK(sb_lock);
  
  /**
   *	alloc_super	-	create new superblock
fe2bbc483   Henrik Kretzschmar   [PATCH] add missi...
45
   *	@type:	filesystem type superblock should belong to
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
46
47
48
49
   *
   *	Allocates and initializes a new &struct super_block.  alloc_super()
   *	returns a pointer new superblock or %NULL if allocation had failed.
   */
cf5162499   Ingo Molnar   [PATCH] lockdep: ...
50
  static struct super_block *alloc_super(struct file_system_type *type)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
51
  {
11b0b5abb   Oliver Neukum   [PATCH] use kzall...
52
  	struct super_block *s = kzalloc(sizeof(struct super_block),  GFP_USER);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
53
54
55
  	static struct super_operations default_op;
  
  	if (s) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
56
57
58
59
60
61
62
  		if (security_sb_alloc(s)) {
  			kfree(s);
  			s = NULL;
  			goto out;
  		}
  		INIT_LIST_HEAD(&s->s_dirty);
  		INIT_LIST_HEAD(&s->s_io);
0e0f4fc22   Ken Chen   writeback: fix pe...
63
  		INIT_LIST_HEAD(&s->s_more_io);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
64
65
66
67
68
  		INIT_LIST_HEAD(&s->s_files);
  		INIT_LIST_HEAD(&s->s_instances);
  		INIT_HLIST_HEAD(&s->s_anon);
  		INIT_LIST_HEAD(&s->s_inodes);
  		init_rwsem(&s->s_umount);
7892f2f48   Ingo Molnar   [PATCH] mutex sub...
69
  		mutex_init(&s->s_lock);
897c6ff95   Arjan van de Ven   [PATCH] lockdep: ...
70
  		lockdep_set_class(&s->s_umount, &type->s_umount_key);
cf5162499   Ingo Molnar   [PATCH] lockdep: ...
71
72
73
74
75
76
  		/*
  		 * The locking rules for s_lock are up to the
  		 * filesystem. For example ext3fs has different
  		 * lock ordering than usbfs:
  		 */
  		lockdep_set_class(&s->s_lock, &type->s_lock_key);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
77
78
79
  		down_write(&s->s_umount);
  		s->s_count = S_BIAS;
  		atomic_set(&s->s_active, 1);
a11f3a057   Arjan van de Ven   [PATCH] sem2mutex...
80
  		mutex_init(&s->s_vfs_rename_mutex);
d3be915fc   Ingo Molnar   [PATCH] sem2mutex...
81
82
  		mutex_init(&s->s_dquot.dqio_mutex);
  		mutex_init(&s->s_dquot.dqonoff_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
  		init_rwsem(&s->s_dquot.dqptr_sem);
  		init_waitqueue_head(&s->s_wait_unfrozen);
  		s->s_maxbytes = MAX_NON_LFS;
  		s->dq_op = sb_dquot_ops;
  		s->s_qcop = sb_quotactl_ops;
  		s->s_op = &default_op;
  		s->s_time_gran = 1000000000;
  	}
  out:
  	return s;
  }
  
  /**
   *	destroy_super	-	frees a superblock
   *	@s: superblock to free
   *
   *	Frees a superblock.
   */
  static inline void destroy_super(struct super_block *s)
  {
  	security_sb_free(s);
79c0b2df7   Miklos Szeredi   add filesystem su...
104
  	kfree(s->s_subtype);
b3b304a23   Miklos Szeredi   mount options: ad...
105
  	kfree(s->s_options);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
  	kfree(s);
  }
  
  /* Superblock refcounting  */
  
  /*
   * Drop a superblock's refcount.  Returns non-zero if the superblock was
   * destroyed.  The caller must hold sb_lock.
   */
  int __put_super(struct super_block *sb)
  {
  	int ret = 0;
  
  	if (!--sb->s_count) {
  		destroy_super(sb);
  		ret = 1;
  	}
  	return ret;
  }
  
  /*
   * Drop a superblock's refcount.
   * Returns non-zero if the superblock is about to be destroyed and
   * at least is already removed from super_blocks list, so if we are
   * making a loop through super blocks then we need to restart.
   * The caller must hold sb_lock.
   */
  int __put_super_and_need_restart(struct super_block *sb)
  {
  	/* check for race with generic_shutdown_super() */
  	if (list_empty(&sb->s_list)) {
  		/* super block is removed, need to restart... */
  		__put_super(sb);
  		return 1;
  	}
  	/* can't be the last, since s_list is still in use */
  	sb->s_count--;
  	BUG_ON(sb->s_count == 0);
  	return 0;
  }
  
  /**
   *	put_super	-	drop a temporary reference to superblock
   *	@sb: superblock in question
   *
   *	Drops a temporary reference, frees superblock if there's no
   *	references left.
   */
  static void put_super(struct super_block *sb)
  {
  	spin_lock(&sb_lock);
  	__put_super(sb);
  	spin_unlock(&sb_lock);
  }
  
  
  /**
   *	deactivate_super	-	drop an active reference to superblock
   *	@s: superblock to deactivate
   *
   *	Drops an active reference to superblock, acquiring a temprory one if
   *	there is no active references left.  In that case we lock superblock,
   *	tell fs driver to shut it down and drop the temporary reference we
   *	had just acquired.
   */
  void deactivate_super(struct super_block *s)
  {
  	struct file_system_type *fs = s->s_type;
  	if (atomic_dec_and_lock(&s->s_active, &sb_lock)) {
  		s->s_count -= S_BIAS-1;
  		spin_unlock(&sb_lock);
7b7b1ace2   Al Viro   [PATCH] saner han...
177
  		DQUOT_OFF(s);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
  		down_write(&s->s_umount);
  		fs->kill_sb(s);
  		put_filesystem(fs);
  		put_super(s);
  	}
  }
  
  EXPORT_SYMBOL(deactivate_super);
  
  /**
   *	grab_super - acquire an active reference
   *	@s: reference we are trying to make active
   *
   *	Tries to acquire an active reference.  grab_super() is used when we
   * 	had just found a superblock in super_blocks or fs_type->fs_supers
   *	and want to turn it into a full-blown active reference.  grab_super()
   *	is called with sb_lock held and drops it.  Returns 1 in case of
   *	success, 0 if we had failed (superblock contents was already dead or
   *	dying when grab_super() had been called).
   */
9c4dbee79   Josh Triplett   [PATCH] fs: add l...
198
  static int grab_super(struct super_block *s) __releases(sb_lock)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
  {
  	s->s_count++;
  	spin_unlock(&sb_lock);
  	down_write(&s->s_umount);
  	if (s->s_root) {
  		spin_lock(&sb_lock);
  		if (s->s_count > S_BIAS) {
  			atomic_inc(&s->s_active);
  			s->s_count--;
  			spin_unlock(&sb_lock);
  			return 1;
  		}
  		spin_unlock(&sb_lock);
  	}
  	up_write(&s->s_umount);
  	put_super(s);
  	yield();
  	return 0;
  }
cf9a2ae8d   David Howells   [PATCH] BLOCK: Mo...
218
  /*
914e26379   Al Viro   [PATCH] severing ...
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
   * Superblock locking.  We really ought to get rid of these two.
   */
  void lock_super(struct super_block * sb)
  {
  	get_fs_excl();
  	mutex_lock(&sb->s_lock);
  }
  
  void unlock_super(struct super_block * sb)
  {
  	put_fs_excl();
  	mutex_unlock(&sb->s_lock);
  }
  
  EXPORT_SYMBOL(lock_super);
  EXPORT_SYMBOL(unlock_super);
  
  /*
cf9a2ae8d   David Howells   [PATCH] BLOCK: Mo...
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
   * Write out and wait upon all dirty data associated with this
   * superblock.  Filesystem data as well as the underlying block
   * device.  Takes the superblock lock.  Requires a second blkdev
   * flush by the caller to complete the operation.
   */
  void __fsync_super(struct super_block *sb)
  {
  	sync_inodes_sb(sb, 0);
  	DQUOT_SYNC(sb);
  	lock_super(sb);
  	if (sb->s_dirt && sb->s_op->write_super)
  		sb->s_op->write_super(sb);
  	unlock_super(sb);
  	if (sb->s_op->sync_fs)
  		sb->s_op->sync_fs(sb, 1);
  	sync_blockdev(sb->s_bdev);
  	sync_inodes_sb(sb, 1);
  }
  
  /*
   * Write out and wait upon all dirty data associated with this
   * superblock.  Filesystem data as well as the underlying block
   * device.  Takes the superblock lock.
   */
  int fsync_super(struct super_block *sb)
  {
  	__fsync_super(sb);
  	return sync_blockdev(sb->s_bdev);
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
266
267
268
269
270
271
272
273
274
  /**
   *	generic_shutdown_super	-	common helper for ->kill_sb()
   *	@sb: superblock to kill
   *
   *	generic_shutdown_super() does all fs-independent work on superblock
   *	shutdown.  Typical ->kill_sb() should pick all fs-specific objects
   *	that need destruction out of superblock, call generic_shutdown_super()
   *	and release aforementioned objects.  Note: dentries and inodes _are_
   *	taken care of and do not need specific handling.
c636ebdb1   David Howells   [PATCH] VFS: Dest...
275
276
277
278
   *
   *	Upon calling this function, the filesystem may no longer alter or
   *	rearrange the set of dentries belonging to this super_block, nor may it
   *	change the attachments of dentries to inodes.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
279
280
281
   */
  void generic_shutdown_super(struct super_block *sb)
  {
ee9b6d61a   Josef 'Jeff' Sipek   [PATCH] Mark stru...
282
  	const struct super_operations *sop = sb->s_op;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
283

c636ebdb1   David Howells   [PATCH] VFS: Dest...
284
285
  	if (sb->s_root) {
  		shrink_dcache_for_umount(sb);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
286
287
288
289
290
291
292
293
294
295
296
297
298
299
  		fsync_super(sb);
  		lock_super(sb);
  		sb->s_flags &= ~MS_ACTIVE;
  		/* bad name - it should be evict_inodes() */
  		invalidate_inodes(sb);
  		lock_kernel();
  
  		if (sop->write_super && sb->s_dirt)
  			sop->write_super(sb);
  		if (sop->put_super)
  			sop->put_super(sb);
  
  		/* Forget any remaining inodes */
  		if (invalidate_inodes(sb)) {
7b4fe29e0   Dave Jones   [PATCH] More info...
300
301
302
303
  			printk("VFS: Busy inodes after unmount of %s. "
  			   "Self-destruct in 5 seconds.  Have a nice day...
  ",
  			   sb->s_id);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
  		}
  
  		unlock_kernel();
  		unlock_super(sb);
  	}
  	spin_lock(&sb_lock);
  	/* should be initialized for __put_super_and_need_restart() */
  	list_del_init(&sb->s_list);
  	list_del(&sb->s_instances);
  	spin_unlock(&sb_lock);
  	up_write(&sb->s_umount);
  }
  
  EXPORT_SYMBOL(generic_shutdown_super);
  
  /**
   *	sget	-	find or create a superblock
   *	@type:	filesystem type superblock should belong to
   *	@test:	comparison callback
   *	@set:	setup callback
   *	@data:	argument to each of them
   */
  struct super_block *sget(struct file_system_type *type,
  			int (*test)(struct super_block *,void *),
  			int (*set)(struct super_block *,void *),
  			void *data)
  {
  	struct super_block *s = NULL;
d47301271   Matthias Kaehlcke   fs/super.c: use l...
332
  	struct super_block *old;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
333
334
335
336
  	int err;
  
  retry:
  	spin_lock(&sb_lock);
d47301271   Matthias Kaehlcke   fs/super.c: use l...
337
338
339
340
341
342
343
344
345
346
  	if (test) {
  		list_for_each_entry(old, &type->fs_supers, s_instances) {
  			if (!test(old, data))
  				continue;
  			if (!grab_super(old))
  				goto retry;
  			if (s)
  				destroy_super(s);
  			return old;
  		}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
347
348
349
  	}
  	if (!s) {
  		spin_unlock(&sb_lock);
cf5162499   Ingo Molnar   [PATCH] lockdep: ...
350
  		s = alloc_super(type);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
  		if (!s)
  			return ERR_PTR(-ENOMEM);
  		goto retry;
  	}
  		
  	err = set(s, data);
  	if (err) {
  		spin_unlock(&sb_lock);
  		destroy_super(s);
  		return ERR_PTR(err);
  	}
  	s->s_type = type;
  	strlcpy(s->s_id, type->name, sizeof(s->s_id));
  	list_add_tail(&s->s_list, &super_blocks);
  	list_add(&s->s_instances, &type->fs_supers);
  	spin_unlock(&sb_lock);
  	get_filesystem(type);
  	return s;
  }
  
  EXPORT_SYMBOL(sget);
  
  void drop_super(struct super_block *sb)
  {
  	up_read(&sb->s_umount);
  	put_super(sb);
  }
  
  EXPORT_SYMBOL(drop_super);
  
  static inline void write_super(struct super_block *sb)
  {
  	lock_super(sb);
  	if (sb->s_root && sb->s_dirt)
  		if (sb->s_op->write_super)
  			sb->s_op->write_super(sb);
  	unlock_super(sb);
  }
  
  /*
   * Note: check the dirty flag before waiting, so we don't
   * hold up the sync while mounting a device. (The newly
   * mounted device won't need syncing.)
   */
  void sync_supers(void)
  {
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
397
  	struct super_block *sb;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
398
  	spin_lock(&sb_lock);
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
399
400
  restart:
  	list_for_each_entry(sb, &super_blocks, s_list) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
401
402
403
404
405
  		if (sb->s_dirt) {
  			sb->s_count++;
  			spin_unlock(&sb_lock);
  			down_read(&sb->s_umount);
  			write_super(sb);
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
406
407
408
409
410
411
  			up_read(&sb->s_umount);
  			spin_lock(&sb_lock);
  			if (__put_super_and_need_restart(sb))
  				goto restart;
  		}
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
412
413
414
415
  	spin_unlock(&sb_lock);
  }
  
  /*
3a4fa0a25   Robert P. J. Day   Fix misspellings ...
416
   * Call the ->sync_fs super_op against all filesystems which are r/w and
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
417
418
419
420
421
422
423
   * which implement it.
   *
   * This operation is careful to avoid the livelock which could easily happen
   * if two or more filesystems are being continuously dirtied.  s_need_sync_fs
   * is used only here.  We set it against all filesystems and then clear it as
   * we sync them.  So redirtied filesystems are skipped.
   *
3a4fa0a25   Robert P. J. Day   Fix misspellings ...
424
   * But if process A is currently running sync_filesystems and then process B
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
425
426
427
428
429
430
431
432
433
   * calls sync_filesystems as well, process B will set all the s_need_sync_fs
   * flags again, which will cause process A to resync everything.  Fix that with
   * a local mutex.
   *
   * (Fabian) Avoid sync_fs with clean fs & wait mode 0
   */
  void sync_filesystems(int wait)
  {
  	struct super_block *sb;
353ab6e97   Ingo Molnar   [PATCH] sem2mutex...
434
  	static DEFINE_MUTEX(mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
435

353ab6e97   Ingo Molnar   [PATCH] sem2mutex...
436
  	mutex_lock(&mutex);		/* Could be down_interruptible */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
437
  	spin_lock(&sb_lock);
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
438
  	list_for_each_entry(sb, &super_blocks, s_list) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
439
440
441
442
443
444
  		if (!sb->s_op->sync_fs)
  			continue;
  		if (sb->s_flags & MS_RDONLY)
  			continue;
  		sb->s_need_sync_fs = 1;
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
445
446
  
  restart:
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
447
  	list_for_each_entry(sb, &super_blocks, s_list) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
448
449
450
451
452
453
454
455
456
457
  		if (!sb->s_need_sync_fs)
  			continue;
  		sb->s_need_sync_fs = 0;
  		if (sb->s_flags & MS_RDONLY)
  			continue;	/* hm.  Was remounted r/o meanwhile */
  		sb->s_count++;
  		spin_unlock(&sb_lock);
  		down_read(&sb->s_umount);
  		if (sb->s_root && (wait || sb->s_dirt))
  			sb->s_op->sync_fs(sb, wait);
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
458
459
460
461
462
  		up_read(&sb->s_umount);
  		/* restart only when sb is no longer on the list */
  		spin_lock(&sb_lock);
  		if (__put_super_and_need_restart(sb))
  			goto restart;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
463
464
  	}
  	spin_unlock(&sb_lock);
353ab6e97   Ingo Molnar   [PATCH] sem2mutex...
465
  	mutex_unlock(&mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
466
467
468
469
470
471
472
473
474
475
476
477
  }
  
  /**
   *	get_super - get the superblock of a device
   *	@bdev: device to get the superblock for
   *	
   *	Scans the superblock list and finds the superblock of the file system
   *	mounted on the device given. %NULL is returned if no match is found.
   */
  
  struct super_block * get_super(struct block_device *bdev)
  {
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
478
  	struct super_block *sb;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
479
480
  	if (!bdev)
  		return NULL;
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
481

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
482
  	spin_lock(&sb_lock);
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
483
484
485
486
  rescan:
  	list_for_each_entry(sb, &super_blocks, s_list) {
  		if (sb->s_bdev == bdev) {
  			sb->s_count++;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
487
  			spin_unlock(&sb_lock);
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
488
489
490
491
492
493
494
495
  			down_read(&sb->s_umount);
  			if (sb->s_root)
  				return sb;
  			up_read(&sb->s_umount);
  			/* restart only when sb is no longer on the list */
  			spin_lock(&sb_lock);
  			if (__put_super_and_need_restart(sb))
  				goto rescan;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
496
497
498
499
500
501
502
503
504
505
  		}
  	}
  	spin_unlock(&sb_lock);
  	return NULL;
  }
  
  EXPORT_SYMBOL(get_super);
   
  struct super_block * user_get_super(dev_t dev)
  {
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
506
  	struct super_block *sb;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
507

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
508
  	spin_lock(&sb_lock);
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
509
510
511
512
  rescan:
  	list_for_each_entry(sb, &super_blocks, s_list) {
  		if (sb->s_dev ==  dev) {
  			sb->s_count++;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
513
  			spin_unlock(&sb_lock);
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
514
515
516
517
518
519
520
521
  			down_read(&sb->s_umount);
  			if (sb->s_root)
  				return sb;
  			up_read(&sb->s_umount);
  			/* restart only when sb is no longer on the list */
  			spin_lock(&sb_lock);
  			if (__put_super_and_need_restart(sb))
  				goto rescan;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
522
523
524
525
526
  		}
  	}
  	spin_unlock(&sb_lock);
  	return NULL;
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
527
528
529
530
531
532
533
534
535
536
  asmlinkage long sys_ustat(unsigned dev, struct ustat __user * ubuf)
  {
          struct super_block *s;
          struct ustat tmp;
          struct kstatfs sbuf;
  	int err = -EINVAL;
  
          s = user_get_super(new_decode_dev(dev));
          if (s == NULL)
                  goto out;
726c33422   David Howells   [PATCH] VFS: Perm...
537
  	err = vfs_statfs(s->s_root, &sbuf);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
  	drop_super(s);
  	if (err)
  		goto out;
  
          memset(&tmp,0,sizeof(struct ustat));
          tmp.f_tfree = sbuf.f_bfree;
          tmp.f_tinode = sbuf.f_ffree;
  
          err = copy_to_user(ubuf,&tmp,sizeof(struct ustat)) ? -EFAULT : 0;
  out:
  	return err;
  }
  
  /**
   *	mark_files_ro
   *	@sb: superblock in question
   *
   *	All files are marked read/only.  We don't care about pending
   *	delete files so this should be used in 'force' mode only
   */
  
  static void mark_files_ro(struct super_block *sb)
  {
  	struct file *f;
  
  	file_list_lock();
2f5120166   Eric Dumazet   [PATCH] reduce si...
564
  	list_for_each_entry(f, &sb->s_files, f_u.fu_list) {
0f7fc9e4d   Josef "Jeff" Sipek   [PATCH] VFS: chan...
565
  		if (S_ISREG(f->f_path.dentry->d_inode->i_mode) && file_count(f))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
  			f->f_mode &= ~FMODE_WRITE;
  	}
  	file_list_unlock();
  }
  
  /**
   *	do_remount_sb - asks filesystem to change mount options.
   *	@sb:	superblock in question
   *	@flags:	numeric part of options
   *	@data:	the rest of options
   *      @force: whether or not to force the change
   *
   *	Alters the mount options of a mounted file system.
   */
  int do_remount_sb(struct super_block *sb, int flags, void *data, int force)
  {
  	int retval;
  	
9361401eb   David Howells   [PATCH] BLOCK: Ma...
584
  #ifdef CONFIG_BLOCK
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
585
586
  	if (!(flags & MS_RDONLY) && bdev_read_only(sb->s_bdev))
  		return -EACCES;
9361401eb   David Howells   [PATCH] BLOCK: Ma...
587
  #endif
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
588
589
590
591
592
593
594
595
596
597
598
599
  	if (flags & MS_RDONLY)
  		acct_auto_close(sb);
  	shrink_dcache_sb(sb);
  	fsync_super(sb);
  
  	/* If we are remounting RDONLY and current sb is read/write,
  	   make sure there are no rw files opened */
  	if ((flags & MS_RDONLY) && !(sb->s_flags & MS_RDONLY)) {
  		if (force)
  			mark_files_ro(sb);
  		else if (!fs_may_remount_ro(sb))
  			return -EBUSY;
66191dc62   Jan Kara   quota: turn quota...
600
  		DQUOT_OFF(sb);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
  	}
  
  	if (sb->s_op->remount_fs) {
  		lock_super(sb);
  		retval = sb->s_op->remount_fs(sb, &flags, data);
  		unlock_super(sb);
  		if (retval)
  			return retval;
  	}
  	sb->s_flags = (sb->s_flags & ~MS_RMT_MASK) | (flags & MS_RMT_MASK);
  	return 0;
  }
  
  static void do_emergency_remount(unsigned long foo)
  {
  	struct super_block *sb;
  
  	spin_lock(&sb_lock);
  	list_for_each_entry(sb, &super_blocks, s_list) {
  		sb->s_count++;
  		spin_unlock(&sb_lock);
  		down_read(&sb->s_umount);
  		if (sb->s_root && sb->s_bdev && !(sb->s_flags & MS_RDONLY)) {
  			/*
  			 * ->remount_fs needs lock_kernel().
  			 *
  			 * What lock protects sb->s_flags??
  			 */
  			lock_kernel();
  			do_remount_sb(sb, MS_RDONLY, NULL, 1);
  			unlock_kernel();
  		}
  		drop_super(sb);
  		spin_lock(&sb_lock);
  	}
  	spin_unlock(&sb_lock);
  	printk("Emergency Remount complete
  ");
  }
  
  void emergency_remount(void)
  {
  	pdflush_operation(do_emergency_remount, 0);
  }
  
  /*
   * Unnamed block devices are dummy devices used by virtual
   * filesystems which don't use real block-devices.  -- jrs
   */
  
  static struct idr unnamed_dev_idr;
  static DEFINE_SPINLOCK(unnamed_dev_lock);/* protects the above */
  
  int set_anon_super(struct super_block *s, void *data)
  {
  	int dev;
  	int error;
  
   retry:
  	if (idr_pre_get(&unnamed_dev_idr, GFP_ATOMIC) == 0)
  		return -ENOMEM;
  	spin_lock(&unnamed_dev_lock);
  	error = idr_get_new(&unnamed_dev_idr, NULL, &dev);
  	spin_unlock(&unnamed_dev_lock);
  	if (error == -EAGAIN)
  		/* We raced and lost with another CPU. */
  		goto retry;
  	else if (error)
  		return -EAGAIN;
  
  	if ((dev & MAX_ID_MASK) == (1 << MINORBITS)) {
  		spin_lock(&unnamed_dev_lock);
  		idr_remove(&unnamed_dev_idr, dev);
  		spin_unlock(&unnamed_dev_lock);
  		return -EMFILE;
  	}
  	s->s_dev = MKDEV(0, dev & MINORMASK);
  	return 0;
  }
  
  EXPORT_SYMBOL(set_anon_super);
  
  void kill_anon_super(struct super_block *sb)
  {
  	int slot = MINOR(sb->s_dev);
  
  	generic_shutdown_super(sb);
  	spin_lock(&unnamed_dev_lock);
  	idr_remove(&unnamed_dev_idr, slot);
  	spin_unlock(&unnamed_dev_lock);
  }
  
  EXPORT_SYMBOL(kill_anon_super);
  
  void __init unnamed_dev_init(void)
  {
  	idr_init(&unnamed_dev_idr);
  }
  
  void kill_litter_super(struct super_block *sb)
  {
  	if (sb->s_root)
  		d_genocide(sb->s_root);
  	kill_anon_super(sb);
  }
  
  EXPORT_SYMBOL(kill_litter_super);
9361401eb   David Howells   [PATCH] BLOCK: Ma...
708
  #ifdef CONFIG_BLOCK
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
709
710
711
712
713
714
715
716
717
718
719
  static int set_bdev_super(struct super_block *s, void *data)
  {
  	s->s_bdev = data;
  	s->s_dev = s->s_bdev->bd_dev;
  	return 0;
  }
  
  static int test_bdev_super(struct super_block *s, void *data)
  {
  	return (void *)s->s_bdev == data;
  }
454e2398b   David Howells   [PATCH] VFS: Perm...
720
  int get_sb_bdev(struct file_system_type *fs_type,
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
721
  	int flags, const char *dev_name, void *data,
454e2398b   David Howells   [PATCH] VFS: Perm...
722
723
  	int (*fill_super)(struct super_block *, void *, int),
  	struct vfsmount *mnt)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
724
725
726
727
728
729
730
  {
  	struct block_device *bdev;
  	struct super_block *s;
  	int error = 0;
  
  	bdev = open_bdev_excl(dev_name, flags, fs_type);
  	if (IS_ERR(bdev))
454e2398b   David Howells   [PATCH] VFS: Perm...
731
  		return PTR_ERR(bdev);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
732
733
734
735
736
737
  
  	/*
  	 * once the super is inserted into the list by sget, s_umount
  	 * will protect the lockfs code from trying to start a snapshot
  	 * while we are mounting
  	 */
f73ca1b76   David Chinner   [PATCH] Revert bd...
738
  	down(&bdev->bd_mount_sem);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
739
  	s = sget(fs_type, test_bdev_super, set_bdev_super, bdev);
f73ca1b76   David Chinner   [PATCH] Revert bd...
740
  	up(&bdev->bd_mount_sem);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
741
  	if (IS_ERR(s))
454e2398b   David Howells   [PATCH] VFS: Perm...
742
  		goto error_s;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
743
744
745
746
747
  
  	if (s->s_root) {
  		if ((flags ^ s->s_flags) & MS_RDONLY) {
  			up_write(&s->s_umount);
  			deactivate_super(s);
454e2398b   David Howells   [PATCH] VFS: Perm...
748
749
  			error = -EBUSY;
  			goto error_bdev;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
750
  		}
454e2398b   David Howells   [PATCH] VFS: Perm...
751
752
  
  		close_bdev_excl(bdev);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
753
754
755
756
757
  	} else {
  		char b[BDEVNAME_SIZE];
  
  		s->s_flags = flags;
  		strlcpy(s->s_id, bdevname(bdev, b), sizeof(s->s_id));
e78c9a004   Pekka Enberg   [PATCH] fs: remov...
758
  		sb_set_blocksize(s, block_size(bdev));
9b04c997b   Theodore Ts'o   [PATCH] vfs: MS_V...
759
  		error = fill_super(s, data, flags & MS_SILENT ? 1 : 0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
760
761
762
  		if (error) {
  			up_write(&s->s_umount);
  			deactivate_super(s);
454e2398b   David Howells   [PATCH] VFS: Perm...
763
  			goto error;
fa675765a   Greg Kroah-Hartman   Revert mount/umou...
764
  		}
454e2398b   David Howells   [PATCH] VFS: Perm...
765
766
  
  		s->s_flags |= MS_ACTIVE;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
767
  	}
454e2398b   David Howells   [PATCH] VFS: Perm...
768
  	return simple_set_mnt(mnt, s);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
769

454e2398b   David Howells   [PATCH] VFS: Perm...
770
771
772
  error_s:
  	error = PTR_ERR(s);
  error_bdev:
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
773
  	close_bdev_excl(bdev);
454e2398b   David Howells   [PATCH] VFS: Perm...
774
775
  error:
  	return error;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
776
777
778
779
780
781
782
  }
  
  EXPORT_SYMBOL(get_sb_bdev);
  
  void kill_block_super(struct super_block *sb)
  {
  	struct block_device *bdev = sb->s_bdev;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
783
784
785
786
787
788
  	generic_shutdown_super(sb);
  	sync_blockdev(bdev);
  	close_bdev_excl(bdev);
  }
  
  EXPORT_SYMBOL(kill_block_super);
9361401eb   David Howells   [PATCH] BLOCK: Ma...
789
  #endif
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
790

454e2398b   David Howells   [PATCH] VFS: Perm...
791
  int get_sb_nodev(struct file_system_type *fs_type,
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
792
  	int flags, void *data,
454e2398b   David Howells   [PATCH] VFS: Perm...
793
794
  	int (*fill_super)(struct super_block *, void *, int),
  	struct vfsmount *mnt)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
795
796
797
798
799
  {
  	int error;
  	struct super_block *s = sget(fs_type, NULL, set_anon_super, NULL);
  
  	if (IS_ERR(s))
454e2398b   David Howells   [PATCH] VFS: Perm...
800
  		return PTR_ERR(s);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
801
802
  
  	s->s_flags = flags;
9b04c997b   Theodore Ts'o   [PATCH] vfs: MS_V...
803
  	error = fill_super(s, data, flags & MS_SILENT ? 1 : 0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
804
805
806
  	if (error) {
  		up_write(&s->s_umount);
  		deactivate_super(s);
454e2398b   David Howells   [PATCH] VFS: Perm...
807
  		return error;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
808
809
  	}
  	s->s_flags |= MS_ACTIVE;
454e2398b   David Howells   [PATCH] VFS: Perm...
810
  	return simple_set_mnt(mnt, s);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
811
812
813
814
815
816
817
818
  }
  
  EXPORT_SYMBOL(get_sb_nodev);
  
  static int compare_single(struct super_block *s, void *p)
  {
  	return 1;
  }
454e2398b   David Howells   [PATCH] VFS: Perm...
819
  int get_sb_single(struct file_system_type *fs_type,
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
820
  	int flags, void *data,
454e2398b   David Howells   [PATCH] VFS: Perm...
821
822
  	int (*fill_super)(struct super_block *, void *, int),
  	struct vfsmount *mnt)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
823
824
825
826
827
828
  {
  	struct super_block *s;
  	int error;
  
  	s = sget(fs_type, compare_single, set_anon_super, NULL);
  	if (IS_ERR(s))
454e2398b   David Howells   [PATCH] VFS: Perm...
829
  		return PTR_ERR(s);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
830
831
  	if (!s->s_root) {
  		s->s_flags = flags;
9b04c997b   Theodore Ts'o   [PATCH] vfs: MS_V...
832
  		error = fill_super(s, data, flags & MS_SILENT ? 1 : 0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
833
834
835
  		if (error) {
  			up_write(&s->s_umount);
  			deactivate_super(s);
454e2398b   David Howells   [PATCH] VFS: Perm...
836
  			return error;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
837
838
839
840
  		}
  		s->s_flags |= MS_ACTIVE;
  	}
  	do_remount_sb(s, flags, data, 0);
454e2398b   David Howells   [PATCH] VFS: Perm...
841
  	return simple_set_mnt(mnt, s);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
842
843
844
845
846
  }
  
  EXPORT_SYMBOL(get_sb_single);
  
  struct vfsmount *
bb4a58bf4   Trond Myklebust   VFS: Add GPL_EXPO...
847
  vfs_kern_mount(struct file_system_type *type, int flags, const char *name, void *data)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
848
  {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
849
  	struct vfsmount *mnt;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
850
  	char *secdata = NULL;
454e2398b   David Howells   [PATCH] VFS: Perm...
851
  	int error;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
852
853
854
  
  	if (!type)
  		return ERR_PTR(-ENODEV);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
855

454e2398b   David Howells   [PATCH] VFS: Perm...
856
  	error = -ENOMEM;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
857
858
859
860
861
862
  	mnt = alloc_vfsmnt(name);
  	if (!mnt)
  		goto out;
  
  	if (data) {
  		secdata = alloc_secdata();
454e2398b   David Howells   [PATCH] VFS: Perm...
863
  		if (!secdata)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
864
  			goto out_mnt;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
865
866
  
  		error = security_sb_copy_data(type, data, secdata);
454e2398b   David Howells   [PATCH] VFS: Perm...
867
  		if (error)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
868
  			goto out_free_secdata;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
869
  	}
454e2398b   David Howells   [PATCH] VFS: Perm...
870
871
  	error = type->get_sb(type, flags, name, data, mnt);
  	if (error < 0)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
872
  		goto out_free_secdata;
b4c07bce7   Lee Schermerhorn   hugetlbfs: handle...
873
  	BUG_ON(!mnt->mnt_sb);
454e2398b   David Howells   [PATCH] VFS: Perm...
874
875
  
   	error = security_sb_kern_mount(mnt->mnt_sb, secdata);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
876
877
   	if (error)
   		goto out_sb;
454e2398b   David Howells   [PATCH] VFS: Perm...
878
879
  
  	mnt->mnt_mountpoint = mnt->mnt_root;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
880
  	mnt->mnt_parent = mnt;
454e2398b   David Howells   [PATCH] VFS: Perm...
881
  	up_write(&mnt->mnt_sb->s_umount);
8680e22f2   Gerald Schaefer   [PATCH] VFS: memo...
882
  	free_secdata(secdata);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
883
884
  	return mnt;
  out_sb:
454e2398b   David Howells   [PATCH] VFS: Perm...
885
886
887
  	dput(mnt->mnt_root);
  	up_write(&mnt->mnt_sb->s_umount);
  	deactivate_super(mnt->mnt_sb);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
888
889
890
891
892
  out_free_secdata:
  	free_secdata(secdata);
  out_mnt:
  	free_vfsmnt(mnt);
  out:
454e2398b   David Howells   [PATCH] VFS: Perm...
893
  	return ERR_PTR(error);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
894
  }
bb4a58bf4   Trond Myklebust   VFS: Add GPL_EXPO...
895
  EXPORT_SYMBOL_GPL(vfs_kern_mount);
79c0b2df7   Miklos Szeredi   add filesystem su...
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
  static struct vfsmount *fs_set_subtype(struct vfsmount *mnt, const char *fstype)
  {
  	int err;
  	const char *subtype = strchr(fstype, '.');
  	if (subtype) {
  		subtype++;
  		err = -EINVAL;
  		if (!subtype[0])
  			goto err;
  	} else
  		subtype = "";
  
  	mnt->mnt_sb->s_subtype = kstrdup(subtype, GFP_KERNEL);
  	err = -ENOMEM;
  	if (!mnt->mnt_sb->s_subtype)
  		goto err;
  	return mnt;
  
   err:
  	mntput(mnt);
  	return ERR_PTR(err);
  }
bb4a58bf4   Trond Myklebust   VFS: Add GPL_EXPO...
918
919
920
921
922
923
924
925
  struct vfsmount *
  do_kern_mount(const char *fstype, int flags, const char *name, void *data)
  {
  	struct file_system_type *type = get_fs_type(fstype);
  	struct vfsmount *mnt;
  	if (!type)
  		return ERR_PTR(-ENODEV);
  	mnt = vfs_kern_mount(type, flags, name, data);
79c0b2df7   Miklos Szeredi   add filesystem su...
926
927
928
  	if (!IS_ERR(mnt) && (type->fs_flags & FS_HAS_SUBTYPE) &&
  	    !mnt->mnt_sb->s_subtype)
  		mnt = fs_set_subtype(mnt, fstype);
bb4a58bf4   Trond Myklebust   VFS: Add GPL_EXPO...
929
930
931
  	put_filesystem(type);
  	return mnt;
  }
8bf9725c2   Pavel Emelyanov   pid namespaces: i...
932
  struct vfsmount *kern_mount_data(struct file_system_type *type, void *data)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
933
  {
8bf9725c2   Pavel Emelyanov   pid namespaces: i...
934
  	return vfs_kern_mount(type, MS_KERNMOUNT, type->name, data);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
935
  }
8bf9725c2   Pavel Emelyanov   pid namespaces: i...
936
  EXPORT_SYMBOL_GPL(kern_mount_data);