Blame view

fs/super.c 36.7 KB
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
  /*
   *  linux/fs/super.c
   *
   *  Copyright (C) 1991, 1992  Linus Torvalds
   *
   *  super.c contains code to handle: - mount structures
   *                                   - super-block tables
   *                                   - filesystem drivers list
   *                                   - mount system call
   *                                   - umount system call
   *                                   - ustat system call
   *
   * GK 2/5/95  -  Changed to support mounting the root fs via NFS
   *
   *  Added kerneld support: Jacques Gelinas and Bjorn Ekwall
   *  Added change_root: Werner Almesberger & Hans Lermen, Feb '96
   *  Added options to /proc/mounts:
96de0e252   Jan Engelhardt   Convert files to ...
18
   *    Torbjörn Lindh (torbjorn.lindh@gopta.se), April 14, 1996.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
19
20
21
   *  Added devfs support: Richard Gooch <rgooch@atnf.csiro.au>, 13-JAN-1998
   *  Heavily rewritten for 'one fs - one tree' dcache architecture. AV, Mar 2000
   */
630d9c472   Paul Gortmaker   fs: reduce the us...
22
  #include <linux/export.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
23
  #include <linux/slab.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
24
  #include <linux/blkdev.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
25
26
  #include <linux/mount.h>
  #include <linux/security.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
27
28
  #include <linux/writeback.h>		/* for the emergency remount stuff */
  #include <linux/idr.h>
353ab6e97   Ingo Molnar   [PATCH] sem2mutex...
29
  #include <linux/mutex.h>
5477d0fac   Jens Axboe   fs: fs/super.c ne...
30
  #include <linux/backing-dev.h>
ceb5bdc2d   Nick Piggin   fs: dcache per-bu...
31
  #include <linux/rculist_bl.h>
c515e1fd3   Dan Magenheimer   mm/fs: add hooks ...
32
  #include <linux/cleancache.h>
404015308   Al Viro   security: trim se...
33
  #include <linux/fsnotify.h>
5accdf82b   Jan Kara   fs: Improve files...
34
  #include <linux/lockdep.h>
6e4eab577   Eric W. Biederman   fs: Add user name...
35
  #include <linux/user_namespace.h>
6d59e7f58   Al Viro   [PATCH] move a bu...
36
  #include "internal.h"
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
37

15d0f5ea3   Al Viro   Make super_blocks...
38
39
  static LIST_HEAD(super_blocks);
  static DEFINE_SPINLOCK(sb_lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
40

5accdf82b   Jan Kara   fs: Improve files...
41
42
43
44
45
  static char *sb_writers_name[SB_FREEZE_LEVELS] = {
  	"sb_writers",
  	"sb_pagefaults",
  	"sb_internal",
  };
b0d40c92a   Dave Chinner   superblock: intro...
46
47
48
49
50
51
52
  /*
   * One thing we have to be careful of with a per-sb shrinker is that we don't
   * drop the last active reference to the superblock from within the shrinker.
   * If that happens we could trigger unregistering the shrinker from within the
   * shrinker path and that leads to deadlock on the shrinker_rwsem. Hence we
   * take a passive reference to the superblock to avoid this from occurring.
   */
0a234c6dc   Dave Chinner   shrinker: convert...
53
54
  static unsigned long super_cache_scan(struct shrinker *shrink,
  				      struct shrink_control *sc)
b0d40c92a   Dave Chinner   superblock: intro...
55
56
  {
  	struct super_block *sb;
0a234c6dc   Dave Chinner   shrinker: convert...
57
58
59
60
61
  	long	fs_objects = 0;
  	long	total_objects;
  	long	freed = 0;
  	long	dentries;
  	long	inodes;
b0d40c92a   Dave Chinner   superblock: intro...
62
63
64
65
66
67
68
  
  	sb = container_of(shrink, struct super_block, s_shrink);
  
  	/*
  	 * Deadlock avoidance.  We may hold various FS locks, and we don't want
  	 * to recurse into the FS that called us in clear_inode() and friends..
  	 */
0a234c6dc   Dave Chinner   shrinker: convert...
69
70
  	if (!(sc->gfp_mask & __GFP_FS))
  		return SHRINK_STOP;
b0d40c92a   Dave Chinner   superblock: intro...
71

eb6ef3df4   Konstantin Khlebnikov   trylock_super(): ...
72
  	if (!trylock_super(sb))
0a234c6dc   Dave Chinner   shrinker: convert...
73
  		return SHRINK_STOP;
b0d40c92a   Dave Chinner   superblock: intro...
74

d04079039   Al Viro   prune_super(): sb...
75
  	if (sb->s_op->nr_cached_objects)
4101b6243   Vladimir Davydov   fs: consolidate {...
76
  		fs_objects = sb->s_op->nr_cached_objects(sb, sc);
0e1fdafd9   Dave Chinner   superblock: add f...
77

503c358cf   Vladimir Davydov   list_lru: introdu...
78
79
  	inodes = list_lru_shrink_count(&sb->s_inode_lru, sc);
  	dentries = list_lru_shrink_count(&sb->s_dentry_lru, sc);
f60415675   Dave Chinner   dcache: convert t...
80
  	total_objects = dentries + inodes + fs_objects + 1;
475d0db74   Tetsuo Handa   fs: Fix theoretic...
81
82
  	if (!total_objects)
  		total_objects = 1;
0e1fdafd9   Dave Chinner   superblock: add f...
83

0a234c6dc   Dave Chinner   shrinker: convert...
84
  	/* proportion the scan between the caches */
f60415675   Dave Chinner   dcache: convert t...
85
  	dentries = mult_frac(sc->nr_to_scan, dentries, total_objects);
bc3b14cb2   Dave Chinner   inode: convert in...
86
  	inodes = mult_frac(sc->nr_to_scan, inodes, total_objects);
503c358cf   Vladimir Davydov   list_lru: introdu...
87
  	fs_objects = mult_frac(sc->nr_to_scan, fs_objects, total_objects);
b0d40c92a   Dave Chinner   superblock: intro...
88

0a234c6dc   Dave Chinner   shrinker: convert...
89
90
91
  	/*
  	 * prune the dcache first as the icache is pinned by it, then
  	 * prune the icache, followed by the filesystem specific caches
49e7e7ff8   Vladimir Davydov   fs: shrinker: alw...
92
93
94
  	 *
  	 * Ensure that we always scan at least one object - memcg kmem
  	 * accounting uses this to fully empty the caches.
0a234c6dc   Dave Chinner   shrinker: convert...
95
  	 */
49e7e7ff8   Vladimir Davydov   fs: shrinker: alw...
96
  	sc->nr_to_scan = dentries + 1;
503c358cf   Vladimir Davydov   list_lru: introdu...
97
  	freed = prune_dcache_sb(sb, sc);
49e7e7ff8   Vladimir Davydov   fs: shrinker: alw...
98
  	sc->nr_to_scan = inodes + 1;
503c358cf   Vladimir Davydov   list_lru: introdu...
99
  	freed += prune_icache_sb(sb, sc);
0a234c6dc   Dave Chinner   shrinker: convert...
100
101
  
  	if (fs_objects) {
49e7e7ff8   Vladimir Davydov   fs: shrinker: alw...
102
  		sc->nr_to_scan = fs_objects + 1;
4101b6243   Vladimir Davydov   fs: consolidate {...
103
  		freed += sb->s_op->free_cached_objects(sb, sc);
b0d40c92a   Dave Chinner   superblock: intro...
104
  	}
eb6ef3df4   Konstantin Khlebnikov   trylock_super(): ...
105
  	up_read(&sb->s_umount);
0a234c6dc   Dave Chinner   shrinker: convert...
106
107
108
109
110
111
112
113
114
115
  	return freed;
  }
  
  static unsigned long super_cache_count(struct shrinker *shrink,
  				       struct shrink_control *sc)
  {
  	struct super_block *sb;
  	long	total_objects = 0;
  
  	sb = container_of(shrink, struct super_block, s_shrink);
d23da150a   Tim Chen   fs/superblock: av...
116
  	/*
eb6ef3df4   Konstantin Khlebnikov   trylock_super(): ...
117
  	 * Don't call trylock_super as it is a potential
d23da150a   Tim Chen   fs/superblock: av...
118
119
120
  	 * scalability bottleneck. The counts could get updated
  	 * between super_cache_count and super_cache_scan anyway.
  	 * Call to super_cache_count with shrinker_rwsem held
503c358cf   Vladimir Davydov   list_lru: introdu...
121
  	 * ensures the safety of call to list_lru_shrink_count() and
d23da150a   Tim Chen   fs/superblock: av...
122
123
  	 * s_op->nr_cached_objects().
  	 */
0a234c6dc   Dave Chinner   shrinker: convert...
124
  	if (sb->s_op && sb->s_op->nr_cached_objects)
4101b6243   Vladimir Davydov   fs: consolidate {...
125
  		total_objects = sb->s_op->nr_cached_objects(sb, sc);
0a234c6dc   Dave Chinner   shrinker: convert...
126

503c358cf   Vladimir Davydov   list_lru: introdu...
127
128
  	total_objects += list_lru_shrink_count(&sb->s_dentry_lru, sc);
  	total_objects += list_lru_shrink_count(&sb->s_inode_lru, sc);
0a234c6dc   Dave Chinner   shrinker: convert...
129

55f841ce9   Glauber Costa   super: fix calcul...
130
  	total_objects = vfs_pressure_ratio(total_objects);
0e1fdafd9   Dave Chinner   superblock: add f...
131
  	return total_objects;
b0d40c92a   Dave Chinner   superblock: intro...
132
  }
853b39a7c   Oleg Nesterov   shift percpu_coun...
133
134
135
136
137
138
139
  static void destroy_super_work(struct work_struct *work)
  {
  	struct super_block *s = container_of(work, struct super_block,
  							destroy_work);
  	int i;
  
  	for (i = 0; i < SB_FREEZE_LEVELS; i++)
8129ed296   Oleg Nesterov   change sb_writers...
140
  		percpu_free_rwsem(&s->s_writers.rw_sem[i]);
853b39a7c   Oleg Nesterov   shift percpu_coun...
141
142
143
144
145
146
147
148
149
  	kfree(s);
  }
  
  static void destroy_super_rcu(struct rcu_head *head)
  {
  	struct super_block *s = container_of(head, struct super_block, rcu);
  	INIT_WORK(&s->destroy_work, destroy_super_work);
  	schedule_work(&s->destroy_work);
  }
7eb5e8826   Al Viro   uninline destroy_...
150
151
152
153
154
155
156
  /**
   *	destroy_super	-	frees a superblock
   *	@s: superblock to free
   *
   *	Frees a superblock.
   */
  static void destroy_super(struct super_block *s)
5accdf82b   Jan Kara   fs: Improve files...
157
  {
7eb5e8826   Al Viro   uninline destroy_...
158
159
  	list_lru_destroy(&s->s_dentry_lru);
  	list_lru_destroy(&s->s_inode_lru);
7eb5e8826   Al Viro   uninline destroy_...
160
161
  	security_sb_free(s);
  	WARN_ON(!list_empty(&s->s_mounts));
6e4eab577   Eric W. Biederman   fs: Add user name...
162
  	put_user_ns(s->s_user_ns);
7eb5e8826   Al Viro   uninline destroy_...
163
164
  	kfree(s->s_subtype);
  	kfree(s->s_options);
853b39a7c   Oleg Nesterov   shift percpu_coun...
165
  	call_rcu(&s->rcu, destroy_super_rcu);
5accdf82b   Jan Kara   fs: Improve files...
166
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
167
168
  /**
   *	alloc_super	-	create new superblock
fe2bbc483   Henrik Kretzschmar   [PATCH] add missi...
169
   *	@type:	filesystem type superblock should belong to
9249e17fe   David Howells   VFS: Pass mount f...
170
   *	@flags: the mount flags
6e4eab577   Eric W. Biederman   fs: Add user name...
171
   *	@user_ns: User namespace for the super_block
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
172
173
174
175
   *
   *	Allocates and initializes a new &struct super_block.  alloc_super()
   *	returns a pointer new superblock or %NULL if allocation had failed.
   */
6e4eab577   Eric W. Biederman   fs: Add user name...
176
177
  static struct super_block *alloc_super(struct file_system_type *type, int flags,
  				       struct user_namespace *user_ns)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
178
  {
11b0b5abb   Oliver Neukum   [PATCH] use kzall...
179
  	struct super_block *s = kzalloc(sizeof(struct super_block),  GFP_USER);
b87221de6   Alexey Dobriyan   const: mark remai...
180
  	static const struct super_operations default_op;
7eb5e8826   Al Viro   uninline destroy_...
181
182
183
184
  	int i;
  
  	if (!s)
  		return NULL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
185

b5bd856a0   Vladimir Davydov   fs/super.c: fix W...
186
  	INIT_LIST_HEAD(&s->s_mounts);
6e4eab577   Eric W. Biederman   fs: Add user name...
187
  	s->s_user_ns = get_user_ns(user_ns);
b5bd856a0   Vladimir Davydov   fs/super.c: fix W...
188

7eb5e8826   Al Viro   uninline destroy_...
189
190
  	if (security_sb_alloc(s))
  		goto fail;
7b7a8665e   Christoph Hellwig   direct-io: Implem...
191

7eb5e8826   Al Viro   uninline destroy_...
192
  	for (i = 0; i < SB_FREEZE_LEVELS; i++) {
8129ed296   Oleg Nesterov   change sb_writers...
193
194
195
  		if (__percpu_init_rwsem(&s->s_writers.rw_sem[i],
  					sb_writers_name[i],
  					&type->s_writers_key[i]))
7eb5e8826   Al Viro   uninline destroy_...
196
  			goto fail;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
197
  	}
7eb5e8826   Al Viro   uninline destroy_...
198
  	init_waitqueue_head(&s->s_writers.wait_unfrozen);
df0ce26cb   Christoph Hellwig   fs: remove defaul...
199
  	s->s_bdi = &noop_backing_dev_info;
7eb5e8826   Al Viro   uninline destroy_...
200
  	s->s_flags = flags;
cc50a07a2   Eric W. Biederman   userns: Remove th...
201
  	if (s->s_user_ns != &init_user_ns)
67690f937   Eric W. Biederman   userns: Remove im...
202
  		s->s_iflags |= SB_I_NODEV;
7eb5e8826   Al Viro   uninline destroy_...
203
204
  	INIT_HLIST_NODE(&s->s_instances);
  	INIT_HLIST_BL_HEAD(&s->s_anon);
e97fedb9e   Dave Chinner   sync: serialise p...
205
  	mutex_init(&s->s_sync_lock);
7eb5e8826   Al Viro   uninline destroy_...
206
  	INIT_LIST_HEAD(&s->s_inodes);
74278da9f   Dave Chinner   inode: convert in...
207
  	spin_lock_init(&s->s_inode_list_lock);
6c60d2b57   Dave Chinner   fs/fs-writeback.c...
208
209
  	INIT_LIST_HEAD(&s->s_inodes_wb);
  	spin_lock_init(&s->s_inode_wblist_lock);
7eb5e8826   Al Viro   uninline destroy_...
210

2acb60a04   Vladimir Davydov   fs: make shrinker...
211
  	if (list_lru_init_memcg(&s->s_dentry_lru))
7eb5e8826   Al Viro   uninline destroy_...
212
  		goto fail;
2acb60a04   Vladimir Davydov   fs: make shrinker...
213
  	if (list_lru_init_memcg(&s->s_inode_lru))
7eb5e8826   Al Viro   uninline destroy_...
214
  		goto fail;
7eb5e8826   Al Viro   uninline destroy_...
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
  	init_rwsem(&s->s_umount);
  	lockdep_set_class(&s->s_umount, &type->s_umount_key);
  	/*
  	 * sget() can have s_umount recursion.
  	 *
  	 * When it cannot find a suitable sb, it allocates a new
  	 * one (this one), and tries again to find a suitable old
  	 * one.
  	 *
  	 * In case that succeeds, it will acquire the s_umount
  	 * lock of the old one. Since these are clearly distrinct
  	 * locks, and this object isn't exposed yet, there's no
  	 * risk of deadlocks.
  	 *
  	 * Annotate this by putting this lock in a different
  	 * subclass.
  	 */
  	down_write_nested(&s->s_umount, SINGLE_DEPTH_NESTING);
  	s->s_count = 1;
  	atomic_set(&s->s_active, 1);
  	mutex_init(&s->s_vfs_rename_mutex);
  	lockdep_set_class(&s->s_vfs_rename_mutex, &type->s_vfs_rename_key);
  	mutex_init(&s->s_dquot.dqio_mutex);
  	mutex_init(&s->s_dquot.dqonoff_mutex);
7eb5e8826   Al Viro   uninline destroy_...
239
240
241
  	s->s_maxbytes = MAX_NON_LFS;
  	s->s_op = &default_op;
  	s->s_time_gran = 1000000000;
3cb29d111   Vladimir Davydov   cleancache: remov...
242
  	s->cleancache_poolid = CLEANCACHE_NO_POOL;
7eb5e8826   Al Viro   uninline destroy_...
243
244
245
246
247
  
  	s->s_shrink.seeks = DEFAULT_SEEKS;
  	s->s_shrink.scan_objects = super_cache_scan;
  	s->s_shrink.count_objects = super_cache_count;
  	s->s_shrink.batch = 1024;
2acb60a04   Vladimir Davydov   fs: make shrinker...
248
  	s->s_shrink.flags = SHRINKER_NUMA_AWARE | SHRINKER_MEMCG_AWARE;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
249
  	return s;
5ca302c8e   Glauber Costa   list_lru: dynamic...
250

7eb5e8826   Al Viro   uninline destroy_...
251
252
253
  fail:
  	destroy_super(s);
  	return NULL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
254
255
256
257
258
  }
  
  /* Superblock refcounting  */
  
  /*
35cf7ba0b   Al Viro   Bury __put_super_...
259
   * Drop a superblock's refcount.  The caller must hold sb_lock.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
260
   */
f47ec3f28   Al Viro   trim fs/internal.h
261
  static void __put_super(struct super_block *sb)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
262
  {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
263
  	if (!--sb->s_count) {
551de6f34   Al Viro   Leave superblocks...
264
  		list_del_init(&sb->s_list);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
265
  		destroy_super(sb);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
266
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
267
268
269
270
271
272
273
274
275
  }
  
  /**
   *	put_super	-	drop a temporary reference to superblock
   *	@sb: superblock in question
   *
   *	Drops a temporary reference, frees superblock if there's no
   *	references left.
   */
f47ec3f28   Al Viro   trim fs/internal.h
276
  static void put_super(struct super_block *sb)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
277
278
279
280
281
282
283
284
  {
  	spin_lock(&sb_lock);
  	__put_super(sb);
  	spin_unlock(&sb_lock);
  }
  
  
  /**
1712ac8fd   Al Viro   Saner locking aro...
285
   *	deactivate_locked_super	-	drop an active reference to superblock
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
286
287
   *	@s: superblock to deactivate
   *
bd7ced988   Masanari Iida   Doc: treewide : F...
288
   *	Drops an active reference to superblock, converting it into a temporary
1712ac8fd   Al Viro   Saner locking aro...
289
   *	one if there is no other active references left.  In that case we
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
290
291
   *	tell fs driver to shut it down and drop the temporary reference we
   *	had just acquired.
1712ac8fd   Al Viro   Saner locking aro...
292
293
   *
   *	Caller holds exclusive lock on superblock; that lock is released.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
294
   */
1712ac8fd   Al Viro   Saner locking aro...
295
  void deactivate_locked_super(struct super_block *s)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
296
297
  {
  	struct file_system_type *fs = s->s_type;
b20bd1a5e   Al Viro   get rid of S_BIAS
298
  	if (atomic_dec_and_test(&s->s_active)) {
3167760f8   Dan Magenheimer   mm: cleancache: s...
299
  		cleancache_invalidate_fs(s);
b0d40c92a   Dave Chinner   superblock: intro...
300
  		unregister_shrinker(&s->s_shrink);
28f2cd4f6   Dave Chinner   fs/superblock: un...
301
  		fs->kill_sb(s);
f5e1dd345   Glauber Costa   super: fix for de...
302

c0a5b5609   Vladimir Davydov   list_lru: organiz...
303
304
305
306
307
308
309
  		/*
  		 * Since list_lru_destroy() may sleep, we cannot call it from
  		 * put_super(), where we hold the sb_lock. Therefore we destroy
  		 * the lru lists right now.
  		 */
  		list_lru_destroy(&s->s_dentry_lru);
  		list_lru_destroy(&s->s_inode_lru);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
310
311
  		put_filesystem(fs);
  		put_super(s);
1712ac8fd   Al Viro   Saner locking aro...
312
313
  	} else {
  		up_write(&s->s_umount);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
314
315
  	}
  }
1712ac8fd   Al Viro   Saner locking aro...
316
  EXPORT_SYMBOL(deactivate_locked_super);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
317
318
  
  /**
1712ac8fd   Al Viro   Saner locking aro...
319
   *	deactivate_super	-	drop an active reference to superblock
74dbbdd7f   Al Viro   New helper: deact...
320
321
   *	@s: superblock to deactivate
   *
1712ac8fd   Al Viro   Saner locking aro...
322
323
324
   *	Variant of deactivate_locked_super(), except that superblock is *not*
   *	locked by caller.  If we are going to drop the final active reference,
   *	lock will be acquired prior to that.
74dbbdd7f   Al Viro   New helper: deact...
325
   */
1712ac8fd   Al Viro   Saner locking aro...
326
  void deactivate_super(struct super_block *s)
74dbbdd7f   Al Viro   New helper: deact...
327
  {
1712ac8fd   Al Viro   Saner locking aro...
328
329
330
          if (!atomic_add_unless(&s->s_active, -1, 1)) {
  		down_write(&s->s_umount);
  		deactivate_locked_super(s);
74dbbdd7f   Al Viro   New helper: deact...
331
332
  	}
  }
1712ac8fd   Al Viro   Saner locking aro...
333
  EXPORT_SYMBOL(deactivate_super);
74dbbdd7f   Al Viro   New helper: deact...
334
335
  
  /**
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
336
337
338
339
340
341
342
343
   *	grab_super - acquire an active reference
   *	@s: reference we are trying to make active
   *
   *	Tries to acquire an active reference.  grab_super() is used when we
   * 	had just found a superblock in super_blocks or fs_type->fs_supers
   *	and want to turn it into a full-blown active reference.  grab_super()
   *	is called with sb_lock held and drops it.  Returns 1 in case of
   *	success, 0 if we had failed (superblock contents was already dead or
acfec9a5a   Al Viro   livelock avoidanc...
344
345
346
   *	dying when grab_super() had been called).  Note that this is only
   *	called for superblocks not in rundown mode (== ones still on ->fs_supers
   *	of their type), so increment of ->s_count is OK here.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
347
   */
9c4dbee79   Josh Triplett   [PATCH] fs: add l...
348
  static int grab_super(struct super_block *s) __releases(sb_lock)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
349
350
351
352
  {
  	s->s_count++;
  	spin_unlock(&sb_lock);
  	down_write(&s->s_umount);
acfec9a5a   Al Viro   livelock avoidanc...
353
354
355
356
  	if ((s->s_flags & MS_BORN) && atomic_inc_not_zero(&s->s_active)) {
  		put_super(s);
  		return 1;
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
357
358
  	up_write(&s->s_umount);
  	put_super(s);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
359
360
  	return 0;
  }
cf9a2ae8d   David Howells   [PATCH] BLOCK: Mo...
361
  /*
eb6ef3df4   Konstantin Khlebnikov   trylock_super(): ...
362
   *	trylock_super - try to grab ->s_umount shared
331cbdeed   Wanpeng Li   writeback: Fix so...
363
   *	@sb: reference we are trying to grab
12ad3ab66   Dave Chinner   superblock: move ...
364
   *
eb6ef3df4   Konstantin Khlebnikov   trylock_super(): ...
365
   *	Try to prevent fs shutdown.  This is used in places where we
12ad3ab66   Dave Chinner   superblock: move ...
366
   *	cannot take an active reference but we need to ensure that the
eb6ef3df4   Konstantin Khlebnikov   trylock_super(): ...
367
368
369
370
371
372
373
374
375
376
   *	filesystem is not shut down while we are working on it. It returns
   *	false if we cannot acquire s_umount or if we lose the race and
   *	filesystem already got into shutdown, and returns true with the s_umount
   *	lock held in read mode in case of success. On successful return,
   *	the caller must drop the s_umount lock when done.
   *
   *	Note that unlike get_super() et.al. this one does *not* bump ->s_count.
   *	The reason why it's safe is that we are OK with doing trylock instead
   *	of down_read().  There's a couple of places that are OK with that, but
   *	it's very much not a general-purpose interface.
12ad3ab66   Dave Chinner   superblock: move ...
377
   */
eb6ef3df4   Konstantin Khlebnikov   trylock_super(): ...
378
  bool trylock_super(struct super_block *sb)
12ad3ab66   Dave Chinner   superblock: move ...
379
  {
12ad3ab66   Dave Chinner   superblock: move ...
380
  	if (down_read_trylock(&sb->s_umount)) {
eb6ef3df4   Konstantin Khlebnikov   trylock_super(): ...
381
382
  		if (!hlist_unhashed(&sb->s_instances) &&
  		    sb->s_root && (sb->s_flags & MS_BORN))
12ad3ab66   Dave Chinner   superblock: move ...
383
384
385
  			return true;
  		up_read(&sb->s_umount);
  	}
12ad3ab66   Dave Chinner   superblock: move ...
386
387
  	return false;
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
388
389
390
391
392
393
394
395
396
  /**
   *	generic_shutdown_super	-	common helper for ->kill_sb()
   *	@sb: superblock to kill
   *
   *	generic_shutdown_super() does all fs-independent work on superblock
   *	shutdown.  Typical ->kill_sb() should pick all fs-specific objects
   *	that need destruction out of superblock, call generic_shutdown_super()
   *	and release aforementioned objects.  Note: dentries and inodes _are_
   *	taken care of and do not need specific handling.
c636ebdb1   David Howells   [PATCH] VFS: Dest...
397
398
399
400
   *
   *	Upon calling this function, the filesystem may no longer alter or
   *	rearrange the set of dentries belonging to this super_block, nor may it
   *	change the attachments of dentries to inodes.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
401
402
403
   */
  void generic_shutdown_super(struct super_block *sb)
  {
ee9b6d61a   Josef 'Jeff' Sipek   [PATCH] Mark stru...
404
  	const struct super_operations *sop = sb->s_op;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
405

c636ebdb1   David Howells   [PATCH] VFS: Dest...
406
407
  	if (sb->s_root) {
  		shrink_dcache_for_umount(sb);
60b0680fa   Jan Kara   vfs: Rename fsync...
408
  		sync_filesystem(sb);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
409
  		sb->s_flags &= ~MS_ACTIVE;
efaee1920   Arjan van de Ven   async: make the f...
410

74278da9f   Dave Chinner   inode: convert in...
411
  		fsnotify_unmount_inodes(sb);
a1a0e23e4   Tejun Heo   writeback: flush ...
412
  		cgroup_writeback_umount();
63997e98a   Al Viro   split invalidate_...
413
414
  
  		evict_inodes(sb);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
415

7b7a8665e   Christoph Hellwig   direct-io: Implem...
416
417
418
419
  		if (sb->s_dio_done_wq) {
  			destroy_workqueue(sb->s_dio_done_wq);
  			sb->s_dio_done_wq = NULL;
  		}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
420
421
  		if (sop->put_super)
  			sop->put_super(sb);
63997e98a   Al Viro   split invalidate_...
422
  		if (!list_empty(&sb->s_inodes)) {
7b4fe29e0   Dave Jones   [PATCH] More info...
423
424
425
426
  			printk("VFS: Busy inodes after unmount of %s. "
  			   "Self-destruct in 5 seconds.  Have a nice day...
  ",
  			   sb->s_id);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
427
  		}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
428
429
430
  	}
  	spin_lock(&sb_lock);
  	/* should be initialized for __put_super_and_need_restart() */
a5166169f   Al Viro   vfs: convert fs_s...
431
  	hlist_del_init(&sb->s_instances);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
432
433
434
435
436
437
438
  	spin_unlock(&sb_lock);
  	up_write(&sb->s_umount);
  }
  
  EXPORT_SYMBOL(generic_shutdown_super);
  
  /**
6e4eab577   Eric W. Biederman   fs: Add user name...
439
   *	sget_userns -	find or create a superblock
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
440
441
442
   *	@type:	filesystem type superblock should belong to
   *	@test:	comparison callback
   *	@set:	setup callback
9249e17fe   David Howells   VFS: Pass mount f...
443
   *	@flags:	mount flags
6e4eab577   Eric W. Biederman   fs: Add user name...
444
   *	@user_ns: User namespace for the super_block
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
445
446
   *	@data:	argument to each of them
   */
6e4eab577   Eric W. Biederman   fs: Add user name...
447
  struct super_block *sget_userns(struct file_system_type *type,
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
448
449
  			int (*test)(struct super_block *,void *),
  			int (*set)(struct super_block *,void *),
6e4eab577   Eric W. Biederman   fs: Add user name...
450
  			int flags, struct user_namespace *user_ns,
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
451
452
453
  			void *data)
  {
  	struct super_block *s = NULL;
d47301271   Matthias Kaehlcke   fs/super.c: use l...
454
  	struct super_block *old;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
455
  	int err;
a001e74ce   Eric W. Biederman   mnt: Move the FS_...
456
457
458
459
  	if (!(flags & MS_KERNMOUNT) &&
  	    !(type->fs_flags & FS_USERNS_MOUNT) &&
  	    !capable(CAP_SYS_ADMIN))
  		return ERR_PTR(-EPERM);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
460
461
  retry:
  	spin_lock(&sb_lock);
d47301271   Matthias Kaehlcke   fs/super.c: use l...
462
  	if (test) {
b67bfe0d4   Sasha Levin   hlist: drop the n...
463
  		hlist_for_each_entry(old, &type->fs_supers, s_instances) {
d47301271   Matthias Kaehlcke   fs/super.c: use l...
464
465
  			if (!test(old, data))
  				continue;
6e4eab577   Eric W. Biederman   fs: Add user name...
466
467
468
469
470
471
472
473
  			if (user_ns != old->s_user_ns) {
  				spin_unlock(&sb_lock);
  				if (s) {
  					up_write(&s->s_umount);
  					destroy_super(s);
  				}
  				return ERR_PTR(-EBUSY);
  			}
d47301271   Matthias Kaehlcke   fs/super.c: use l...
474
475
  			if (!grab_super(old))
  				goto retry;
a3cfbb53b   Li Zefan   vfs: add missing ...
476
477
  			if (s) {
  				up_write(&s->s_umount);
d47301271   Matthias Kaehlcke   fs/super.c: use l...
478
  				destroy_super(s);
7a4dec538   Al Viro   Fix sget() race w...
479
  				s = NULL;
a3cfbb53b   Li Zefan   vfs: add missing ...
480
  			}
d47301271   Matthias Kaehlcke   fs/super.c: use l...
481
482
  			return old;
  		}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
483
484
485
  	}
  	if (!s) {
  		spin_unlock(&sb_lock);
6e4eab577   Eric W. Biederman   fs: Add user name...
486
  		s = alloc_super(type, flags, user_ns);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
487
488
489
490
491
492
493
494
  		if (!s)
  			return ERR_PTR(-ENOMEM);
  		goto retry;
  	}
  		
  	err = set(s, data);
  	if (err) {
  		spin_unlock(&sb_lock);
a3cfbb53b   Li Zefan   vfs: add missing ...
495
  		up_write(&s->s_umount);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
496
497
498
499
500
501
  		destroy_super(s);
  		return ERR_PTR(err);
  	}
  	s->s_type = type;
  	strlcpy(s->s_id, type->name, sizeof(s->s_id));
  	list_add_tail(&s->s_list, &super_blocks);
a5166169f   Al Viro   vfs: convert fs_s...
502
  	hlist_add_head(&s->s_instances, &type->fs_supers);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
503
504
  	spin_unlock(&sb_lock);
  	get_filesystem(type);
b0d40c92a   Dave Chinner   superblock: intro...
505
  	register_shrinker(&s->s_shrink);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
506
507
  	return s;
  }
6e4eab577   Eric W. Biederman   fs: Add user name...
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
  EXPORT_SYMBOL(sget_userns);
  
  /**
   *	sget	-	find or create a superblock
   *	@type:	  filesystem type superblock should belong to
   *	@test:	  comparison callback
   *	@set:	  setup callback
   *	@flags:	  mount flags
   *	@data:	  argument to each of them
   */
  struct super_block *sget(struct file_system_type *type,
  			int (*test)(struct super_block *,void *),
  			int (*set)(struct super_block *,void *),
  			int flags,
  			void *data)
  {
  	struct user_namespace *user_ns = current_user_ns();
  
  	/* Ensure the requestor has permissions over the target filesystem */
  	if (!(flags & MS_KERNMOUNT) && !ns_capable(user_ns, CAP_SYS_ADMIN))
  		return ERR_PTR(-EPERM);
  
  	return sget_userns(type, test, set, flags, user_ns, data);
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
532
533
534
535
536
537
538
539
540
  EXPORT_SYMBOL(sget);
  
  void drop_super(struct super_block *sb)
  {
  	up_read(&sb->s_umount);
  	put_super(sb);
  }
  
  EXPORT_SYMBOL(drop_super);
e50047533   Christoph Hellwig   cleanup sync_supers
541
  /**
01a05b337   Al Viro   new helper: itera...
542
543
544
545
546
547
548
549
550
   *	iterate_supers - call function for all active superblocks
   *	@f: function to call
   *	@arg: argument to pass to it
   *
   *	Scans the superblock list and calls given function, passing it
   *	locked superblock and given argument.
   */
  void iterate_supers(void (*f)(struct super_block *, void *), void *arg)
  {
dca332528   Al Viro   no need for list_...
551
  	struct super_block *sb, *p = NULL;
01a05b337   Al Viro   new helper: itera...
552
553
  
  	spin_lock(&sb_lock);
dca332528   Al Viro   no need for list_...
554
  	list_for_each_entry(sb, &super_blocks, s_list) {
a5166169f   Al Viro   vfs: convert fs_s...
555
  		if (hlist_unhashed(&sb->s_instances))
01a05b337   Al Viro   new helper: itera...
556
557
558
559
560
  			continue;
  		sb->s_count++;
  		spin_unlock(&sb_lock);
  
  		down_read(&sb->s_umount);
dabe0dc19   Al Viro   vfs: fix the rest...
561
  		if (sb->s_root && (sb->s_flags & MS_BORN))
01a05b337   Al Viro   new helper: itera...
562
563
564
565
  			f(sb, arg);
  		up_read(&sb->s_umount);
  
  		spin_lock(&sb_lock);
dca332528   Al Viro   no need for list_...
566
567
568
  		if (p)
  			__put_super(p);
  		p = sb;
01a05b337   Al Viro   new helper: itera...
569
  	}
dca332528   Al Viro   no need for list_...
570
571
  	if (p)
  		__put_super(p);
01a05b337   Al Viro   new helper: itera...
572
573
574
575
  	spin_unlock(&sb_lock);
  }
  
  /**
43e15cdbe   Al Viro   new helper: itera...
576
577
578
579
580
581
582
583
584
585
586
587
588
589
   *	iterate_supers_type - call function for superblocks of given type
   *	@type: fs type
   *	@f: function to call
   *	@arg: argument to pass to it
   *
   *	Scans the superblock list and calls given function, passing it
   *	locked superblock and given argument.
   */
  void iterate_supers_type(struct file_system_type *type,
  	void (*f)(struct super_block *, void *), void *arg)
  {
  	struct super_block *sb, *p = NULL;
  
  	spin_lock(&sb_lock);
b67bfe0d4   Sasha Levin   hlist: drop the n...
590
  	hlist_for_each_entry(sb, &type->fs_supers, s_instances) {
43e15cdbe   Al Viro   new helper: itera...
591
592
593
594
  		sb->s_count++;
  		spin_unlock(&sb_lock);
  
  		down_read(&sb->s_umount);
dabe0dc19   Al Viro   vfs: fix the rest...
595
  		if (sb->s_root && (sb->s_flags & MS_BORN))
43e15cdbe   Al Viro   new helper: itera...
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
  			f(sb, arg);
  		up_read(&sb->s_umount);
  
  		spin_lock(&sb_lock);
  		if (p)
  			__put_super(p);
  		p = sb;
  	}
  	if (p)
  		__put_super(p);
  	spin_unlock(&sb_lock);
  }
  
  EXPORT_SYMBOL(iterate_supers_type);
  
  /**
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
612
613
614
615
616
617
   *	get_super - get the superblock of a device
   *	@bdev: device to get the superblock for
   *	
   *	Scans the superblock list and finds the superblock of the file system
   *	mounted on the device given. %NULL is returned if no match is found.
   */
df40c01a9   Al Viro   In get_super() an...
618
  struct super_block *get_super(struct block_device *bdev)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
619
  {
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
620
  	struct super_block *sb;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
621
622
  	if (!bdev)
  		return NULL;
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
623

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
624
  	spin_lock(&sb_lock);
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
625
626
  rescan:
  	list_for_each_entry(sb, &super_blocks, s_list) {
a5166169f   Al Viro   vfs: convert fs_s...
627
  		if (hlist_unhashed(&sb->s_instances))
551de6f34   Al Viro   Leave superblocks...
628
  			continue;
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
629
630
  		if (sb->s_bdev == bdev) {
  			sb->s_count++;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
631
  			spin_unlock(&sb_lock);
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
632
  			down_read(&sb->s_umount);
df40c01a9   Al Viro   In get_super() an...
633
  			/* still alive? */
dabe0dc19   Al Viro   vfs: fix the rest...
634
  			if (sb->s_root && (sb->s_flags & MS_BORN))
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
635
636
  				return sb;
  			up_read(&sb->s_umount);
df40c01a9   Al Viro   In get_super() an...
637
  			/* nope, got unmounted */
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
638
  			spin_lock(&sb_lock);
df40c01a9   Al Viro   In get_super() an...
639
640
  			__put_super(sb);
  			goto rescan;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
641
642
643
644
645
646
647
  		}
  	}
  	spin_unlock(&sb_lock);
  	return NULL;
  }
  
  EXPORT_SYMBOL(get_super);
4504230a7   Christoph Hellwig   freeze_bdev: grab...
648
649
  
  /**
6b6dc836a   Jan Kara   vfs: Provide func...
650
651
652
653
654
655
656
657
658
659
660
661
   *	get_super_thawed - get thawed superblock of a device
   *	@bdev: device to get the superblock for
   *
   *	Scans the superblock list and finds the superblock of the file system
   *	mounted on the device. The superblock is returned once it is thawed
   *	(or immediately if it was not frozen). %NULL is returned if no match
   *	is found.
   */
  struct super_block *get_super_thawed(struct block_device *bdev)
  {
  	while (1) {
  		struct super_block *s = get_super(bdev);
5accdf82b   Jan Kara   fs: Improve files...
662
  		if (!s || s->s_writers.frozen == SB_UNFROZEN)
6b6dc836a   Jan Kara   vfs: Provide func...
663
664
  			return s;
  		up_read(&s->s_umount);
5accdf82b   Jan Kara   fs: Improve files...
665
666
  		wait_event(s->s_writers.wait_unfrozen,
  			   s->s_writers.frozen == SB_UNFROZEN);
6b6dc836a   Jan Kara   vfs: Provide func...
667
668
669
670
671
672
  		put_super(s);
  	}
  }
  EXPORT_SYMBOL(get_super_thawed);
  
  /**
4504230a7   Christoph Hellwig   freeze_bdev: grab...
673
674
675
676
677
   * get_active_super - get an active reference to the superblock of a device
   * @bdev: device to get the superblock for
   *
   * Scans the superblock list and finds the superblock of the file system
   * mounted on the device given.  Returns the superblock with an active
d3f214730   Al Viro   Move grabbing s_u...
678
   * reference or %NULL if none was found.
4504230a7   Christoph Hellwig   freeze_bdev: grab...
679
680
681
682
683
684
685
   */
  struct super_block *get_active_super(struct block_device *bdev)
  {
  	struct super_block *sb;
  
  	if (!bdev)
  		return NULL;
1494583de   Al Viro   fix get_active_su...
686
  restart:
4504230a7   Christoph Hellwig   freeze_bdev: grab...
687
688
  	spin_lock(&sb_lock);
  	list_for_each_entry(sb, &super_blocks, s_list) {
a5166169f   Al Viro   vfs: convert fs_s...
689
  		if (hlist_unhashed(&sb->s_instances))
551de6f34   Al Viro   Leave superblocks...
690
  			continue;
1494583de   Al Viro   fix get_active_su...
691
  		if (sb->s_bdev == bdev) {
acfec9a5a   Al Viro   livelock avoidanc...
692
  			if (!grab_super(sb))
1494583de   Al Viro   fix get_active_su...
693
  				goto restart;
acfec9a5a   Al Viro   livelock avoidanc...
694
695
  			up_write(&sb->s_umount);
  			return sb;
1494583de   Al Viro   fix get_active_su...
696
  		}
4504230a7   Christoph Hellwig   freeze_bdev: grab...
697
698
699
700
  	}
  	spin_unlock(&sb_lock);
  	return NULL;
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
701
   
df40c01a9   Al Viro   In get_super() an...
702
  struct super_block *user_get_super(dev_t dev)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
703
  {
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
704
  	struct super_block *sb;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
705

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
706
  	spin_lock(&sb_lock);
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
707
708
  rescan:
  	list_for_each_entry(sb, &super_blocks, s_list) {
a5166169f   Al Viro   vfs: convert fs_s...
709
  		if (hlist_unhashed(&sb->s_instances))
551de6f34   Al Viro   Leave superblocks...
710
  			continue;
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
711
712
  		if (sb->s_dev ==  dev) {
  			sb->s_count++;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
713
  			spin_unlock(&sb_lock);
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
714
  			down_read(&sb->s_umount);
df40c01a9   Al Viro   In get_super() an...
715
  			/* still alive? */
dabe0dc19   Al Viro   vfs: fix the rest...
716
  			if (sb->s_root && (sb->s_flags & MS_BORN))
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
717
718
  				return sb;
  			up_read(&sb->s_umount);
df40c01a9   Al Viro   In get_super() an...
719
  			/* nope, got unmounted */
618f06362   Kirill Korotaev   [PATCH] O(1) sb l...
720
  			spin_lock(&sb_lock);
df40c01a9   Al Viro   In get_super() an...
721
722
  			__put_super(sb);
  			goto rescan;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
723
724
725
726
727
  		}
  	}
  	spin_unlock(&sb_lock);
  	return NULL;
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
728
  /**
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
729
730
731
732
733
734
735
736
737
738
739
   *	do_remount_sb - asks filesystem to change mount options.
   *	@sb:	superblock in question
   *	@flags:	numeric part of options
   *	@data:	the rest of options
   *      @force: whether or not to force the change
   *
   *	Alters the mount options of a mounted file system.
   */
  int do_remount_sb(struct super_block *sb, int flags, void *data, int force)
  {
  	int retval;
c79d967de   Christoph Hellwig   quota: move remou...
740
  	int remount_ro;
4504230a7   Christoph Hellwig   freeze_bdev: grab...
741

5accdf82b   Jan Kara   fs: Improve files...
742
  	if (sb->s_writers.frozen != SB_UNFROZEN)
4504230a7   Christoph Hellwig   freeze_bdev: grab...
743
  		return -EBUSY;
9361401eb   David Howells   [PATCH] BLOCK: Ma...
744
  #ifdef CONFIG_BLOCK
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
745
746
  	if (!(flags & MS_RDONLY) && bdev_read_only(sb->s_bdev))
  		return -EACCES;
9361401eb   David Howells   [PATCH] BLOCK: Ma...
747
  #endif
4504230a7   Christoph Hellwig   freeze_bdev: grab...
748

d208bbdda   Nick Piggin   fs: improve remou...
749
  	remount_ro = (flags & MS_RDONLY) && !(sb->s_flags & MS_RDONLY);
d208bbdda   Nick Piggin   fs: improve remou...
750

0aec09d04   Al Viro   drop ->s_umount a...
751
  	if (remount_ro) {
fdab684d7   Al Viro   allow attaching f...
752
  		if (!hlist_empty(&sb->s_pins)) {
0aec09d04   Al Viro   drop ->s_umount a...
753
  			up_write(&sb->s_umount);
fdab684d7   Al Viro   allow attaching f...
754
  			group_pin_kill(&sb->s_pins);
0aec09d04   Al Viro   drop ->s_umount a...
755
756
757
758
759
760
761
762
763
  			down_write(&sb->s_umount);
  			if (!sb->s_root)
  				return 0;
  			if (sb->s_writers.frozen != SB_UNFROZEN)
  				return -EBUSY;
  			remount_ro = (flags & MS_RDONLY) && !(sb->s_flags & MS_RDONLY);
  		}
  	}
  	shrink_dcache_sb(sb);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
764
765
  	/* If we are remounting RDONLY and current sb is read/write,
  	   make sure there are no rw files opened */
d208bbdda   Nick Piggin   fs: improve remou...
766
  	if (remount_ro) {
4ed5e82fe   Miklos Szeredi   vfs: protect remo...
767
  		if (force) {
eee5cc270   Al Viro   get rid of s_file...
768
769
  			sb->s_readonly_remount = 1;
  			smp_wmb();
4ed5e82fe   Miklos Szeredi   vfs: protect remo...
770
771
772
773
  		} else {
  			retval = sb_prepare_remount_readonly(sb);
  			if (retval)
  				return retval;
4ed5e82fe   Miklos Szeredi   vfs: protect remo...
774
  		}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
775
776
777
  	}
  
  	if (sb->s_op->remount_fs) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
778
  		retval = sb->s_op->remount_fs(sb, &flags, data);
2833eb2b4   Miklos Szeredi   vfs: ignore error...
779
780
  		if (retval) {
  			if (!force)
4ed5e82fe   Miklos Szeredi   vfs: protect remo...
781
  				goto cancel_readonly;
2833eb2b4   Miklos Szeredi   vfs: ignore error...
782
783
784
785
786
  			/* If forced remount, go ahead despite any errors */
  			WARN(1, "forced remount of a %s fs returned %i
  ",
  			     sb->s_type->name, retval);
  		}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
787
788
  	}
  	sb->s_flags = (sb->s_flags & ~MS_RMT_MASK) | (flags & MS_RMT_MASK);
4ed5e82fe   Miklos Szeredi   vfs: protect remo...
789
790
791
  	/* Needs to be ordered wrt mnt_is_readonly() */
  	smp_wmb();
  	sb->s_readonly_remount = 0;
c79d967de   Christoph Hellwig   quota: move remou...
792

d208bbdda   Nick Piggin   fs: improve remou...
793
794
795
796
797
798
799
800
801
802
  	/*
  	 * Some filesystems modify their metadata via some other path than the
  	 * bdev buffer cache (eg. use a private mapping, or directories in
  	 * pagecache, etc). Also file data modifications go via their own
  	 * mappings. So If we try to mount readonly then copy the filesystem
  	 * from bdev, we could get stale data, so invalidate it to give a best
  	 * effort at coherency.
  	 */
  	if (remount_ro && sb->s_bdev)
  		invalidate_bdev(sb->s_bdev);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
803
  	return 0;
4ed5e82fe   Miklos Szeredi   vfs: protect remo...
804
805
806
807
  
  cancel_readonly:
  	sb->s_readonly_remount = 0;
  	return retval;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
808
  }
a2a9537ac   Jens Axboe   Get rid of pdflus...
809
  static void do_emergency_remount(struct work_struct *work)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
810
  {
dca332528   Al Viro   no need for list_...
811
  	struct super_block *sb, *p = NULL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
812
813
  
  	spin_lock(&sb_lock);
dca332528   Al Viro   no need for list_...
814
  	list_for_each_entry(sb, &super_blocks, s_list) {
a5166169f   Al Viro   vfs: convert fs_s...
815
  		if (hlist_unhashed(&sb->s_instances))
551de6f34   Al Viro   Leave superblocks...
816
  			continue;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
817
818
  		sb->s_count++;
  		spin_unlock(&sb_lock);
443b94baa   Al Viro   Make sure that al...
819
  		down_write(&sb->s_umount);
dabe0dc19   Al Viro   vfs: fix the rest...
820
821
  		if (sb->s_root && sb->s_bdev && (sb->s_flags & MS_BORN) &&
  		    !(sb->s_flags & MS_RDONLY)) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
822
  			/*
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
823
824
  			 * What lock protects sb->s_flags??
  			 */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
825
  			do_remount_sb(sb, MS_RDONLY, NULL, 1);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
826
  		}
443b94baa   Al Viro   Make sure that al...
827
  		up_write(&sb->s_umount);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
828
  		spin_lock(&sb_lock);
dca332528   Al Viro   no need for list_...
829
830
831
  		if (p)
  			__put_super(p);
  		p = sb;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
832
  	}
dca332528   Al Viro   no need for list_...
833
834
  	if (p)
  		__put_super(p);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
835
  	spin_unlock(&sb_lock);
a2a9537ac   Jens Axboe   Get rid of pdflus...
836
  	kfree(work);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
837
838
839
840
841
842
  	printk("Emergency Remount complete
  ");
  }
  
  void emergency_remount(void)
  {
a2a9537ac   Jens Axboe   Get rid of pdflus...
843
844
845
846
847
848
849
  	struct work_struct *work;
  
  	work = kmalloc(sizeof(*work), GFP_ATOMIC);
  	if (work) {
  		INIT_WORK(work, do_emergency_remount);
  		schedule_work(work);
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
850
851
852
853
854
855
  }
  
  /*
   * Unnamed block devices are dummy devices used by virtual
   * filesystems which don't use real block-devices.  -- jrs
   */
ad76cbc63   Alexey Dobriyan   [PATCH 2/2] anond...
856
  static DEFINE_IDA(unnamed_dev_ida);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
857
  static DEFINE_SPINLOCK(unnamed_dev_lock);/* protects the above */
a2a4dc494   Thomas Bächler   fs: Don't return ...
858
859
860
861
  /* Many userspace utilities consider an FSID of 0 invalid.
   * Always return at least 1 from get_anon_bdev.
   */
  static int unnamed_dev_start = 1;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
862

0ee5dc676   Al Viro   btrfs: kill magic...
863
  int get_anon_bdev(dev_t *p)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
864
865
866
867
868
  {
  	int dev;
  	int error;
  
   retry:
ad76cbc63   Alexey Dobriyan   [PATCH 2/2] anond...
869
  	if (ida_pre_get(&unnamed_dev_ida, GFP_ATOMIC) == 0)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
870
871
  		return -ENOMEM;
  	spin_lock(&unnamed_dev_lock);
c63e09ecc   Al Viro   Make allocation o...
872
  	error = ida_get_new_above(&unnamed_dev_ida, unnamed_dev_start, &dev);
f21f62208   Al Viro   ... and the same ...
873
874
  	if (!error)
  		unnamed_dev_start = dev + 1;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
875
876
877
878
879
880
  	spin_unlock(&unnamed_dev_lock);
  	if (error == -EAGAIN)
  		/* We raced and lost with another CPU. */
  		goto retry;
  	else if (error)
  		return -EAGAIN;
1af95de6f   Wang YanQing   fs:super:get_anon...
881
  	if (dev >= (1 << MINORBITS)) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
882
  		spin_lock(&unnamed_dev_lock);
ad76cbc63   Alexey Dobriyan   [PATCH 2/2] anond...
883
  		ida_remove(&unnamed_dev_ida, dev);
f21f62208   Al Viro   ... and the same ...
884
885
  		if (unnamed_dev_start > dev)
  			unnamed_dev_start = dev;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
886
887
888
  		spin_unlock(&unnamed_dev_lock);
  		return -EMFILE;
  	}
0ee5dc676   Al Viro   btrfs: kill magic...
889
  	*p = MKDEV(0, dev & MINORMASK);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
890
891
  	return 0;
  }
0ee5dc676   Al Viro   btrfs: kill magic...
892
  EXPORT_SYMBOL(get_anon_bdev);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
893

0ee5dc676   Al Viro   btrfs: kill magic...
894
  void free_anon_bdev(dev_t dev)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
895
  {
0ee5dc676   Al Viro   btrfs: kill magic...
896
  	int slot = MINOR(dev);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
897
  	spin_lock(&unnamed_dev_lock);
ad76cbc63   Alexey Dobriyan   [PATCH 2/2] anond...
898
  	ida_remove(&unnamed_dev_ida, slot);
c63e09ecc   Al Viro   Make allocation o...
899
900
  	if (slot < unnamed_dev_start)
  		unnamed_dev_start = slot;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
901
902
  	spin_unlock(&unnamed_dev_lock);
  }
0ee5dc676   Al Viro   btrfs: kill magic...
903
904
905
906
  EXPORT_SYMBOL(free_anon_bdev);
  
  int set_anon_super(struct super_block *s, void *data)
  {
df0ce26cb   Christoph Hellwig   fs: remove defaul...
907
  	return get_anon_bdev(&s->s_dev);
0ee5dc676   Al Viro   btrfs: kill magic...
908
909
910
911
912
913
914
915
916
917
  }
  
  EXPORT_SYMBOL(set_anon_super);
  
  void kill_anon_super(struct super_block *sb)
  {
  	dev_t dev = sb->s_dev;
  	generic_shutdown_super(sb);
  	free_anon_bdev(dev);
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
918
919
  
  EXPORT_SYMBOL(kill_anon_super);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
920
921
922
923
924
925
926
927
  void kill_litter_super(struct super_block *sb)
  {
  	if (sb->s_root)
  		d_genocide(sb->s_root);
  	kill_anon_super(sb);
  }
  
  EXPORT_SYMBOL(kill_litter_super);
909e6d947   Serge E. Hallyn   namespaces: move ...
928
929
930
931
932
933
934
935
936
937
  static int ns_test_super(struct super_block *sb, void *data)
  {
  	return sb->s_fs_info == data;
  }
  
  static int ns_set_super(struct super_block *sb, void *data)
  {
  	sb->s_fs_info = data;
  	return set_anon_super(sb, NULL);
  }
d91ee87d8   Eric W. Biederman   vfs: Pass data, n...
938
939
940
  struct dentry *mount_ns(struct file_system_type *fs_type,
  	int flags, void *data, void *ns, struct user_namespace *user_ns,
  	int (*fill_super)(struct super_block *, void *, int))
909e6d947   Serge E. Hallyn   namespaces: move ...
941
942
  {
  	struct super_block *sb;
d91ee87d8   Eric W. Biederman   vfs: Pass data, n...
943
944
945
946
947
  	/* Don't allow mounting unless the caller has CAP_SYS_ADMIN
  	 * over the namespace.
  	 */
  	if (!(flags & MS_KERNMOUNT) && !ns_capable(user_ns, CAP_SYS_ADMIN))
  		return ERR_PTR(-EPERM);
6e4eab577   Eric W. Biederman   fs: Add user name...
948
949
  	sb = sget_userns(fs_type, ns_test_super, ns_set_super, flags,
  			 user_ns, ns);
909e6d947   Serge E. Hallyn   namespaces: move ...
950
  	if (IS_ERR(sb))
ceefda693   Al Viro   switch get_sb_ns(...
951
  		return ERR_CAST(sb);
909e6d947   Serge E. Hallyn   namespaces: move ...
952
953
954
  
  	if (!sb->s_root) {
  		int err;
909e6d947   Serge E. Hallyn   namespaces: move ...
955
956
  		err = fill_super(sb, data, flags & MS_SILENT ? 1 : 0);
  		if (err) {
74dbbdd7f   Al Viro   New helper: deact...
957
  			deactivate_locked_super(sb);
ceefda693   Al Viro   switch get_sb_ns(...
958
  			return ERR_PTR(err);
909e6d947   Serge E. Hallyn   namespaces: move ...
959
960
961
962
  		}
  
  		sb->s_flags |= MS_ACTIVE;
  	}
ceefda693   Al Viro   switch get_sb_ns(...
963
  	return dget(sb->s_root);
909e6d947   Serge E. Hallyn   namespaces: move ...
964
  }
ceefda693   Al Viro   switch get_sb_ns(...
965
  EXPORT_SYMBOL(mount_ns);
909e6d947   Serge E. Hallyn   namespaces: move ...
966

9361401eb   David Howells   [PATCH] BLOCK: Ma...
967
  #ifdef CONFIG_BLOCK
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
968
969
970
971
  static int set_bdev_super(struct super_block *s, void *data)
  {
  	s->s_bdev = data;
  	s->s_dev = s->s_bdev->bd_dev;
32a88aa1b   Jens Axboe   fs: Assign bdi in...
972
973
974
975
976
977
  
  	/*
  	 * We set the bdi here to the queue backing, file systems can
  	 * overwrite this in ->fill_super()
  	 */
  	s->s_bdi = &bdev_get_queue(s->s_bdev)->backing_dev_info;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
978
979
980
981
982
983
984
  	return 0;
  }
  
  static int test_bdev_super(struct super_block *s, void *data)
  {
  	return (void *)s->s_bdev == data;
  }
152a08366   Al Viro   new helper: mount...
985
  struct dentry *mount_bdev(struct file_system_type *fs_type,
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
986
  	int flags, const char *dev_name, void *data,
152a08366   Al Viro   new helper: mount...
987
  	int (*fill_super)(struct super_block *, void *, int))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
988
989
990
  {
  	struct block_device *bdev;
  	struct super_block *s;
d4d776299   Tejun Heo   block: clean up b...
991
  	fmode_t mode = FMODE_READ | FMODE_EXCL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
992
  	int error = 0;
30c40d2c0   Al Viro   [PATCH] propagate...
993
994
  	if (!(flags & MS_RDONLY))
  		mode |= FMODE_WRITE;
d4d776299   Tejun Heo   block: clean up b...
995
  	bdev = blkdev_get_by_path(dev_name, mode, fs_type);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
996
  	if (IS_ERR(bdev))
152a08366   Al Viro   new helper: mount...
997
  		return ERR_CAST(bdev);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
998
999
1000
1001
1002
1003
  
  	/*
  	 * once the super is inserted into the list by sget, s_umount
  	 * will protect the lockfs code from trying to start a snapshot
  	 * while we are mounting
  	 */
4fadd7bb2   Christoph Hellwig   freeze_bdev: kill...
1004
1005
1006
1007
1008
1009
  	mutex_lock(&bdev->bd_fsfreeze_mutex);
  	if (bdev->bd_fsfreeze_count > 0) {
  		mutex_unlock(&bdev->bd_fsfreeze_mutex);
  		error = -EBUSY;
  		goto error_bdev;
  	}
9249e17fe   David Howells   VFS: Pass mount f...
1010
1011
  	s = sget(fs_type, test_bdev_super, set_bdev_super, flags | MS_NOSEC,
  		 bdev);
4fadd7bb2   Christoph Hellwig   freeze_bdev: kill...
1012
  	mutex_unlock(&bdev->bd_fsfreeze_mutex);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1013
  	if (IS_ERR(s))
454e2398b   David Howells   [PATCH] VFS: Perm...
1014
  		goto error_s;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1015
1016
1017
  
  	if (s->s_root) {
  		if ((flags ^ s->s_flags) & MS_RDONLY) {
74dbbdd7f   Al Viro   New helper: deact...
1018
  			deactivate_locked_super(s);
454e2398b   David Howells   [PATCH] VFS: Perm...
1019
1020
  			error = -EBUSY;
  			goto error_bdev;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1021
  		}
454e2398b   David Howells   [PATCH] VFS: Perm...
1022

4f331f01b   Tejun Heo   vfs: don't hold s...
1023
1024
  		/*
  		 * s_umount nests inside bd_mutex during
e525fd89d   Tejun Heo   block: make blkde...
1025
1026
1027
1028
  		 * __invalidate_device().  blkdev_put() acquires
  		 * bd_mutex and can't be called under s_umount.  Drop
  		 * s_umount temporarily.  This is safe as we're
  		 * holding an active reference.
4f331f01b   Tejun Heo   vfs: don't hold s...
1029
1030
  		 */
  		up_write(&s->s_umount);
d4d776299   Tejun Heo   block: clean up b...
1031
  		blkdev_put(bdev, mode);
4f331f01b   Tejun Heo   vfs: don't hold s...
1032
  		down_write(&s->s_umount);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1033
  	} else {
30c40d2c0   Al Viro   [PATCH] propagate...
1034
  		s->s_mode = mode;
a1c6f0573   Dmitry Monakhov   fs: use block_dev...
1035
  		snprintf(s->s_id, sizeof(s->s_id), "%pg", bdev);
e78c9a004   Pekka Enberg   [PATCH] fs: remov...
1036
  		sb_set_blocksize(s, block_size(bdev));
9b04c997b   Theodore Ts'o   [PATCH] vfs: MS_V...
1037
  		error = fill_super(s, data, flags & MS_SILENT ? 1 : 0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1038
  		if (error) {
74dbbdd7f   Al Viro   New helper: deact...
1039
  			deactivate_locked_super(s);
454e2398b   David Howells   [PATCH] VFS: Perm...
1040
  			goto error;
fa675765a   Greg Kroah-Hartman   Revert mount/umou...
1041
  		}
454e2398b   David Howells   [PATCH] VFS: Perm...
1042
1043
  
  		s->s_flags |= MS_ACTIVE;
87d8fe1ee   Theodore Ts'o   add releasepage h...
1044
  		bdev->bd_super = s;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1045
  	}
152a08366   Al Viro   new helper: mount...
1046
  	return dget(s->s_root);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1047

454e2398b   David Howells   [PATCH] VFS: Perm...
1048
1049
1050
  error_s:
  	error = PTR_ERR(s);
  error_bdev:
d4d776299   Tejun Heo   block: clean up b...
1051
  	blkdev_put(bdev, mode);
454e2398b   David Howells   [PATCH] VFS: Perm...
1052
  error:
152a08366   Al Viro   new helper: mount...
1053
1054
1055
  	return ERR_PTR(error);
  }
  EXPORT_SYMBOL(mount_bdev);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1056
1057
1058
  void kill_block_super(struct super_block *sb)
  {
  	struct block_device *bdev = sb->s_bdev;
30c40d2c0   Al Viro   [PATCH] propagate...
1059
  	fmode_t mode = sb->s_mode;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1060

ddbaaf302   H Hartley Sweeten   NULL noise in fs/...
1061
  	bdev->bd_super = NULL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1062
1063
  	generic_shutdown_super(sb);
  	sync_blockdev(bdev);
d4d776299   Tejun Heo   block: clean up b...
1064
  	WARN_ON_ONCE(!(mode & FMODE_EXCL));
e525fd89d   Tejun Heo   block: make blkde...
1065
  	blkdev_put(bdev, mode | FMODE_EXCL);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1066
1067
1068
  }
  
  EXPORT_SYMBOL(kill_block_super);
9361401eb   David Howells   [PATCH] BLOCK: Ma...
1069
  #endif
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1070

3c26ff6e4   Al Viro   convert get_sb_no...
1071
  struct dentry *mount_nodev(struct file_system_type *fs_type,
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1072
  	int flags, void *data,
3c26ff6e4   Al Viro   convert get_sb_no...
1073
  	int (*fill_super)(struct super_block *, void *, int))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1074
1075
  {
  	int error;
9249e17fe   David Howells   VFS: Pass mount f...
1076
  	struct super_block *s = sget(fs_type, NULL, set_anon_super, flags, NULL);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1077
1078
  
  	if (IS_ERR(s))
3c26ff6e4   Al Viro   convert get_sb_no...
1079
  		return ERR_CAST(s);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1080

9b04c997b   Theodore Ts'o   [PATCH] vfs: MS_V...
1081
  	error = fill_super(s, data, flags & MS_SILENT ? 1 : 0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1082
  	if (error) {
74dbbdd7f   Al Viro   New helper: deact...
1083
  		deactivate_locked_super(s);
3c26ff6e4   Al Viro   convert get_sb_no...
1084
  		return ERR_PTR(error);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1085
1086
  	}
  	s->s_flags |= MS_ACTIVE;
3c26ff6e4   Al Viro   convert get_sb_no...
1087
  	return dget(s->s_root);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1088
  }
3c26ff6e4   Al Viro   convert get_sb_no...
1089
  EXPORT_SYMBOL(mount_nodev);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1090
1091
1092
1093
  static int compare_single(struct super_block *s, void *p)
  {
  	return 1;
  }
fc14f2fef   Al Viro   convert get_sb_si...
1094
  struct dentry *mount_single(struct file_system_type *fs_type,
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1095
  	int flags, void *data,
fc14f2fef   Al Viro   convert get_sb_si...
1096
  	int (*fill_super)(struct super_block *, void *, int))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1097
1098
1099
  {
  	struct super_block *s;
  	int error;
9249e17fe   David Howells   VFS: Pass mount f...
1100
  	s = sget(fs_type, compare_single, set_anon_super, flags, NULL);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1101
  	if (IS_ERR(s))
fc14f2fef   Al Viro   convert get_sb_si...
1102
  		return ERR_CAST(s);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1103
  	if (!s->s_root) {
9b04c997b   Theodore Ts'o   [PATCH] vfs: MS_V...
1104
  		error = fill_super(s, data, flags & MS_SILENT ? 1 : 0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1105
  		if (error) {
74dbbdd7f   Al Viro   New helper: deact...
1106
  			deactivate_locked_super(s);
fc14f2fef   Al Viro   convert get_sb_si...
1107
  			return ERR_PTR(error);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1108
1109
  		}
  		s->s_flags |= MS_ACTIVE;
9329d1bea   Kay Sievers   vfs: get_sb_singl...
1110
1111
  	} else {
  		do_remount_sb(s, flags, data, 0);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1112
  	}
fc14f2fef   Al Viro   convert get_sb_si...
1113
1114
1115
  	return dget(s->s_root);
  }
  EXPORT_SYMBOL(mount_single);
9d412a43c   Al Viro   vfs: split off vf...
1116
1117
  struct dentry *
  mount_fs(struct file_system_type *type, int flags, const char *name, void *data)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1118
  {
c96e41e92   Al Viro   beginning of tran...
1119
  	struct dentry *root;
9d412a43c   Al Viro   vfs: split off vf...
1120
  	struct super_block *sb;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1121
  	char *secdata = NULL;
9d412a43c   Al Viro   vfs: split off vf...
1122
  	int error = -ENOMEM;
8089352a1   Al Viro   Mirror MS_KERNMOU...
1123

e00075298   Eric Paris   LSM/SELinux: Inte...
1124
  	if (data && !(type->fs_flags & FS_BINARY_MOUNTDATA)) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1125
  		secdata = alloc_secdata();
454e2398b   David Howells   [PATCH] VFS: Perm...
1126
  		if (!secdata)
9d412a43c   Al Viro   vfs: split off vf...
1127
  			goto out;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1128

e00075298   Eric Paris   LSM/SELinux: Inte...
1129
  		error = security_sb_copy_data(data, secdata);
454e2398b   David Howells   [PATCH] VFS: Perm...
1130
  		if (error)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1131
  			goto out_free_secdata;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1132
  	}
1a102ff92   Al Viro   vfs: bury ->get_sb()
1133
1134
1135
1136
  	root = type->mount(type, flags, name, data);
  	if (IS_ERR(root)) {
  		error = PTR_ERR(root);
  		goto out_free_secdata;
c96e41e92   Al Viro   beginning of tran...
1137
  	}
9d412a43c   Al Viro   vfs: split off vf...
1138
1139
1140
1141
  	sb = root->d_sb;
  	BUG_ON(!sb);
  	WARN_ON(!sb->s_bdi);
  	sb->s_flags |= MS_BORN;
454e2398b   David Howells   [PATCH] VFS: Perm...
1142

9d412a43c   Al Viro   vfs: split off vf...
1143
  	error = security_sb_kern_mount(sb, flags, secdata);
5129a469a   Jörn Engel   Catch filesystems...
1144
1145
  	if (error)
  		goto out_sb;
454e2398b   David Howells   [PATCH] VFS: Perm...
1146

42cb56ae2   Jeff Layton   vfs: change sb->s...
1147
1148
1149
1150
  	/*
  	 * filesystems should never set s_maxbytes larger than MAX_LFS_FILESIZE
  	 * but s_maxbytes was an unsigned long long for many releases. Throw
  	 * this warning for a little while to try and catch filesystems that
4358b5678   Jeff Layton   VFS: trivial: fix...
1151
  	 * violate this rule.
42cb56ae2   Jeff Layton   vfs: change sb->s...
1152
  	 */
9d412a43c   Al Viro   vfs: split off vf...
1153
1154
1155
  	WARN((sb->s_maxbytes < 0), "%s set sb->s_maxbytes to "
  		"negative value (%lld)
  ", type->name, sb->s_maxbytes);
42cb56ae2   Jeff Layton   vfs: change sb->s...
1156

9d412a43c   Al Viro   vfs: split off vf...
1157
  	up_write(&sb->s_umount);
8680e22f2   Gerald Schaefer   [PATCH] VFS: memo...
1158
  	free_secdata(secdata);
9d412a43c   Al Viro   vfs: split off vf...
1159
  	return root;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1160
  out_sb:
9d412a43c   Al Viro   vfs: split off vf...
1161
1162
  	dput(root);
  	deactivate_locked_super(sb);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1163
1164
  out_free_secdata:
  	free_secdata(secdata);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1165
  out:
454e2398b   David Howells   [PATCH] VFS: Perm...
1166
  	return ERR_PTR(error);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1167
  }
5accdf82b   Jan Kara   fs: Improve files...
1168
1169
1170
1171
1172
1173
  /*
   * This is an internal function, please use sb_end_{write,pagefault,intwrite}
   * instead.
   */
  void __sb_end_write(struct super_block *sb, int level)
  {
8129ed296   Oleg Nesterov   change sb_writers...
1174
  	percpu_up_read(sb->s_writers.rw_sem + level-1);
5accdf82b   Jan Kara   fs: Improve files...
1175
1176
  }
  EXPORT_SYMBOL(__sb_end_write);
f4b554af9   Oleg Nesterov   fix the broken lo...
1177
1178
1179
1180
1181
1182
1183
  /*
   * This is an internal function, please use sb_start_{write,pagefault,intwrite}
   * instead.
   */
  int __sb_start_write(struct super_block *sb, int level, bool wait)
  {
  	bool force_trylock = false;
8129ed296   Oleg Nesterov   change sb_writers...
1184
  	int ret = 1;
f4b554af9   Oleg Nesterov   fix the broken lo...
1185
1186
1187
1188
1189
1190
1191
1192
1193
1194
1195
1196
1197
1198
1199
  
  #ifdef CONFIG_LOCKDEP
  	/*
  	 * We want lockdep to tell us about possible deadlocks with freezing
  	 * but it's it bit tricky to properly instrument it. Getting a freeze
  	 * protection works as getting a read lock but there are subtle
  	 * problems. XFS for example gets freeze protection on internal level
  	 * twice in some cases, which is OK only because we already hold a
  	 * freeze protection also on higher level. Due to these cases we have
  	 * to use wait == F (trylock mode) which must not fail.
  	 */
  	if (wait) {
  		int i;
  
  		for (i = 0; i < level - 1; i++)
8129ed296   Oleg Nesterov   change sb_writers...
1200
  			if (percpu_rwsem_is_held(sb->s_writers.rw_sem + i)) {
f4b554af9   Oleg Nesterov   fix the broken lo...
1201
1202
1203
1204
1205
  				force_trylock = true;
  				break;
  			}
  	}
  #endif
8129ed296   Oleg Nesterov   change sb_writers...
1206
1207
1208
1209
  	if (wait && !force_trylock)
  		percpu_down_read(sb->s_writers.rw_sem + level-1);
  	else
  		ret = percpu_down_read_trylock(sb->s_writers.rw_sem + level-1);
22224a175   Vincent Stehlé   fs/super.c: use &...
1210
  	WARN_ON(force_trylock && !ret);
f4b554af9   Oleg Nesterov   fix the broken lo...
1211
1212
  	return ret;
  }
5accdf82b   Jan Kara   fs: Improve files...
1213
1214
1215
1216
1217
1218
1219
1220
  EXPORT_SYMBOL(__sb_start_write);
  
  /**
   * sb_wait_write - wait until all writers to given file system finish
   * @sb: the super for which we wait
   * @level: type of writers we wait for (normal vs page fault)
   *
   * This function waits until there are no writers of given type to given file
8129ed296   Oleg Nesterov   change sb_writers...
1221
   * system.
5accdf82b   Jan Kara   fs: Improve files...
1222
1223
1224
   */
  static void sb_wait_write(struct super_block *sb, int level)
  {
8129ed296   Oleg Nesterov   change sb_writers...
1225
  	percpu_down_write(sb->s_writers.rw_sem + level-1);
8129ed296   Oleg Nesterov   change sb_writers...
1226
  }
5accdf82b   Jan Kara   fs: Improve files...
1227

f1a962203   Oleg Nesterov   fs/super.c: don't...
1228
1229
1230
1231
1232
1233
1234
1235
1236
1237
1238
1239
1240
1241
1242
1243
  /*
   * We are going to return to userspace and forget about these locks, the
   * ownership goes to the caller of thaw_super() which does unlock().
   */
  static void lockdep_sb_freeze_release(struct super_block *sb)
  {
  	int level;
  
  	for (level = SB_FREEZE_LEVELS - 1; level >= 0; level--)
  		percpu_rwsem_release(sb->s_writers.rw_sem + level, 0, _THIS_IP_);
  }
  
  /*
   * Tell lockdep we are holding these locks before we call ->unfreeze_fs(sb).
   */
  static void lockdep_sb_freeze_acquire(struct super_block *sb)
8129ed296   Oleg Nesterov   change sb_writers...
1244
1245
  {
  	int level;
5accdf82b   Jan Kara   fs: Improve files...
1246

8129ed296   Oleg Nesterov   change sb_writers...
1247
1248
  	for (level = 0; level < SB_FREEZE_LEVELS; ++level)
  		percpu_rwsem_acquire(sb->s_writers.rw_sem + level, 0, _THIS_IP_);
f1a962203   Oleg Nesterov   fs/super.c: don't...
1249
1250
1251
1252
1253
  }
  
  static void sb_freeze_unlock(struct super_block *sb)
  {
  	int level;
5accdf82b   Jan Kara   fs: Improve files...
1254

8129ed296   Oleg Nesterov   change sb_writers...
1255
1256
  	for (level = SB_FREEZE_LEVELS - 1; level >= 0; level--)
  		percpu_up_write(sb->s_writers.rw_sem + level);
5accdf82b   Jan Kara   fs: Improve files...
1257
  }
18e9e5104   Josef Bacik   Introduce freeze_...
1258
  /**
7000d3c42   Randy Dunlap   fs/super: fix ker...
1259
1260
   * freeze_super - lock the filesystem and force it into a consistent state
   * @sb: the super to lock
18e9e5104   Josef Bacik   Introduce freeze_...
1261
1262
1263
1264
   *
   * Syncs the super to make sure the filesystem is consistent and calls the fs's
   * freeze_fs.  Subsequent calls to this without first thawing the fs will return
   * -EBUSY.
5accdf82b   Jan Kara   fs: Improve files...
1265
1266
1267
1268
1269
1270
1271
1272
1273
1274
1275
1276
1277
1278
1279
1280
1281
1282
1283
1284
1285
1286
1287
1288
1289
   *
   * During this function, sb->s_writers.frozen goes through these values:
   *
   * SB_UNFROZEN: File system is normal, all writes progress as usual.
   *
   * SB_FREEZE_WRITE: The file system is in the process of being frozen.  New
   * writes should be blocked, though page faults are still allowed. We wait for
   * all writes to complete and then proceed to the next stage.
   *
   * SB_FREEZE_PAGEFAULT: Freezing continues. Now also page faults are blocked
   * but internal fs threads can still modify the filesystem (although they
   * should not dirty new pages or inodes), writeback can run etc. After waiting
   * for all running page faults we sync the filesystem which will clean all
   * dirty pages and inodes (no new dirty pages or inodes can be created when
   * sync is running).
   *
   * SB_FREEZE_FS: The file system is frozen. Now all internal sources of fs
   * modification are blocked (e.g. XFS preallocation truncation on inode
   * reclaim). This is usually implemented by blocking new transactions for
   * filesystems that have them and need this additional guard. After all
   * internal writers are finished we call ->freeze_fs() to finish filesystem
   * freezing. Then we transition to SB_FREEZE_COMPLETE state. This state is
   * mostly auxiliary for filesystems to verify they do not modify frozen fs.
   *
   * sb->s_writers.frozen is protected by sb->s_umount.
18e9e5104   Josef Bacik   Introduce freeze_...
1290
1291
1292
1293
1294
1295
1296
   */
  int freeze_super(struct super_block *sb)
  {
  	int ret;
  
  	atomic_inc(&sb->s_active);
  	down_write(&sb->s_umount);
5accdf82b   Jan Kara   fs: Improve files...
1297
  	if (sb->s_writers.frozen != SB_UNFROZEN) {
18e9e5104   Josef Bacik   Introduce freeze_...
1298
1299
1300
  		deactivate_locked_super(sb);
  		return -EBUSY;
  	}
dabe0dc19   Al Viro   vfs: fix the rest...
1301
1302
1303
1304
  	if (!(sb->s_flags & MS_BORN)) {
  		up_write(&sb->s_umount);
  		return 0;	/* sic - it's "nothing to do" */
  	}
18e9e5104   Josef Bacik   Introduce freeze_...
1305
  	if (sb->s_flags & MS_RDONLY) {
5accdf82b   Jan Kara   fs: Improve files...
1306
1307
  		/* Nothing to do really... */
  		sb->s_writers.frozen = SB_FREEZE_COMPLETE;
18e9e5104   Josef Bacik   Introduce freeze_...
1308
1309
1310
  		up_write(&sb->s_umount);
  		return 0;
  	}
5accdf82b   Jan Kara   fs: Improve files...
1311
  	sb->s_writers.frozen = SB_FREEZE_WRITE;
5accdf82b   Jan Kara   fs: Improve files...
1312
1313
  	/* Release s_umount to preserve sb_start_write -> s_umount ordering */
  	up_write(&sb->s_umount);
5accdf82b   Jan Kara   fs: Improve files...
1314
  	sb_wait_write(sb, SB_FREEZE_WRITE);
8129ed296   Oleg Nesterov   change sb_writers...
1315
  	down_write(&sb->s_umount);
5accdf82b   Jan Kara   fs: Improve files...
1316
1317
  
  	/* Now we go and block page faults... */
5accdf82b   Jan Kara   fs: Improve files...
1318
  	sb->s_writers.frozen = SB_FREEZE_PAGEFAULT;
5accdf82b   Jan Kara   fs: Improve files...
1319
1320
1321
  	sb_wait_write(sb, SB_FREEZE_PAGEFAULT);
  
  	/* All writers are done so after syncing there won't be dirty data */
18e9e5104   Josef Bacik   Introduce freeze_...
1322
  	sync_filesystem(sb);
5accdf82b   Jan Kara   fs: Improve files...
1323
1324
  	/* Now wait for internal filesystem counter */
  	sb->s_writers.frozen = SB_FREEZE_FS;
5accdf82b   Jan Kara   fs: Improve files...
1325
  	sb_wait_write(sb, SB_FREEZE_FS);
18e9e5104   Josef Bacik   Introduce freeze_...
1326

18e9e5104   Josef Bacik   Introduce freeze_...
1327
1328
1329
1330
1331
1332
  	if (sb->s_op->freeze_fs) {
  		ret = sb->s_op->freeze_fs(sb);
  		if (ret) {
  			printk(KERN_ERR
  				"VFS:Filesystem freeze failed
  ");
5accdf82b   Jan Kara   fs: Improve files...
1333
  			sb->s_writers.frozen = SB_UNFROZEN;
8129ed296   Oleg Nesterov   change sb_writers...
1334
  			sb_freeze_unlock(sb);
5accdf82b   Jan Kara   fs: Improve files...
1335
  			wake_up(&sb->s_writers.wait_unfrozen);
18e9e5104   Josef Bacik   Introduce freeze_...
1336
1337
1338
1339
  			deactivate_locked_super(sb);
  			return ret;
  		}
  	}
5accdf82b   Jan Kara   fs: Improve files...
1340
  	/*
89f39af12   Oleg Nesterov   fs/super.c: fix r...
1341
1342
  	 * For debugging purposes so that fs can warn if it sees write activity
  	 * when frozen is set to SB_FREEZE_COMPLETE, and for thaw_super().
5accdf82b   Jan Kara   fs: Improve files...
1343
1344
  	 */
  	sb->s_writers.frozen = SB_FREEZE_COMPLETE;
f1a962203   Oleg Nesterov   fs/super.c: don't...
1345
  	lockdep_sb_freeze_release(sb);
18e9e5104   Josef Bacik   Introduce freeze_...
1346
1347
1348
1349
1350
1351
1352
1353
1354
1355
1356
1357
1358
1359
1360
1361
  	up_write(&sb->s_umount);
  	return 0;
  }
  EXPORT_SYMBOL(freeze_super);
  
  /**
   * thaw_super -- unlock filesystem
   * @sb: the super to thaw
   *
   * Unlocks the filesystem and marks it writeable again after freeze_super().
   */
  int thaw_super(struct super_block *sb)
  {
  	int error;
  
  	down_write(&sb->s_umount);
89f39af12   Oleg Nesterov   fs/super.c: fix r...
1362
  	if (sb->s_writers.frozen != SB_FREEZE_COMPLETE) {
18e9e5104   Josef Bacik   Introduce freeze_...
1363
1364
1365
  		up_write(&sb->s_umount);
  		return -EINVAL;
  	}
8129ed296   Oleg Nesterov   change sb_writers...
1366
1367
  	if (sb->s_flags & MS_RDONLY) {
  		sb->s_writers.frozen = SB_UNFROZEN;
18e9e5104   Josef Bacik   Introduce freeze_...
1368
  		goto out;
8129ed296   Oleg Nesterov   change sb_writers...
1369
  	}
18e9e5104   Josef Bacik   Introduce freeze_...
1370

f1a962203   Oleg Nesterov   fs/super.c: don't...
1371
  	lockdep_sb_freeze_acquire(sb);
18e9e5104   Josef Bacik   Introduce freeze_...
1372
1373
1374
1375
1376
1377
  	if (sb->s_op->unfreeze_fs) {
  		error = sb->s_op->unfreeze_fs(sb);
  		if (error) {
  			printk(KERN_ERR
  				"VFS:Filesystem thaw failed
  ");
f1a962203   Oleg Nesterov   fs/super.c: don't...
1378
  			lockdep_sb_freeze_release(sb);
18e9e5104   Josef Bacik   Introduce freeze_...
1379
1380
1381
1382
  			up_write(&sb->s_umount);
  			return error;
  		}
  	}
5accdf82b   Jan Kara   fs: Improve files...
1383
  	sb->s_writers.frozen = SB_UNFROZEN;
8129ed296   Oleg Nesterov   change sb_writers...
1384
1385
  	sb_freeze_unlock(sb);
  out:
5accdf82b   Jan Kara   fs: Improve files...
1386
  	wake_up(&sb->s_writers.wait_unfrozen);
18e9e5104   Josef Bacik   Introduce freeze_...
1387
  	deactivate_locked_super(sb);
18e9e5104   Josef Bacik   Introduce freeze_...
1388
1389
1390
  	return 0;
  }
  EXPORT_SYMBOL(thaw_super);