Blame view

block/genhd.c 58 KB
3dcf60bcb   Christoph Hellwig   block: add SPDX t...
1
  // SPDX-License-Identifier: GPL-2.0
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2
3
4
  /*
   *  gendisk handling
   */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
5
  #include <linux/module.h>
3ad5cee5c   Christoph Hellwig   block: move sysfs...
6
  #include <linux/ctype.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
7
8
  #include <linux/fs.h>
  #include <linux/genhd.h>
b446b60e4   Andrew Morton   [PATCH] rework re...
9
  #include <linux/kdev_t.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
10
11
  #include <linux/kernel.h>
  #include <linux/blkdev.h>
66114cad6   Tejun Heo   writeback: separa...
12
  #include <linux/backing-dev.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
13
14
  #include <linux/init.h>
  #include <linux/spinlock.h>
f500975a3   Alexey Dobriyan   proc: move rest o...
15
  #include <linux/proc_fs.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
16
17
18
19
  #include <linux/seq_file.h>
  #include <linux/slab.h>
  #include <linux/kmod.h>
  #include <linux/kobj_map.h>
58383af62   Jes Sorensen   [PATCH] kobj_map ...
20
  #include <linux/mutex.h>
bcce3de1b   Tejun Heo   block: implement ...
21
  #include <linux/idr.h>
77ea887e4   Tejun Heo   implement in-kern...
22
  #include <linux/log2.h>
25e823c8c   Ming Lei   block/genhd.c: ap...
23
  #include <linux/pm_runtime.h>
99e6608c9   Vishal Verma   block: Add badblo...
24
  #include <linux/badblocks.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
25

ff88972c8   Adrian Bunk   proper prototype ...
26
  #include "blk.h"
edfaa7c36   Kay Sievers   Driver core: conv...
27
  static DEFINE_MUTEX(block_class_lock);
31eb61867   Christoph Hellwig   block: mark block...
28
  static struct kobject *block_depr;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
29

bcce3de1b   Tejun Heo   block: implement ...
30
  /* for extended dynamic devt allocation, currently only one major is used */
ce23bba84   Tejun Heo   block: fix synchr...
31
  #define NR_EXT_DEVT		(1 << MINORBITS)
bcce3de1b   Tejun Heo   block: implement ...
32

2da78092d   Keith Busch   block: Fix dev_t ...
33
  /* For extended devt allocation.  ext_devt_lock prevents look up
bcce3de1b   Tejun Heo   block: implement ...
34
35
   * results from going away underneath its user.
   */
2da78092d   Keith Busch   block: Fix dev_t ...
36
  static DEFINE_SPINLOCK(ext_devt_lock);
bcce3de1b   Tejun Heo   block: implement ...
37
  static DEFINE_IDR(ext_devt_idr);
12c2bdb23   Derek Basehore   block: prevent ra...
38
39
  static void disk_check_events(struct disk_events *ev,
  			      unsigned int *clearing_ptr);
9f53d2fe8   Stanislaw Gruszka   block: fix __blkd...
40
  static void disk_alloc_events(struct gendisk *disk);
77ea887e4   Tejun Heo   implement in-kern...
41
42
43
  static void disk_add_events(struct gendisk *disk);
  static void disk_del_events(struct gendisk *disk);
  static void disk_release_events(struct gendisk *disk);
e598a72fa   Balbir Singh   block/genhd: Noti...
44
45
46
47
  /*
   * Set disk capacity and notify if the size is not currently
   * zero and will not be set to zero
   */
7e890c37c   Christoph Hellwig   block: add a retu...
48
  bool set_capacity_revalidate_and_notify(struct gendisk *disk, sector_t size,
b8086d3f5   Christoph Hellwig   block: use revali...
49
  					bool update_bdev)
e598a72fa   Balbir Singh   block/genhd: Noti...
50
51
52
53
  {
  	sector_t capacity = get_capacity(disk);
  
  	set_capacity(disk, size);
b8086d3f5   Christoph Hellwig   block: use revali...
54
55
  	if (update_bdev)
  		revalidate_disk_size(disk, true);
e598a72fa   Balbir Singh   block/genhd: Noti...
56
57
58
59
60
  
  	if (capacity != size && capacity != 0 && size != 0) {
  		char *envp[] = { "RESIZE=1", NULL };
  
  		kobject_uevent_env(&disk_to_dev(disk)->kobj, KOBJ_CHANGE, envp);
7e890c37c   Christoph Hellwig   block: add a retu...
61
  		return true;
e598a72fa   Balbir Singh   block/genhd: Noti...
62
  	}
7e890c37c   Christoph Hellwig   block: add a retu...
63
64
  
  	return false;
e598a72fa   Balbir Singh   block/genhd: Noti...
65
66
67
  }
  
  EXPORT_SYMBOL_GPL(set_capacity_revalidate_and_notify);
5cbd28e3c   Christoph Hellwig   block: move disk_...
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
  /*
   * Format the device name of the indicated disk into the supplied buffer and
   * return a pointer to that same buffer for convenience.
   */
  char *disk_name(struct gendisk *hd, int partno, char *buf)
  {
  	if (!partno)
  		snprintf(buf, BDEVNAME_SIZE, "%s", hd->disk_name);
  	else if (isdigit(hd->disk_name[strlen(hd->disk_name)-1]))
  		snprintf(buf, BDEVNAME_SIZE, "%sp%d", hd->disk_name, partno);
  	else
  		snprintf(buf, BDEVNAME_SIZE, "%s%d", hd->disk_name, partno);
  
  	return buf;
  }
  
  const char *bdevname(struct block_device *bdev, char *buf)
  {
8a63a86e1   Christoph Hellwig   block: use bd_par...
86
  	return disk_name(bdev->bd_disk, bdev->bd_partno, buf);
5cbd28e3c   Christoph Hellwig   block: move disk_...
87
88
  }
  EXPORT_SYMBOL(bdevname);
e598a72fa   Balbir Singh   block/genhd: Noti...
89

ea18e0f0a   Konstantin Khlebnikov   block/diskstats: ...
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
  static void part_stat_read_all(struct hd_struct *part, struct disk_stats *stat)
  {
  	int cpu;
  
  	memset(stat, 0, sizeof(struct disk_stats));
  	for_each_possible_cpu(cpu) {
  		struct disk_stats *ptr = per_cpu_ptr(part->dkstats, cpu);
  		int group;
  
  		for (group = 0; group < NR_STAT_GROUPS; group++) {
  			stat->nsecs[group] += ptr->nsecs[group];
  			stat->sectors[group] += ptr->sectors[group];
  			stat->ios[group] += ptr->ios[group];
  			stat->merges[group] += ptr->merges[group];
  		}
  
  		stat->io_ticks += ptr->io_ticks;
ea18e0f0a   Konstantin Khlebnikov   block/diskstats: ...
107
108
  	}
  }
ea18e0f0a   Konstantin Khlebnikov   block/diskstats: ...
109

1f06959bd   Christoph Hellwig   block: remove the...
110
  static unsigned int part_in_flight(struct hd_struct *part)
f299b7c7a   Jens Axboe   blk-mq: provide i...
111
  {
b2f609e19   Christoph Hellwig   block: move the b...
112
  	unsigned int inflight = 0;
1226b8dd0   Mikulas Patocka   block: switch to ...
113
  	int cpu;
f299b7c7a   Jens Axboe   blk-mq: provide i...
114

1226b8dd0   Mikulas Patocka   block: switch to ...
115
  	for_each_possible_cpu(cpu) {
e016b7820   Mikulas Patocka   block: return jus...
116
117
  		inflight += part_stat_local_read_cpu(part, in_flight[0], cpu) +
  			    part_stat_local_read_cpu(part, in_flight[1], cpu);
1226b8dd0   Mikulas Patocka   block: switch to ...
118
  	}
e016b7820   Mikulas Patocka   block: return jus...
119
120
  	if ((int)inflight < 0)
  		inflight = 0;
1226b8dd0   Mikulas Patocka   block: switch to ...
121

e016b7820   Mikulas Patocka   block: return jus...
122
  	return inflight;
f299b7c7a   Jens Axboe   blk-mq: provide i...
123
  }
1f06959bd   Christoph Hellwig   block: remove the...
124
  static void part_in_flight_rw(struct hd_struct *part, unsigned int inflight[2])
bf0ddaba6   Omar Sandoval   blk-mq: fix sysfs...
125
  {
1226b8dd0   Mikulas Patocka   block: switch to ...
126
  	int cpu;
1226b8dd0   Mikulas Patocka   block: switch to ...
127
128
129
130
131
132
133
134
135
136
  	inflight[0] = 0;
  	inflight[1] = 0;
  	for_each_possible_cpu(cpu) {
  		inflight[0] += part_stat_local_read_cpu(part, in_flight[0], cpu);
  		inflight[1] += part_stat_local_read_cpu(part, in_flight[1], cpu);
  	}
  	if ((int)inflight[0] < 0)
  		inflight[0] = 0;
  	if ((int)inflight[1] < 0)
  		inflight[1] = 0;
bf0ddaba6   Omar Sandoval   blk-mq: fix sysfs...
137
  }
807d4af2f   Christoph Hellwig   block: add a __di...
138
139
140
141
142
143
144
145
  struct hd_struct *__disk_get_part(struct gendisk *disk, int partno)
  {
  	struct disk_part_tbl *ptbl = rcu_dereference(disk->part_tbl);
  
  	if (unlikely(partno < 0 || partno >= ptbl->len))
  		return NULL;
  	return rcu_dereference(ptbl->part[partno]);
  }
e71bf0d0e   Tejun Heo   block: fix disk->...
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
  /**
   * disk_get_part - get partition
   * @disk: disk to look partition from
   * @partno: partition number
   *
   * Look for partition @partno from @disk.  If found, increment
   * reference count and return it.
   *
   * CONTEXT:
   * Don't care.
   *
   * RETURNS:
   * Pointer to the found partition on success, NULL if not found.
   */
  struct hd_struct *disk_get_part(struct gendisk *disk, int partno)
  {
807d4af2f   Christoph Hellwig   block: add a __di...
162
  	struct hd_struct *part;
540eed563   Tejun Heo   block: make parti...
163

e71bf0d0e   Tejun Heo   block: fix disk->...
164
  	rcu_read_lock();
807d4af2f   Christoph Hellwig   block: add a __di...
165
166
167
  	part = __disk_get_part(disk, partno);
  	if (part)
  		get_device(part_to_dev(part));
e71bf0d0e   Tejun Heo   block: fix disk->...
168
169
170
171
  	rcu_read_unlock();
  
  	return part;
  }
e71bf0d0e   Tejun Heo   block: fix disk->...
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
  
  /**
   * disk_part_iter_init - initialize partition iterator
   * @piter: iterator to initialize
   * @disk: disk to iterate over
   * @flags: DISK_PITER_* flags
   *
   * Initialize @piter so that it iterates over partitions of @disk.
   *
   * CONTEXT:
   * Don't care.
   */
  void disk_part_iter_init(struct disk_part_iter *piter, struct gendisk *disk,
  			  unsigned int flags)
  {
540eed563   Tejun Heo   block: make parti...
187
188
189
190
  	struct disk_part_tbl *ptbl;
  
  	rcu_read_lock();
  	ptbl = rcu_dereference(disk->part_tbl);
e71bf0d0e   Tejun Heo   block: fix disk->...
191
192
193
194
  	piter->disk = disk;
  	piter->part = NULL;
  
  	if (flags & DISK_PITER_REVERSE)
540eed563   Tejun Heo   block: make parti...
195
  		piter->idx = ptbl->len - 1;
71982a409   Tejun Heo   block: include em...
196
  	else if (flags & (DISK_PITER_INCL_PART0 | DISK_PITER_INCL_EMPTY_PART0))
e71bf0d0e   Tejun Heo   block: fix disk->...
197
  		piter->idx = 0;
b5d0b9df0   Tejun Heo   block: introduce ...
198
199
  	else
  		piter->idx = 1;
e71bf0d0e   Tejun Heo   block: fix disk->...
200
201
  
  	piter->flags = flags;
540eed563   Tejun Heo   block: make parti...
202
203
  
  	rcu_read_unlock();
e71bf0d0e   Tejun Heo   block: fix disk->...
204
205
206
207
208
209
210
211
212
213
214
215
216
217
  }
  EXPORT_SYMBOL_GPL(disk_part_iter_init);
  
  /**
   * disk_part_iter_next - proceed iterator to the next partition and return it
   * @piter: iterator of interest
   *
   * Proceed @piter to the next partition and return it.
   *
   * CONTEXT:
   * Don't care.
   */
  struct hd_struct *disk_part_iter_next(struct disk_part_iter *piter)
  {
540eed563   Tejun Heo   block: make parti...
218
  	struct disk_part_tbl *ptbl;
e71bf0d0e   Tejun Heo   block: fix disk->...
219
220
221
222
223
  	int inc, end;
  
  	/* put the last partition */
  	disk_put_part(piter->part);
  	piter->part = NULL;
540eed563   Tejun Heo   block: make parti...
224
  	/* get part_tbl */
e71bf0d0e   Tejun Heo   block: fix disk->...
225
  	rcu_read_lock();
540eed563   Tejun Heo   block: make parti...
226
  	ptbl = rcu_dereference(piter->disk->part_tbl);
e71bf0d0e   Tejun Heo   block: fix disk->...
227
228
229
230
  
  	/* determine iteration parameters */
  	if (piter->flags & DISK_PITER_REVERSE) {
  		inc = -1;
71982a409   Tejun Heo   block: include em...
231
232
  		if (piter->flags & (DISK_PITER_INCL_PART0 |
  				    DISK_PITER_INCL_EMPTY_PART0))
b5d0b9df0   Tejun Heo   block: introduce ...
233
234
235
  			end = -1;
  		else
  			end = 0;
e71bf0d0e   Tejun Heo   block: fix disk->...
236
237
  	} else {
  		inc = 1;
540eed563   Tejun Heo   block: make parti...
238
  		end = ptbl->len;
e71bf0d0e   Tejun Heo   block: fix disk->...
239
240
241
242
243
  	}
  
  	/* iterate to the next partition */
  	for (; piter->idx != end; piter->idx += inc) {
  		struct hd_struct *part;
540eed563   Tejun Heo   block: make parti...
244
  		part = rcu_dereference(ptbl->part[piter->idx]);
e71bf0d0e   Tejun Heo   block: fix disk->...
245
246
  		if (!part)
  			continue;
c83f6bf98   Vivek Goyal   block: add partit...
247
  		if (!part_nr_sects_read(part) &&
71982a409   Tejun Heo   block: include em...
248
249
250
  		    !(piter->flags & DISK_PITER_INCL_EMPTY) &&
  		    !(piter->flags & DISK_PITER_INCL_EMPTY_PART0 &&
  		      piter->idx == 0))
e71bf0d0e   Tejun Heo   block: fix disk->...
251
  			continue;
ed9e19823   Tejun Heo   block: implement ...
252
  		get_device(part_to_dev(part));
e71bf0d0e   Tejun Heo   block: fix disk->...
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
  		piter->part = part;
  		piter->idx += inc;
  		break;
  	}
  
  	rcu_read_unlock();
  
  	return piter->part;
  }
  EXPORT_SYMBOL_GPL(disk_part_iter_next);
  
  /**
   * disk_part_iter_exit - finish up partition iteration
   * @piter: iter of interest
   *
   * Called when iteration is over.  Cleans up @piter.
   *
   * CONTEXT:
   * Don't care.
   */
  void disk_part_iter_exit(struct disk_part_iter *piter)
  {
  	disk_put_part(piter->part);
  	piter->part = NULL;
  }
  EXPORT_SYMBOL_GPL(disk_part_iter_exit);
a6f23657d   Jens Axboe   block: add one-hi...
279
280
281
  static inline int sector_in_part(struct hd_struct *part, sector_t sector)
  {
  	return part->start_sect <= sector &&
c83f6bf98   Vivek Goyal   block: add partit...
282
  		sector < part->start_sect + part_nr_sects_read(part);
a6f23657d   Jens Axboe   block: add one-hi...
283
  }
e71bf0d0e   Tejun Heo   block: fix disk->...
284
285
286
287
288
289
290
291
292
  /**
   * disk_map_sector_rcu - map sector to partition
   * @disk: gendisk of interest
   * @sector: sector to map
   *
   * Find out which partition @sector maps to on @disk.  This is
   * primarily used for stats accounting.
   *
   * CONTEXT:
b7d6c3033   Ming Lei   block: fix use-af...
293
   * RCU read locked.  The returned partition pointer is always valid
27eb3af9a   Ming Lei   block: don't hold...
294
295
   * because its refcount is grabbed except for part0, which lifetime
   * is same with the disk.
e71bf0d0e   Tejun Heo   block: fix disk->...
296
297
   *
   * RETURNS:
074a7aca7   Tejun Heo   block: move stats...
298
   * Found partition on success, part0 is returned if no partition matches
b7d6c3033   Ming Lei   block: fix use-af...
299
   * or the matched partition is being deleted.
e71bf0d0e   Tejun Heo   block: fix disk->...
300
301
302
   */
  struct hd_struct *disk_map_sector_rcu(struct gendisk *disk, sector_t sector)
  {
540eed563   Tejun Heo   block: make parti...
303
  	struct disk_part_tbl *ptbl;
a6f23657d   Jens Axboe   block: add one-hi...
304
  	struct hd_struct *part;
e71bf0d0e   Tejun Heo   block: fix disk->...
305
  	int i;
8ab1d40a6   Konstantin Khlebnikov   block: remove rcu...
306
  	rcu_read_lock();
540eed563   Tejun Heo   block: make parti...
307
  	ptbl = rcu_dereference(disk->part_tbl);
a6f23657d   Jens Axboe   block: add one-hi...
308
  	part = rcu_dereference(ptbl->last_lookup);
b7d6c3033   Ming Lei   block: fix use-af...
309
  	if (part && sector_in_part(part, sector) && hd_struct_try_get(part))
8ab1d40a6   Konstantin Khlebnikov   block: remove rcu...
310
  		goto out_unlock;
a6f23657d   Jens Axboe   block: add one-hi...
311

540eed563   Tejun Heo   block: make parti...
312
  	for (i = 1; i < ptbl->len; i++) {
a6f23657d   Jens Axboe   block: add one-hi...
313
  		part = rcu_dereference(ptbl->part[i]);
e71bf0d0e   Tejun Heo   block: fix disk->...
314

a6f23657d   Jens Axboe   block: add one-hi...
315
  		if (part && sector_in_part(part, sector)) {
b7d6c3033   Ming Lei   block: fix use-af...
316
317
318
319
320
321
322
  			/*
  			 * only live partition can be cached for lookup,
  			 * so use-after-free on cached & deleting partition
  			 * can be avoided
  			 */
  			if (!hd_struct_try_get(part))
  				break;
a6f23657d   Jens Axboe   block: add one-hi...
323
  			rcu_assign_pointer(ptbl->last_lookup, part);
8ab1d40a6   Konstantin Khlebnikov   block: remove rcu...
324
  			goto out_unlock;
a6f23657d   Jens Axboe   block: add one-hi...
325
  		}
e71bf0d0e   Tejun Heo   block: fix disk->...
326
  	}
8ab1d40a6   Konstantin Khlebnikov   block: remove rcu...
327
328
329
330
331
  
  	part = &disk->part0;
  out_unlock:
  	rcu_read_unlock();
  	return part;
e71bf0d0e   Tejun Heo   block: fix disk->...
332
  }
e71bf0d0e   Tejun Heo   block: fix disk->...
333

b53df2e74   Shin'ichiro Kawasaki   block: Fix partit...
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
  /**
   * disk_has_partitions
   * @disk: gendisk of interest
   *
   * Walk through the partition table and check if valid partition exists.
   *
   * CONTEXT:
   * Don't care.
   *
   * RETURNS:
   * True if the gendisk has at least one valid non-zero size partition.
   * Otherwise false.
   */
  bool disk_has_partitions(struct gendisk *disk)
  {
  	struct disk_part_tbl *ptbl;
  	int i;
  	bool ret = false;
  
  	rcu_read_lock();
  	ptbl = rcu_dereference(disk->part_tbl);
  
  	/* Iterate partitions skipping the whole device at index 0 */
  	for (i = 1; i < ptbl->len; i++) {
  		if (rcu_dereference(ptbl->part[i])) {
  			ret = true;
  			break;
  		}
  	}
  
  	rcu_read_unlock();
  
  	return ret;
  }
  EXPORT_SYMBOL_GPL(disk_has_partitions);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
369
370
371
372
  /*
   * Can be deleted altogether. Later.
   *
   */
133d55cdb   Logan Gunthorpe   block: order /pro...
373
  #define BLKDEV_MAJOR_HASH_SIZE 255
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
374
375
376
377
  static struct blk_major_name {
  	struct blk_major_name *next;
  	int major;
  	char name[16];
68eef3b47   Joe Korty   [PATCH] Simplify ...
378
  } *major_names[BLKDEV_MAJOR_HASH_SIZE];
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
379
380
  
  /* index in the above - for now: assume no multimajor ranges */
e61eb2e93   Yang Zhang   fs/block: type si...
381
  static inline int major_to_index(unsigned major)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
382
  {
68eef3b47   Joe Korty   [PATCH] Simplify ...
383
  	return major % BLKDEV_MAJOR_HASH_SIZE;
7170be5f5   Neil Horman   [PATCH] convert /...
384
  }
68eef3b47   Joe Korty   [PATCH] Simplify ...
385
  #ifdef CONFIG_PROC_FS
cf771cb5a   Tejun Heo   block: make varia...
386
  void blkdev_show(struct seq_file *seqf, off_t offset)
7170be5f5   Neil Horman   [PATCH] convert /...
387
  {
68eef3b47   Joe Korty   [PATCH] Simplify ...
388
  	struct blk_major_name *dp;
7170be5f5   Neil Horman   [PATCH] convert /...
389

133d55cdb   Logan Gunthorpe   block: order /pro...
390
391
392
  	mutex_lock(&block_class_lock);
  	for (dp = major_names[major_to_index(offset)]; dp; dp = dp->next)
  		if (dp->major == offset)
cf771cb5a   Tejun Heo   block: make varia...
393
394
  			seq_printf(seqf, "%3d %s
  ", dp->major, dp->name);
133d55cdb   Logan Gunthorpe   block: order /pro...
395
  	mutex_unlock(&block_class_lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
396
  }
68eef3b47   Joe Korty   [PATCH] Simplify ...
397
  #endif /* CONFIG_PROC_FS */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
398

9e8c0bccd   Márton Németh   block: add docume...
399
400
401
  /**
   * register_blkdev - register a new block device
   *
f33ff110e   Srivatsa S. Bhat   block, char_dev: ...
402
403
   * @major: the requested major device number [1..BLKDEV_MAJOR_MAX-1]. If
   *         @major = 0, try to allocate any unused major number.
9e8c0bccd   Márton Németh   block: add docume...
404
405
406
407
   * @name: the name of the new block device as a zero terminated string
   *
   * The @name must be unique within the system.
   *
0e056eb55   mchehab@s-opensource.com   kernel-api.rst: f...
408
409
   * The return value depends on the @major input parameter:
   *
f33ff110e   Srivatsa S. Bhat   block, char_dev: ...
410
411
   *  - if a major device number was requested in range [1..BLKDEV_MAJOR_MAX-1]
   *    then the function returns zero on success, or a negative error code
0e056eb55   mchehab@s-opensource.com   kernel-api.rst: f...
412
   *  - if any unused major number was requested with @major = 0 parameter
9e8c0bccd   Márton Németh   block: add docume...
413
   *    then the return value is the allocated major number in range
f33ff110e   Srivatsa S. Bhat   block, char_dev: ...
414
415
416
417
   *    [1..BLKDEV_MAJOR_MAX-1] or a negative error code otherwise
   *
   * See Documentation/admin-guide/devices.txt for the list of allocated
   * major numbers.
9e8c0bccd   Márton Németh   block: add docume...
418
   */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
419
420
421
422
  int register_blkdev(unsigned int major, const char *name)
  {
  	struct blk_major_name **n, *p;
  	int index, ret = 0;
edfaa7c36   Kay Sievers   Driver core: conv...
423
  	mutex_lock(&block_class_lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
424
425
426
427
428
429
430
431
432
  
  	/* temporary */
  	if (major == 0) {
  		for (index = ARRAY_SIZE(major_names)-1; index > 0; index--) {
  			if (major_names[index] == NULL)
  				break;
  		}
  
  		if (index == 0) {
dfc76d11d   Keyur Patel   block: Replace fu...
433
434
435
  			printk("%s: failed to get major for %s
  ",
  			       __func__, name);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
436
437
438
439
440
441
  			ret = -EBUSY;
  			goto out;
  		}
  		major = index;
  		ret = major;
  	}
133d55cdb   Logan Gunthorpe   block: order /pro...
442
  	if (major >= BLKDEV_MAJOR_MAX) {
dfc76d11d   Keyur Patel   block: Replace fu...
443
444
445
  		pr_err("%s: major requested (%u) is greater than the maximum (%u) for %s
  ",
  		       __func__, major, BLKDEV_MAJOR_MAX-1, name);
133d55cdb   Logan Gunthorpe   block: order /pro...
446
447
448
449
  
  		ret = -EINVAL;
  		goto out;
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
  	p = kmalloc(sizeof(struct blk_major_name), GFP_KERNEL);
  	if (p == NULL) {
  		ret = -ENOMEM;
  		goto out;
  	}
  
  	p->major = major;
  	strlcpy(p->name, name, sizeof(p->name));
  	p->next = NULL;
  	index = major_to_index(major);
  
  	for (n = &major_names[index]; *n; n = &(*n)->next) {
  		if ((*n)->major == major)
  			break;
  	}
  	if (!*n)
  		*n = p;
  	else
  		ret = -EBUSY;
  
  	if (ret < 0) {
f33ff110e   Srivatsa S. Bhat   block, char_dev: ...
471
472
  		printk("register_blkdev: cannot get major %u for %s
  ",
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
473
474
475
476
  		       major, name);
  		kfree(p);
  	}
  out:
edfaa7c36   Kay Sievers   Driver core: conv...
477
  	mutex_unlock(&block_class_lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
478
479
480
481
  	return ret;
  }
  
  EXPORT_SYMBOL(register_blkdev);
f4480240f   Akinobu Mita   unregister_blkdev...
482
  void unregister_blkdev(unsigned int major, const char *name)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
483
484
485
486
  {
  	struct blk_major_name **n;
  	struct blk_major_name *p = NULL;
  	int index = major_to_index(major);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
487

edfaa7c36   Kay Sievers   Driver core: conv...
488
  	mutex_lock(&block_class_lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
489
490
491
  	for (n = &major_names[index]; *n; n = &(*n)->next)
  		if ((*n)->major == major)
  			break;
294462a5c   Akinobu Mita   unregister_blkdev...
492
493
  	if (!*n || strcmp((*n)->name, name)) {
  		WARN_ON(1);
294462a5c   Akinobu Mita   unregister_blkdev...
494
  	} else {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
495
496
497
  		p = *n;
  		*n = p->next;
  	}
edfaa7c36   Kay Sievers   Driver core: conv...
498
  	mutex_unlock(&block_class_lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
499
  	kfree(p);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
500
501
502
503
504
  }
  
  EXPORT_SYMBOL(unregister_blkdev);
  
  static struct kobj_map *bdev_map;
bcce3de1b   Tejun Heo   block: implement ...
505
  /**
870d66561   Tejun Heo   block: implement ...
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
   * blk_mangle_minor - scatter minor numbers apart
   * @minor: minor number to mangle
   *
   * Scatter consecutively allocated @minor number apart if MANGLE_DEVT
   * is enabled.  Mangling twice gives the original value.
   *
   * RETURNS:
   * Mangled value.
   *
   * CONTEXT:
   * Don't care.
   */
  static int blk_mangle_minor(int minor)
  {
  #ifdef CONFIG_DEBUG_BLOCK_EXT_DEVT
  	int i;
  
  	for (i = 0; i < MINORBITS / 2; i++) {
  		int low = minor & (1 << i);
  		int high = minor & (1 << (MINORBITS - 1 - i));
  		int distance = MINORBITS - 1 - 2 * i;
  
  		minor ^= low | high;	/* clear both bits */
  		low <<= distance;	/* swap the positions */
  		high >>= distance;
  		minor |= low | high;	/* and set */
  	}
  #endif
  	return minor;
  }
  
  /**
bcce3de1b   Tejun Heo   block: implement ...
538
539
   * blk_alloc_devt - allocate a dev_t for a partition
   * @part: partition to allocate dev_t for
bcce3de1b   Tejun Heo   block: implement ...
540
541
542
543
544
545
546
547
548
549
550
551
552
553
   * @devt: out parameter for resulting dev_t
   *
   * Allocate a dev_t for block device.
   *
   * RETURNS:
   * 0 on success, allocated dev_t is returned in *@devt.  -errno on
   * failure.
   *
   * CONTEXT:
   * Might sleep.
   */
  int blk_alloc_devt(struct hd_struct *part, dev_t *devt)
  {
  	struct gendisk *disk = part_to_disk(part);
bab998d62   Tejun Heo   block: convert to...
554
  	int idx;
bcce3de1b   Tejun Heo   block: implement ...
555
556
557
558
559
560
561
562
  
  	/* in consecutive minor range? */
  	if (part->partno < disk->minors) {
  		*devt = MKDEV(disk->major, disk->first_minor + part->partno);
  		return 0;
  	}
  
  	/* allocate ext devt */
2da78092d   Keith Busch   block: Fix dev_t ...
563
  	idr_preload(GFP_KERNEL);
4d66e5e9b   Dan Williams   block: fix ext_de...
564
  	spin_lock_bh(&ext_devt_lock);
2da78092d   Keith Busch   block: Fix dev_t ...
565
  	idx = idr_alloc(&ext_devt_idr, part, 0, NR_EXT_DEVT, GFP_NOWAIT);
4d66e5e9b   Dan Williams   block: fix ext_de...
566
  	spin_unlock_bh(&ext_devt_lock);
2da78092d   Keith Busch   block: Fix dev_t ...
567
568
  
  	idr_preload_end();
bab998d62   Tejun Heo   block: convert to...
569
570
  	if (idx < 0)
  		return idx == -ENOSPC ? -EBUSY : idx;
bcce3de1b   Tejun Heo   block: implement ...
571

870d66561   Tejun Heo   block: implement ...
572
  	*devt = MKDEV(BLOCK_EXT_MAJOR, blk_mangle_minor(idx));
bcce3de1b   Tejun Heo   block: implement ...
573
574
575
576
577
578
579
580
581
582
583
584
585
586
  	return 0;
  }
  
  /**
   * blk_free_devt - free a dev_t
   * @devt: dev_t to free
   *
   * Free @devt which was allocated using blk_alloc_devt().
   *
   * CONTEXT:
   * Might sleep.
   */
  void blk_free_devt(dev_t devt)
  {
bcce3de1b   Tejun Heo   block: implement ...
587
588
589
590
  	if (devt == MKDEV(0, 0))
  		return;
  
  	if (MAJOR(devt) == BLOCK_EXT_MAJOR) {
4d66e5e9b   Dan Williams   block: fix ext_de...
591
  		spin_lock_bh(&ext_devt_lock);
870d66561   Tejun Heo   block: implement ...
592
  		idr_remove(&ext_devt_idr, blk_mangle_minor(MINOR(devt)));
4d66e5e9b   Dan Williams   block: fix ext_de...
593
  		spin_unlock_bh(&ext_devt_lock);
bcce3de1b   Tejun Heo   block: implement ...
594
595
  	}
  }
33c826ef1   Bart Van Assche   block: Convert bl...
596
597
  /*
   * We invalidate devt by assigning NULL pointer for devt in idr.
6fcc44d1d   Yufen Yu   block: fix use-af...
598
599
600
601
602
603
604
605
606
   */
  void blk_invalidate_devt(dev_t devt)
  {
  	if (MAJOR(devt) == BLOCK_EXT_MAJOR) {
  		spin_lock_bh(&ext_devt_lock);
  		idr_replace(&ext_devt_idr, NULL, blk_mangle_minor(MINOR(devt)));
  		spin_unlock_bh(&ext_devt_lock);
  	}
  }
1f0142905   Tejun Heo   block: adjust for...
607
608
609
610
611
612
613
614
615
616
617
  static char *bdevt_str(dev_t devt, char *buf)
  {
  	if (MAJOR(devt) <= 0xff && MINOR(devt) <= 0xff) {
  		char tbuf[BDEVT_SIZE];
  		snprintf(tbuf, BDEVT_SIZE, "%02x%02x", MAJOR(devt), MINOR(devt));
  		snprintf(buf, BDEVT_SIZE, "%-9s", tbuf);
  	} else
  		snprintf(buf, BDEVT_SIZE, "%03x:%05x", MAJOR(devt), MINOR(devt));
  
  	return buf;
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
618
619
620
621
622
  /*
   * Register device numbers dev..(dev+range-1)
   * range must be nonzero
   * The hash chain is sorted on range, so that subranges can override.
   */
edfaa7c36   Kay Sievers   Driver core: conv...
623
  void blk_register_region(dev_t devt, unsigned long range, struct module *module,
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
624
625
626
  			 struct kobject *(*probe)(dev_t, int *, void *),
  			 int (*lock)(dev_t, void *), void *data)
  {
edfaa7c36   Kay Sievers   Driver core: conv...
627
  	kobj_map(bdev_map, devt, range, module, probe, lock, data);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
628
629
630
  }
  
  EXPORT_SYMBOL(blk_register_region);
edfaa7c36   Kay Sievers   Driver core: conv...
631
  void blk_unregister_region(dev_t devt, unsigned long range)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
632
  {
edfaa7c36   Kay Sievers   Driver core: conv...
633
  	kobj_unmap(bdev_map, devt, range);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
634
635
636
  }
  
  EXPORT_SYMBOL(blk_unregister_region);
cf771cb5a   Tejun Heo   block: make varia...
637
  static struct kobject *exact_match(dev_t devt, int *partno, void *data)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
638
639
  {
  	struct gendisk *p = data;
edfaa7c36   Kay Sievers   Driver core: conv...
640

ed9e19823   Tejun Heo   block: implement ...
641
  	return &disk_to_dev(p)->kobj;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
642
  }
edfaa7c36   Kay Sievers   Driver core: conv...
643
  static int exact_lock(dev_t devt, void *data)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
644
645
  {
  	struct gendisk *p = data;
3079c22ea   Jan Kara   genhd: Rename get...
646
  	if (!get_disk_and_module(p))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
647
648
649
  		return -1;
  	return 0;
  }
9301fe734   Christoph Hellwig   block: cleanup pa...
650
651
652
653
654
655
656
657
658
659
660
661
  static void disk_scan_partitions(struct gendisk *disk)
  {
  	struct block_device *bdev;
  
  	if (!get_capacity(disk) || !disk_part_scan_enabled(disk))
  		return;
  
  	set_bit(GD_NEED_PART_SCAN, &disk->state);
  	bdev = blkdev_get_by_dev(disk_devt(disk), FMODE_READ, NULL);
  	if (!IS_ERR(bdev))
  		blkdev_put(bdev, FMODE_READ);
  }
fef912bf8   Hannes Reinecke   block: genhd: add...
662
663
  static void register_disk(struct device *parent, struct gendisk *disk,
  			  const struct attribute_group **groups)
d2bf1b672   Tejun Heo   block: move regis...
664
665
  {
  	struct device *ddev = disk_to_dev(disk);
d2bf1b672   Tejun Heo   block: move regis...
666
667
668
  	struct disk_part_iter piter;
  	struct hd_struct *part;
  	int err;
e63a46bef   Dan Williams   block: introduce ...
669
  	ddev->parent = parent;
d2bf1b672   Tejun Heo   block: move regis...
670

ffc8b3086   Kees Cook   block: do not pas...
671
  	dev_set_name(ddev, "%s", disk->disk_name);
d2bf1b672   Tejun Heo   block: move regis...
672
673
674
  
  	/* delay uevents, until we scanned partition table */
  	dev_set_uevent_suppress(ddev, 1);
fef912bf8   Hannes Reinecke   block: genhd: add...
675
676
677
678
  	if (groups) {
  		WARN_ON(ddev->groups);
  		ddev->groups = groups;
  	}
d2bf1b672   Tejun Heo   block: move regis...
679
680
681
682
683
684
685
686
687
688
  	if (device_add(ddev))
  		return;
  	if (!sysfs_deprecated) {
  		err = sysfs_create_link(block_depr, &ddev->kobj,
  					kobject_name(&ddev->kobj));
  		if (err) {
  			device_del(ddev);
  			return;
  		}
  	}
25e823c8c   Ming Lei   block/genhd.c: ap...
689
690
691
692
693
694
695
  
  	/*
  	 * avoid probable deadlock caused by allocating memory with
  	 * GFP_KERNEL in runtime_resume callback of its all ancestor
  	 * devices
  	 */
  	pm_runtime_set_memalloc_noio(ddev, true);
d2bf1b672   Tejun Heo   block: move regis...
696
697
  	disk->part0.holder_dir = kobject_create_and_add("holders", &ddev->kobj);
  	disk->slave_dir = kobject_create_and_add("slaves", &ddev->kobj);
8ddcd6532   Christoph Hellwig   block: introduce ...
698
699
700
701
  	if (disk->flags & GENHD_FL_HIDDEN) {
  		dev_set_uevent_suppress(ddev, 0);
  		return;
  	}
9301fe734   Christoph Hellwig   block: cleanup pa...
702
  	disk_scan_partitions(disk);
d2bf1b672   Tejun Heo   block: move regis...
703

d2bf1b672   Tejun Heo   block: move regis...
704
705
706
707
708
709
710
711
712
  	/* announce disk after possible partitions are created */
  	dev_set_uevent_suppress(ddev, 0);
  	kobject_uevent(&ddev->kobj, KOBJ_ADD);
  
  	/* announce possible partitions */
  	disk_part_iter_init(&piter, disk, 0);
  	while ((part = disk_part_iter_next(&piter)))
  		kobject_uevent(&part_to_dev(part)->kobj, KOBJ_ADD);
  	disk_part_iter_exit(&piter);
8ddcd6532   Christoph Hellwig   block: introduce ...
713

4d7c1d3fd   zhengbin   block: fix NULL p...
714
715
716
717
718
719
  	if (disk->queue->backing_dev_info->dev) {
  		err = sysfs_create_link(&ddev->kobj,
  			  &disk->queue->backing_dev_info->dev->kobj,
  			  "bdi");
  		WARN_ON(err);
  	}
d2bf1b672   Tejun Heo   block: move regis...
720
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
721
  /**
fa70d2e2c   Mike Snitzer   block: allow gend...
722
   * __device_add_disk - add disk information to kernel list
e63a46bef   Dan Williams   block: introduce ...
723
   * @parent: parent device for the disk
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
724
   * @disk: per-device partitioning information
fef912bf8   Hannes Reinecke   block: genhd: add...
725
   * @groups: Additional per-device sysfs groups
fa70d2e2c   Mike Snitzer   block: allow gend...
726
   * @register_queue: register the queue if set to true
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
727
728
729
   *
   * This function registers the partitioning information in @disk
   * with the kernel.
3e1a7ff8a   Tejun Heo   block: allow disk...
730
731
   *
   * FIXME: error handling
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
732
   */
fa70d2e2c   Mike Snitzer   block: allow gend...
733
  static void __device_add_disk(struct device *parent, struct gendisk *disk,
fef912bf8   Hannes Reinecke   block: genhd: add...
734
  			      const struct attribute_group **groups,
fa70d2e2c   Mike Snitzer   block: allow gend...
735
  			      bool register_queue)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
736
  {
3e1a7ff8a   Tejun Heo   block: allow disk...
737
  	dev_t devt;
6ffeea77f   Greg Kroah-Hartman   block: fix compil...
738
  	int retval;
cf0ca9fe5   Peter Zijlstra   mm: bdi: export B...
739

737eb78e8   Damien Le Moal   block: Delay defa...
740
741
742
743
744
745
746
747
  	/*
  	 * The disk queue should now be all set with enough information about
  	 * the device for the elevator code to pick an adequate default
  	 * elevator if one is needed, that is, for devices requesting queue
  	 * registration.
  	 */
  	if (register_queue)
  		elevator_init_mq(disk->queue);
3e1a7ff8a   Tejun Heo   block: allow disk...
748
749
750
751
752
  	/* minors == 0 indicates to use ext devt from part0 and should
  	 * be accompanied with EXT_DEVT flag.  Make sure all
  	 * parameters make sense.
  	 */
  	WARN_ON(disk->minors && !(disk->major || disk->first_minor));
8ddcd6532   Christoph Hellwig   block: introduce ...
753
754
  	WARN_ON(!disk->minors &&
  		!(disk->flags & (GENHD_FL_EXT_DEVT | GENHD_FL_HIDDEN)));
3e1a7ff8a   Tejun Heo   block: allow disk...
755

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
756
  	disk->flags |= GENHD_FL_UP;
3e1a7ff8a   Tejun Heo   block: allow disk...
757
758
759
760
761
762
  
  	retval = blk_alloc_devt(&disk->part0, &devt);
  	if (retval) {
  		WARN_ON(1);
  		return;
  	}
3e1a7ff8a   Tejun Heo   block: allow disk...
763
764
  	disk->major = MAJOR(devt);
  	disk->first_minor = MINOR(devt);
9f53d2fe8   Stanislaw Gruszka   block: fix __blkd...
765
  	disk_alloc_events(disk);
8ddcd6532   Christoph Hellwig   block: introduce ...
766
767
768
769
770
771
772
773
  	if (disk->flags & GENHD_FL_HIDDEN) {
  		/*
  		 * Don't let hidden disks show up in /proc/partitions,
  		 * and don't bother scanning for partitions either.
  		 */
  		disk->flags |= GENHD_FL_SUPPRESS_PARTITION_INFO;
  		disk->flags |= GENHD_FL_NO_PART_SCAN;
  	} else {
3c5d202b5   Christoph Hellwig   bdi: remove bdi_r...
774
775
  		struct backing_dev_info *bdi = disk->queue->backing_dev_info;
  		struct device *dev = disk_to_dev(disk);
3a92168bc   weiping zhang   block: add WARN_O...
776
  		int ret;
8ddcd6532   Christoph Hellwig   block: introduce ...
777
  		/* Register BDI before referencing it from bdev */
3c5d202b5   Christoph Hellwig   bdi: remove bdi_r...
778
779
  		dev->devt = devt;
  		ret = bdi_register(bdi, "%u:%u", MAJOR(devt), MINOR(devt));
3a92168bc   weiping zhang   block: add WARN_O...
780
  		WARN_ON(ret);
3c5d202b5   Christoph Hellwig   bdi: remove bdi_r...
781
  		bdi_set_owner(bdi, dev);
8ddcd6532   Christoph Hellwig   block: introduce ...
782
783
784
  		blk_register_region(disk_devt(disk), disk->minors, NULL,
  				    exact_match, exact_lock, disk);
  	}
fef912bf8   Hannes Reinecke   block: genhd: add...
785
  	register_disk(parent, disk, groups);
fa70d2e2c   Mike Snitzer   block: allow gend...
786
787
  	if (register_queue)
  		blk_register_queue(disk);
cf0ca9fe5   Peter Zijlstra   mm: bdi: export B...
788

523e1d399   Tejun Heo   block: make gendi...
789
790
791
792
  	/*
  	 * Take an extra ref on queue which will be put on disk_release()
  	 * so that it sticks around as long as @disk is there.
  	 */
09ac46c42   Tejun Heo   block: misc updat...
793
  	WARN_ON_ONCE(!blk_get_queue(disk->queue));
523e1d399   Tejun Heo   block: make gendi...
794

77ea887e4   Tejun Heo   implement in-kern...
795
  	disk_add_events(disk);
25520d55c   Martin K. Petersen   block: Inline blk...
796
  	blk_integrity_add(disk);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
797
  }
fa70d2e2c   Mike Snitzer   block: allow gend...
798

fef912bf8   Hannes Reinecke   block: genhd: add...
799
800
  void device_add_disk(struct device *parent, struct gendisk *disk,
  		     const struct attribute_group **groups)
fa70d2e2c   Mike Snitzer   block: allow gend...
801
  {
fef912bf8   Hannes Reinecke   block: genhd: add...
802
  	__device_add_disk(parent, disk, groups, true);
fa70d2e2c   Mike Snitzer   block: allow gend...
803
  }
e63a46bef   Dan Williams   block: introduce ...
804
  EXPORT_SYMBOL(device_add_disk);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
805

fa70d2e2c   Mike Snitzer   block: allow gend...
806
807
  void device_add_disk_no_queue_reg(struct device *parent, struct gendisk *disk)
  {
fef912bf8   Hannes Reinecke   block: genhd: add...
808
  	__device_add_disk(parent, disk, NULL, false);
fa70d2e2c   Mike Snitzer   block: allow gend...
809
810
  }
  EXPORT_SYMBOL(device_add_disk_no_queue_reg);
02d33b677   Christoph Hellwig   block: mark inval...
811
812
813
814
815
816
817
818
819
820
  static void invalidate_partition(struct gendisk *disk, int partno)
  {
  	struct block_device *bdev;
  
  	bdev = bdget_disk(disk, partno);
  	if (!bdev)
  		return;
  
  	fsync_bdev(bdev);
  	__invalidate_device(bdev, true);
9bc5c397d   Christoph Hellwig   block: fold bdev_...
821
822
823
824
825
826
  
  	/*
  	 * Unhash the bdev inode for this device so that it gets evicted as soon
  	 * as last inode reference is dropped.
  	 */
  	remove_inode_hash(bdev->bd_inode);
02d33b677   Christoph Hellwig   block: mark inval...
827
828
  	bdput(bdev);
  }
b5bd357cf   Luis Chamberlain   block: add docs f...
829
830
831
832
833
834
835
836
837
838
839
840
841
  /**
   * del_gendisk - remove the gendisk
   * @disk: the struct gendisk to remove
   *
   * Removes the gendisk and all its associated resources. This deletes the
   * partitions associated with the gendisk, and unregisters the associated
   * request_queue.
   *
   * This is the counter to the respective __device_add_disk() call.
   *
   * The final removal of the struct gendisk happens when its refcount reaches 0
   * with put_disk(), which should be called after del_gendisk(), if
   * __device_add_disk() was used.
e8c7d14ac   Luis Chamberlain   block: revert bac...
842
843
844
845
846
   *
   * Drivers exist which depend on the release of the gendisk to be synchronous,
   * it should not be deferred.
   *
   * Context: can sleep
b5bd357cf   Luis Chamberlain   block: add docs f...
847
   */
d2bf1b672   Tejun Heo   block: move regis...
848
  void del_gendisk(struct gendisk *disk)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
849
  {
d2bf1b672   Tejun Heo   block: move regis...
850
851
  	struct disk_part_iter piter;
  	struct hd_struct *part;
e8c7d14ac   Luis Chamberlain   block: revert bac...
852
  	might_sleep();
25520d55c   Martin K. Petersen   block: Inline blk...
853
  	blk_integrity_del(disk);
77ea887e4   Tejun Heo   implement in-kern...
854
  	disk_del_events(disk);
56c0908c8   Jan Kara   genhd: Fix BUG in...
855
856
857
858
859
  	/*
  	 * Block lookups of the disk until all bdevs are unhashed and the
  	 * disk is marked as dead (GENHD_FL_UP cleared).
  	 */
  	down_write(&disk->lookup_sem);
d2bf1b672   Tejun Heo   block: move regis...
860
861
862
863
864
  	/* invalidate stuff */
  	disk_part_iter_init(&piter, disk,
  			     DISK_PITER_INCL_EMPTY | DISK_PITER_REVERSE);
  	while ((part = disk_part_iter_next(&piter))) {
  		invalidate_partition(disk, part->partno);
8328eb283   Christoph Hellwig   block: remove the...
865
  		delete_partition(part);
d2bf1b672   Tejun Heo   block: move regis...
866
867
868
869
  	}
  	disk_part_iter_exit(&piter);
  
  	invalidate_partition(disk, 0);
d2bf1b672   Tejun Heo   block: move regis...
870
871
  	set_capacity(disk, 0);
  	disk->flags &= ~GENHD_FL_UP;
56c0908c8   Jan Kara   genhd: Fix BUG in...
872
  	up_write(&disk->lookup_sem);
d2bf1b672   Tejun Heo   block: move regis...
873

8ddcd6532   Christoph Hellwig   block: introduce ...
874
875
  	if (!(disk->flags & GENHD_FL_HIDDEN))
  		sysfs_remove_link(&disk_to_dev(disk)->kobj, "bdi");
90f16fddc   Jan Kara   block: Make del_g...
876
877
878
879
880
  	if (disk->queue) {
  		/*
  		 * Unregister bdi before releasing device numbers (as they can
  		 * get reused and we'd get clashes in sysfs).
  		 */
bc8d062c3   Mike Snitzer   block: only bdi_u...
881
882
  		if (!(disk->flags & GENHD_FL_HIDDEN))
  			bdi_unregister(disk->queue->backing_dev_info);
90f16fddc   Jan Kara   block: Make del_g...
883
884
885
886
  		blk_unregister_queue(disk);
  	} else {
  		WARN_ON(1);
  	}
d2bf1b672   Tejun Heo   block: move regis...
887

17eac0996   Hannes Reinecke   block: create 'sl...
888
  	if (!(disk->flags & GENHD_FL_HIDDEN))
8ddcd6532   Christoph Hellwig   block: introduce ...
889
  		blk_unregister_region(disk_devt(disk), disk->minors);
6fcc44d1d   Yufen Yu   block: fix use-af...
890
891
892
893
894
895
896
  	/*
  	 * Remove gendisk pointer from idr so that it cannot be looked up
  	 * while RCU period before freeing gendisk is running to prevent
  	 * use-after-free issues. Note that the device number stays
  	 * "in-use" until we really free the gendisk.
  	 */
  	blk_invalidate_devt(disk_devt(disk));
d2bf1b672   Tejun Heo   block: move regis...
897
898
899
  
  	kobject_put(disk->part0.holder_dir);
  	kobject_put(disk->slave_dir);
d2bf1b672   Tejun Heo   block: move regis...
900
901
902
  
  	part_stat_set_all(&disk->part0, 0);
  	disk->part0.stamp = 0;
d2bf1b672   Tejun Heo   block: move regis...
903
904
  	if (!sysfs_deprecated)
  		sysfs_remove_link(block_depr, dev_name(disk_to_dev(disk)));
25e823c8c   Ming Lei   block/genhd.c: ap...
905
  	pm_runtime_set_memalloc_noio(disk_to_dev(disk), false);
d2bf1b672   Tejun Heo   block: move regis...
906
  	device_del(disk_to_dev(disk));
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
907
  }
d2bf1b672   Tejun Heo   block: move regis...
908
  EXPORT_SYMBOL(del_gendisk);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
909

99e6608c9   Vishal Verma   block: Add badblo...
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
  /* sysfs access to bad-blocks list. */
  static ssize_t disk_badblocks_show(struct device *dev,
  					struct device_attribute *attr,
  					char *page)
  {
  	struct gendisk *disk = dev_to_disk(dev);
  
  	if (!disk->bb)
  		return sprintf(page, "
  ");
  
  	return badblocks_show(disk->bb, page, 0);
  }
  
  static ssize_t disk_badblocks_store(struct device *dev,
  					struct device_attribute *attr,
  					const char *page, size_t len)
  {
  	struct gendisk *disk = dev_to_disk(dev);
  
  	if (!disk->bb)
  		return -ENXIO;
  
  	return badblocks_store(disk->bb, page, len, 0);
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
935
936
  /**
   * get_gendisk - get partitioning information for a given device
710027a48   Randy Dunlap   Add some block/ s...
937
   * @devt: device to get partitioning information for
496aa8a98   Randy Dunlap   block: fix curren...
938
   * @partno: returned partition index
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
939
940
   *
   * This function gets the structure containing partitioning
710027a48   Randy Dunlap   Add some block/ s...
941
   * information for the given device @devt.
763b58923   Luis Chamberlain   block: clarify co...
942
943
   *
   * Context: can sleep
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
944
   */
cf771cb5a   Tejun Heo   block: make varia...
945
  struct gendisk *get_gendisk(dev_t devt, int *partno)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
946
  {
bcce3de1b   Tejun Heo   block: implement ...
947
  	struct gendisk *disk = NULL;
763b58923   Luis Chamberlain   block: clarify co...
948
  	might_sleep();
bcce3de1b   Tejun Heo   block: implement ...
949
950
951
952
953
954
955
956
  	if (MAJOR(devt) != BLOCK_EXT_MAJOR) {
  		struct kobject *kobj;
  
  		kobj = kobj_lookup(bdev_map, devt, partno);
  		if (kobj)
  			disk = dev_to_disk(kobj_to_dev(kobj));
  	} else {
  		struct hd_struct *part;
4d66e5e9b   Dan Williams   block: fix ext_de...
957
  		spin_lock_bh(&ext_devt_lock);
870d66561   Tejun Heo   block: implement ...
958
  		part = idr_find(&ext_devt_idr, blk_mangle_minor(MINOR(devt)));
3079c22ea   Jan Kara   genhd: Rename get...
959
  		if (part && get_disk_and_module(part_to_disk(part))) {
bcce3de1b   Tejun Heo   block: implement ...
960
961
962
  			*partno = part->partno;
  			disk = part_to_disk(part);
  		}
4d66e5e9b   Dan Williams   block: fix ext_de...
963
  		spin_unlock_bh(&ext_devt_lock);
bcce3de1b   Tejun Heo   block: implement ...
964
  	}
edfaa7c36   Kay Sievers   Driver core: conv...
965

56c0908c8   Jan Kara   genhd: Fix BUG in...
966
967
968
969
970
971
972
973
974
975
976
  	if (!disk)
  		return NULL;
  
  	/*
  	 * Synchronize with del_gendisk() to not return disk that is being
  	 * destroyed.
  	 */
  	down_read(&disk->lookup_sem);
  	if (unlikely((disk->flags & GENHD_FL_HIDDEN) ||
  		     !(disk->flags & GENHD_FL_UP))) {
  		up_read(&disk->lookup_sem);
9df6c2991   Jan Kara   genhd: Add helper...
977
  		put_disk_and_module(disk);
8ddcd6532   Christoph Hellwig   block: introduce ...
978
  		disk = NULL;
56c0908c8   Jan Kara   genhd: Fix BUG in...
979
980
  	} else {
  		up_read(&disk->lookup_sem);
8ddcd6532   Christoph Hellwig   block: introduce ...
981
  	}
bcce3de1b   Tejun Heo   block: implement ...
982
  	return disk;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
983
  }
f331c0296   Tejun Heo   block: don't depe...
984
985
986
987
988
989
990
991
992
993
994
995
996
  /**
   * bdget_disk - do bdget() by gendisk and partition number
   * @disk: gendisk of interest
   * @partno: partition number
   *
   * Find partition @partno from @disk, do bdget() on it.
   *
   * CONTEXT:
   * Don't care.
   *
   * RETURNS:
   * Resulting block_device on success, NULL on failure.
   */
aeb3d3a81   Harvey Harrison   block: kmalloc ar...
997
  struct block_device *bdget_disk(struct gendisk *disk, int partno)
f331c0296   Tejun Heo   block: don't depe...
998
  {
548b10eb2   Tejun Heo   block: move __dev...
999
1000
  	struct hd_struct *part;
  	struct block_device *bdev = NULL;
f331c0296   Tejun Heo   block: don't depe...
1001

548b10eb2   Tejun Heo   block: move __dev...
1002
  	part = disk_get_part(disk, partno);
2bbedcb4c   Tejun Heo   block: don't test...
1003
  	if (part)
10ed16662   Christoph Hellwig   block: add a bdge...
1004
  		bdev = bdget_part(part);
548b10eb2   Tejun Heo   block: move __dev...
1005
  	disk_put_part(part);
f331c0296   Tejun Heo   block: don't depe...
1006

548b10eb2   Tejun Heo   block: move __dev...
1007
  	return bdev;
f331c0296   Tejun Heo   block: don't depe...
1008
1009
  }
  EXPORT_SYMBOL(bdget_disk);
dd2a345f8   Dave Gilbert   Display all possi...
1010
  /*
5c6f35c5e   Greg Kroah-Hartman   block: make print...
1011
1012
1013
1014
1015
1016
   * print a full list of all partitions - intended for places where the root
   * filesystem can't be mounted and thus to give the victim some idea of what
   * went wrong
   */
  void __init printk_all_partitions(void)
  {
def4e38dd   Tejun Heo   block: use class_...
1017
1018
1019
1020
1021
1022
  	struct class_dev_iter iter;
  	struct device *dev;
  
  	class_dev_iter_init(&iter, &block_class, NULL, &disk_type);
  	while ((dev = class_dev_iter_next(&iter))) {
  		struct gendisk *disk = dev_to_disk(dev);
e71bf0d0e   Tejun Heo   block: fix disk->...
1023
1024
  		struct disk_part_iter piter;
  		struct hd_struct *part;
1f0142905   Tejun Heo   block: adjust for...
1025
1026
  		char name_buf[BDEVNAME_SIZE];
  		char devt_buf[BDEVT_SIZE];
def4e38dd   Tejun Heo   block: use class_...
1027
1028
1029
  
  		/*
  		 * Don't show empty devices or things that have been
25985edce   Lucas De Marchi   Fix common misspe...
1030
  		 * suppressed
def4e38dd   Tejun Heo   block: use class_...
1031
1032
1033
1034
1035
1036
1037
1038
1039
1040
  		 */
  		if (get_capacity(disk) == 0 ||
  		    (disk->flags & GENHD_FL_SUPPRESS_PARTITION_INFO))
  			continue;
  
  		/*
  		 * Note, unlike /proc/partitions, I am showing the
  		 * numbers in hex - the same format as the root=
  		 * option takes.
  		 */
074a7aca7   Tejun Heo   block: move stats...
1041
1042
1043
  		disk_part_iter_init(&piter, disk, DISK_PITER_INCL_PART0);
  		while ((part = disk_part_iter_next(&piter))) {
  			bool is_part0 = part == &disk->part0;
def4e38dd   Tejun Heo   block: use class_...
1044

b5af921ec   Will Drewry   init: add support...
1045
  			printk("%s%s %10llu %s %s", is_part0 ? "" : "  ",
1f0142905   Tejun Heo   block: adjust for...
1046
  			       bdevt_str(part_devt(part), devt_buf),
c83f6bf98   Vivek Goyal   block: add partit...
1047
1048
  			       (unsigned long long)part_nr_sects_read(part) >> 1
  			       , disk_name(disk, part->partno, name_buf),
1ad7e8994   Stephen Warren   block: store part...
1049
  			       part->info ? part->info->uuid : "");
074a7aca7   Tejun Heo   block: move stats...
1050
  			if (is_part0) {
52c44d93c   Dan Williams   block: remove ->d...
1051
  				if (dev->parent && dev->parent->driver)
074a7aca7   Tejun Heo   block: move stats...
1052
1053
  					printk(" driver: %s
  ",
52c44d93c   Dan Williams   block: remove ->d...
1054
  					      dev->parent->driver->name);
074a7aca7   Tejun Heo   block: move stats...
1055
1056
1057
1058
1059
1060
1061
  				else
  					printk(" (driver?)
  ");
  			} else
  				printk("
  ");
  		}
e71bf0d0e   Tejun Heo   block: fix disk->...
1062
  		disk_part_iter_exit(&piter);
def4e38dd   Tejun Heo   block: use class_...
1063
1064
  	}
  	class_dev_iter_exit(&iter);
dd2a345f8   Dave Gilbert   Display all possi...
1065
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1066
1067
  #ifdef CONFIG_PROC_FS
  /* iterator */
def4e38dd   Tejun Heo   block: use class_...
1068
  static void *disk_seqf_start(struct seq_file *seqf, loff_t *pos)
68c4d4a78   Greg Kroah-Hartman   block: make proc ...
1069
  {
def4e38dd   Tejun Heo   block: use class_...
1070
1071
1072
  	loff_t skip = *pos;
  	struct class_dev_iter *iter;
  	struct device *dev;
68c4d4a78   Greg Kroah-Hartman   block: make proc ...
1073

aeb3d3a81   Harvey Harrison   block: kmalloc ar...
1074
  	iter = kmalloc(sizeof(*iter), GFP_KERNEL);
def4e38dd   Tejun Heo   block: use class_...
1075
1076
1077
1078
1079
1080
1081
1082
1083
1084
1085
1086
  	if (!iter)
  		return ERR_PTR(-ENOMEM);
  
  	seqf->private = iter;
  	class_dev_iter_init(iter, &block_class, NULL, &disk_type);
  	do {
  		dev = class_dev_iter_next(iter);
  		if (!dev)
  			return NULL;
  	} while (skip--);
  
  	return dev_to_disk(dev);
68c4d4a78   Greg Kroah-Hartman   block: make proc ...
1087
  }
def4e38dd   Tejun Heo   block: use class_...
1088
  static void *disk_seqf_next(struct seq_file *seqf, void *v, loff_t *pos)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1089
  {
edfaa7c36   Kay Sievers   Driver core: conv...
1090
  	struct device *dev;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1091

def4e38dd   Tejun Heo   block: use class_...
1092
1093
  	(*pos)++;
  	dev = class_dev_iter_next(seqf->private);
2ac3cee52   Tejun Heo   block: don't grab...
1094
  	if (dev)
68c4d4a78   Greg Kroah-Hartman   block: make proc ...
1095
  		return dev_to_disk(dev);
2ac3cee52   Tejun Heo   block: don't grab...
1096

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1097
1098
  	return NULL;
  }
def4e38dd   Tejun Heo   block: use class_...
1099
  static void disk_seqf_stop(struct seq_file *seqf, void *v)
27f302519   Greg Kroah-Hartman   block: make /proc...
1100
  {
def4e38dd   Tejun Heo   block: use class_...
1101
  	struct class_dev_iter *iter = seqf->private;
27f302519   Greg Kroah-Hartman   block: make /proc...
1102

def4e38dd   Tejun Heo   block: use class_...
1103
1104
1105
1106
  	/* stop is called even after start failed :-( */
  	if (iter) {
  		class_dev_iter_exit(iter);
  		kfree(iter);
77da16053   Vegard Nossum   block: fix use-af...
1107
  		seqf->private = NULL;
5c0ef6d02   Kay Sievers   block: drop refer...
1108
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1109
  }
def4e38dd   Tejun Heo   block: use class_...
1110
  static void *show_partition_start(struct seq_file *seqf, loff_t *pos)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1111
  {
067680670   Jianpeng Ma   block: Don't use ...
1112
  	void *p;
def4e38dd   Tejun Heo   block: use class_...
1113
1114
  
  	p = disk_seqf_start(seqf, pos);
b9f985b6e   Yang Zhang   block: convert !I...
1115
  	if (!IS_ERR_OR_NULL(p) && !*pos)
def4e38dd   Tejun Heo   block: use class_...
1116
1117
1118
1119
  		seq_puts(seqf, "major minor  #blocks  name
  
  ");
  	return p;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1120
  }
cf771cb5a   Tejun Heo   block: make varia...
1121
  static int show_partition(struct seq_file *seqf, void *v)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1122
1123
  {
  	struct gendisk *sgp = v;
e71bf0d0e   Tejun Heo   block: fix disk->...
1124
1125
  	struct disk_part_iter piter;
  	struct hd_struct *part;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1126
  	char buf[BDEVNAME_SIZE];
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1127
  	/* Don't show non-partitionable removeable devices or empty devices */
d27769ec3   Tejun Heo   block: add GENHD_...
1128
  	if (!get_capacity(sgp) || (!disk_max_parts(sgp) &&
f331c0296   Tejun Heo   block: don't depe...
1129
  				   (sgp->flags & GENHD_FL_REMOVABLE)))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1130
1131
1132
1133
1134
  		return 0;
  	if (sgp->flags & GENHD_FL_SUPPRESS_PARTITION_INFO)
  		return 0;
  
  	/* show the full disk and all non-0 size partitions of it */
074a7aca7   Tejun Heo   block: move stats...
1135
  	disk_part_iter_init(&piter, sgp, DISK_PITER_INCL_PART0);
e71bf0d0e   Tejun Heo   block: fix disk->...
1136
  	while ((part = disk_part_iter_next(&piter)))
1f0142905   Tejun Heo   block: adjust for...
1137
1138
  		seq_printf(seqf, "%4d  %7d %10llu %s
  ",
f331c0296   Tejun Heo   block: don't depe...
1139
  			   MAJOR(part_devt(part)), MINOR(part_devt(part)),
c83f6bf98   Vivek Goyal   block: add partit...
1140
  			   (unsigned long long)part_nr_sects_read(part) >> 1,
f331c0296   Tejun Heo   block: don't depe...
1141
  			   disk_name(sgp, part->partno, buf));
e71bf0d0e   Tejun Heo   block: fix disk->...
1142
  	disk_part_iter_exit(&piter);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1143
1144
1145
  
  	return 0;
  }
f500975a3   Alexey Dobriyan   proc: move rest o...
1146
  static const struct seq_operations partitions_op = {
def4e38dd   Tejun Heo   block: use class_...
1147
1148
1149
  	.start	= show_partition_start,
  	.next	= disk_seqf_next,
  	.stop	= disk_seqf_stop,
edfaa7c36   Kay Sievers   Driver core: conv...
1150
  	.show	= show_partition
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1151
1152
  };
  #endif
cf771cb5a   Tejun Heo   block: make varia...
1153
  static struct kobject *base_probe(dev_t devt, int *partno, void *data)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1154
  {
edfaa7c36   Kay Sievers   Driver core: conv...
1155
  	if (request_module("block-major-%d-%d", MAJOR(devt), MINOR(devt)) > 0)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1156
  		/* Make old-style 2.4 aliases work */
edfaa7c36   Kay Sievers   Driver core: conv...
1157
  		request_module("block-major-%d", MAJOR(devt));
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1158
1159
1160
1161
1162
  	return NULL;
  }
  
  static int __init genhd_device_init(void)
  {
e105b8bfc   Dan Williams   sysfs: add /sys/d...
1163
1164
1165
1166
  	int error;
  
  	block_class.dev_kobj = sysfs_dev_block_kobj;
  	error = class_register(&block_class);
ee27a558a   Roland McGrath   genhd must_check ...
1167
1168
  	if (unlikely(error))
  		return error;
edfaa7c36   Kay Sievers   Driver core: conv...
1169
  	bdev_map = kobj_map_init(base_probe, &block_class_lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1170
  	blk_dev_init();
edfaa7c36   Kay Sievers   Driver core: conv...
1171

561ec68e4   Zhang, Yanmin   block: fix boot f...
1172
  	register_blkdev(BLOCK_EXT_MAJOR, "blkext");
edfaa7c36   Kay Sievers   Driver core: conv...
1173
  	/* create top-level block dir */
e52eec13c   Andi Kleen   SYSFS: Allow boot...
1174
1175
  	if (!sysfs_deprecated)
  		block_depr = kobject_create_and_add("block", NULL);
830d3cfb1   Greg Kroah-Hartman   kset: convert blo...
1176
  	return 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1177
1178
1179
  }
  
  subsys_initcall(genhd_device_init);
edfaa7c36   Kay Sievers   Driver core: conv...
1180
1181
  static ssize_t disk_range_show(struct device *dev,
  			       struct device_attribute *attr, char *buf)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1182
  {
edfaa7c36   Kay Sievers   Driver core: conv...
1183
  	struct gendisk *disk = dev_to_disk(dev);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1184

edfaa7c36   Kay Sievers   Driver core: conv...
1185
1186
  	return sprintf(buf, "%d
  ", disk->minors);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1187
  }
1f0142905   Tejun Heo   block: adjust for...
1188
1189
1190
1191
  static ssize_t disk_ext_range_show(struct device *dev,
  				   struct device_attribute *attr, char *buf)
  {
  	struct gendisk *disk = dev_to_disk(dev);
b5d0b9df0   Tejun Heo   block: introduce ...
1192
1193
  	return sprintf(buf, "%d
  ", disk_max_parts(disk));
1f0142905   Tejun Heo   block: adjust for...
1194
  }
edfaa7c36   Kay Sievers   Driver core: conv...
1195
1196
  static ssize_t disk_removable_show(struct device *dev,
  				   struct device_attribute *attr, char *buf)
a7fd67062   Kay Sievers   [PATCH] add sysfs...
1197
  {
edfaa7c36   Kay Sievers   Driver core: conv...
1198
  	struct gendisk *disk = dev_to_disk(dev);
a7fd67062   Kay Sievers   [PATCH] add sysfs...
1199

edfaa7c36   Kay Sievers   Driver core: conv...
1200
1201
1202
  	return sprintf(buf, "%d
  ",
  		       (disk->flags & GENHD_FL_REMOVABLE ? 1 : 0));
a7fd67062   Kay Sievers   [PATCH] add sysfs...
1203
  }
8ddcd6532   Christoph Hellwig   block: introduce ...
1204
1205
1206
1207
1208
1209
1210
1211
1212
  static ssize_t disk_hidden_show(struct device *dev,
  				   struct device_attribute *attr, char *buf)
  {
  	struct gendisk *disk = dev_to_disk(dev);
  
  	return sprintf(buf, "%d
  ",
  		       (disk->flags & GENHD_FL_HIDDEN ? 1 : 0));
  }
1c9ce5276   Kay Sievers   block: export "ro...
1213
1214
1215
1216
  static ssize_t disk_ro_show(struct device *dev,
  				   struct device_attribute *attr, char *buf)
  {
  	struct gendisk *disk = dev_to_disk(dev);
b7db9956e   Tejun Heo   block: move polic...
1217
1218
  	return sprintf(buf, "%d
  ", get_disk_ro(disk) ? 1 : 0);
1c9ce5276   Kay Sievers   block: export "ro...
1219
  }
3ad5cee5c   Christoph Hellwig   block: move sysfs...
1220
1221
1222
1223
1224
1225
1226
1227
1228
1229
1230
1231
1232
1233
1234
  ssize_t part_size_show(struct device *dev,
  		       struct device_attribute *attr, char *buf)
  {
  	struct hd_struct *p = dev_to_part(dev);
  
  	return sprintf(buf, "%llu
  ",
  		(unsigned long long)part_nr_sects_read(p));
  }
  
  ssize_t part_stat_show(struct device *dev,
  		       struct device_attribute *attr, char *buf)
  {
  	struct hd_struct *p = dev_to_part(dev);
  	struct request_queue *q = part_to_disk(p)->queue;
ea18e0f0a   Konstantin Khlebnikov   block/diskstats: ...
1235
  	struct disk_stats stat;
3ad5cee5c   Christoph Hellwig   block: move sysfs...
1236
  	unsigned int inflight;
ea18e0f0a   Konstantin Khlebnikov   block/diskstats: ...
1237
  	part_stat_read_all(p, &stat);
b2f609e19   Christoph Hellwig   block: move the b...
1238
1239
1240
  	if (queue_is_mq(q))
  		inflight = blk_mq_in_flight(q, p);
  	else
1f06959bd   Christoph Hellwig   block: remove the...
1241
  		inflight = part_in_flight(p);
ea18e0f0a   Konstantin Khlebnikov   block/diskstats: ...
1242

3ad5cee5c   Christoph Hellwig   block: move sysfs...
1243
1244
1245
1246
1247
1248
1249
1250
  	return sprintf(buf,
  		"%8lu %8lu %8llu %8u "
  		"%8lu %8lu %8llu %8u "
  		"%8u %8u %8u "
  		"%8lu %8lu %8llu %8u "
  		"%8lu %8u"
  		"
  ",
ea18e0f0a   Konstantin Khlebnikov   block/diskstats: ...
1251
1252
1253
1254
1255
1256
1257
1258
  		stat.ios[STAT_READ],
  		stat.merges[STAT_READ],
  		(unsigned long long)stat.sectors[STAT_READ],
  		(unsigned int)div_u64(stat.nsecs[STAT_READ], NSEC_PER_MSEC),
  		stat.ios[STAT_WRITE],
  		stat.merges[STAT_WRITE],
  		(unsigned long long)stat.sectors[STAT_WRITE],
  		(unsigned int)div_u64(stat.nsecs[STAT_WRITE], NSEC_PER_MSEC),
3ad5cee5c   Christoph Hellwig   block: move sysfs...
1259
  		inflight,
ea18e0f0a   Konstantin Khlebnikov   block/diskstats: ...
1260
  		jiffies_to_msecs(stat.io_ticks),
8cd5b8fc0   Konstantin Khlebnikov   block/diskstats: ...
1261
1262
1263
1264
1265
  		(unsigned int)div_u64(stat.nsecs[STAT_READ] +
  				      stat.nsecs[STAT_WRITE] +
  				      stat.nsecs[STAT_DISCARD] +
  				      stat.nsecs[STAT_FLUSH],
  						NSEC_PER_MSEC),
ea18e0f0a   Konstantin Khlebnikov   block/diskstats: ...
1266
1267
1268
1269
1270
1271
  		stat.ios[STAT_DISCARD],
  		stat.merges[STAT_DISCARD],
  		(unsigned long long)stat.sectors[STAT_DISCARD],
  		(unsigned int)div_u64(stat.nsecs[STAT_DISCARD], NSEC_PER_MSEC),
  		stat.ios[STAT_FLUSH],
  		(unsigned int)div_u64(stat.nsecs[STAT_FLUSH], NSEC_PER_MSEC));
3ad5cee5c   Christoph Hellwig   block: move sysfs...
1272
1273
1274
1275
1276
1277
1278
1279
  }
  
  ssize_t part_inflight_show(struct device *dev, struct device_attribute *attr,
  			   char *buf)
  {
  	struct hd_struct *p = dev_to_part(dev);
  	struct request_queue *q = part_to_disk(p)->queue;
  	unsigned int inflight[2];
b2f609e19   Christoph Hellwig   block: move the b...
1280
1281
1282
  	if (queue_is_mq(q))
  		blk_mq_in_flight_rw(q, p, inflight);
  	else
1f06959bd   Christoph Hellwig   block: remove the...
1283
  		part_in_flight_rw(p, inflight);
b2f609e19   Christoph Hellwig   block: move the b...
1284

3ad5cee5c   Christoph Hellwig   block: move sysfs...
1285
1286
1287
  	return sprintf(buf, "%8u %8u
  ", inflight[0], inflight[1]);
  }
edfaa7c36   Kay Sievers   Driver core: conv...
1288
1289
  static ssize_t disk_capability_show(struct device *dev,
  				    struct device_attribute *attr, char *buf)
86ce18d7b   Kristen Carlson Accardi   genhd: expose AN ...
1290
  {
edfaa7c36   Kay Sievers   Driver core: conv...
1291
1292
1293
1294
  	struct gendisk *disk = dev_to_disk(dev);
  
  	return sprintf(buf, "%x
  ", disk->flags);
86ce18d7b   Kristen Carlson Accardi   genhd: expose AN ...
1295
  }
edfaa7c36   Kay Sievers   Driver core: conv...
1296

c72758f33   Martin K. Petersen   block: Export I/O...
1297
1298
1299
1300
1301
1302
1303
1304
1305
  static ssize_t disk_alignment_offset_show(struct device *dev,
  					  struct device_attribute *attr,
  					  char *buf)
  {
  	struct gendisk *disk = dev_to_disk(dev);
  
  	return sprintf(buf, "%d
  ", queue_alignment_offset(disk->queue));
  }
86b372814   Martin K. Petersen   block: Expose dis...
1306
1307
1308
1309
1310
  static ssize_t disk_discard_alignment_show(struct device *dev,
  					   struct device_attribute *attr,
  					   char *buf)
  {
  	struct gendisk *disk = dev_to_disk(dev);
dd3d145d4   Martin K. Petersen   block: Fix discar...
1311
1312
  	return sprintf(buf, "%d
  ", queue_discard_alignment(disk->queue));
86b372814   Martin K. Petersen   block: Expose dis...
1313
  }
5657a819a   Joe Perches   block drivers/blo...
1314
1315
1316
1317
1318
1319
1320
1321
1322
1323
1324
1325
  static DEVICE_ATTR(range, 0444, disk_range_show, NULL);
  static DEVICE_ATTR(ext_range, 0444, disk_ext_range_show, NULL);
  static DEVICE_ATTR(removable, 0444, disk_removable_show, NULL);
  static DEVICE_ATTR(hidden, 0444, disk_hidden_show, NULL);
  static DEVICE_ATTR(ro, 0444, disk_ro_show, NULL);
  static DEVICE_ATTR(size, 0444, part_size_show, NULL);
  static DEVICE_ATTR(alignment_offset, 0444, disk_alignment_offset_show, NULL);
  static DEVICE_ATTR(discard_alignment, 0444, disk_discard_alignment_show, NULL);
  static DEVICE_ATTR(capability, 0444, disk_capability_show, NULL);
  static DEVICE_ATTR(stat, 0444, part_stat_show, NULL);
  static DEVICE_ATTR(inflight, 0444, part_inflight_show, NULL);
  static DEVICE_ATTR(badblocks, 0644, disk_badblocks_show, disk_badblocks_store);
3ad5cee5c   Christoph Hellwig   block: move sysfs...
1326

c17bb4951   Akinobu Mita   [PATCH] fault-inj...
1327
  #ifdef CONFIG_FAIL_MAKE_REQUEST
3ad5cee5c   Christoph Hellwig   block: move sysfs...
1328
1329
1330
1331
1332
1333
1334
1335
1336
1337
1338
1339
1340
1341
1342
1343
1344
1345
1346
1347
1348
  ssize_t part_fail_show(struct device *dev,
  		       struct device_attribute *attr, char *buf)
  {
  	struct hd_struct *p = dev_to_part(dev);
  
  	return sprintf(buf, "%d
  ", p->make_it_fail);
  }
  
  ssize_t part_fail_store(struct device *dev,
  			struct device_attribute *attr,
  			const char *buf, size_t count)
  {
  	struct hd_struct *p = dev_to_part(dev);
  	int i;
  
  	if (count > 0 && sscanf(buf, "%d", &i) > 0)
  		p->make_it_fail = (i == 0) ? 0 : 1;
  
  	return count;
  }
edfaa7c36   Kay Sievers   Driver core: conv...
1349
  static struct device_attribute dev_attr_fail =
5657a819a   Joe Perches   block drivers/blo...
1350
  	__ATTR(make-it-fail, 0644, part_fail_show, part_fail_store);
3ad5cee5c   Christoph Hellwig   block: move sysfs...
1351
  #endif /* CONFIG_FAIL_MAKE_REQUEST */
581d4e28d   Jens Axboe   block: add fault ...
1352
1353
  #ifdef CONFIG_FAIL_IO_TIMEOUT
  static struct device_attribute dev_attr_fail_timeout =
5657a819a   Joe Perches   block drivers/blo...
1354
  	__ATTR(io-timeout-fail, 0644, part_timeout_show, part_timeout_store);
581d4e28d   Jens Axboe   block: add fault ...
1355
  #endif
edfaa7c36   Kay Sievers   Driver core: conv...
1356
1357
1358
  
  static struct attribute *disk_attrs[] = {
  	&dev_attr_range.attr,
1f0142905   Tejun Heo   block: adjust for...
1359
  	&dev_attr_ext_range.attr,
edfaa7c36   Kay Sievers   Driver core: conv...
1360
  	&dev_attr_removable.attr,
8ddcd6532   Christoph Hellwig   block: introduce ...
1361
  	&dev_attr_hidden.attr,
1c9ce5276   Kay Sievers   block: export "ro...
1362
  	&dev_attr_ro.attr,
edfaa7c36   Kay Sievers   Driver core: conv...
1363
  	&dev_attr_size.attr,
c72758f33   Martin K. Petersen   block: Export I/O...
1364
  	&dev_attr_alignment_offset.attr,
86b372814   Martin K. Petersen   block: Expose dis...
1365
  	&dev_attr_discard_alignment.attr,
edfaa7c36   Kay Sievers   Driver core: conv...
1366
1367
  	&dev_attr_capability.attr,
  	&dev_attr_stat.attr,
316d315bf   Nikanth Karthikesan   block: Seperate r...
1368
  	&dev_attr_inflight.attr,
99e6608c9   Vishal Verma   block: Add badblo...
1369
  	&dev_attr_badblocks.attr,
edfaa7c36   Kay Sievers   Driver core: conv...
1370
1371
1372
  #ifdef CONFIG_FAIL_MAKE_REQUEST
  	&dev_attr_fail.attr,
  #endif
581d4e28d   Jens Axboe   block: add fault ...
1373
1374
1375
  #ifdef CONFIG_FAIL_IO_TIMEOUT
  	&dev_attr_fail_timeout.attr,
  #endif
edfaa7c36   Kay Sievers   Driver core: conv...
1376
1377
  	NULL
  };
9438b3e08   Dan Williams   block: hide badbl...
1378
1379
1380
1381
1382
1383
1384
1385
1386
  static umode_t disk_visible(struct kobject *kobj, struct attribute *a, int n)
  {
  	struct device *dev = container_of(kobj, typeof(*dev), kobj);
  	struct gendisk *disk = dev_to_disk(dev);
  
  	if (a == &dev_attr_badblocks.attr && !disk->bb)
  		return 0;
  	return a->mode;
  }
edfaa7c36   Kay Sievers   Driver core: conv...
1387
1388
  static struct attribute_group disk_attr_group = {
  	.attrs = disk_attrs,
9438b3e08   Dan Williams   block: hide badbl...
1389
  	.is_visible = disk_visible,
edfaa7c36   Kay Sievers   Driver core: conv...
1390
  };
a4dbd6740   David Brownell   driver model: con...
1391
  static const struct attribute_group *disk_attr_groups[] = {
edfaa7c36   Kay Sievers   Driver core: conv...
1392
1393
  	&disk_attr_group,
  	NULL
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1394
  };
540eed563   Tejun Heo   block: make parti...
1395
1396
1397
1398
1399
1400
1401
1402
1403
  /**
   * disk_replace_part_tbl - replace disk->part_tbl in RCU-safe way
   * @disk: disk to replace part_tbl for
   * @new_ptbl: new part_tbl to install
   *
   * Replace disk->part_tbl with @new_ptbl in RCU-safe way.  The
   * original ptbl is freed using RCU callback.
   *
   * LOCKING:
6d2cf6f2b   Bart Van Assche   genhd: Annotate a...
1404
   * Matching bd_mutex locked or the caller is the only user of @disk.
540eed563   Tejun Heo   block: make parti...
1405
1406
1407
1408
   */
  static void disk_replace_part_tbl(struct gendisk *disk,
  				  struct disk_part_tbl *new_ptbl)
  {
6d2cf6f2b   Bart Van Assche   genhd: Annotate a...
1409
1410
  	struct disk_part_tbl *old_ptbl =
  		rcu_dereference_protected(disk->part_tbl, 1);
540eed563   Tejun Heo   block: make parti...
1411
1412
  
  	rcu_assign_pointer(disk->part_tbl, new_ptbl);
a6f23657d   Jens Axboe   block: add one-hi...
1413
1414
1415
  
  	if (old_ptbl) {
  		rcu_assign_pointer(old_ptbl->last_lookup, NULL);
57bdfbf9e   Lai Jiangshan   block,rcu: Conver...
1416
  		kfree_rcu(old_ptbl, rcu_head);
a6f23657d   Jens Axboe   block: add one-hi...
1417
  	}
540eed563   Tejun Heo   block: make parti...
1418
1419
1420
1421
1422
1423
1424
1425
1426
1427
1428
  }
  
  /**
   * disk_expand_part_tbl - expand disk->part_tbl
   * @disk: disk to expand part_tbl for
   * @partno: expand such that this partno can fit in
   *
   * Expand disk->part_tbl such that @partno can fit in.  disk->part_tbl
   * uses RCU to allow unlocked dereferencing for stats and other stuff.
   *
   * LOCKING:
6d2cf6f2b   Bart Van Assche   genhd: Annotate a...
1429
1430
   * Matching bd_mutex locked or the caller is the only user of @disk.
   * Might sleep.
540eed563   Tejun Heo   block: make parti...
1431
1432
1433
1434
1435
1436
   *
   * RETURNS:
   * 0 on success, -errno on failure.
   */
  int disk_expand_part_tbl(struct gendisk *disk, int partno)
  {
6d2cf6f2b   Bart Van Assche   genhd: Annotate a...
1437
1438
  	struct disk_part_tbl *old_ptbl =
  		rcu_dereference_protected(disk->part_tbl, 1);
540eed563   Tejun Heo   block: make parti...
1439
1440
  	struct disk_part_tbl *new_ptbl;
  	int len = old_ptbl ? old_ptbl->len : 0;
5fabcb4c3   Jens Axboe   genhd: check for ...
1441
  	int i, target;
5fabcb4c3   Jens Axboe   genhd: check for ...
1442
1443
1444
1445
1446
1447
1448
1449
  
  	/*
  	 * check for int overflow, since we can get here from blkpg_ioctl()
  	 * with a user passed 'partno'.
  	 */
  	target = partno + 1;
  	if (target < 0)
  		return -EINVAL;
540eed563   Tejun Heo   block: make parti...
1450
1451
1452
1453
1454
1455
1456
  
  	/* disk_max_parts() is zero during initialization, ignore if so */
  	if (disk_max_parts(disk) && target > disk_max_parts(disk))
  		return -EINVAL;
  
  	if (target <= len)
  		return 0;
78b90a2ce   Gustavo A. R. Silva   block: genhd: Use...
1457
1458
  	new_ptbl = kzalloc_node(struct_size(new_ptbl, part, target), GFP_KERNEL,
  				disk->node_id);
540eed563   Tejun Heo   block: make parti...
1459
1460
  	if (!new_ptbl)
  		return -ENOMEM;
540eed563   Tejun Heo   block: make parti...
1461
1462
1463
1464
1465
1466
1467
1468
  	new_ptbl->len = target;
  
  	for (i = 0; i < len; i++)
  		rcu_assign_pointer(new_ptbl->part[i], old_ptbl->part[i]);
  
  	disk_replace_part_tbl(disk, new_ptbl);
  	return 0;
  }
b5bd357cf   Luis Chamberlain   block: add docs f...
1469
1470
1471
1472
1473
1474
1475
1476
1477
1478
1479
1480
1481
1482
1483
1484
  /**
   * disk_release - releases all allocated resources of the gendisk
   * @dev: the device representing this disk
   *
   * This function releases all allocated resources of the gendisk.
   *
   * The struct gendisk refcount is incremented with get_gendisk() or
   * get_disk_and_module(), and its refcount is decremented with
   * put_disk_and_module() or put_disk(). Once the refcount reaches 0 this
   * function is called.
   *
   * Drivers which used __device_add_disk() have a gendisk with a request_queue
   * assigned. Since the request_queue sits on top of the gendisk for these
   * drivers we also call blk_put_queue() for them, and we expect the
   * request_queue refcount to reach 0 at this point, and so the request_queue
   * will also be freed prior to the disk.
e8c7d14ac   Luis Chamberlain   block: revert bac...
1485
1486
   *
   * Context: can sleep
b5bd357cf   Luis Chamberlain   block: add docs f...
1487
   */
edfaa7c36   Kay Sievers   Driver core: conv...
1488
  static void disk_release(struct device *dev)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1489
  {
edfaa7c36   Kay Sievers   Driver core: conv...
1490
  	struct gendisk *disk = dev_to_disk(dev);
e8c7d14ac   Luis Chamberlain   block: revert bac...
1491
  	might_sleep();
2da78092d   Keith Busch   block: Fix dev_t ...
1492
  	blk_free_devt(dev->devt);
77ea887e4   Tejun Heo   implement in-kern...
1493
  	disk_release_events(disk);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1494
  	kfree(disk->random);
540eed563   Tejun Heo   block: make parti...
1495
  	disk_replace_part_tbl(disk, NULL);
b54e5ed8f   Ming Lei   block: partition:...
1496
  	hd_free_part(&disk->part0);
523e1d399   Tejun Heo   block: make gendi...
1497
1498
  	if (disk->queue)
  		blk_put_queue(disk->queue);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1499
1500
  	kfree(disk);
  }
edfaa7c36   Kay Sievers   Driver core: conv...
1501
1502
  struct class block_class = {
  	.name		= "block",
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1503
  };
3c2670e65   Kay Sievers   driver core: add ...
1504
  static char *block_devnode(struct device *dev, umode_t *mode,
4e4098a3e   Greg Kroah-Hartman   driver core: hand...
1505
  			   kuid_t *uid, kgid_t *gid)
b03f38b68   Kay Sievers   Driver Core: bloc...
1506
1507
  {
  	struct gendisk *disk = dev_to_disk(dev);
348e114bb   Christoph Hellwig   block: move the -...
1508
1509
  	if (disk->fops->devnode)
  		return disk->fops->devnode(disk, mode);
b03f38b68   Kay Sievers   Driver Core: bloc...
1510
1511
  	return NULL;
  }
ef45fe470   Boris Burkov   blk-cgroup: show ...
1512
  const struct device_type disk_type = {
edfaa7c36   Kay Sievers   Driver core: conv...
1513
1514
1515
  	.name		= "disk",
  	.groups		= disk_attr_groups,
  	.release	= disk_release,
e454cea20   Kay Sievers   Driver-Core: exte...
1516
  	.devnode	= block_devnode,
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1517
  };
a6e2ba887   Randy Dunlap   block: make /proc...
1518
  #ifdef CONFIG_PROC_FS
cf771cb5a   Tejun Heo   block: make varia...
1519
1520
1521
1522
1523
1524
1525
1526
  /*
   * aggregate disk stat collector.  Uses the same stats that the sysfs
   * entries do, above, but makes them available through one seq_file.
   *
   * The output looks suspiciously like /proc/partitions with a bunch of
   * extra fields.
   */
  static int diskstats_show(struct seq_file *seqf, void *v)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1527
1528
  {
  	struct gendisk *gp = v;
e71bf0d0e   Tejun Heo   block: fix disk->...
1529
1530
  	struct disk_part_iter piter;
  	struct hd_struct *hd;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1531
  	char buf[BDEVNAME_SIZE];
e016b7820   Mikulas Patocka   block: return jus...
1532
  	unsigned int inflight;
ea18e0f0a   Konstantin Khlebnikov   block/diskstats: ...
1533
  	struct disk_stats stat;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1534
1535
  
  	/*
ed9e19823   Tejun Heo   block: implement ...
1536
  	if (&disk_to_dev(gp)->kobj.entry == block_class.devices.next)
cf771cb5a   Tejun Heo   block: make varia...
1537
  		seq_puts(seqf,	"major minor name"
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1538
1539
1540
1541
1542
1543
  				"     rio rmerge rsect ruse wio wmerge "
  				"wsect wuse running use aveq"
  				"
  
  ");
  	*/
9f5e48655   Wanlong Gao   block:remove some...
1544

71982a409   Tejun Heo   block: include em...
1545
  	disk_part_iter_init(&piter, gp, DISK_PITER_INCL_EMPTY_PART0);
e71bf0d0e   Tejun Heo   block: fix disk->...
1546
  	while ((hd = disk_part_iter_next(&piter))) {
ea18e0f0a   Konstantin Khlebnikov   block/diskstats: ...
1547
  		part_stat_read_all(hd, &stat);
b2f609e19   Christoph Hellwig   block: move the b...
1548
1549
1550
  		if (queue_is_mq(gp->queue))
  			inflight = blk_mq_in_flight(gp->queue, hd);
  		else
1f06959bd   Christoph Hellwig   block: remove the...
1551
  			inflight = part_in_flight(hd);
ea18e0f0a   Konstantin Khlebnikov   block/diskstats: ...
1552

bdca3c87f   Michael Callahan   block: Track DISC...
1553
1554
1555
1556
  		seq_printf(seqf, "%4d %7d %s "
  			   "%lu %lu %lu %u "
  			   "%lu %lu %lu %u "
  			   "%u %u %u "
b68663186   Konstantin Khlebnikov   block: add iostat...
1557
1558
1559
1560
  			   "%lu %lu %lu %u "
  			   "%lu %u"
  			   "
  ",
f331c0296   Tejun Heo   block: don't depe...
1561
1562
  			   MAJOR(part_devt(hd)), MINOR(part_devt(hd)),
  			   disk_name(gp, hd->partno, buf),
ea18e0f0a   Konstantin Khlebnikov   block/diskstats: ...
1563
1564
1565
1566
1567
1568
1569
1570
1571
1572
  			   stat.ios[STAT_READ],
  			   stat.merges[STAT_READ],
  			   stat.sectors[STAT_READ],
  			   (unsigned int)div_u64(stat.nsecs[STAT_READ],
  							NSEC_PER_MSEC),
  			   stat.ios[STAT_WRITE],
  			   stat.merges[STAT_WRITE],
  			   stat.sectors[STAT_WRITE],
  			   (unsigned int)div_u64(stat.nsecs[STAT_WRITE],
  							NSEC_PER_MSEC),
e016b7820   Mikulas Patocka   block: return jus...
1573
  			   inflight,
ea18e0f0a   Konstantin Khlebnikov   block/diskstats: ...
1574
  			   jiffies_to_msecs(stat.io_ticks),
8cd5b8fc0   Konstantin Khlebnikov   block/diskstats: ...
1575
1576
1577
1578
1579
  			   (unsigned int)div_u64(stat.nsecs[STAT_READ] +
  						 stat.nsecs[STAT_WRITE] +
  						 stat.nsecs[STAT_DISCARD] +
  						 stat.nsecs[STAT_FLUSH],
  							NSEC_PER_MSEC),
ea18e0f0a   Konstantin Khlebnikov   block/diskstats: ...
1580
1581
1582
1583
1584
1585
1586
1587
  			   stat.ios[STAT_DISCARD],
  			   stat.merges[STAT_DISCARD],
  			   stat.sectors[STAT_DISCARD],
  			   (unsigned int)div_u64(stat.nsecs[STAT_DISCARD],
  						 NSEC_PER_MSEC),
  			   stat.ios[STAT_FLUSH],
  			   (unsigned int)div_u64(stat.nsecs[STAT_FLUSH],
  						 NSEC_PER_MSEC)
28f39d553   Jerome Marchand   Enhanced partitio...
1588
  			);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1589
  	}
e71bf0d0e   Tejun Heo   block: fix disk->...
1590
  	disk_part_iter_exit(&piter);
9f5e48655   Wanlong Gao   block:remove some...
1591

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1592
1593
  	return 0;
  }
31d85ab28   Alexey Dobriyan   proc: move /proc/...
1594
  static const struct seq_operations diskstats_op = {
def4e38dd   Tejun Heo   block: use class_...
1595
1596
1597
  	.start	= disk_seqf_start,
  	.next	= disk_seqf_next,
  	.stop	= disk_seqf_stop,
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1598
1599
  	.show	= diskstats_show
  };
f500975a3   Alexey Dobriyan   proc: move rest o...
1600
1601
1602
  
  static int __init proc_genhd_init(void)
  {
fddda2b7b   Christoph Hellwig   proc: introduce p...
1603
1604
  	proc_create_seq("diskstats", 0, NULL, &diskstats_op);
  	proc_create_seq("partitions", 0, NULL, &partitions_op);
f500975a3   Alexey Dobriyan   proc: move rest o...
1605
1606
1607
  	return 0;
  }
  module_init(proc_genhd_init);
a6e2ba887   Randy Dunlap   block: make /proc...
1608
  #endif /* CONFIG_PROC_FS */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1609

cf771cb5a   Tejun Heo   block: make varia...
1610
  dev_t blk_lookup_devt(const char *name, int partno)
a142be856   Greg Kroah-Hartman   block: make blk_l...
1611
  {
def4e38dd   Tejun Heo   block: use class_...
1612
1613
1614
  	dev_t devt = MKDEV(0, 0);
  	struct class_dev_iter iter;
  	struct device *dev;
a142be856   Greg Kroah-Hartman   block: make blk_l...
1615

def4e38dd   Tejun Heo   block: use class_...
1616
1617
  	class_dev_iter_init(&iter, &block_class, NULL, &disk_type);
  	while ((dev = class_dev_iter_next(&iter))) {
a142be856   Greg Kroah-Hartman   block: make blk_l...
1618
  		struct gendisk *disk = dev_to_disk(dev);
548b10eb2   Tejun Heo   block: move __dev...
1619
  		struct hd_struct *part;
a142be856   Greg Kroah-Hartman   block: make blk_l...
1620

3ada8b7e9   Kay Sievers   block: struct dev...
1621
  		if (strcmp(dev_name(dev), name))
f331c0296   Tejun Heo   block: don't depe...
1622
  			continue;
f331c0296   Tejun Heo   block: don't depe...
1623

41b8c853a   Neil Brown   block: fix bootin...
1624
1625
1626
1627
1628
1629
1630
1631
  		if (partno < disk->minors) {
  			/* We need to return the right devno, even
  			 * if the partition doesn't exist yet.
  			 */
  			devt = MKDEV(MAJOR(dev->devt),
  				     MINOR(dev->devt) + partno);
  			break;
  		}
548b10eb2   Tejun Heo   block: move __dev...
1632
  		part = disk_get_part(disk, partno);
2bbedcb4c   Tejun Heo   block: don't test...
1633
  		if (part) {
f331c0296   Tejun Heo   block: don't depe...
1634
  			devt = part_devt(part);
e71bf0d0e   Tejun Heo   block: fix disk->...
1635
  			disk_put_part(part);
548b10eb2   Tejun Heo   block: move __dev...
1636
  			break;
def4e38dd   Tejun Heo   block: use class_...
1637
  		}
548b10eb2   Tejun Heo   block: move __dev...
1638
  		disk_put_part(part);
5c0ef6d02   Kay Sievers   block: drop refer...
1639
  	}
def4e38dd   Tejun Heo   block: use class_...
1640
  	class_dev_iter_exit(&iter);
edfaa7c36   Kay Sievers   Driver core: conv...
1641
1642
  	return devt;
  }
edfaa7c36   Kay Sievers   Driver core: conv...
1643

e319e1fbd   Byungchul Park   block, locking/lo...
1644
  struct gendisk *__alloc_disk_node(int minors, int node_id)
1946089a1   Christoph Lameter   [PATCH] NUMA awar...
1645
1646
  {
  	struct gendisk *disk;
6d2cf6f2b   Bart Van Assche   genhd: Annotate a...
1647
  	struct disk_part_tbl *ptbl;
1946089a1   Christoph Lameter   [PATCH] NUMA awar...
1648

de65b0123   Christoph Hellwig   block: reject att...
1649
1650
  	if (minors > DISK_MAX_PARTS) {
  		printk(KERN_ERR
7fb526212   Randy Dunlap   block: genhd.c: f...
1651
1652
  			"block: can't allocate more than %d partitions
  ",
de65b0123   Christoph Hellwig   block: reject att...
1653
1654
1655
  			DISK_MAX_PARTS);
  		minors = DISK_MAX_PARTS;
  	}
1946089a1   Christoph Lameter   [PATCH] NUMA awar...
1656

c1b511eb2   Joe Perches   block: Convert km...
1657
  	disk = kzalloc_node(sizeof(struct gendisk), GFP_KERNEL, node_id);
f93af2a49   Christoph Hellwig   block: cleanup __...
1658
1659
  	if (!disk)
  		return NULL;
6c23a9681   Jens Axboe   block: add intern...
1660

f93af2a49   Christoph Hellwig   block: cleanup __...
1661
1662
1663
  	disk->part0.dkstats = alloc_percpu(struct disk_stats);
  	if (!disk->part0.dkstats)
  		goto out_free_disk;
b5d0b9df0   Tejun Heo   block: introduce ...
1664

f93af2a49   Christoph Hellwig   block: cleanup __...
1665
1666
1667
1668
1669
  	init_rwsem(&disk->lookup_sem);
  	disk->node_id = node_id;
  	if (disk_expand_part_tbl(disk, 0)) {
  		free_percpu(disk->part0.dkstats);
  		goto out_free_disk;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1670
  	}
f93af2a49   Christoph Hellwig   block: cleanup __...
1671
1672
1673
1674
1675
1676
1677
1678
1679
1680
1681
1682
1683
1684
1685
1686
1687
1688
1689
1690
1691
1692
  
  	ptbl = rcu_dereference_protected(disk->part_tbl, 1);
  	rcu_assign_pointer(ptbl->part[0], &disk->part0);
  
  	/*
  	 * set_capacity() and get_capacity() currently don't use
  	 * seqcounter to read/update the part0->nr_sects. Still init
  	 * the counter as we can read the sectors in IO submission
  	 * patch using seqence counters.
  	 *
  	 * TODO: Ideally set_capacity() and get_capacity() should be
  	 * converted to make use of bd_mutex and sequence counters.
  	 */
  	hd_sects_seq_init(&disk->part0);
  	if (hd_ref_init(&disk->part0))
  		goto out_free_part0;
  
  	disk->minors = minors;
  	rand_initialize_disk(disk);
  	disk_to_dev(disk)->class = &block_class;
  	disk_to_dev(disk)->type = &disk_type;
  	device_initialize(disk_to_dev(disk));
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1693
  	return disk;
f93af2a49   Christoph Hellwig   block: cleanup __...
1694
1695
1696
1697
1698
1699
  
  out_free_part0:
  	hd_free_part(&disk->part0);
  out_free_disk:
  	kfree(disk);
  	return NULL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1700
  }
e319e1fbd   Byungchul Park   block, locking/lo...
1701
  EXPORT_SYMBOL(__alloc_disk_node);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1702

b5bd357cf   Luis Chamberlain   block: add docs f...
1703
1704
  /**
   * get_disk_and_module - increments the gendisk and gendisk fops module refcount
0d20dcc27   Randy Dunlap   block: genhd: del...
1705
   * @disk: the struct gendisk to increment the refcount for
b5bd357cf   Luis Chamberlain   block: add docs f...
1706
1707
1708
   *
   * This increments the refcount for the struct gendisk, and the gendisk's
   * fops module owner.
763b58923   Luis Chamberlain   block: clarify co...
1709
1710
   *
   * Context: Any context.
b5bd357cf   Luis Chamberlain   block: add docs f...
1711
   */
3079c22ea   Jan Kara   genhd: Rename get...
1712
  struct kobject *get_disk_and_module(struct gendisk *disk)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1713
1714
1715
1716
1717
1718
1719
1720
1721
  {
  	struct module *owner;
  	struct kobject *kobj;
  
  	if (!disk->fops)
  		return NULL;
  	owner = disk->fops->owner;
  	if (owner && !try_module_get(owner))
  		return NULL;
d01b2dcb4   Jan Kara   block: Fix oops s...
1722
  	kobj = kobject_get_unless_zero(&disk_to_dev(disk)->kobj);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1723
1724
1725
1726
1727
1728
1729
  	if (kobj == NULL) {
  		module_put(owner);
  		return NULL;
  	}
  	return kobj;
  
  }
3079c22ea   Jan Kara   genhd: Rename get...
1730
  EXPORT_SYMBOL(get_disk_and_module);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1731

b5bd357cf   Luis Chamberlain   block: add docs f...
1732
1733
  /**
   * put_disk - decrements the gendisk refcount
0d20dcc27   Randy Dunlap   block: genhd: del...
1734
   * @disk: the struct gendisk to decrement the refcount for
b5bd357cf   Luis Chamberlain   block: add docs f...
1735
1736
1737
   *
   * This decrements the refcount for the struct gendisk. When this reaches 0
   * we'll have disk_release() called.
e8c7d14ac   Luis Chamberlain   block: revert bac...
1738
1739
1740
   *
   * Context: Any context, but the last reference must not be dropped from
   *          atomic context.
b5bd357cf   Luis Chamberlain   block: add docs f...
1741
   */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1742
1743
1744
  void put_disk(struct gendisk *disk)
  {
  	if (disk)
ed9e19823   Tejun Heo   block: implement ...
1745
  		kobject_put(&disk_to_dev(disk)->kobj);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1746
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1747
  EXPORT_SYMBOL(put_disk);
b5bd357cf   Luis Chamberlain   block: add docs f...
1748
1749
  /**
   * put_disk_and_module - decrements the module and gendisk refcount
0d20dcc27   Randy Dunlap   block: genhd: del...
1750
   * @disk: the struct gendisk to decrement the refcount for
b5bd357cf   Luis Chamberlain   block: add docs f...
1751
   *
9df6c2991   Jan Kara   genhd: Add helper...
1752
1753
   * This is a counterpart of get_disk_and_module() and thus also of
   * get_gendisk().
e8c7d14ac   Luis Chamberlain   block: revert bac...
1754
1755
1756
   *
   * Context: Any context, but the last reference must not be dropped from
   *          atomic context.
9df6c2991   Jan Kara   genhd: Add helper...
1757
1758
1759
1760
1761
1762
1763
1764
1765
1766
1767
   */
  void put_disk_and_module(struct gendisk *disk)
  {
  	if (disk) {
  		struct module *owner = disk->fops->owner;
  
  		put_disk(disk);
  		module_put(owner);
  	}
  }
  EXPORT_SYMBOL(put_disk_and_module);
e3264a4d7   Hannes Reinecke   Send uevents for ...
1768
1769
1770
1771
1772
1773
1774
1775
1776
  static void set_disk_ro_uevent(struct gendisk *gd, int ro)
  {
  	char event[] = "DISK_RO=1";
  	char *envp[] = { event, NULL };
  
  	if (!ro)
  		event[8] = '0';
  	kobject_uevent_env(&disk_to_dev(gd)->kobj, KOBJ_CHANGE, envp);
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1777
1778
  void set_device_ro(struct block_device *bdev, int flag)
  {
b7db9956e   Tejun Heo   block: move polic...
1779
  	bdev->bd_part->policy = flag;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1780
1781
1782
1783
1784
1785
  }
  
  EXPORT_SYMBOL(set_device_ro);
  
  void set_disk_ro(struct gendisk *disk, int flag)
  {
e71bf0d0e   Tejun Heo   block: fix disk->...
1786
1787
  	struct disk_part_iter piter;
  	struct hd_struct *part;
e3264a4d7   Hannes Reinecke   Send uevents for ...
1788
1789
1790
1791
1792
1793
  	if (disk->part0.policy != flag) {
  		set_disk_ro_uevent(disk, flag);
  		disk->part0.policy = flag;
  	}
  
  	disk_part_iter_init(&piter, disk, DISK_PITER_INCL_EMPTY);
e71bf0d0e   Tejun Heo   block: fix disk->...
1794
1795
1796
  	while ((part = disk_part_iter_next(&piter)))
  		part->policy = flag;
  	disk_part_iter_exit(&piter);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1797
1798
1799
1800
1801
1802
1803
1804
  }
  
  EXPORT_SYMBOL(set_disk_ro);
  
  int bdev_read_only(struct block_device *bdev)
  {
  	if (!bdev)
  		return 0;
b7db9956e   Tejun Heo   block: move polic...
1805
  	return bdev->bd_part->policy;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1806
1807
1808
  }
  
  EXPORT_SYMBOL(bdev_read_only);
77ea887e4   Tejun Heo   implement in-kern...
1809
1810
1811
1812
1813
1814
1815
  /*
   * Disk events - monitor disk events like media change and eject request.
   */
  struct disk_events {
  	struct list_head	node;		/* all disk_event's */
  	struct gendisk		*disk;		/* the associated disk */
  	spinlock_t		lock;
fdd514e16   Tejun Heo   block: make disk_...
1816
  	struct mutex		block_mutex;	/* protects blocking */
77ea887e4   Tejun Heo   implement in-kern...
1817
1818
1819
1820
1821
1822
1823
1824
1825
1826
1827
1828
1829
1830
1831
1832
1833
1834
1835
1836
1837
1838
1839
  	int			block;		/* event blocking depth */
  	unsigned int		pending;	/* events already sent out */
  	unsigned int		clearing;	/* events being cleared */
  
  	long			poll_msecs;	/* interval, -1 for default */
  	struct delayed_work	dwork;
  };
  
  static const char *disk_events_strs[] = {
  	[ilog2(DISK_EVENT_MEDIA_CHANGE)]	= "media_change",
  	[ilog2(DISK_EVENT_EJECT_REQUEST)]	= "eject_request",
  };
  
  static char *disk_uevents[] = {
  	[ilog2(DISK_EVENT_MEDIA_CHANGE)]	= "DISK_MEDIA_CHANGE=1",
  	[ilog2(DISK_EVENT_EJECT_REQUEST)]	= "DISK_EJECT_REQUEST=1",
  };
  
  /* list of all disk_events */
  static DEFINE_MUTEX(disk_events_mutex);
  static LIST_HEAD(disk_events);
  
  /* disable in-kernel polling by default */
1fe8f3484   Wei Tang   block: do not ini...
1840
  static unsigned long disk_events_dfl_poll_msecs;
77ea887e4   Tejun Heo   implement in-kern...
1841
1842
1843
1844
1845
1846
1847
1848
  
  static unsigned long disk_events_poll_jiffies(struct gendisk *disk)
  {
  	struct disk_events *ev = disk->ev;
  	long intv_msecs = 0;
  
  	/*
  	 * If device-specific poll interval is set, always use it.  If
673387a93   Martin Wilck   block: genhd: rem...
1849
  	 * the default is being used, poll if the POLL flag is set.
77ea887e4   Tejun Heo   implement in-kern...
1850
1851
1852
  	 */
  	if (ev->poll_msecs >= 0)
  		intv_msecs = ev->poll_msecs;
c92e2f04b   Martin Wilck   block: disk_event...
1853
  	else if (disk->event_flags & DISK_EVENT_FLAG_POLL)
77ea887e4   Tejun Heo   implement in-kern...
1854
1855
1856
1857
  		intv_msecs = disk_events_dfl_poll_msecs;
  
  	return msecs_to_jiffies(intv_msecs);
  }
c3af54afb   Tejun Heo   block: remove non...
1858
1859
1860
1861
1862
1863
1864
1865
1866
1867
1868
1869
1870
1871
1872
1873
  /**
   * disk_block_events - block and flush disk event checking
   * @disk: disk to block events for
   *
   * On return from this function, it is guaranteed that event checking
   * isn't in progress and won't happen until unblocked by
   * disk_unblock_events().  Events blocking is counted and the actual
   * unblocking happens after the matching number of unblocks are done.
   *
   * Note that this intentionally does not block event checking from
   * disk_clear_events().
   *
   * CONTEXT:
   * Might sleep.
   */
  void disk_block_events(struct gendisk *disk)
77ea887e4   Tejun Heo   implement in-kern...
1874
1875
1876
1877
  {
  	struct disk_events *ev = disk->ev;
  	unsigned long flags;
  	bool cancel;
c3af54afb   Tejun Heo   block: remove non...
1878
1879
  	if (!ev)
  		return;
fdd514e16   Tejun Heo   block: make disk_...
1880
1881
1882
1883
1884
  	/*
  	 * Outer mutex ensures that the first blocker completes canceling
  	 * the event work before further blockers are allowed to finish.
  	 */
  	mutex_lock(&ev->block_mutex);
77ea887e4   Tejun Heo   implement in-kern...
1885
1886
1887
  	spin_lock_irqsave(&ev->lock, flags);
  	cancel = !ev->block++;
  	spin_unlock_irqrestore(&ev->lock, flags);
c3af54afb   Tejun Heo   block: remove non...
1888
1889
  	if (cancel)
  		cancel_delayed_work_sync(&disk->ev->dwork);
fdd514e16   Tejun Heo   block: make disk_...
1890
1891
  
  	mutex_unlock(&ev->block_mutex);
77ea887e4   Tejun Heo   implement in-kern...
1892
1893
1894
1895
1896
1897
1898
1899
1900
1901
1902
1903
1904
1905
1906
  }
  
  static void __disk_unblock_events(struct gendisk *disk, bool check_now)
  {
  	struct disk_events *ev = disk->ev;
  	unsigned long intv;
  	unsigned long flags;
  
  	spin_lock_irqsave(&ev->lock, flags);
  
  	if (WARN_ON_ONCE(ev->block <= 0))
  		goto out_unlock;
  
  	if (--ev->block)
  		goto out_unlock;
77ea887e4   Tejun Heo   implement in-kern...
1907
  	intv = disk_events_poll_jiffies(disk);
77ea887e4   Tejun Heo   implement in-kern...
1908
  	if (check_now)
695588f94   Viresh Kumar   block: queue work...
1909
1910
  		queue_delayed_work(system_freezable_power_efficient_wq,
  				&ev->dwork, 0);
77ea887e4   Tejun Heo   implement in-kern...
1911
  	else if (intv)
695588f94   Viresh Kumar   block: queue work...
1912
1913
  		queue_delayed_work(system_freezable_power_efficient_wq,
  				&ev->dwork, intv);
77ea887e4   Tejun Heo   implement in-kern...
1914
1915
1916
1917
1918
  out_unlock:
  	spin_unlock_irqrestore(&ev->lock, flags);
  }
  
  /**
77ea887e4   Tejun Heo   implement in-kern...
1919
1920
1921
1922
1923
1924
1925
1926
1927
1928
1929
1930
   * disk_unblock_events - unblock disk event checking
   * @disk: disk to unblock events for
   *
   * Undo disk_block_events().  When the block count reaches zero, it
   * starts events polling if configured.
   *
   * CONTEXT:
   * Don't care.  Safe to call from irq context.
   */
  void disk_unblock_events(struct gendisk *disk)
  {
  	if (disk->ev)
facc31ddc   Tejun Heo   block: Don't impl...
1931
  		__disk_unblock_events(disk, false);
77ea887e4   Tejun Heo   implement in-kern...
1932
1933
1934
  }
  
  /**
85ef06d1d   Tejun Heo   block: flush MEDI...
1935
1936
1937
   * disk_flush_events - schedule immediate event checking and flushing
   * @disk: disk to check and flush events for
   * @mask: events to flush
77ea887e4   Tejun Heo   implement in-kern...
1938
   *
85ef06d1d   Tejun Heo   block: flush MEDI...
1939
1940
1941
   * Schedule immediate event checking on @disk if not blocked.  Events in
   * @mask are scheduled to be cleared from the driver.  Note that this
   * doesn't clear the events from @disk->ev.
77ea887e4   Tejun Heo   implement in-kern...
1942
1943
   *
   * CONTEXT:
85ef06d1d   Tejun Heo   block: flush MEDI...
1944
   * If @mask is non-zero must be called with bdev->bd_mutex held.
77ea887e4   Tejun Heo   implement in-kern...
1945
   */
85ef06d1d   Tejun Heo   block: flush MEDI...
1946
  void disk_flush_events(struct gendisk *disk, unsigned int mask)
77ea887e4   Tejun Heo   implement in-kern...
1947
  {
a9dce2a3b   Tejun Heo   block: don't use ...
1948
  	struct disk_events *ev = disk->ev;
a9dce2a3b   Tejun Heo   block: don't use ...
1949
1950
1951
  
  	if (!ev)
  		return;
85ef06d1d   Tejun Heo   block: flush MEDI...
1952
1953
  	spin_lock_irq(&ev->lock);
  	ev->clearing |= mask;
41f63c535   Tejun Heo   workqueue: use mo...
1954
  	if (!ev->block)
695588f94   Viresh Kumar   block: queue work...
1955
1956
  		mod_delayed_work(system_freezable_power_efficient_wq,
  				&ev->dwork, 0);
85ef06d1d   Tejun Heo   block: flush MEDI...
1957
  	spin_unlock_irq(&ev->lock);
77ea887e4   Tejun Heo   implement in-kern...
1958
  }
77ea887e4   Tejun Heo   implement in-kern...
1959
1960
1961
1962
  
  /**
   * disk_clear_events - synchronously check, clear and return pending events
   * @disk: disk to fetch and clear events from
da3dae54e   Masanari Iida   Documentation: Do...
1963
   * @mask: mask of events to be fetched and cleared
77ea887e4   Tejun Heo   implement in-kern...
1964
1965
1966
1967
1968
1969
1970
   *
   * Disk events are synchronously checked and pending events in @mask
   * are cleared and returned.  This ignores the block count.
   *
   * CONTEXT:
   * Might sleep.
   */
95f6f3a46   Christoph Hellwig   block: add a bdev...
1971
  static unsigned int disk_clear_events(struct gendisk *disk, unsigned int mask)
77ea887e4   Tejun Heo   implement in-kern...
1972
  {
77ea887e4   Tejun Heo   implement in-kern...
1973
1974
  	struct disk_events *ev = disk->ev;
  	unsigned int pending;
12c2bdb23   Derek Basehore   block: prevent ra...
1975
  	unsigned int clearing = mask;
77ea887e4   Tejun Heo   implement in-kern...
1976

a564e23f0   Christoph Hellwig   md: switch to ->c...
1977
  	if (!ev)
77ea887e4   Tejun Heo   implement in-kern...
1978
  		return 0;
77ea887e4   Tejun Heo   implement in-kern...
1979

12c2bdb23   Derek Basehore   block: prevent ra...
1980
1981
1982
1983
1984
1985
1986
  	disk_block_events(disk);
  
  	/*
  	 * store the union of mask and ev->clearing on the stack so that the
  	 * race with disk_flush_events does not cause ambiguity (ev->clearing
  	 * can still be modified even if events are blocked).
  	 */
77ea887e4   Tejun Heo   implement in-kern...
1987
  	spin_lock_irq(&ev->lock);
12c2bdb23   Derek Basehore   block: prevent ra...
1988
1989
  	clearing |= ev->clearing;
  	ev->clearing = 0;
77ea887e4   Tejun Heo   implement in-kern...
1990
  	spin_unlock_irq(&ev->lock);
12c2bdb23   Derek Basehore   block: prevent ra...
1991
  	disk_check_events(ev, &clearing);
aea24a8bb   Derek Basehore   block: remove dea...
1992
  	/*
12c2bdb23   Derek Basehore   block: prevent ra...
1993
1994
  	 * if ev->clearing is not 0, the disk_flush_events got called in the
  	 * middle of this function, so we want to run the workfn without delay.
aea24a8bb   Derek Basehore   block: remove dea...
1995
  	 */
12c2bdb23   Derek Basehore   block: prevent ra...
1996
  	__disk_unblock_events(disk, ev->clearing ? true : false);
77ea887e4   Tejun Heo   implement in-kern...
1997
1998
1999
  
  	/* then, fetch and clear pending events */
  	spin_lock_irq(&ev->lock);
77ea887e4   Tejun Heo   implement in-kern...
2000
2001
2002
  	pending = ev->pending & mask;
  	ev->pending &= ~mask;
  	spin_unlock_irq(&ev->lock);
12c2bdb23   Derek Basehore   block: prevent ra...
2003
  	WARN_ON_ONCE(clearing & mask);
77ea887e4   Tejun Heo   implement in-kern...
2004
2005
2006
  
  	return pending;
  }
95f6f3a46   Christoph Hellwig   block: add a bdev...
2007
2008
2009
2010
2011
2012
2013
2014
2015
2016
2017
2018
2019
2020
2021
2022
2023
2024
2025
2026
2027
2028
2029
  /**
   * bdev_check_media_change - check if a removable media has been changed
   * @bdev: block device to check
   *
   * Check whether a removable media has been changed, and attempt to free all
   * dentries and inodes and invalidates all block device page cache entries in
   * that case.
   *
   * Returns %true if the block device changed, or %false if not.
   */
  bool bdev_check_media_change(struct block_device *bdev)
  {
  	unsigned int events;
  
  	events = disk_clear_events(bdev->bd_disk, DISK_EVENT_MEDIA_CHANGE |
  				   DISK_EVENT_EJECT_REQUEST);
  	if (!(events & DISK_EVENT_MEDIA_CHANGE))
  		return false;
  
  	if (__invalidate_device(bdev, true))
  		pr_warn("VFS: busy inodes on changed media %s
  ",
  			bdev->bd_disk->disk_name);
38430f087   Christoph Hellwig   block: move the N...
2030
  	set_bit(GD_NEED_PART_SCAN, &bdev->bd_disk->state);
95f6f3a46   Christoph Hellwig   block: add a bdev...
2031
2032
2033
  	return true;
  }
  EXPORT_SYMBOL(bdev_check_media_change);
12c2bdb23   Derek Basehore   block: prevent ra...
2034
2035
2036
2037
  /*
   * Separate this part out so that a different pointer for clearing_ptr can be
   * passed in for disk_clear_events.
   */
77ea887e4   Tejun Heo   implement in-kern...
2038
2039
2040
2041
  static void disk_events_workfn(struct work_struct *work)
  {
  	struct delayed_work *dwork = to_delayed_work(work);
  	struct disk_events *ev = container_of(dwork, struct disk_events, dwork);
12c2bdb23   Derek Basehore   block: prevent ra...
2042
2043
2044
2045
2046
2047
2048
  
  	disk_check_events(ev, &ev->clearing);
  }
  
  static void disk_check_events(struct disk_events *ev,
  			      unsigned int *clearing_ptr)
  {
77ea887e4   Tejun Heo   implement in-kern...
2049
2050
  	struct gendisk *disk = ev->disk;
  	char *envp[ARRAY_SIZE(disk_uevents) + 1] = { };
12c2bdb23   Derek Basehore   block: prevent ra...
2051
  	unsigned int clearing = *clearing_ptr;
77ea887e4   Tejun Heo   implement in-kern...
2052
2053
2054
2055
2056
2057
2058
2059
2060
2061
2062
2063
  	unsigned int events;
  	unsigned long intv;
  	int nr_events = 0, i;
  
  	/* check events */
  	events = disk->fops->check_events(disk, clearing);
  
  	/* accumulate pending events and schedule next poll if necessary */
  	spin_lock_irq(&ev->lock);
  
  	events &= ~ev->pending;
  	ev->pending |= events;
12c2bdb23   Derek Basehore   block: prevent ra...
2064
  	*clearing_ptr &= ~clearing;
77ea887e4   Tejun Heo   implement in-kern...
2065
2066
2067
  
  	intv = disk_events_poll_jiffies(disk);
  	if (!ev->block && intv)
695588f94   Viresh Kumar   block: queue work...
2068
2069
  		queue_delayed_work(system_freezable_power_efficient_wq,
  				&ev->dwork, intv);
77ea887e4   Tejun Heo   implement in-kern...
2070
2071
  
  	spin_unlock_irq(&ev->lock);
7c88a168d   Tejun Heo   block: don't prop...
2072
2073
  	/*
  	 * Tell userland about new events.  Only the events listed in
c92e2f04b   Martin Wilck   block: disk_event...
2074
2075
2076
  	 * @disk->events are reported, and only if DISK_EVENT_FLAG_UEVENT
  	 * is set. Otherwise, events are processed internally but never
  	 * get reported to userland.
7c88a168d   Tejun Heo   block: don't prop...
2077
  	 */
77ea887e4   Tejun Heo   implement in-kern...
2078
  	for (i = 0; i < ARRAY_SIZE(disk_uevents); i++)
c92e2f04b   Martin Wilck   block: disk_event...
2079
2080
  		if ((events & disk->events & (1 << i)) &&
  		    (disk->event_flags & DISK_EVENT_FLAG_UEVENT))
77ea887e4   Tejun Heo   implement in-kern...
2081
2082
2083
2084
2085
2086
2087
2088
2089
2090
2091
2092
  			envp[nr_events++] = disk_uevents[i];
  
  	if (nr_events)
  		kobject_uevent_env(&disk_to_dev(disk)->kobj, KOBJ_CHANGE, envp);
  }
  
  /*
   * A disk events enabled device has the following sysfs nodes under
   * its /sys/block/X/ directory.
   *
   * events		: list of all supported events
   * events_async		: list of events which can be detected w/o polling
673387a93   Martin Wilck   block: genhd: rem...
2093
   *			  (always empty, only for backwards compatibility)
77ea887e4   Tejun Heo   implement in-kern...
2094
2095
2096
2097
2098
2099
2100
2101
2102
2103
2104
2105
2106
2107
2108
2109
2110
2111
2112
2113
2114
2115
2116
2117
   * events_poll_msecs	: polling interval, 0: disable, -1: system default
   */
  static ssize_t __disk_events_show(unsigned int events, char *buf)
  {
  	const char *delim = "";
  	ssize_t pos = 0;
  	int i;
  
  	for (i = 0; i < ARRAY_SIZE(disk_events_strs); i++)
  		if (events & (1 << i)) {
  			pos += sprintf(buf + pos, "%s%s",
  				       delim, disk_events_strs[i]);
  			delim = " ";
  		}
  	if (pos)
  		pos += sprintf(buf + pos, "
  ");
  	return pos;
  }
  
  static ssize_t disk_events_show(struct device *dev,
  				struct device_attribute *attr, char *buf)
  {
  	struct gendisk *disk = dev_to_disk(dev);
c92e2f04b   Martin Wilck   block: disk_event...
2118
2119
  	if (!(disk->event_flags & DISK_EVENT_FLAG_UEVENT))
  		return 0;
77ea887e4   Tejun Heo   implement in-kern...
2120
2121
2122
2123
2124
2125
  	return __disk_events_show(disk->events, buf);
  }
  
  static ssize_t disk_events_async_show(struct device *dev,
  				      struct device_attribute *attr, char *buf)
  {
673387a93   Martin Wilck   block: genhd: rem...
2126
  	return 0;
77ea887e4   Tejun Heo   implement in-kern...
2127
2128
2129
2130
2131
2132
2133
  }
  
  static ssize_t disk_events_poll_msecs_show(struct device *dev,
  					   struct device_attribute *attr,
  					   char *buf)
  {
  	struct gendisk *disk = dev_to_disk(dev);
cdf3e3deb   Martin Wilck   block: check_even...
2134
2135
2136
  	if (!disk->ev)
  		return sprintf(buf, "-1
  ");
77ea887e4   Tejun Heo   implement in-kern...
2137
2138
2139
2140
2141
2142
2143
2144
2145
2146
2147
2148
2149
2150
2151
2152
  	return sprintf(buf, "%ld
  ", disk->ev->poll_msecs);
  }
  
  static ssize_t disk_events_poll_msecs_store(struct device *dev,
  					    struct device_attribute *attr,
  					    const char *buf, size_t count)
  {
  	struct gendisk *disk = dev_to_disk(dev);
  	long intv;
  
  	if (!count || !sscanf(buf, "%ld", &intv))
  		return -EINVAL;
  
  	if (intv < 0 && intv != -1)
  		return -EINVAL;
cdf3e3deb   Martin Wilck   block: check_even...
2153
2154
  	if (!disk->ev)
  		return -ENODEV;
c3af54afb   Tejun Heo   block: remove non...
2155
  	disk_block_events(disk);
77ea887e4   Tejun Heo   implement in-kern...
2156
2157
2158
2159
2160
  	disk->ev->poll_msecs = intv;
  	__disk_unblock_events(disk, true);
  
  	return count;
  }
5657a819a   Joe Perches   block drivers/blo...
2161
2162
2163
  static const DEVICE_ATTR(events, 0444, disk_events_show, NULL);
  static const DEVICE_ATTR(events_async, 0444, disk_events_async_show, NULL);
  static const DEVICE_ATTR(events_poll_msecs, 0644,
77ea887e4   Tejun Heo   implement in-kern...
2164
2165
2166
2167
2168
2169
2170
2171
2172
2173
2174
2175
2176
2177
  			 disk_events_poll_msecs_show,
  			 disk_events_poll_msecs_store);
  
  static const struct attribute *disk_events_attrs[] = {
  	&dev_attr_events.attr,
  	&dev_attr_events_async.attr,
  	&dev_attr_events_poll_msecs.attr,
  	NULL,
  };
  
  /*
   * The default polling interval can be specified by the kernel
   * parameter block.events_dfl_poll_msecs which defaults to 0
   * (disable).  This can also be modified runtime by writing to
1624b0b20   Akinobu Mita   block: fix sysfs ...
2178
   * /sys/module/block/parameters/events_dfl_poll_msecs.
77ea887e4   Tejun Heo   implement in-kern...
2179
2180
2181
2182
2183
2184
2185
2186
2187
2188
2189
2190
2191
2192
   */
  static int disk_events_set_dfl_poll_msecs(const char *val,
  					  const struct kernel_param *kp)
  {
  	struct disk_events *ev;
  	int ret;
  
  	ret = param_set_ulong(val, kp);
  	if (ret < 0)
  		return ret;
  
  	mutex_lock(&disk_events_mutex);
  
  	list_for_each_entry(ev, &disk_events, node)
85ef06d1d   Tejun Heo   block: flush MEDI...
2193
  		disk_flush_events(ev->disk, 0);
77ea887e4   Tejun Heo   implement in-kern...
2194
2195
2196
2197
2198
2199
2200
2201
2202
2203
2204
2205
2206
2207
2208
2209
2210
2211
  
  	mutex_unlock(&disk_events_mutex);
  
  	return 0;
  }
  
  static const struct kernel_param_ops disk_events_dfl_poll_msecs_param_ops = {
  	.set	= disk_events_set_dfl_poll_msecs,
  	.get	= param_get_ulong,
  };
  
  #undef MODULE_PARAM_PREFIX
  #define MODULE_PARAM_PREFIX	"block."
  
  module_param_cb(events_dfl_poll_msecs, &disk_events_dfl_poll_msecs_param_ops,
  		&disk_events_dfl_poll_msecs, 0644);
  
  /*
9f53d2fe8   Stanislaw Gruszka   block: fix __blkd...
2212
   * disk_{alloc|add|del|release}_events - initialize and destroy disk_events.
77ea887e4   Tejun Heo   implement in-kern...
2213
   */
9f53d2fe8   Stanislaw Gruszka   block: fix __blkd...
2214
  static void disk_alloc_events(struct gendisk *disk)
77ea887e4   Tejun Heo   implement in-kern...
2215
2216
  {
  	struct disk_events *ev;
cdf3e3deb   Martin Wilck   block: check_even...
2217
  	if (!disk->fops->check_events || !disk->events)
77ea887e4   Tejun Heo   implement in-kern...
2218
2219
2220
2221
2222
2223
2224
2225
  		return;
  
  	ev = kzalloc(sizeof(*ev), GFP_KERNEL);
  	if (!ev) {
  		pr_warn("%s: failed to initialize events
  ", disk->disk_name);
  		return;
  	}
77ea887e4   Tejun Heo   implement in-kern...
2226
2227
2228
  	INIT_LIST_HEAD(&ev->node);
  	ev->disk = disk;
  	spin_lock_init(&ev->lock);
fdd514e16   Tejun Heo   block: make disk_...
2229
  	mutex_init(&ev->block_mutex);
77ea887e4   Tejun Heo   implement in-kern...
2230
2231
2232
  	ev->block = 1;
  	ev->poll_msecs = -1;
  	INIT_DELAYED_WORK(&ev->dwork, disk_events_workfn);
9f53d2fe8   Stanislaw Gruszka   block: fix __blkd...
2233
2234
2235
2236
2237
  	disk->ev = ev;
  }
  
  static void disk_add_events(struct gendisk *disk)
  {
9f53d2fe8   Stanislaw Gruszka   block: fix __blkd...
2238
2239
2240
2241
2242
  	/* FIXME: error handling */
  	if (sysfs_create_files(&disk_to_dev(disk)->kobj, disk_events_attrs) < 0)
  		pr_warn("%s: failed to create sysfs files for events
  ",
  			disk->disk_name);
cdf3e3deb   Martin Wilck   block: check_even...
2243
2244
  	if (!disk->ev)
  		return;
77ea887e4   Tejun Heo   implement in-kern...
2245
  	mutex_lock(&disk_events_mutex);
9f53d2fe8   Stanislaw Gruszka   block: fix __blkd...
2246
  	list_add_tail(&disk->ev->node, &disk_events);
77ea887e4   Tejun Heo   implement in-kern...
2247
2248
2249
2250
2251
2252
2253
2254
2255
2256
2257
  	mutex_unlock(&disk_events_mutex);
  
  	/*
  	 * Block count is initialized to 1 and the following initial
  	 * unblock kicks it into action.
  	 */
  	__disk_unblock_events(disk, true);
  }
  
  static void disk_del_events(struct gendisk *disk)
  {
cdf3e3deb   Martin Wilck   block: check_even...
2258
2259
  	if (disk->ev) {
  		disk_block_events(disk);
77ea887e4   Tejun Heo   implement in-kern...
2260

cdf3e3deb   Martin Wilck   block: check_even...
2261
2262
2263
2264
  		mutex_lock(&disk_events_mutex);
  		list_del_init(&disk->ev->node);
  		mutex_unlock(&disk_events_mutex);
  	}
77ea887e4   Tejun Heo   implement in-kern...
2265
2266
2267
2268
2269
2270
2271
2272
2273
2274
  
  	sysfs_remove_files(&disk_to_dev(disk)->kobj, disk_events_attrs);
  }
  
  static void disk_release_events(struct gendisk *disk)
  {
  	/* the block count should be 1 from disk_del_events() */
  	WARN_ON_ONCE(disk->ev && disk->ev->block != 1);
  	kfree(disk->ev);
  }