Blame view

block/blk-cgroup.c 38.4 KB
31e4c28d9   Vivek Goyal   blkio: Introduce ...
1
2
3
4
5
6
7
8
9
10
11
12
13
  /*
   * Common Block IO controller cgroup interface
   *
   * Based on ideas and code from CFQ, CFS and BFQ:
   * Copyright (C) 2003 Jens Axboe <axboe@kernel.dk>
   *
   * Copyright (C) 2008 Fabio Checconi <fabio@gandalf.sssup.it>
   *		      Paolo Valente <paolo.valente@unimore.it>
   *
   * Copyright (C) 2009 Vivek Goyal <vgoyal@redhat.com>
   * 	              Nauman Rafique <nauman@google.com>
   */
  #include <linux/ioprio.h>
220841906   Vivek Goyal   blkio: Export dis...
14
15
  #include <linux/seq_file.h>
  #include <linux/kdev_t.h>
9d6a986c0   Vivek Goyal   blkio: Export som...
16
  #include <linux/module.h>
accee7854   Stephen Rothwell   block: include li...
17
  #include <linux/err.h>
9195291e5   Divyesh Shah   blkio: Increment ...
18
  #include <linux/blkdev.h>
5a0e3ad6a   Tejun Heo   include cleanup: ...
19
  #include <linux/slab.h>
31e4c28d9   Vivek Goyal   blkio: Introduce ...
20
  #include "blk-cgroup.h"
34d0f179d   Gui Jianfeng   io-controller: Ad...
21
  #include <linux/genhd.h>
3e2520668   Vivek Goyal   blkio: Implement ...
22

84c124da9   Divyesh Shah   blkio: Changes to...
23
  #define MAX_KEY_LEN 100
3e2520668   Vivek Goyal   blkio: Implement ...
24
25
  static DEFINE_SPINLOCK(blkio_list_lock);
  static LIST_HEAD(blkio_list);
b1c357696   Vivek Goyal   blkio: Take care ...
26

31e4c28d9   Vivek Goyal   blkio: Introduce ...
27
  struct blkio_cgroup blkio_root_cgroup = { .weight = 2*BLKIO_WEIGHT_DEFAULT };
9d6a986c0   Vivek Goyal   blkio: Export som...
28
  EXPORT_SYMBOL_GPL(blkio_root_cgroup);
67523c48a   Ben Blum   cgroups: blkio su...
29
30
31
32
33
34
35
36
  static struct cgroup_subsys_state *blkiocg_create(struct cgroup_subsys *,
  						  struct cgroup *);
  static int blkiocg_can_attach(struct cgroup_subsys *, struct cgroup *,
  			      struct task_struct *, bool);
  static void blkiocg_attach(struct cgroup_subsys *, struct cgroup *,
  			   struct cgroup *, struct task_struct *, bool);
  static void blkiocg_destroy(struct cgroup_subsys *, struct cgroup *);
  static int blkiocg_populate(struct cgroup_subsys *, struct cgroup *);
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
37
38
39
40
41
  /* for encoding cft->private value on file */
  #define BLKIOFILE_PRIVATE(x, val)	(((x) << 16) | (val))
  /* What policy owns the file, proportional or throttle */
  #define BLKIOFILE_POLICY(val)		(((val) >> 16) & 0xffff)
  #define BLKIOFILE_ATTR(val)		((val) & 0xffff)
67523c48a   Ben Blum   cgroups: blkio su...
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
  struct cgroup_subsys blkio_subsys = {
  	.name = "blkio",
  	.create = blkiocg_create,
  	.can_attach = blkiocg_can_attach,
  	.attach = blkiocg_attach,
  	.destroy = blkiocg_destroy,
  	.populate = blkiocg_populate,
  #ifdef CONFIG_BLK_CGROUP
  	/* note: blkio_subsys_id is otherwise defined in blk-cgroup.h */
  	.subsys_id = blkio_subsys_id,
  #endif
  	.use_id = 1,
  	.module = THIS_MODULE,
  };
  EXPORT_SYMBOL_GPL(blkio_subsys);
34d0f179d   Gui Jianfeng   io-controller: Ad...
57
58
59
60
61
  static inline void blkio_policy_insert_node(struct blkio_cgroup *blkcg,
  					    struct blkio_policy_node *pn)
  {
  	list_add(&pn->node, &blkcg->policy_list);
  }
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
  static inline bool cftype_blkg_same_policy(struct cftype *cft,
  			struct blkio_group *blkg)
  {
  	enum blkio_policy_id plid = BLKIOFILE_POLICY(cft->private);
  
  	if (blkg->plid == plid)
  		return 1;
  
  	return 0;
  }
  
  /* Determines if policy node matches cgroup file being accessed */
  static inline bool pn_matches_cftype(struct cftype *cft,
  			struct blkio_policy_node *pn)
  {
  	enum blkio_policy_id plid = BLKIOFILE_POLICY(cft->private);
  	int fileid = BLKIOFILE_ATTR(cft->private);
  
  	return (plid == pn->plid && fileid == pn->fileid);
  }
34d0f179d   Gui Jianfeng   io-controller: Ad...
82
83
84
85
86
87
88
89
  /* Must be called with blkcg->lock held */
  static inline void blkio_policy_delete_node(struct blkio_policy_node *pn)
  {
  	list_del(&pn->node);
  }
  
  /* Must be called with blkcg->lock held */
  static struct blkio_policy_node *
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
90
91
  blkio_policy_search_node(const struct blkio_cgroup *blkcg, dev_t dev,
  		enum blkio_policy_id plid, int fileid)
34d0f179d   Gui Jianfeng   io-controller: Ad...
92
93
94
95
  {
  	struct blkio_policy_node *pn;
  
  	list_for_each_entry(pn, &blkcg->policy_list, node) {
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
96
  		if (pn->dev == dev && pn->plid == plid && pn->fileid == fileid)
34d0f179d   Gui Jianfeng   io-controller: Ad...
97
98
99
100
101
  			return pn;
  	}
  
  	return NULL;
  }
31e4c28d9   Vivek Goyal   blkio: Introduce ...
102
103
104
105
106
  struct blkio_cgroup *cgroup_to_blkio_cgroup(struct cgroup *cgroup)
  {
  	return container_of(cgroup_subsys_state(cgroup, blkio_subsys_id),
  			    struct blkio_cgroup, css);
  }
9d6a986c0   Vivek Goyal   blkio: Export som...
107
  EXPORT_SYMBOL_GPL(cgroup_to_blkio_cgroup);
31e4c28d9   Vivek Goyal   blkio: Introduce ...
108

062a644d6   Vivek Goyal   blk-cgroup: Prepa...
109
110
111
112
113
114
115
116
117
118
  static inline void
  blkio_update_group_weight(struct blkio_group *blkg, unsigned int weight)
  {
  	struct blkio_policy_type *blkiop;
  
  	list_for_each_entry(blkiop, &blkio_list, list) {
  		/* If this policy does not own the blkg, do not send updates */
  		if (blkiop->plid != blkg->plid)
  			continue;
  		if (blkiop->ops.blkio_update_group_weight_fn)
fe0714377   Vivek Goyal   blkio: Recalculat...
119
120
  			blkiop->ops.blkio_update_group_weight_fn(blkg->key,
  							blkg, weight);
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
121
122
  	}
  }
4c9eefa16   Vivek Goyal   blk-cgroup: Intro...
123
124
125
126
127
128
129
130
131
132
133
134
135
  static inline void blkio_update_group_bps(struct blkio_group *blkg, u64 bps,
  				int fileid)
  {
  	struct blkio_policy_type *blkiop;
  
  	list_for_each_entry(blkiop, &blkio_list, list) {
  
  		/* If this policy does not own the blkg, do not send updates */
  		if (blkiop->plid != blkg->plid)
  			continue;
  
  		if (fileid == BLKIO_THROTL_read_bps_device
  		    && blkiop->ops.blkio_update_group_read_bps_fn)
fe0714377   Vivek Goyal   blkio: Recalculat...
136
137
  			blkiop->ops.blkio_update_group_read_bps_fn(blkg->key,
  								blkg, bps);
4c9eefa16   Vivek Goyal   blk-cgroup: Intro...
138
139
140
  
  		if (fileid == BLKIO_THROTL_write_bps_device
  		    && blkiop->ops.blkio_update_group_write_bps_fn)
fe0714377   Vivek Goyal   blkio: Recalculat...
141
142
  			blkiop->ops.blkio_update_group_write_bps_fn(blkg->key,
  								blkg, bps);
4c9eefa16   Vivek Goyal   blk-cgroup: Intro...
143
144
  	}
  }
7702e8f45   Vivek Goyal   blk-cgroup: cgrou...
145
146
147
148
149
150
151
152
153
154
155
156
157
  static inline void blkio_update_group_iops(struct blkio_group *blkg,
  			unsigned int iops, int fileid)
  {
  	struct blkio_policy_type *blkiop;
  
  	list_for_each_entry(blkiop, &blkio_list, list) {
  
  		/* If this policy does not own the blkg, do not send updates */
  		if (blkiop->plid != blkg->plid)
  			continue;
  
  		if (fileid == BLKIO_THROTL_read_iops_device
  		    && blkiop->ops.blkio_update_group_read_iops_fn)
fe0714377   Vivek Goyal   blkio: Recalculat...
158
159
  			blkiop->ops.blkio_update_group_read_iops_fn(blkg->key,
  								blkg, iops);
7702e8f45   Vivek Goyal   blk-cgroup: cgrou...
160
161
162
  
  		if (fileid == BLKIO_THROTL_write_iops_device
  		    && blkiop->ops.blkio_update_group_write_iops_fn)
fe0714377   Vivek Goyal   blkio: Recalculat...
163
164
  			blkiop->ops.blkio_update_group_write_iops_fn(blkg->key,
  								blkg,iops);
7702e8f45   Vivek Goyal   blk-cgroup: cgrou...
165
166
  	}
  }
9195291e5   Divyesh Shah   blkio: Increment ...
167
168
169
170
  /*
   * Add to the appropriate stat variable depending on the request type.
   * This should be called with the blkg->stats_lock held.
   */
84c124da9   Divyesh Shah   blkio: Changes to...
171
172
  static void blkio_add_stat(uint64_t *stat, uint64_t add, bool direction,
  				bool sync)
9195291e5   Divyesh Shah   blkio: Increment ...
173
  {
84c124da9   Divyesh Shah   blkio: Changes to...
174
175
  	if (direction)
  		stat[BLKIO_STAT_WRITE] += add;
9195291e5   Divyesh Shah   blkio: Increment ...
176
  	else
84c124da9   Divyesh Shah   blkio: Changes to...
177
178
179
  		stat[BLKIO_STAT_READ] += add;
  	if (sync)
  		stat[BLKIO_STAT_SYNC] += add;
9195291e5   Divyesh Shah   blkio: Increment ...
180
  	else
84c124da9   Divyesh Shah   blkio: Changes to...
181
  		stat[BLKIO_STAT_ASYNC] += add;
9195291e5   Divyesh Shah   blkio: Increment ...
182
  }
cdc1184cf   Divyesh Shah   blkio: Add io_que...
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
  /*
   * Decrements the appropriate stat variable if non-zero depending on the
   * request type. Panics on value being zero.
   * This should be called with the blkg->stats_lock held.
   */
  static void blkio_check_and_dec_stat(uint64_t *stat, bool direction, bool sync)
  {
  	if (direction) {
  		BUG_ON(stat[BLKIO_STAT_WRITE] == 0);
  		stat[BLKIO_STAT_WRITE]--;
  	} else {
  		BUG_ON(stat[BLKIO_STAT_READ] == 0);
  		stat[BLKIO_STAT_READ]--;
  	}
  	if (sync) {
  		BUG_ON(stat[BLKIO_STAT_SYNC] == 0);
  		stat[BLKIO_STAT_SYNC]--;
  	} else {
  		BUG_ON(stat[BLKIO_STAT_ASYNC] == 0);
  		stat[BLKIO_STAT_ASYNC]--;
  	}
  }
  
  #ifdef CONFIG_DEBUG_BLK_CGROUP
812df48d1   Divyesh Shah   blkio: Add more d...
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
  /* This should be called with the blkg->stats_lock held. */
  static void blkio_set_start_group_wait_time(struct blkio_group *blkg,
  						struct blkio_group *curr_blkg)
  {
  	if (blkio_blkg_waiting(&blkg->stats))
  		return;
  	if (blkg == curr_blkg)
  		return;
  	blkg->stats.start_group_wait_time = sched_clock();
  	blkio_mark_blkg_waiting(&blkg->stats);
  }
  
  /* This should be called with the blkg->stats_lock held. */
  static void blkio_update_group_wait_time(struct blkio_group_stats *stats)
  {
  	unsigned long long now;
  
  	if (!blkio_blkg_waiting(stats))
  		return;
  
  	now = sched_clock();
  	if (time_after64(now, stats->start_group_wait_time))
  		stats->group_wait_time += now - stats->start_group_wait_time;
  	blkio_clear_blkg_waiting(stats);
  }
  
  /* This should be called with the blkg->stats_lock held. */
  static void blkio_end_empty_time(struct blkio_group_stats *stats)
  {
  	unsigned long long now;
  
  	if (!blkio_blkg_empty(stats))
  		return;
  
  	now = sched_clock();
  	if (time_after64(now, stats->start_empty_time))
  		stats->empty_time += now - stats->start_empty_time;
  	blkio_clear_blkg_empty(stats);
  }
  
  void blkiocg_update_set_idle_time_stats(struct blkio_group *blkg)
  {
  	unsigned long flags;
  
  	spin_lock_irqsave(&blkg->stats_lock, flags);
  	BUG_ON(blkio_blkg_idling(&blkg->stats));
  	blkg->stats.start_idle_time = sched_clock();
  	blkio_mark_blkg_idling(&blkg->stats);
  	spin_unlock_irqrestore(&blkg->stats_lock, flags);
  }
  EXPORT_SYMBOL_GPL(blkiocg_update_set_idle_time_stats);
  
  void blkiocg_update_idle_time_stats(struct blkio_group *blkg)
  {
  	unsigned long flags;
  	unsigned long long now;
  	struct blkio_group_stats *stats;
  
  	spin_lock_irqsave(&blkg->stats_lock, flags);
  	stats = &blkg->stats;
  	if (blkio_blkg_idling(stats)) {
  		now = sched_clock();
  		if (time_after64(now, stats->start_idle_time))
  			stats->idle_time += now - stats->start_idle_time;
  		blkio_clear_blkg_idling(stats);
  	}
  	spin_unlock_irqrestore(&blkg->stats_lock, flags);
  }
  EXPORT_SYMBOL_GPL(blkiocg_update_idle_time_stats);
a11cdaa7a   Divyesh Shah   block: Update to ...
276
  void blkiocg_update_avg_queue_size_stats(struct blkio_group *blkg)
cdc1184cf   Divyesh Shah   blkio: Add io_que...
277
278
279
280
281
282
283
284
285
286
  {
  	unsigned long flags;
  	struct blkio_group_stats *stats;
  
  	spin_lock_irqsave(&blkg->stats_lock, flags);
  	stats = &blkg->stats;
  	stats->avg_queue_size_sum +=
  			stats->stat_arr[BLKIO_STAT_QUEUED][BLKIO_STAT_READ] +
  			stats->stat_arr[BLKIO_STAT_QUEUED][BLKIO_STAT_WRITE];
  	stats->avg_queue_size_samples++;
812df48d1   Divyesh Shah   blkio: Add more d...
287
  	blkio_update_group_wait_time(stats);
cdc1184cf   Divyesh Shah   blkio: Add io_que...
288
289
  	spin_unlock_irqrestore(&blkg->stats_lock, flags);
  }
a11cdaa7a   Divyesh Shah   block: Update to ...
290
  EXPORT_SYMBOL_GPL(blkiocg_update_avg_queue_size_stats);
e5ff082e8   Vivek Goyal   blkio: Fix anothe...
291
  void blkiocg_set_start_empty_time(struct blkio_group *blkg)
28baf4429   Divyesh Shah   blkio: Fix compil...
292
293
294
295
296
297
298
299
300
301
302
303
304
305
  {
  	unsigned long flags;
  	struct blkio_group_stats *stats;
  
  	spin_lock_irqsave(&blkg->stats_lock, flags);
  	stats = &blkg->stats;
  
  	if (stats->stat_arr[BLKIO_STAT_QUEUED][BLKIO_STAT_READ] ||
  			stats->stat_arr[BLKIO_STAT_QUEUED][BLKIO_STAT_WRITE]) {
  		spin_unlock_irqrestore(&blkg->stats_lock, flags);
  		return;
  	}
  
  	/*
e5ff082e8   Vivek Goyal   blkio: Fix anothe...
306
307
308
  	 * group is already marked empty. This can happen if cfqq got new
  	 * request in parent group and moved to this group while being added
  	 * to service tree. Just ignore the event and move on.
28baf4429   Divyesh Shah   blkio: Fix compil...
309
  	 */
e5ff082e8   Vivek Goyal   blkio: Fix anothe...
310
311
312
313
  	if(blkio_blkg_empty(stats)) {
  		spin_unlock_irqrestore(&blkg->stats_lock, flags);
  		return;
  	}
28baf4429   Divyesh Shah   blkio: Fix compil...
314
315
316
317
318
  	stats->start_empty_time = sched_clock();
  	blkio_mark_blkg_empty(stats);
  	spin_unlock_irqrestore(&blkg->stats_lock, flags);
  }
  EXPORT_SYMBOL_GPL(blkiocg_set_start_empty_time);
a11cdaa7a   Divyesh Shah   block: Update to ...
319
320
321
322
323
324
  void blkiocg_update_dequeue_stats(struct blkio_group *blkg,
  			unsigned long dequeue)
  {
  	blkg->stats.dequeue += dequeue;
  }
  EXPORT_SYMBOL_GPL(blkiocg_update_dequeue_stats);
812df48d1   Divyesh Shah   blkio: Add more d...
325
326
327
328
  #else
  static inline void blkio_set_start_group_wait_time(struct blkio_group *blkg,
  					struct blkio_group *curr_blkg) {}
  static inline void blkio_end_empty_time(struct blkio_group_stats *stats) {}
cdc1184cf   Divyesh Shah   blkio: Add io_que...
329
  #endif
a11cdaa7a   Divyesh Shah   block: Update to ...
330
  void blkiocg_update_io_add_stats(struct blkio_group *blkg,
cdc1184cf   Divyesh Shah   blkio: Add io_que...
331
332
333
334
335
336
337
338
  			struct blkio_group *curr_blkg, bool direction,
  			bool sync)
  {
  	unsigned long flags;
  
  	spin_lock_irqsave(&blkg->stats_lock, flags);
  	blkio_add_stat(blkg->stats.stat_arr[BLKIO_STAT_QUEUED], 1, direction,
  			sync);
812df48d1   Divyesh Shah   blkio: Add more d...
339
340
  	blkio_end_empty_time(&blkg->stats);
  	blkio_set_start_group_wait_time(blkg, curr_blkg);
cdc1184cf   Divyesh Shah   blkio: Add io_que...
341
342
  	spin_unlock_irqrestore(&blkg->stats_lock, flags);
  }
a11cdaa7a   Divyesh Shah   block: Update to ...
343
  EXPORT_SYMBOL_GPL(blkiocg_update_io_add_stats);
cdc1184cf   Divyesh Shah   blkio: Add io_que...
344

a11cdaa7a   Divyesh Shah   block: Update to ...
345
  void blkiocg_update_io_remove_stats(struct blkio_group *blkg,
cdc1184cf   Divyesh Shah   blkio: Add io_que...
346
347
348
349
350
351
352
353
354
  						bool direction, bool sync)
  {
  	unsigned long flags;
  
  	spin_lock_irqsave(&blkg->stats_lock, flags);
  	blkio_check_and_dec_stat(blkg->stats.stat_arr[BLKIO_STAT_QUEUED],
  					direction, sync);
  	spin_unlock_irqrestore(&blkg->stats_lock, flags);
  }
a11cdaa7a   Divyesh Shah   block: Update to ...
355
  EXPORT_SYMBOL_GPL(blkiocg_update_io_remove_stats);
cdc1184cf   Divyesh Shah   blkio: Add io_que...
356

303a3acb2   Divyesh Shah   blkio: Add io con...
357
  void blkiocg_update_timeslice_used(struct blkio_group *blkg, unsigned long time)
220841906   Vivek Goyal   blkio: Export dis...
358
  {
303a3acb2   Divyesh Shah   blkio: Add io con...
359
360
361
362
363
  	unsigned long flags;
  
  	spin_lock_irqsave(&blkg->stats_lock, flags);
  	blkg->stats.time += time;
  	spin_unlock_irqrestore(&blkg->stats_lock, flags);
220841906   Vivek Goyal   blkio: Export dis...
364
  }
303a3acb2   Divyesh Shah   blkio: Add io con...
365
  EXPORT_SYMBOL_GPL(blkiocg_update_timeslice_used);
220841906   Vivek Goyal   blkio: Export dis...
366

84c124da9   Divyesh Shah   blkio: Changes to...
367
368
  void blkiocg_update_dispatch_stats(struct blkio_group *blkg,
  				uint64_t bytes, bool direction, bool sync)
9195291e5   Divyesh Shah   blkio: Increment ...
369
370
371
372
373
374
  {
  	struct blkio_group_stats *stats;
  	unsigned long flags;
  
  	spin_lock_irqsave(&blkg->stats_lock, flags);
  	stats = &blkg->stats;
84c124da9   Divyesh Shah   blkio: Changes to...
375
376
377
378
379
  	stats->sectors += bytes >> 9;
  	blkio_add_stat(stats->stat_arr[BLKIO_STAT_SERVICED], 1, direction,
  			sync);
  	blkio_add_stat(stats->stat_arr[BLKIO_STAT_SERVICE_BYTES], bytes,
  			direction, sync);
9195291e5   Divyesh Shah   blkio: Increment ...
380
381
  	spin_unlock_irqrestore(&blkg->stats_lock, flags);
  }
84c124da9   Divyesh Shah   blkio: Changes to...
382
  EXPORT_SYMBOL_GPL(blkiocg_update_dispatch_stats);
9195291e5   Divyesh Shah   blkio: Increment ...
383

84c124da9   Divyesh Shah   blkio: Changes to...
384
385
  void blkiocg_update_completion_stats(struct blkio_group *blkg,
  	uint64_t start_time, uint64_t io_start_time, bool direction, bool sync)
9195291e5   Divyesh Shah   blkio: Increment ...
386
387
388
389
390
391
392
  {
  	struct blkio_group_stats *stats;
  	unsigned long flags;
  	unsigned long long now = sched_clock();
  
  	spin_lock_irqsave(&blkg->stats_lock, flags);
  	stats = &blkg->stats;
84c124da9   Divyesh Shah   blkio: Changes to...
393
394
395
396
397
398
  	if (time_after64(now, io_start_time))
  		blkio_add_stat(stats->stat_arr[BLKIO_STAT_SERVICE_TIME],
  				now - io_start_time, direction, sync);
  	if (time_after64(io_start_time, start_time))
  		blkio_add_stat(stats->stat_arr[BLKIO_STAT_WAIT_TIME],
  				io_start_time - start_time, direction, sync);
9195291e5   Divyesh Shah   blkio: Increment ...
399
400
  	spin_unlock_irqrestore(&blkg->stats_lock, flags);
  }
84c124da9   Divyesh Shah   blkio: Changes to...
401
  EXPORT_SYMBOL_GPL(blkiocg_update_completion_stats);
9195291e5   Divyesh Shah   blkio: Increment ...
402

812d40264   Divyesh Shah   blkio: Add io_mer...
403
404
405
406
407
408
409
410
411
412
413
  void blkiocg_update_io_merged_stats(struct blkio_group *blkg, bool direction,
  					bool sync)
  {
  	unsigned long flags;
  
  	spin_lock_irqsave(&blkg->stats_lock, flags);
  	blkio_add_stat(blkg->stats.stat_arr[BLKIO_STAT_MERGED], 1, direction,
  			sync);
  	spin_unlock_irqrestore(&blkg->stats_lock, flags);
  }
  EXPORT_SYMBOL_GPL(blkiocg_update_io_merged_stats);
31e4c28d9   Vivek Goyal   blkio: Introduce ...
414
  void blkiocg_add_blkio_group(struct blkio_cgroup *blkcg,
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
415
416
  		struct blkio_group *blkg, void *key, dev_t dev,
  		enum blkio_policy_id plid)
31e4c28d9   Vivek Goyal   blkio: Introduce ...
417
418
419
420
  {
  	unsigned long flags;
  
  	spin_lock_irqsave(&blkcg->lock, flags);
8d2a91f89   Divyesh Shah   blkio: Initialize...
421
  	spin_lock_init(&blkg->stats_lock);
31e4c28d9   Vivek Goyal   blkio: Introduce ...
422
  	rcu_assign_pointer(blkg->key, key);
b1c357696   Vivek Goyal   blkio: Take care ...
423
  	blkg->blkcg_id = css_id(&blkcg->css);
31e4c28d9   Vivek Goyal   blkio: Introduce ...
424
  	hlist_add_head_rcu(&blkg->blkcg_node, &blkcg->blkg_list);
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
425
  	blkg->plid = plid;
31e4c28d9   Vivek Goyal   blkio: Introduce ...
426
  	spin_unlock_irqrestore(&blkcg->lock, flags);
2868ef7b3   Vivek Goyal   blkio: Some debug...
427
428
  	/* Need to take css reference ? */
  	cgroup_path(blkcg->css.cgroup, blkg->path, sizeof(blkg->path));
220841906   Vivek Goyal   blkio: Export dis...
429
  	blkg->dev = dev;
31e4c28d9   Vivek Goyal   blkio: Introduce ...
430
  }
9d6a986c0   Vivek Goyal   blkio: Export som...
431
  EXPORT_SYMBOL_GPL(blkiocg_add_blkio_group);
31e4c28d9   Vivek Goyal   blkio: Introduce ...
432

b1c357696   Vivek Goyal   blkio: Take care ...
433
434
435
436
437
438
439
440
441
442
  static void __blkiocg_del_blkio_group(struct blkio_group *blkg)
  {
  	hlist_del_init_rcu(&blkg->blkcg_node);
  	blkg->blkcg_id = 0;
  }
  
  /*
   * returns 0 if blkio_group was still on cgroup list. Otherwise returns 1
   * indicating that blk_group was unhashed by the time we got to it.
   */
31e4c28d9   Vivek Goyal   blkio: Introduce ...
443
444
  int blkiocg_del_blkio_group(struct blkio_group *blkg)
  {
b1c357696   Vivek Goyal   blkio: Take care ...
445
446
447
448
449
450
451
  	struct blkio_cgroup *blkcg;
  	unsigned long flags;
  	struct cgroup_subsys_state *css;
  	int ret = 1;
  
  	rcu_read_lock();
  	css = css_lookup(&blkio_subsys, blkg->blkcg_id);
0f3942a39   Jens Axboe   block: kill some ...
452
453
454
455
456
457
458
459
  	if (css) {
  		blkcg = container_of(css, struct blkio_cgroup, css);
  		spin_lock_irqsave(&blkcg->lock, flags);
  		if (!hlist_unhashed(&blkg->blkcg_node)) {
  			__blkiocg_del_blkio_group(blkg);
  			ret = 0;
  		}
  		spin_unlock_irqrestore(&blkcg->lock, flags);
b1c357696   Vivek Goyal   blkio: Take care ...
460
  	}
0f3942a39   Jens Axboe   block: kill some ...
461

b1c357696   Vivek Goyal   blkio: Take care ...
462
463
  	rcu_read_unlock();
  	return ret;
31e4c28d9   Vivek Goyal   blkio: Introduce ...
464
  }
9d6a986c0   Vivek Goyal   blkio: Export som...
465
  EXPORT_SYMBOL_GPL(blkiocg_del_blkio_group);
31e4c28d9   Vivek Goyal   blkio: Introduce ...
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
  
  /* called under rcu_read_lock(). */
  struct blkio_group *blkiocg_lookup_group(struct blkio_cgroup *blkcg, void *key)
  {
  	struct blkio_group *blkg;
  	struct hlist_node *n;
  	void *__key;
  
  	hlist_for_each_entry_rcu(blkg, n, &blkcg->blkg_list, blkcg_node) {
  		__key = blkg->key;
  		if (__key == key)
  			return blkg;
  	}
  
  	return NULL;
  }
9d6a986c0   Vivek Goyal   blkio: Export som...
482
  EXPORT_SYMBOL_GPL(blkiocg_lookup_group);
31e4c28d9   Vivek Goyal   blkio: Introduce ...
483

303a3acb2   Divyesh Shah   blkio: Add io con...
484
  static int
84c124da9   Divyesh Shah   blkio: Changes to...
485
  blkiocg_reset_stats(struct cgroup *cgroup, struct cftype *cftype, u64 val)
303a3acb2   Divyesh Shah   blkio: Add io con...
486
487
488
  {
  	struct blkio_cgroup *blkcg;
  	struct blkio_group *blkg;
812df48d1   Divyesh Shah   blkio: Add more d...
489
  	struct blkio_group_stats *stats;
303a3acb2   Divyesh Shah   blkio: Add io con...
490
  	struct hlist_node *n;
cdc1184cf   Divyesh Shah   blkio: Add io_que...
491
492
  	uint64_t queued[BLKIO_STAT_TOTAL];
  	int i;
812df48d1   Divyesh Shah   blkio: Add more d...
493
494
495
496
  #ifdef CONFIG_DEBUG_BLK_CGROUP
  	bool idling, waiting, empty;
  	unsigned long long now = sched_clock();
  #endif
303a3acb2   Divyesh Shah   blkio: Add io con...
497
498
499
500
501
  
  	blkcg = cgroup_to_blkio_cgroup(cgroup);
  	spin_lock_irq(&blkcg->lock);
  	hlist_for_each_entry(blkg, n, &blkcg->blkg_list, blkcg_node) {
  		spin_lock(&blkg->stats_lock);
812df48d1   Divyesh Shah   blkio: Add more d...
502
503
504
505
506
507
  		stats = &blkg->stats;
  #ifdef CONFIG_DEBUG_BLK_CGROUP
  		idling = blkio_blkg_idling(stats);
  		waiting = blkio_blkg_waiting(stats);
  		empty = blkio_blkg_empty(stats);
  #endif
cdc1184cf   Divyesh Shah   blkio: Add io_que...
508
  		for (i = 0; i < BLKIO_STAT_TOTAL; i++)
812df48d1   Divyesh Shah   blkio: Add more d...
509
510
  			queued[i] = stats->stat_arr[BLKIO_STAT_QUEUED][i];
  		memset(stats, 0, sizeof(struct blkio_group_stats));
cdc1184cf   Divyesh Shah   blkio: Add io_que...
511
  		for (i = 0; i < BLKIO_STAT_TOTAL; i++)
812df48d1   Divyesh Shah   blkio: Add more d...
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
  			stats->stat_arr[BLKIO_STAT_QUEUED][i] = queued[i];
  #ifdef CONFIG_DEBUG_BLK_CGROUP
  		if (idling) {
  			blkio_mark_blkg_idling(stats);
  			stats->start_idle_time = now;
  		}
  		if (waiting) {
  			blkio_mark_blkg_waiting(stats);
  			stats->start_group_wait_time = now;
  		}
  		if (empty) {
  			blkio_mark_blkg_empty(stats);
  			stats->start_empty_time = now;
  		}
  #endif
303a3acb2   Divyesh Shah   blkio: Add io con...
527
528
529
530
531
  		spin_unlock(&blkg->stats_lock);
  	}
  	spin_unlock_irq(&blkcg->lock);
  	return 0;
  }
84c124da9   Divyesh Shah   blkio: Changes to...
532
533
  static void blkio_get_key_name(enum stat_sub_type type, dev_t dev, char *str,
  				int chars_left, bool diskname_only)
303a3acb2   Divyesh Shah   blkio: Add io con...
534
  {
84c124da9   Divyesh Shah   blkio: Changes to...
535
  	snprintf(str, chars_left, "%d:%d", MAJOR(dev), MINOR(dev));
303a3acb2   Divyesh Shah   blkio: Add io con...
536
537
538
539
540
541
  	chars_left -= strlen(str);
  	if (chars_left <= 0) {
  		printk(KERN_WARNING
  			"Possibly incorrect cgroup stat display format");
  		return;
  	}
84c124da9   Divyesh Shah   blkio: Changes to...
542
543
  	if (diskname_only)
  		return;
303a3acb2   Divyesh Shah   blkio: Add io con...
544
  	switch (type) {
84c124da9   Divyesh Shah   blkio: Changes to...
545
  	case BLKIO_STAT_READ:
303a3acb2   Divyesh Shah   blkio: Add io con...
546
547
  		strlcat(str, " Read", chars_left);
  		break;
84c124da9   Divyesh Shah   blkio: Changes to...
548
  	case BLKIO_STAT_WRITE:
303a3acb2   Divyesh Shah   blkio: Add io con...
549
550
  		strlcat(str, " Write", chars_left);
  		break;
84c124da9   Divyesh Shah   blkio: Changes to...
551
  	case BLKIO_STAT_SYNC:
303a3acb2   Divyesh Shah   blkio: Add io con...
552
553
  		strlcat(str, " Sync", chars_left);
  		break;
84c124da9   Divyesh Shah   blkio: Changes to...
554
  	case BLKIO_STAT_ASYNC:
303a3acb2   Divyesh Shah   blkio: Add io con...
555
556
  		strlcat(str, " Async", chars_left);
  		break;
84c124da9   Divyesh Shah   blkio: Changes to...
557
  	case BLKIO_STAT_TOTAL:
303a3acb2   Divyesh Shah   blkio: Add io con...
558
559
560
561
562
563
  		strlcat(str, " Total", chars_left);
  		break;
  	default:
  		strlcat(str, " Invalid", chars_left);
  	}
  }
84c124da9   Divyesh Shah   blkio: Changes to...
564
565
566
567
568
569
570
  static uint64_t blkio_fill_stat(char *str, int chars_left, uint64_t val,
  				struct cgroup_map_cb *cb, dev_t dev)
  {
  	blkio_get_key_name(0, dev, str, chars_left, true);
  	cb->fill(cb, str, val);
  	return val;
  }
303a3acb2   Divyesh Shah   blkio: Add io con...
571

84c124da9   Divyesh Shah   blkio: Changes to...
572
573
574
  /* This should be called with blkg->stats_lock held */
  static uint64_t blkio_get_stat(struct blkio_group *blkg,
  		struct cgroup_map_cb *cb, dev_t dev, enum stat_type type)
303a3acb2   Divyesh Shah   blkio: Add io con...
575
576
577
  {
  	uint64_t disk_total;
  	char key_str[MAX_KEY_LEN];
84c124da9   Divyesh Shah   blkio: Changes to...
578
579
580
581
582
583
584
585
586
  	enum stat_sub_type sub_type;
  
  	if (type == BLKIO_STAT_TIME)
  		return blkio_fill_stat(key_str, MAX_KEY_LEN - 1,
  					blkg->stats.time, cb, dev);
  	if (type == BLKIO_STAT_SECTORS)
  		return blkio_fill_stat(key_str, MAX_KEY_LEN - 1,
  					blkg->stats.sectors, cb, dev);
  #ifdef CONFIG_DEBUG_BLK_CGROUP
cdc1184cf   Divyesh Shah   blkio: Add io_que...
587
588
589
590
591
592
593
594
595
  	if (type == BLKIO_STAT_AVG_QUEUE_SIZE) {
  		uint64_t sum = blkg->stats.avg_queue_size_sum;
  		uint64_t samples = blkg->stats.avg_queue_size_samples;
  		if (samples)
  			do_div(sum, samples);
  		else
  			sum = 0;
  		return blkio_fill_stat(key_str, MAX_KEY_LEN - 1, sum, cb, dev);
  	}
812df48d1   Divyesh Shah   blkio: Add more d...
596
597
598
599
600
601
602
603
604
  	if (type == BLKIO_STAT_GROUP_WAIT_TIME)
  		return blkio_fill_stat(key_str, MAX_KEY_LEN - 1,
  					blkg->stats.group_wait_time, cb, dev);
  	if (type == BLKIO_STAT_IDLE_TIME)
  		return blkio_fill_stat(key_str, MAX_KEY_LEN - 1,
  					blkg->stats.idle_time, cb, dev);
  	if (type == BLKIO_STAT_EMPTY_TIME)
  		return blkio_fill_stat(key_str, MAX_KEY_LEN - 1,
  					blkg->stats.empty_time, cb, dev);
84c124da9   Divyesh Shah   blkio: Changes to...
605
606
607
608
  	if (type == BLKIO_STAT_DEQUEUE)
  		return blkio_fill_stat(key_str, MAX_KEY_LEN - 1,
  					blkg->stats.dequeue, cb, dev);
  #endif
303a3acb2   Divyesh Shah   blkio: Add io con...
609

84c124da9   Divyesh Shah   blkio: Changes to...
610
611
612
613
  	for (sub_type = BLKIO_STAT_READ; sub_type < BLKIO_STAT_TOTAL;
  			sub_type++) {
  		blkio_get_key_name(sub_type, dev, key_str, MAX_KEY_LEN, false);
  		cb->fill(cb, key_str, blkg->stats.stat_arr[type][sub_type]);
303a3acb2   Divyesh Shah   blkio: Add io con...
614
  	}
84c124da9   Divyesh Shah   blkio: Changes to...
615
616
617
  	disk_total = blkg->stats.stat_arr[type][BLKIO_STAT_READ] +
  			blkg->stats.stat_arr[type][BLKIO_STAT_WRITE];
  	blkio_get_key_name(BLKIO_STAT_TOTAL, dev, key_str, MAX_KEY_LEN, false);
303a3acb2   Divyesh Shah   blkio: Add io con...
618
619
620
  	cb->fill(cb, key_str, disk_total);
  	return disk_total;
  }
34d0f179d   Gui Jianfeng   io-controller: Ad...
621
622
623
624
625
626
627
628
629
630
631
632
633
  static int blkio_check_dev_num(dev_t dev)
  {
  	int part = 0;
  	struct gendisk *disk;
  
  	disk = get_gendisk(dev, &part);
  	if (!disk || part)
  		return -ENODEV;
  
  	return 0;
  }
  
  static int blkio_policy_parse_and_set(char *buf,
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
634
  	struct blkio_policy_node *newpn, enum blkio_policy_id plid, int fileid)
34d0f179d   Gui Jianfeng   io-controller: Ad...
635
636
637
638
639
640
  {
  	char *s[4], *p, *major_s = NULL, *minor_s = NULL;
  	int ret;
  	unsigned long major, minor, temp;
  	int i = 0;
  	dev_t dev;
9355aede5   Vivek Goyal   blkio-throttle: l...
641
  	u64 bps, iops;
34d0f179d   Gui Jianfeng   io-controller: Ad...
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
  
  	memset(s, 0, sizeof(s));
  
  	while ((p = strsep(&buf, " ")) != NULL) {
  		if (!*p)
  			continue;
  
  		s[i++] = p;
  
  		/* Prevent from inputing too many things */
  		if (i == 3)
  			break;
  	}
  
  	if (i != 2)
  		return -EINVAL;
  
  	p = strsep(&s[0], ":");
  	if (p != NULL)
  		major_s = p;
  	else
  		return -EINVAL;
  
  	minor_s = s[0];
  	if (!minor_s)
  		return -EINVAL;
  
  	ret = strict_strtoul(major_s, 10, &major);
  	if (ret)
  		return -EINVAL;
  
  	ret = strict_strtoul(minor_s, 10, &minor);
  	if (ret)
  		return -EINVAL;
  
  	dev = MKDEV(major, minor);
  
  	ret = blkio_check_dev_num(dev);
  	if (ret)
  		return ret;
  
  	newpn->dev = dev;
  
  	if (s[1] == NULL)
  		return -EINVAL;
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
687
688
689
690
691
692
  	switch (plid) {
  	case BLKIO_POLICY_PROP:
  		ret = strict_strtoul(s[1], 10, &temp);
  		if (ret || (temp < BLKIO_WEIGHT_MIN && temp > 0) ||
  			temp > BLKIO_WEIGHT_MAX)
  			return -EINVAL;
34d0f179d   Gui Jianfeng   io-controller: Ad...
693

062a644d6   Vivek Goyal   blk-cgroup: Prepa...
694
695
  		newpn->plid = plid;
  		newpn->fileid = fileid;
4c9eefa16   Vivek Goyal   blk-cgroup: Intro...
696
697
698
  		newpn->val.weight = temp;
  		break;
  	case BLKIO_POLICY_THROTL:
7702e8f45   Vivek Goyal   blk-cgroup: cgrou...
699
700
701
702
703
704
  		switch(fileid) {
  		case BLKIO_THROTL_read_bps_device:
  		case BLKIO_THROTL_write_bps_device:
  			ret = strict_strtoull(s[1], 10, &bps);
  			if (ret)
  				return -EINVAL;
4c9eefa16   Vivek Goyal   blk-cgroup: Intro...
705

7702e8f45   Vivek Goyal   blk-cgroup: cgrou...
706
707
708
709
710
711
  			newpn->plid = plid;
  			newpn->fileid = fileid;
  			newpn->val.bps = bps;
  			break;
  		case BLKIO_THROTL_read_iops_device:
  		case BLKIO_THROTL_write_iops_device:
9355aede5   Vivek Goyal   blkio-throttle: l...
712
  			ret = strict_strtoull(s[1], 10, &iops);
7702e8f45   Vivek Goyal   blk-cgroup: cgrou...
713
714
  			if (ret)
  				return -EINVAL;
9355aede5   Vivek Goyal   blkio-throttle: l...
715
716
  			if (iops > THROTL_IOPS_MAX)
  				return -EINVAL;
7702e8f45   Vivek Goyal   blk-cgroup: cgrou...
717
718
  			newpn->plid = plid;
  			newpn->fileid = fileid;
9355aede5   Vivek Goyal   blkio-throttle: l...
719
  			newpn->val.iops = (unsigned int)iops;
7702e8f45   Vivek Goyal   blk-cgroup: cgrou...
720
721
  			break;
  		}
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
722
723
724
725
  		break;
  	default:
  		BUG();
  	}
34d0f179d   Gui Jianfeng   io-controller: Ad...
726
727
728
729
730
731
732
733
  
  	return 0;
  }
  
  unsigned int blkcg_get_weight(struct blkio_cgroup *blkcg,
  			      dev_t dev)
  {
  	struct blkio_policy_node *pn;
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
734
735
  	pn = blkio_policy_search_node(blkcg, dev, BLKIO_POLICY_PROP,
  				BLKIO_PROP_weight_device);
34d0f179d   Gui Jianfeng   io-controller: Ad...
736
  	if (pn)
4c9eefa16   Vivek Goyal   blk-cgroup: Intro...
737
  		return pn->val.weight;
34d0f179d   Gui Jianfeng   io-controller: Ad...
738
739
740
741
  	else
  		return blkcg->weight;
  }
  EXPORT_SYMBOL_GPL(blkcg_get_weight);
4c9eefa16   Vivek Goyal   blk-cgroup: Intro...
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
  uint64_t blkcg_get_read_bps(struct blkio_cgroup *blkcg, dev_t dev)
  {
  	struct blkio_policy_node *pn;
  
  	pn = blkio_policy_search_node(blkcg, dev, BLKIO_POLICY_THROTL,
  				BLKIO_THROTL_read_bps_device);
  	if (pn)
  		return pn->val.bps;
  	else
  		return -1;
  }
  
  uint64_t blkcg_get_write_bps(struct blkio_cgroup *blkcg, dev_t dev)
  {
  	struct blkio_policy_node *pn;
  	pn = blkio_policy_search_node(blkcg, dev, BLKIO_POLICY_THROTL,
  				BLKIO_THROTL_write_bps_device);
  	if (pn)
  		return pn->val.bps;
  	else
  		return -1;
  }
7702e8f45   Vivek Goyal   blk-cgroup: cgrou...
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
  unsigned int blkcg_get_read_iops(struct blkio_cgroup *blkcg, dev_t dev)
  {
  	struct blkio_policy_node *pn;
  
  	pn = blkio_policy_search_node(blkcg, dev, BLKIO_POLICY_THROTL,
  				BLKIO_THROTL_read_iops_device);
  	if (pn)
  		return pn->val.iops;
  	else
  		return -1;
  }
  
  unsigned int blkcg_get_write_iops(struct blkio_cgroup *blkcg, dev_t dev)
  {
  	struct blkio_policy_node *pn;
  	pn = blkio_policy_search_node(blkcg, dev, BLKIO_POLICY_THROTL,
  				BLKIO_THROTL_write_iops_device);
  	if (pn)
  		return pn->val.iops;
  	else
  		return -1;
  }
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
786
787
788
789
790
  /* Checks whether user asked for deleting a policy rule */
  static bool blkio_delete_rule_command(struct blkio_policy_node *pn)
  {
  	switch(pn->plid) {
  	case BLKIO_POLICY_PROP:
4c9eefa16   Vivek Goyal   blk-cgroup: Intro...
791
792
793
794
  		if (pn->val.weight == 0)
  			return 1;
  		break;
  	case BLKIO_POLICY_THROTL:
7702e8f45   Vivek Goyal   blk-cgroup: cgrou...
795
796
797
798
799
800
801
802
803
804
805
  		switch(pn->fileid) {
  		case BLKIO_THROTL_read_bps_device:
  		case BLKIO_THROTL_write_bps_device:
  			if (pn->val.bps == 0)
  				return 1;
  			break;
  		case BLKIO_THROTL_read_iops_device:
  		case BLKIO_THROTL_write_iops_device:
  			if (pn->val.iops == 0)
  				return 1;
  		}
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
806
807
808
809
810
811
812
813
814
815
816
817
818
  		break;
  	default:
  		BUG();
  	}
  
  	return 0;
  }
  
  static void blkio_update_policy_rule(struct blkio_policy_node *oldpn,
  					struct blkio_policy_node *newpn)
  {
  	switch(oldpn->plid) {
  	case BLKIO_POLICY_PROP:
4c9eefa16   Vivek Goyal   blk-cgroup: Intro...
819
820
821
  		oldpn->val.weight = newpn->val.weight;
  		break;
  	case BLKIO_POLICY_THROTL:
7702e8f45   Vivek Goyal   blk-cgroup: cgrou...
822
823
824
825
826
827
828
829
830
  		switch(newpn->fileid) {
  		case BLKIO_THROTL_read_bps_device:
  		case BLKIO_THROTL_write_bps_device:
  			oldpn->val.bps = newpn->val.bps;
  			break;
  		case BLKIO_THROTL_read_iops_device:
  		case BLKIO_THROTL_write_iops_device:
  			oldpn->val.iops = newpn->val.iops;
  		}
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
831
832
833
834
835
836
837
838
839
840
841
842
843
  		break;
  	default:
  		BUG();
  	}
  }
  
  /*
   * Some rules/values in blkg have changed. Propogate those to respective
   * policies.
   */
  static void blkio_update_blkg_policy(struct blkio_cgroup *blkcg,
  		struct blkio_group *blkg, struct blkio_policy_node *pn)
  {
7702e8f45   Vivek Goyal   blk-cgroup: cgrou...
844
  	unsigned int weight, iops;
4c9eefa16   Vivek Goyal   blk-cgroup: Intro...
845
  	u64 bps;
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
846
847
848
  
  	switch(pn->plid) {
  	case BLKIO_POLICY_PROP:
4c9eefa16   Vivek Goyal   blk-cgroup: Intro...
849
  		weight = pn->val.weight ? pn->val.weight :
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
850
851
852
  				blkcg->weight;
  		blkio_update_group_weight(blkg, weight);
  		break;
4c9eefa16   Vivek Goyal   blk-cgroup: Intro...
853
854
855
856
857
858
859
  	case BLKIO_POLICY_THROTL:
  		switch(pn->fileid) {
  		case BLKIO_THROTL_read_bps_device:
  		case BLKIO_THROTL_write_bps_device:
  			bps = pn->val.bps ? pn->val.bps : (-1);
  			blkio_update_group_bps(blkg, bps, pn->fileid);
  			break;
7702e8f45   Vivek Goyal   blk-cgroup: cgrou...
860
861
862
863
864
  		case BLKIO_THROTL_read_iops_device:
  		case BLKIO_THROTL_write_iops_device:
  			iops = pn->val.iops ? pn->val.iops : (-1);
  			blkio_update_group_iops(blkg, iops, pn->fileid);
  			break;
4c9eefa16   Vivek Goyal   blk-cgroup: Intro...
865
866
  		}
  		break;
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
  	default:
  		BUG();
  	}
  }
  
  /*
   * A policy node rule has been updated. Propogate this update to all the
   * block groups which might be affected by this update.
   */
  static void blkio_update_policy_node_blkg(struct blkio_cgroup *blkcg,
  				struct blkio_policy_node *pn)
  {
  	struct blkio_group *blkg;
  	struct hlist_node *n;
  
  	spin_lock(&blkio_list_lock);
  	spin_lock_irq(&blkcg->lock);
34d0f179d   Gui Jianfeng   io-controller: Ad...
884

062a644d6   Vivek Goyal   blk-cgroup: Prepa...
885
886
887
888
889
890
891
892
893
  	hlist_for_each_entry(blkg, n, &blkcg->blkg_list, blkcg_node) {
  		if (pn->dev != blkg->dev || pn->plid != blkg->plid)
  			continue;
  		blkio_update_blkg_policy(blkcg, blkg, pn);
  	}
  
  	spin_unlock_irq(&blkcg->lock);
  	spin_unlock(&blkio_list_lock);
  }
34d0f179d   Gui Jianfeng   io-controller: Ad...
894

062a644d6   Vivek Goyal   blk-cgroup: Prepa...
895
896
  static int blkiocg_file_write(struct cgroup *cgrp, struct cftype *cft,
   				       const char *buffer)
34d0f179d   Gui Jianfeng   io-controller: Ad...
897
898
899
900
901
  {
  	int ret = 0;
  	char *buf;
  	struct blkio_policy_node *newpn, *pn;
  	struct blkio_cgroup *blkcg;
34d0f179d   Gui Jianfeng   io-controller: Ad...
902
  	int keep_newpn = 0;
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
903
904
  	enum blkio_policy_id plid = BLKIOFILE_POLICY(cft->private);
  	int fileid = BLKIOFILE_ATTR(cft->private);
34d0f179d   Gui Jianfeng   io-controller: Ad...
905
906
907
908
909
910
911
912
913
914
  
  	buf = kstrdup(buffer, GFP_KERNEL);
  	if (!buf)
  		return -ENOMEM;
  
  	newpn = kzalloc(sizeof(*newpn), GFP_KERNEL);
  	if (!newpn) {
  		ret = -ENOMEM;
  		goto free_buf;
  	}
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
915
  	ret = blkio_policy_parse_and_set(buf, newpn, plid, fileid);
34d0f179d   Gui Jianfeng   io-controller: Ad...
916
917
918
919
920
921
  	if (ret)
  		goto free_newpn;
  
  	blkcg = cgroup_to_blkio_cgroup(cgrp);
  
  	spin_lock_irq(&blkcg->lock);
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
922
  	pn = blkio_policy_search_node(blkcg, newpn->dev, plid, fileid);
34d0f179d   Gui Jianfeng   io-controller: Ad...
923
  	if (!pn) {
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
924
  		if (!blkio_delete_rule_command(newpn)) {
34d0f179d   Gui Jianfeng   io-controller: Ad...
925
926
927
928
929
930
  			blkio_policy_insert_node(blkcg, newpn);
  			keep_newpn = 1;
  		}
  		spin_unlock_irq(&blkcg->lock);
  		goto update_io_group;
  	}
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
931
  	if (blkio_delete_rule_command(newpn)) {
34d0f179d   Gui Jianfeng   io-controller: Ad...
932
933
934
935
936
  		blkio_policy_delete_node(pn);
  		spin_unlock_irq(&blkcg->lock);
  		goto update_io_group;
  	}
  	spin_unlock_irq(&blkcg->lock);
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
937
  	blkio_update_policy_rule(pn, newpn);
34d0f179d   Gui Jianfeng   io-controller: Ad...
938
939
  
  update_io_group:
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
940
  	blkio_update_policy_node_blkg(blkcg, newpn);
34d0f179d   Gui Jianfeng   io-controller: Ad...
941
942
943
944
945
946
947
948
  
  free_newpn:
  	if (!keep_newpn)
  		kfree(newpn);
  free_buf:
  	kfree(buf);
  	return ret;
  }
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
949
950
  static void
  blkio_print_policy_node(struct seq_file *m, struct blkio_policy_node *pn)
34d0f179d   Gui Jianfeng   io-controller: Ad...
951
  {
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
952
953
954
955
956
  	switch(pn->plid) {
  		case BLKIO_POLICY_PROP:
  			if (pn->fileid == BLKIO_PROP_weight_device)
  				seq_printf(m, "%u:%u\t%u
  ", MAJOR(pn->dev),
4c9eefa16   Vivek Goyal   blk-cgroup: Intro...
957
958
959
  					MINOR(pn->dev), pn->val.weight);
  			break;
  		case BLKIO_POLICY_THROTL:
7702e8f45   Vivek Goyal   blk-cgroup: cgrou...
960
961
962
  			switch(pn->fileid) {
  			case BLKIO_THROTL_read_bps_device:
  			case BLKIO_THROTL_write_bps_device:
4c9eefa16   Vivek Goyal   blk-cgroup: Intro...
963
964
965
  				seq_printf(m, "%u:%u\t%llu
  ", MAJOR(pn->dev),
  					MINOR(pn->dev), pn->val.bps);
7702e8f45   Vivek Goyal   blk-cgroup: cgrou...
966
967
968
969
970
971
972
973
  				break;
  			case BLKIO_THROTL_read_iops_device:
  			case BLKIO_THROTL_write_iops_device:
  				seq_printf(m, "%u:%u\t%u
  ", MAJOR(pn->dev),
  					MINOR(pn->dev), pn->val.iops);
  				break;
  			}
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
974
975
976
977
978
  			break;
  		default:
  			BUG();
  	}
  }
34d0f179d   Gui Jianfeng   io-controller: Ad...
979

062a644d6   Vivek Goyal   blk-cgroup: Prepa...
980
981
982
  /* cgroup files which read their data from policy nodes end up here */
  static void blkio_read_policy_node_files(struct cftype *cft,
  			struct blkio_cgroup *blkcg, struct seq_file *m)
34d0f179d   Gui Jianfeng   io-controller: Ad...
983
  {
34d0f179d   Gui Jianfeng   io-controller: Ad...
984
  	struct blkio_policy_node *pn;
34d0f179d   Gui Jianfeng   io-controller: Ad...
985

0f3942a39   Jens Axboe   block: kill some ...
986
987
988
  	if (!list_empty(&blkcg->policy_list)) {
  		spin_lock_irq(&blkcg->lock);
  		list_for_each_entry(pn, &blkcg->policy_list, node) {
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
989
990
991
  			if (!pn_matches_cftype(cft, pn))
  				continue;
  			blkio_print_policy_node(m, pn);
0f3942a39   Jens Axboe   block: kill some ...
992
993
  		}
  		spin_unlock_irq(&blkcg->lock);
34d0f179d   Gui Jianfeng   io-controller: Ad...
994
  	}
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
995
996
997
998
999
1000
1001
1002
1003
1004
1005
1006
1007
1008
1009
1010
1011
1012
1013
1014
1015
  }
  
  static int blkiocg_file_read(struct cgroup *cgrp, struct cftype *cft,
  				struct seq_file *m)
  {
  	struct blkio_cgroup *blkcg;
  	enum blkio_policy_id plid = BLKIOFILE_POLICY(cft->private);
  	int name = BLKIOFILE_ATTR(cft->private);
  
  	blkcg = cgroup_to_blkio_cgroup(cgrp);
  
  	switch(plid) {
  	case BLKIO_POLICY_PROP:
  		switch(name) {
  		case BLKIO_PROP_weight_device:
  			blkio_read_policy_node_files(cft, blkcg, m);
  			return 0;
  		default:
  			BUG();
  		}
  		break;
4c9eefa16   Vivek Goyal   blk-cgroup: Intro...
1016
1017
1018
1019
  	case BLKIO_POLICY_THROTL:
  		switch(name){
  		case BLKIO_THROTL_read_bps_device:
  		case BLKIO_THROTL_write_bps_device:
7702e8f45   Vivek Goyal   blk-cgroup: cgrou...
1020
1021
  		case BLKIO_THROTL_read_iops_device:
  		case BLKIO_THROTL_write_iops_device:
4c9eefa16   Vivek Goyal   blk-cgroup: Intro...
1022
1023
1024
1025
1026
1027
  			blkio_read_policy_node_files(cft, blkcg, m);
  			return 0;
  		default:
  			BUG();
  		}
  		break;
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
1028
1029
1030
1031
1032
1033
1034
1035
1036
1037
1038
1039
1040
1041
1042
1043
1044
1045
1046
1047
1048
1049
1050
1051
1052
1053
1054
1055
1056
1057
1058
1059
1060
1061
1062
1063
1064
1065
1066
1067
1068
1069
1070
1071
1072
1073
1074
1075
1076
1077
1078
1079
1080
1081
1082
1083
1084
1085
1086
1087
1088
1089
1090
1091
1092
1093
1094
1095
1096
1097
1098
1099
1100
1101
1102
1103
1104
1105
1106
1107
1108
1109
1110
1111
1112
1113
1114
1115
1116
1117
  	default:
  		BUG();
  	}
  
  	return 0;
  }
  
  static int blkio_read_blkg_stats(struct blkio_cgroup *blkcg,
  		struct cftype *cft, struct cgroup_map_cb *cb, enum stat_type type,
  		bool show_total)
  {
  	struct blkio_group *blkg;
  	struct hlist_node *n;
  	uint64_t cgroup_total = 0;
  
  	rcu_read_lock();
  	hlist_for_each_entry_rcu(blkg, n, &blkcg->blkg_list, blkcg_node) {
  		if (blkg->dev) {
  			if (!cftype_blkg_same_policy(cft, blkg))
  				continue;
  			spin_lock_irq(&blkg->stats_lock);
  			cgroup_total += blkio_get_stat(blkg, cb, blkg->dev,
  						type);
  			spin_unlock_irq(&blkg->stats_lock);
  		}
  	}
  	if (show_total)
  		cb->fill(cb, "Total", cgroup_total);
  	rcu_read_unlock();
  	return 0;
  }
  
  /* All map kind of cgroup file get serviced by this function */
  static int blkiocg_file_read_map(struct cgroup *cgrp, struct cftype *cft,
  				struct cgroup_map_cb *cb)
  {
  	struct blkio_cgroup *blkcg;
  	enum blkio_policy_id plid = BLKIOFILE_POLICY(cft->private);
  	int name = BLKIOFILE_ATTR(cft->private);
  
  	blkcg = cgroup_to_blkio_cgroup(cgrp);
  
  	switch(plid) {
  	case BLKIO_POLICY_PROP:
  		switch(name) {
  		case BLKIO_PROP_time:
  			return blkio_read_blkg_stats(blkcg, cft, cb,
  						BLKIO_STAT_TIME, 0);
  		case BLKIO_PROP_sectors:
  			return blkio_read_blkg_stats(blkcg, cft, cb,
  						BLKIO_STAT_SECTORS, 0);
  		case BLKIO_PROP_io_service_bytes:
  			return blkio_read_blkg_stats(blkcg, cft, cb,
  						BLKIO_STAT_SERVICE_BYTES, 1);
  		case BLKIO_PROP_io_serviced:
  			return blkio_read_blkg_stats(blkcg, cft, cb,
  						BLKIO_STAT_SERVICED, 1);
  		case BLKIO_PROP_io_service_time:
  			return blkio_read_blkg_stats(blkcg, cft, cb,
  						BLKIO_STAT_SERVICE_TIME, 1);
  		case BLKIO_PROP_io_wait_time:
  			return blkio_read_blkg_stats(blkcg, cft, cb,
  						BLKIO_STAT_WAIT_TIME, 1);
  		case BLKIO_PROP_io_merged:
  			return blkio_read_blkg_stats(blkcg, cft, cb,
  						BLKIO_STAT_MERGED, 1);
  		case BLKIO_PROP_io_queued:
  			return blkio_read_blkg_stats(blkcg, cft, cb,
  						BLKIO_STAT_QUEUED, 1);
  #ifdef CONFIG_DEBUG_BLK_CGROUP
  		case BLKIO_PROP_dequeue:
  			return blkio_read_blkg_stats(blkcg, cft, cb,
  						BLKIO_STAT_DEQUEUE, 0);
  		case BLKIO_PROP_avg_queue_size:
  			return blkio_read_blkg_stats(blkcg, cft, cb,
  						BLKIO_STAT_AVG_QUEUE_SIZE, 0);
  		case BLKIO_PROP_group_wait_time:
  			return blkio_read_blkg_stats(blkcg, cft, cb,
  						BLKIO_STAT_GROUP_WAIT_TIME, 0);
  		case BLKIO_PROP_idle_time:
  			return blkio_read_blkg_stats(blkcg, cft, cb,
  						BLKIO_STAT_IDLE_TIME, 0);
  		case BLKIO_PROP_empty_time:
  			return blkio_read_blkg_stats(blkcg, cft, cb,
  						BLKIO_STAT_EMPTY_TIME, 0);
  #endif
  		default:
  			BUG();
  		}
  		break;
4c9eefa16   Vivek Goyal   blk-cgroup: Intro...
1118
1119
1120
1121
1122
1123
1124
1125
1126
1127
1128
1129
  	case BLKIO_POLICY_THROTL:
  		switch(name){
  		case BLKIO_THROTL_io_service_bytes:
  			return blkio_read_blkg_stats(blkcg, cft, cb,
  						BLKIO_STAT_SERVICE_BYTES, 1);
  		case BLKIO_THROTL_io_serviced:
  			return blkio_read_blkg_stats(blkcg, cft, cb,
  						BLKIO_STAT_SERVICED, 1);
  		default:
  			BUG();
  		}
  		break;
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
1130
1131
1132
1133
1134
1135
1136
1137
1138
1139
1140
1141
1142
1143
1144
1145
1146
1147
1148
1149
1150
1151
1152
1153
1154
1155
1156
1157
1158
1159
1160
1161
1162
1163
1164
1165
1166
1167
1168
1169
1170
1171
1172
1173
1174
1175
1176
1177
1178
1179
1180
1181
1182
1183
1184
1185
1186
1187
1188
1189
1190
1191
1192
1193
1194
1195
1196
1197
1198
1199
1200
1201
  	default:
  		BUG();
  	}
  
  	return 0;
  }
  
  static int blkio_weight_write(struct blkio_cgroup *blkcg, u64 val)
  {
  	struct blkio_group *blkg;
  	struct hlist_node *n;
  	struct blkio_policy_node *pn;
  
  	if (val < BLKIO_WEIGHT_MIN || val > BLKIO_WEIGHT_MAX)
  		return -EINVAL;
  
  	spin_lock(&blkio_list_lock);
  	spin_lock_irq(&blkcg->lock);
  	blkcg->weight = (unsigned int)val;
  
  	hlist_for_each_entry(blkg, n, &blkcg->blkg_list, blkcg_node) {
  		pn = blkio_policy_search_node(blkcg, blkg->dev,
  				BLKIO_POLICY_PROP, BLKIO_PROP_weight_device);
  		if (pn)
  			continue;
  
  		blkio_update_group_weight(blkg, blkcg->weight);
  	}
  	spin_unlock_irq(&blkcg->lock);
  	spin_unlock(&blkio_list_lock);
  	return 0;
  }
  
  static u64 blkiocg_file_read_u64 (struct cgroup *cgrp, struct cftype *cft) {
  	struct blkio_cgroup *blkcg;
  	enum blkio_policy_id plid = BLKIOFILE_POLICY(cft->private);
  	int name = BLKIOFILE_ATTR(cft->private);
  
  	blkcg = cgroup_to_blkio_cgroup(cgrp);
  
  	switch(plid) {
  	case BLKIO_POLICY_PROP:
  		switch(name) {
  		case BLKIO_PROP_weight:
  			return (u64)blkcg->weight;
  		}
  		break;
  	default:
  		BUG();
  	}
  	return 0;
  }
  
  static int
  blkiocg_file_write_u64(struct cgroup *cgrp, struct cftype *cft, u64 val)
  {
  	struct blkio_cgroup *blkcg;
  	enum blkio_policy_id plid = BLKIOFILE_POLICY(cft->private);
  	int name = BLKIOFILE_ATTR(cft->private);
  
  	blkcg = cgroup_to_blkio_cgroup(cgrp);
  
  	switch(plid) {
  	case BLKIO_POLICY_PROP:
  		switch(name) {
  		case BLKIO_PROP_weight:
  			return blkio_weight_write(blkcg, val);
  		}
  		break;
  	default:
  		BUG();
  	}
34d0f179d   Gui Jianfeng   io-controller: Ad...
1202

34d0f179d   Gui Jianfeng   io-controller: Ad...
1203
1204
  	return 0;
  }
31e4c28d9   Vivek Goyal   blkio: Introduce ...
1205
1206
  struct cftype blkio_files[] = {
  	{
34d0f179d   Gui Jianfeng   io-controller: Ad...
1207
  		.name = "weight_device",
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
1208
1209
1210
1211
  		.private = BLKIOFILE_PRIVATE(BLKIO_POLICY_PROP,
  				BLKIO_PROP_weight_device),
  		.read_seq_string = blkiocg_file_read,
  		.write_string = blkiocg_file_write,
34d0f179d   Gui Jianfeng   io-controller: Ad...
1212
1213
1214
  		.max_write_len = 256,
  	},
  	{
31e4c28d9   Vivek Goyal   blkio: Introduce ...
1215
  		.name = "weight",
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
1216
1217
1218
1219
  		.private = BLKIOFILE_PRIVATE(BLKIO_POLICY_PROP,
  				BLKIO_PROP_weight),
  		.read_u64 = blkiocg_file_read_u64,
  		.write_u64 = blkiocg_file_write_u64,
31e4c28d9   Vivek Goyal   blkio: Introduce ...
1220
  	},
220841906   Vivek Goyal   blkio: Export dis...
1221
1222
  	{
  		.name = "time",
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
1223
1224
1225
  		.private = BLKIOFILE_PRIVATE(BLKIO_POLICY_PROP,
  				BLKIO_PROP_time),
  		.read_map = blkiocg_file_read_map,
220841906   Vivek Goyal   blkio: Export dis...
1226
1227
1228
  	},
  	{
  		.name = "sectors",
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
1229
1230
1231
  		.private = BLKIOFILE_PRIVATE(BLKIO_POLICY_PROP,
  				BLKIO_PROP_sectors),
  		.read_map = blkiocg_file_read_map,
303a3acb2   Divyesh Shah   blkio: Add io con...
1232
1233
1234
  	},
  	{
  		.name = "io_service_bytes",
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
1235
1236
1237
  		.private = BLKIOFILE_PRIVATE(BLKIO_POLICY_PROP,
  				BLKIO_PROP_io_service_bytes),
  		.read_map = blkiocg_file_read_map,
303a3acb2   Divyesh Shah   blkio: Add io con...
1238
1239
1240
  	},
  	{
  		.name = "io_serviced",
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
1241
1242
1243
  		.private = BLKIOFILE_PRIVATE(BLKIO_POLICY_PROP,
  				BLKIO_PROP_io_serviced),
  		.read_map = blkiocg_file_read_map,
303a3acb2   Divyesh Shah   blkio: Add io con...
1244
1245
1246
  	},
  	{
  		.name = "io_service_time",
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
1247
1248
1249
  		.private = BLKIOFILE_PRIVATE(BLKIO_POLICY_PROP,
  				BLKIO_PROP_io_service_time),
  		.read_map = blkiocg_file_read_map,
303a3acb2   Divyesh Shah   blkio: Add io con...
1250
1251
1252
  	},
  	{
  		.name = "io_wait_time",
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
1253
1254
1255
  		.private = BLKIOFILE_PRIVATE(BLKIO_POLICY_PROP,
  				BLKIO_PROP_io_wait_time),
  		.read_map = blkiocg_file_read_map,
84c124da9   Divyesh Shah   blkio: Changes to...
1256
1257
  	},
  	{
812d40264   Divyesh Shah   blkio: Add io_mer...
1258
  		.name = "io_merged",
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
1259
1260
1261
  		.private = BLKIOFILE_PRIVATE(BLKIO_POLICY_PROP,
  				BLKIO_PROP_io_merged),
  		.read_map = blkiocg_file_read_map,
812d40264   Divyesh Shah   blkio: Add io_mer...
1262
1263
  	},
  	{
cdc1184cf   Divyesh Shah   blkio: Add io_que...
1264
  		.name = "io_queued",
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
1265
1266
1267
  		.private = BLKIOFILE_PRIVATE(BLKIO_POLICY_PROP,
  				BLKIO_PROP_io_queued),
  		.read_map = blkiocg_file_read_map,
cdc1184cf   Divyesh Shah   blkio: Add io_que...
1268
1269
  	},
  	{
84c124da9   Divyesh Shah   blkio: Changes to...
1270
1271
  		.name = "reset_stats",
  		.write_u64 = blkiocg_reset_stats,
220841906   Vivek Goyal   blkio: Export dis...
1272
  	},
13f98250f   Vivek Goyal   blkio: Do not exp...
1273
1274
1275
1276
1277
1278
1279
1280
1281
1282
1283
1284
1285
1286
1287
1288
1289
1290
1291
1292
1293
1294
1295
1296
1297
1298
1299
1300
1301
1302
1303
1304
1305
1306
1307
1308
1309
1310
1311
1312
1313
1314
1315
1316
1317
1318
1319
1320
1321
  #ifdef CONFIG_BLK_DEV_THROTTLING
  	{
  		.name = "throttle.read_bps_device",
  		.private = BLKIOFILE_PRIVATE(BLKIO_POLICY_THROTL,
  				BLKIO_THROTL_read_bps_device),
  		.read_seq_string = blkiocg_file_read,
  		.write_string = blkiocg_file_write,
  		.max_write_len = 256,
  	},
  
  	{
  		.name = "throttle.write_bps_device",
  		.private = BLKIOFILE_PRIVATE(BLKIO_POLICY_THROTL,
  				BLKIO_THROTL_write_bps_device),
  		.read_seq_string = blkiocg_file_read,
  		.write_string = blkiocg_file_write,
  		.max_write_len = 256,
  	},
  
  	{
  		.name = "throttle.read_iops_device",
  		.private = BLKIOFILE_PRIVATE(BLKIO_POLICY_THROTL,
  				BLKIO_THROTL_read_iops_device),
  		.read_seq_string = blkiocg_file_read,
  		.write_string = blkiocg_file_write,
  		.max_write_len = 256,
  	},
  
  	{
  		.name = "throttle.write_iops_device",
  		.private = BLKIOFILE_PRIVATE(BLKIO_POLICY_THROTL,
  				BLKIO_THROTL_write_iops_device),
  		.read_seq_string = blkiocg_file_read,
  		.write_string = blkiocg_file_write,
  		.max_write_len = 256,
  	},
  	{
  		.name = "throttle.io_service_bytes",
  		.private = BLKIOFILE_PRIVATE(BLKIO_POLICY_THROTL,
  				BLKIO_THROTL_io_service_bytes),
  		.read_map = blkiocg_file_read_map,
  	},
  	{
  		.name = "throttle.io_serviced",
  		.private = BLKIOFILE_PRIVATE(BLKIO_POLICY_THROTL,
  				BLKIO_THROTL_io_serviced),
  		.read_map = blkiocg_file_read_map,
  	},
  #endif /* CONFIG_BLK_DEV_THROTTLING */
220841906   Vivek Goyal   blkio: Export dis...
1322
  #ifdef CONFIG_DEBUG_BLK_CGROUP
cdc1184cf   Divyesh Shah   blkio: Add io_que...
1323
1324
  	{
  		.name = "avg_queue_size",
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
1325
1326
1327
  		.private = BLKIOFILE_PRIVATE(BLKIO_POLICY_PROP,
  				BLKIO_PROP_avg_queue_size),
  		.read_map = blkiocg_file_read_map,
cdc1184cf   Divyesh Shah   blkio: Add io_que...
1328
1329
  	},
  	{
812df48d1   Divyesh Shah   blkio: Add more d...
1330
  		.name = "group_wait_time",
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
1331
1332
1333
  		.private = BLKIOFILE_PRIVATE(BLKIO_POLICY_PROP,
  				BLKIO_PROP_group_wait_time),
  		.read_map = blkiocg_file_read_map,
812df48d1   Divyesh Shah   blkio: Add more d...
1334
1335
1336
  	},
  	{
  		.name = "idle_time",
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
1337
1338
1339
  		.private = BLKIOFILE_PRIVATE(BLKIO_POLICY_PROP,
  				BLKIO_PROP_idle_time),
  		.read_map = blkiocg_file_read_map,
812df48d1   Divyesh Shah   blkio: Add more d...
1340
1341
1342
  	},
  	{
  		.name = "empty_time",
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
1343
1344
1345
  		.private = BLKIOFILE_PRIVATE(BLKIO_POLICY_PROP,
  				BLKIO_PROP_empty_time),
  		.read_map = blkiocg_file_read_map,
812df48d1   Divyesh Shah   blkio: Add more d...
1346
1347
  	},
  	{
220841906   Vivek Goyal   blkio: Export dis...
1348
  		.name = "dequeue",
062a644d6   Vivek Goyal   blk-cgroup: Prepa...
1349
1350
1351
  		.private = BLKIOFILE_PRIVATE(BLKIO_POLICY_PROP,
  				BLKIO_PROP_dequeue),
  		.read_map = blkiocg_file_read_map,
cdc1184cf   Divyesh Shah   blkio: Add io_que...
1352
  	},
220841906   Vivek Goyal   blkio: Export dis...
1353
  #endif
31e4c28d9   Vivek Goyal   blkio: Introduce ...
1354
1355
1356
1357
1358
1359
1360
1361
1362
1363
1364
  };
  
  static int blkiocg_populate(struct cgroup_subsys *subsys, struct cgroup *cgroup)
  {
  	return cgroup_add_files(cgroup, subsys, blkio_files,
  				ARRAY_SIZE(blkio_files));
  }
  
  static void blkiocg_destroy(struct cgroup_subsys *subsys, struct cgroup *cgroup)
  {
  	struct blkio_cgroup *blkcg = cgroup_to_blkio_cgroup(cgroup);
b1c357696   Vivek Goyal   blkio: Take care ...
1365
1366
1367
  	unsigned long flags;
  	struct blkio_group *blkg;
  	void *key;
3e2520668   Vivek Goyal   blkio: Implement ...
1368
  	struct blkio_policy_type *blkiop;
34d0f179d   Gui Jianfeng   io-controller: Ad...
1369
  	struct blkio_policy_node *pn, *pntmp;
b1c357696   Vivek Goyal   blkio: Take care ...
1370
1371
  
  	rcu_read_lock();
0f3942a39   Jens Axboe   block: kill some ...
1372
1373
  	do {
  		spin_lock_irqsave(&blkcg->lock, flags);
b1c357696   Vivek Goyal   blkio: Take care ...
1374

0f3942a39   Jens Axboe   block: kill some ...
1375
1376
1377
1378
  		if (hlist_empty(&blkcg->blkg_list)) {
  			spin_unlock_irqrestore(&blkcg->lock, flags);
  			break;
  		}
b1c357696   Vivek Goyal   blkio: Take care ...
1379

0f3942a39   Jens Axboe   block: kill some ...
1380
1381
1382
1383
  		blkg = hlist_entry(blkcg->blkg_list.first, struct blkio_group,
  					blkcg_node);
  		key = rcu_dereference(blkg->key);
  		__blkiocg_del_blkio_group(blkg);
31e4c28d9   Vivek Goyal   blkio: Introduce ...
1384

0f3942a39   Jens Axboe   block: kill some ...
1385
  		spin_unlock_irqrestore(&blkcg->lock, flags);
b1c357696   Vivek Goyal   blkio: Take care ...
1386

0f3942a39   Jens Axboe   block: kill some ...
1387
1388
1389
  		/*
  		 * This blkio_group is being unlinked as associated cgroup is
  		 * going away. Let all the IO controlling policies know about
61014e96e   Vivek Goyal   blkio: deletion o...
1390
  		 * this event.
0f3942a39   Jens Axboe   block: kill some ...
1391
1392
  		 */
  		spin_lock(&blkio_list_lock);
61014e96e   Vivek Goyal   blkio: deletion o...
1393
1394
1395
  		list_for_each_entry(blkiop, &blkio_list, list) {
  			if (blkiop->plid != blkg->plid)
  				continue;
0f3942a39   Jens Axboe   block: kill some ...
1396
  			blkiop->ops.blkio_unlink_group_fn(key, blkg);
61014e96e   Vivek Goyal   blkio: deletion o...
1397
  		}
0f3942a39   Jens Axboe   block: kill some ...
1398
1399
  		spin_unlock(&blkio_list_lock);
  	} while (1);
34d0f179d   Gui Jianfeng   io-controller: Ad...
1400

34d0f179d   Gui Jianfeng   io-controller: Ad...
1401
1402
1403
1404
  	list_for_each_entry_safe(pn, pntmp, &blkcg->policy_list, node) {
  		blkio_policy_delete_node(pn);
  		kfree(pn);
  	}
0f3942a39   Jens Axboe   block: kill some ...
1405

31e4c28d9   Vivek Goyal   blkio: Introduce ...
1406
  	free_css_id(&blkio_subsys, &blkcg->css);
b1c357696   Vivek Goyal   blkio: Take care ...
1407
  	rcu_read_unlock();
67523c48a   Ben Blum   cgroups: blkio su...
1408
1409
  	if (blkcg != &blkio_root_cgroup)
  		kfree(blkcg);
31e4c28d9   Vivek Goyal   blkio: Introduce ...
1410
1411
1412
1413
1414
  }
  
  static struct cgroup_subsys_state *
  blkiocg_create(struct cgroup_subsys *subsys, struct cgroup *cgroup)
  {
0341509fd   Li Zefan   blk-cgroup: Fix a...
1415
1416
  	struct blkio_cgroup *blkcg;
  	struct cgroup *parent = cgroup->parent;
31e4c28d9   Vivek Goyal   blkio: Introduce ...
1417

0341509fd   Li Zefan   blk-cgroup: Fix a...
1418
  	if (!parent) {
31e4c28d9   Vivek Goyal   blkio: Introduce ...
1419
1420
1421
  		blkcg = &blkio_root_cgroup;
  		goto done;
  	}
31e4c28d9   Vivek Goyal   blkio: Introduce ...
1422
1423
1424
1425
1426
1427
1428
1429
  	blkcg = kzalloc(sizeof(*blkcg), GFP_KERNEL);
  	if (!blkcg)
  		return ERR_PTR(-ENOMEM);
  
  	blkcg->weight = BLKIO_WEIGHT_DEFAULT;
  done:
  	spin_lock_init(&blkcg->lock);
  	INIT_HLIST_HEAD(&blkcg->blkg_list);
34d0f179d   Gui Jianfeng   io-controller: Ad...
1430
  	INIT_LIST_HEAD(&blkcg->policy_list);
31e4c28d9   Vivek Goyal   blkio: Introduce ...
1431
1432
1433
1434
1435
1436
1437
1438
1439
1440
1441
1442
1443
1444
1445
1446
1447
1448
1449
1450
1451
1452
1453
1454
1455
1456
1457
1458
1459
1460
1461
1462
1463
1464
1465
1466
1467
1468
  	return &blkcg->css;
  }
  
  /*
   * We cannot support shared io contexts, as we have no mean to support
   * two tasks with the same ioc in two different groups without major rework
   * of the main cic data structures.  For now we allow a task to change
   * its cgroup only if it's the only owner of its ioc.
   */
  static int blkiocg_can_attach(struct cgroup_subsys *subsys,
  				struct cgroup *cgroup, struct task_struct *tsk,
  				bool threadgroup)
  {
  	struct io_context *ioc;
  	int ret = 0;
  
  	/* task_lock() is needed to avoid races with exit_io_context() */
  	task_lock(tsk);
  	ioc = tsk->io_context;
  	if (ioc && atomic_read(&ioc->nr_tasks) > 1)
  		ret = -EINVAL;
  	task_unlock(tsk);
  
  	return ret;
  }
  
  static void blkiocg_attach(struct cgroup_subsys *subsys, struct cgroup *cgroup,
  				struct cgroup *prev, struct task_struct *tsk,
  				bool threadgroup)
  {
  	struct io_context *ioc;
  
  	task_lock(tsk);
  	ioc = tsk->io_context;
  	if (ioc)
  		ioc->cgroup_changed = 1;
  	task_unlock(tsk);
  }
3e2520668   Vivek Goyal   blkio: Implement ...
1469
1470
1471
1472
1473
1474
1475
1476
1477
1478
1479
1480
1481
1482
1483
  void blkio_policy_register(struct blkio_policy_type *blkiop)
  {
  	spin_lock(&blkio_list_lock);
  	list_add_tail(&blkiop->list, &blkio_list);
  	spin_unlock(&blkio_list_lock);
  }
  EXPORT_SYMBOL_GPL(blkio_policy_register);
  
  void blkio_policy_unregister(struct blkio_policy_type *blkiop)
  {
  	spin_lock(&blkio_list_lock);
  	list_del_init(&blkiop->list);
  	spin_unlock(&blkio_list_lock);
  }
  EXPORT_SYMBOL_GPL(blkio_policy_unregister);
67523c48a   Ben Blum   cgroups: blkio su...
1484
1485
1486
1487
1488
1489
1490
1491
1492
1493
1494
1495
1496
1497
  
  static int __init init_cgroup_blkio(void)
  {
  	return cgroup_load_subsys(&blkio_subsys);
  }
  
  static void __exit exit_cgroup_blkio(void)
  {
  	cgroup_unload_subsys(&blkio_subsys);
  }
  
  module_init(init_cgroup_blkio);
  module_exit(exit_cgroup_blkio);
  MODULE_LICENSE("GPL");