Blame view

block/as-iosched.c 38.7 KB
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1
  /*
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
2
3
   *  Anticipatory & deadline i/o scheduler.
   *
0fe234795   Jens Axboe   [PATCH] Update ax...
4
   *  Copyright (C) 2002 Jens Axboe <axboe@kernel.dk>
f5b3db001   Nick Piggin   [PATCH] as: coope...
5
   *                     Nick Piggin <nickpiggin@yahoo.com.au>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
6
7
8
9
10
11
12
   *
   */
  #include <linux/kernel.h>
  #include <linux/fs.h>
  #include <linux/blkdev.h>
  #include <linux/elevator.h>
  #include <linux/bio.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
13
14
15
16
  #include <linux/module.h>
  #include <linux/slab.h>
  #include <linux/init.h>
  #include <linux/compiler.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
17
18
  #include <linux/rbtree.h>
  #include <linux/interrupt.h>
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
  /*
   * See Documentation/block/as-iosched.txt
   */
  
  /*
   * max time before a read is submitted.
   */
  #define default_read_expire (HZ / 8)
  
  /*
   * ditto for writes, these limits are not hard, even
   * if the disk is capable of satisfying them.
   */
  #define default_write_expire (HZ / 4)
  
  /*
   * read_batch_expire describes how long we will allow a stream of reads to
   * persist before looking to see whether it is time to switch over to writes.
   */
  #define default_read_batch_expire (HZ / 2)
  
  /*
   * write_batch_expire describes how long we want a stream of writes to run for.
   * This is not a hard limit, but a target we set for the auto-tuning thingy.
   * See, the problem is: we can send a lot of writes to disk cache / TCQ in
   * a short amount of time...
   */
  #define default_write_batch_expire (HZ / 8)
  
  /*
   * max time we may wait to anticipate a read (default around 6ms)
   */
  #define default_antic_expire ((HZ / 150) ? HZ / 150 : 1)
  
  /*
   * Keep track of up to 20ms thinktimes. We can go as big as we like here,
   * however huge values tend to interfere and not decay fast enough. A program
   * might be in a non-io phase of operation. Waiting on user input for example,
   * or doing a lengthy computation. A small penalty can be justified there, and
   * will still catch out those processes that constantly have large thinktimes.
   */
  #define MAX_THINKTIME (HZ/50UL)
  
  /* Bits in as_io_context.state */
  enum as_io_states {
f5b3db001   Nick Piggin   [PATCH] as: coope...
64
  	AS_TASK_RUNNING=0,	/* Process has not exited */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
  	AS_TASK_IOSTARTED,	/* Process has started some IO */
  	AS_TASK_IORUNNING,	/* Process has completed some IO */
  };
  
  enum anticipation_status {
  	ANTIC_OFF=0,		/* Not anticipating (normal operation)	*/
  	ANTIC_WAIT_REQ,		/* The last read has not yet completed  */
  	ANTIC_WAIT_NEXT,	/* Currently anticipating a request vs
  				   last read (which has completed) */
  	ANTIC_FINISHED,		/* Anticipating but have found a candidate
  				 * or timed out */
  };
  
  struct as_data {
  	/*
  	 * run time data
  	 */
  
  	struct request_queue *q;	/* the "owner" queue */
  
  	/*
  	 * requests (as_rq s) are present on both sort_list and fifo_list
  	 */
  	struct rb_root sort_list[2];
  	struct list_head fifo_list[2];
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
90
  	struct request *next_rq[2];	/* next in sort order */
1d6bfbdf3   Jens Axboe   as-iosched: get r...
91
  	sector_t last_sector[2];	/* last SYNC & ASYNC sectors */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
92
93
94
  
  	unsigned long exit_prob;	/* probability a task will exit while
  					   being waited on */
f5b3db001   Nick Piggin   [PATCH] as: coope...
95
96
97
  	unsigned long exit_no_coop;	/* probablility an exited task will
  					   not be part of a later cooperating
  					   request */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
98
99
100
101
102
103
104
105
106
  	unsigned long new_ttime_total; 	/* mean thinktime on new proc */
  	unsigned long new_ttime_mean;
  	u64 new_seek_total;		/* mean seek on new proc */
  	sector_t new_seek_mean;
  
  	unsigned long current_batch_expires;
  	unsigned long last_check_fifo[2];
  	int changed_batch;		/* 1: waiting for old batch to end */
  	int new_batch;			/* 1: waiting on first read complete */
1d6bfbdf3   Jens Axboe   as-iosched: get r...
107
  	int batch_data_dir;		/* current batch SYNC / ASYNC */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
108
109
110
  	int write_batch_count;		/* max # of reqs in a write batch */
  	int current_write_count;	/* how many requests left this batch */
  	int write_batch_idled;		/* has the write batch gone idle? */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
  
  	enum anticipation_status antic_status;
  	unsigned long antic_start;	/* jiffies: when it started */
  	struct timer_list antic_timer;	/* anticipatory scheduling timer */
  	struct work_struct antic_work;	/* Deferred unplugging */
  	struct io_context *io_context;	/* Identify the expected process */
  	int ioc_finished; /* IO associated with io_context is finished */
  	int nr_dispatched;
  
  	/*
  	 * settings that change how the i/o scheduler behaves
  	 */
  	unsigned long fifo_expire[2];
  	unsigned long batch_expire[2];
  	unsigned long antic_expire;
  };
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
127
128
129
130
131
132
133
134
135
136
137
138
139
140
  /*
   * per-request data.
   */
  enum arq_state {
  	AS_RQ_NEW=0,		/* New - not referenced and not on any lists */
  	AS_RQ_QUEUED,		/* In the request queue. It belongs to the
  				   scheduler */
  	AS_RQ_DISPATCHED,	/* On the dispatch list. It belongs to the
  				   driver now */
  	AS_RQ_PRESCHED,		/* Debug poisoning for requests being used */
  	AS_RQ_REMOVED,
  	AS_RQ_MERGED,
  	AS_RQ_POSTSCHED,	/* when they shouldn't be */
  };
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
141
142
143
  #define RQ_IOC(rq)	((struct io_context *) (rq)->elevator_private)
  #define RQ_STATE(rq)	((enum arq_state)(rq)->elevator_private2)
  #define RQ_SET_STATE(rq, state)	((rq)->elevator_private2 = (void *) state)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
144

e4313dd42   Jens Axboe   [PATCH] as-iosche...
145
  static DEFINE_PER_CPU(unsigned long, ioc_count);
334e94de9   Al Viro   [PATCH] deal with...
146
  static struct completion *ioc_gone;
863fddcb4   Jens Axboe   as-iosched: prope...
147
  static DEFINE_SPINLOCK(ioc_gone_lock);
334e94de9   Al Viro   [PATCH] deal with...
148

8a8e674cb   Jens Axboe   [PATCH] as-iosche...
149
  static void as_move_to_dispatch(struct as_data *ad, struct request *rq);
ef9be1d33   Tejun Heo   [BLOCK] as-iosche...
150
  static void as_antic_stop(struct as_data *ad);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
151
152
153
154
155
156
157
158
  /*
   * IO Context helper functions
   */
  
  /* Called to deallocate the as_io_context */
  static void free_as_io_context(struct as_io_context *aic)
  {
  	kfree(aic);
e4313dd42   Jens Axboe   [PATCH] as-iosche...
159
  	elv_ioc_count_dec(ioc_count);
863fddcb4   Jens Axboe   as-iosched: prope...
160
161
162
163
164
165
166
167
168
169
170
171
172
  	if (ioc_gone) {
  		/*
  		 * AS scheduler is exiting, grab exit lock and check
  		 * the pending io context count. If it hits zero,
  		 * complete ioc_gone and set it back to NULL.
  		 */
  		spin_lock(&ioc_gone_lock);
  		if (ioc_gone && !elv_ioc_count_read(ioc_count)) {
  			complete(ioc_gone);
  			ioc_gone = NULL;
  		}
  		spin_unlock(&ioc_gone_lock);
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
173
  }
e17a9489b   Al Viro   [PATCH] stop elv_...
174
175
  static void as_trim(struct io_context *ioc)
  {
8bdd3f8a6   Jens Axboe   as-iosched: fix i...
176
  	spin_lock_irq(&ioc->lock);
334e94de9   Al Viro   [PATCH] deal with...
177
178
  	if (ioc->aic)
  		free_as_io_context(ioc->aic);
e17a9489b   Al Viro   [PATCH] stop elv_...
179
  	ioc->aic = NULL;
8bdd3f8a6   Jens Axboe   as-iosched: fix i...
180
  	spin_unlock_irq(&ioc->lock);
e17a9489b   Al Viro   [PATCH] stop elv_...
181
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
  /* Called when the task exits */
  static void exit_as_io_context(struct as_io_context *aic)
  {
  	WARN_ON(!test_bit(AS_TASK_RUNNING, &aic->state));
  	clear_bit(AS_TASK_RUNNING, &aic->state);
  }
  
  static struct as_io_context *alloc_as_io_context(void)
  {
  	struct as_io_context *ret;
  
  	ret = kmalloc(sizeof(*ret), GFP_ATOMIC);
  	if (ret) {
  		ret->dtor = free_as_io_context;
  		ret->exit = exit_as_io_context;
  		ret->state = 1 << AS_TASK_RUNNING;
  		atomic_set(&ret->nr_queued, 0);
  		atomic_set(&ret->nr_dispatched, 0);
  		spin_lock_init(&ret->lock);
  		ret->ttime_total = 0;
  		ret->ttime_samples = 0;
  		ret->ttime_mean = 0;
  		ret->seek_total = 0;
  		ret->seek_samples = 0;
  		ret->seek_mean = 0;
e4313dd42   Jens Axboe   [PATCH] as-iosche...
207
  		elv_ioc_count_inc(ioc_count);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
208
209
210
211
212
213
214
215
216
  	}
  
  	return ret;
  }
  
  /*
   * If the current task has no AS IO context then create one and initialise it.
   * Then take a ref on the task's io context and return it.
   */
b5deef901   Jens Axboe   [PATCH] Make sure...
217
  static struct io_context *as_get_io_context(int node)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
218
  {
b5deef901   Jens Axboe   [PATCH] Make sure...
219
  	struct io_context *ioc = get_io_context(GFP_ATOMIC, node);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
220
221
222
223
224
225
226
227
228
  	if (ioc && !ioc->aic) {
  		ioc->aic = alloc_as_io_context();
  		if (!ioc->aic) {
  			put_io_context(ioc);
  			ioc = NULL;
  		}
  	}
  	return ioc;
  }
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
229
  static void as_put_io_context(struct request *rq)
b4878f245   Jens Axboe   [PATCH] 02/05: up...
230
231
  {
  	struct as_io_context *aic;
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
232
  	if (unlikely(!RQ_IOC(rq)))
b4878f245   Jens Axboe   [PATCH] 02/05: up...
233
  		return;
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
234
  	aic = RQ_IOC(rq)->aic;
b4878f245   Jens Axboe   [PATCH] 02/05: up...
235

8a8e674cb   Jens Axboe   [PATCH] as-iosche...
236
  	if (rq_is_sync(rq) && aic) {
8bdd3f8a6   Jens Axboe   as-iosched: fix i...
237
238
239
  		unsigned long flags;
  
  		spin_lock_irqsave(&aic->lock, flags);
b4878f245   Jens Axboe   [PATCH] 02/05: up...
240
241
  		set_bit(AS_TASK_IORUNNING, &aic->state);
  		aic->last_end_request = jiffies;
8bdd3f8a6   Jens Axboe   as-iosched: fix i...
242
  		spin_unlock_irqrestore(&aic->lock, flags);
b4878f245   Jens Axboe   [PATCH] 02/05: up...
243
  	}
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
244
  	put_io_context(RQ_IOC(rq));
b4878f245   Jens Axboe   [PATCH] 02/05: up...
245
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
246
  /*
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
247
248
   * rb tree support functions
   */
9e2585a8a   Jens Axboe   [PATCH] as-iosche...
249
  #define RQ_RB_ROOT(ad, rq)	(&(ad)->sort_list[rq_is_sync((rq))])
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
250

8a8e674cb   Jens Axboe   [PATCH] as-iosche...
251
  static void as_add_rq_rb(struct as_data *ad, struct request *rq)
ef9be1d33   Tejun Heo   [BLOCK] as-iosche...
252
  {
e37f346e3   Jens Axboe   [PATCH] as-iosche...
253
  	struct request *alias;
ef9be1d33   Tejun Heo   [BLOCK] as-iosche...
254

9e2585a8a   Jens Axboe   [PATCH] as-iosche...
255
  	while ((unlikely(alias = elv_rb_add(RQ_RB_ROOT(ad, rq), rq)))) {
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
256
  		as_move_to_dispatch(ad, alias);
ef9be1d33   Tejun Heo   [BLOCK] as-iosche...
257
258
259
  		as_antic_stop(ad);
  	}
  }
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
260
  static inline void as_del_rq_rb(struct as_data *ad, struct request *rq)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
261
  {
9e2585a8a   Jens Axboe   [PATCH] as-iosche...
262
  	elv_rb_del(RQ_RB_ROOT(ad, rq), rq);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
  }
  
  /*
   * IO Scheduler proper
   */
  
  #define MAXBACK (1024 * 1024)	/*
  				 * Maximum distance the disk will go backward
  				 * for a request.
  				 */
  
  #define BACK_PENALTY	2
  
  /*
   * as_choose_req selects the preferred one of two requests of the same data_dir
   * ignoring time - eg. timeouts, which is the job of as_dispatch_request
   */
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
280
281
  static struct request *
  as_choose_req(struct as_data *ad, struct request *rq1, struct request *rq2)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
282
283
284
285
286
  {
  	int data_dir;
  	sector_t last, s1, s2, d1, d2;
  	int r1_wrap=0, r2_wrap=0;	/* requests are behind the disk head */
  	const sector_t maxback = MAXBACK;
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
287
288
289
290
  	if (rq1 == NULL || rq1 == rq2)
  		return rq2;
  	if (rq2 == NULL)
  		return rq1;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
291

8a8e674cb   Jens Axboe   [PATCH] as-iosche...
292
  	data_dir = rq_is_sync(rq1);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
293
294
  
  	last = ad->last_sector[data_dir];
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
295
296
  	s1 = rq1->sector;
  	s2 = rq2->sector;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
297

8a8e674cb   Jens Axboe   [PATCH] as-iosche...
298
  	BUG_ON(data_dir != rq_is_sync(rq2));
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
  
  	/*
  	 * Strict one way elevator _except_ in the case where we allow
  	 * short backward seeks which are biased as twice the cost of a
  	 * similar forward seek.
  	 */
  	if (s1 >= last)
  		d1 = s1 - last;
  	else if (s1+maxback >= last)
  		d1 = (last - s1)*BACK_PENALTY;
  	else {
  		r1_wrap = 1;
  		d1 = 0; /* shut up, gcc */
  	}
  
  	if (s2 >= last)
  		d2 = s2 - last;
  	else if (s2+maxback >= last)
  		d2 = (last - s2)*BACK_PENALTY;
  	else {
  		r2_wrap = 1;
  		d2 = 0;
  	}
  
  	/* Found required data */
  	if (!r1_wrap && r2_wrap)
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
325
  		return rq1;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
326
  	else if (!r2_wrap && r1_wrap)
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
327
  		return rq2;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
328
329
330
  	else if (r1_wrap && r2_wrap) {
  		/* both behind the head */
  		if (s1 <= s2)
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
331
  			return rq1;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
332
  		else
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
333
  			return rq2;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
334
335
336
337
  	}
  
  	/* Both requests in front of the head */
  	if (d1 < d2)
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
338
  		return rq1;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
339
  	else if (d2 < d1)
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
340
  		return rq2;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
341
342
  	else {
  		if (s1 >= s2)
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
343
  			return rq1;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
344
  		else
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
345
  			return rq2;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
346
347
348
349
  	}
  }
  
  /*
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
350
   * as_find_next_rq finds the next request after @prev in elevator order.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
351
352
353
   * this with as_choose_req form the basis for how the scheduler chooses
   * what request to process next. Anticipation works on top of this.
   */
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
354
355
  static struct request *
  as_find_next_rq(struct as_data *ad, struct request *last)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
356
  {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
357
358
  	struct rb_node *rbnext = rb_next(&last->rb_node);
  	struct rb_node *rbprev = rb_prev(&last->rb_node);
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
359
  	struct request *next = NULL, *prev = NULL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
360

e37f346e3   Jens Axboe   [PATCH] as-iosche...
361
  	BUG_ON(RB_EMPTY_NODE(&last->rb_node));
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
362
363
  
  	if (rbprev)
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
364
  		prev = rb_entry_rq(rbprev);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
365
366
  
  	if (rbnext)
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
367
  		next = rb_entry_rq(rbnext);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
368
  	else {
9e2585a8a   Jens Axboe   [PATCH] as-iosche...
369
  		const int data_dir = rq_is_sync(last);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
370

e37f346e3   Jens Axboe   [PATCH] as-iosche...
371
372
  		rbnext = rb_first(&ad->sort_list[data_dir]);
  		if (rbnext && rbnext != &last->rb_node)
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
373
  			next = rb_entry_rq(rbnext);
e37f346e3   Jens Axboe   [PATCH] as-iosche...
374
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
375

e37f346e3   Jens Axboe   [PATCH] as-iosche...
376
  	return as_choose_req(ad, next, prev);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
  }
  
  /*
   * anticipatory scheduling functions follow
   */
  
  /*
   * as_antic_expired tells us when we have anticipated too long.
   * The funny "absolute difference" math on the elapsed time is to handle
   * jiffy wraps, and disks which have been idle for 0x80000000 jiffies.
   */
  static int as_antic_expired(struct as_data *ad)
  {
  	long delta_jif;
  
  	delta_jif = jiffies - ad->antic_start;
  	if (unlikely(delta_jif < 0))
  		delta_jif = -delta_jif;
  	if (delta_jif < ad->antic_expire)
  		return 0;
  
  	return 1;
  }
  
  /*
   * as_antic_waitnext starts anticipating that a nice request will soon be
   * submitted. See also as_antic_waitreq
   */
  static void as_antic_waitnext(struct as_data *ad)
  {
  	unsigned long timeout;
  
  	BUG_ON(ad->antic_status != ANTIC_OFF
  			&& ad->antic_status != ANTIC_WAIT_REQ);
  
  	timeout = ad->antic_start + ad->antic_expire;
  
  	mod_timer(&ad->antic_timer, timeout);
  
  	ad->antic_status = ANTIC_WAIT_NEXT;
  }
  
  /*
   * as_antic_waitreq starts anticipating. We don't start timing the anticipation
   * until the request that we're anticipating on has finished. This means we
   * are timing from when the candidate process wakes up hopefully.
   */
  static void as_antic_waitreq(struct as_data *ad)
  {
  	BUG_ON(ad->antic_status == ANTIC_FINISHED);
  	if (ad->antic_status == ANTIC_OFF) {
  		if (!ad->io_context || ad->ioc_finished)
  			as_antic_waitnext(ad);
  		else
  			ad->antic_status = ANTIC_WAIT_REQ;
  	}
  }
  
  /*
   * This is called directly by the functions in this file to stop anticipation.
   * We kill the timer and schedule a call to the request_fn asap.
   */
  static void as_antic_stop(struct as_data *ad)
  {
  	int status = ad->antic_status;
  
  	if (status == ANTIC_WAIT_REQ || status == ANTIC_WAIT_NEXT) {
  		if (status == ANTIC_WAIT_NEXT)
  			del_timer(&ad->antic_timer);
  		ad->antic_status = ANTIC_FINISHED;
  		/* see as_work_handler */
18887ad91   Jens Axboe   block: make kbloc...
448
  		kblockd_schedule_work(ad->q, &ad->antic_work);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
  	}
  }
  
  /*
   * as_antic_timeout is the timer function set by as_antic_waitnext.
   */
  static void as_antic_timeout(unsigned long data)
  {
  	struct request_queue *q = (struct request_queue *)data;
  	struct as_data *ad = q->elevator->elevator_data;
  	unsigned long flags;
  
  	spin_lock_irqsave(q->queue_lock, flags);
  	if (ad->antic_status == ANTIC_WAIT_REQ
  			|| ad->antic_status == ANTIC_WAIT_NEXT) {
521f3bbdb   Jens Axboe   io_context sharin...
464
465
466
  		struct as_io_context *aic;
  		spin_lock(&ad->io_context->lock);
  		aic = ad->io_context->aic;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
467
468
  
  		ad->antic_status = ANTIC_FINISHED;
18887ad91   Jens Axboe   block: make kbloc...
469
  		kblockd_schedule_work(q, &ad->antic_work);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
470
471
  
  		if (aic->ttime_samples == 0) {
f5b3db001   Nick Piggin   [PATCH] as: coope...
472
  			/* process anticipated on has exited or timed out*/
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
473
474
  			ad->exit_prob = (7*ad->exit_prob + 256)/8;
  		}
f5b3db001   Nick Piggin   [PATCH] as: coope...
475
476
477
478
  		if (!test_bit(AS_TASK_RUNNING, &aic->state)) {
  			/* process not "saved" by a cooperating request */
  			ad->exit_no_coop = (7*ad->exit_no_coop + 256)/8;
  		}
521f3bbdb   Jens Axboe   io_context sharin...
479
  		spin_unlock(&ad->io_context->lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
480
481
482
  	}
  	spin_unlock_irqrestore(q->queue_lock, flags);
  }
f5b3db001   Nick Piggin   [PATCH] as: coope...
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
  static void as_update_thinktime(struct as_data *ad, struct as_io_context *aic,
  				unsigned long ttime)
  {
  	/* fixed point: 1.0 == 1<<8 */
  	if (aic->ttime_samples == 0) {
  		ad->new_ttime_total = (7*ad->new_ttime_total + 256*ttime) / 8;
  		ad->new_ttime_mean = ad->new_ttime_total / 256;
  
  		ad->exit_prob = (7*ad->exit_prob)/8;
  	}
  	aic->ttime_samples = (7*aic->ttime_samples + 256) / 8;
  	aic->ttime_total = (7*aic->ttime_total + 256*ttime) / 8;
  	aic->ttime_mean = (aic->ttime_total + 128) / aic->ttime_samples;
  }
  
  static void as_update_seekdist(struct as_data *ad, struct as_io_context *aic,
  				sector_t sdist)
  {
  	u64 total;
  
  	if (aic->seek_samples == 0) {
  		ad->new_seek_total = (7*ad->new_seek_total + 256*(u64)sdist)/8;
  		ad->new_seek_mean = ad->new_seek_total / 256;
  	}
  
  	/*
  	 * Don't allow the seek distance to get too large from the
  	 * odd fragment, pagein, etc
  	 */
  	if (aic->seek_samples <= 60) /* second&third seek */
  		sdist = min(sdist, (aic->seek_mean * 4) + 2*1024*1024);
  	else
  		sdist = min(sdist, (aic->seek_mean * 4)	+ 2*1024*64);
  
  	aic->seek_samples = (7*aic->seek_samples + 256) / 8;
  	aic->seek_total = (7*aic->seek_total + (u64)256*sdist) / 8;
  	total = aic->seek_total + (aic->seek_samples/2);
  	do_div(total, aic->seek_samples);
  	aic->seek_mean = (sector_t)total;
  }
  
  /*
   * as_update_iohist keeps a decaying histogram of IO thinktimes, and
   * updates @aic->ttime_mean based on that. It is called when a new
   * request is queued.
   */
  static void as_update_iohist(struct as_data *ad, struct as_io_context *aic,
  				struct request *rq)
  {
9e2585a8a   Jens Axboe   [PATCH] as-iosche...
532
  	int data_dir = rq_is_sync(rq);
f5b3db001   Nick Piggin   [PATCH] as: coope...
533
534
535
536
537
  	unsigned long thinktime = 0;
  	sector_t seek_dist;
  
  	if (aic == NULL)
  		return;
1d6bfbdf3   Jens Axboe   as-iosched: get r...
538
  	if (data_dir == BLK_RW_SYNC) {
f5b3db001   Nick Piggin   [PATCH] as: coope...
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
  		unsigned long in_flight = atomic_read(&aic->nr_queued)
  					+ atomic_read(&aic->nr_dispatched);
  		spin_lock(&aic->lock);
  		if (test_bit(AS_TASK_IORUNNING, &aic->state) ||
  			test_bit(AS_TASK_IOSTARTED, &aic->state)) {
  			/* Calculate read -> read thinktime */
  			if (test_bit(AS_TASK_IORUNNING, &aic->state)
  							&& in_flight == 0) {
  				thinktime = jiffies - aic->last_end_request;
  				thinktime = min(thinktime, MAX_THINKTIME-1);
  			}
  			as_update_thinktime(ad, aic, thinktime);
  
  			/* Calculate read -> read seek distance */
  			if (aic->last_request_pos < rq->sector)
  				seek_dist = rq->sector - aic->last_request_pos;
  			else
  				seek_dist = aic->last_request_pos - rq->sector;
  			as_update_seekdist(ad, aic, seek_dist);
  		}
  		aic->last_request_pos = rq->sector + rq->nr_sectors;
  		set_bit(AS_TASK_IOSTARTED, &aic->state);
  		spin_unlock(&aic->lock);
  	}
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
564
565
566
567
  /*
   * as_close_req decides if one request is considered "close" to the
   * previous one issued.
   */
f5b3db001   Nick Piggin   [PATCH] as: coope...
568
  static int as_close_req(struct as_data *ad, struct as_io_context *aic,
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
569
  			struct request *rq)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
570
  {
c6a632a2b   Nick Piggin   as: fix antic_exp...
571
  	unsigned long delay;	/* jiffies */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
572
  	sector_t last = ad->last_sector[ad->batch_data_dir];
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
573
  	sector_t next = rq->sector;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
574
  	sector_t delta; /* acceptable close offset (in sectors) */
f5b3db001   Nick Piggin   [PATCH] as: coope...
575
  	sector_t s;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
576
577
578
579
  
  	if (ad->antic_status == ANTIC_OFF || !ad->ioc_finished)
  		delay = 0;
  	else
c6a632a2b   Nick Piggin   as: fix antic_exp...
580
  		delay = jiffies - ad->antic_start;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
581

f5b3db001   Nick Piggin   [PATCH] as: coope...
582
583
  	if (delay == 0)
  		delta = 8192;
c6a632a2b   Nick Piggin   as: fix antic_exp...
584
  	else if (delay <= (20 * HZ / 1000) && delay <= ad->antic_expire)
f5b3db001   Nick Piggin   [PATCH] as: coope...
585
  		delta = 8192 << delay;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
586
587
  	else
  		return 1;
f5b3db001   Nick Piggin   [PATCH] as: coope...
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
  	if ((last <= next + (delta>>1)) && (next <= last + delta))
  		return 1;
  
  	if (last < next)
  		s = next - last;
  	else
  		s = last - next;
  
  	if (aic->seek_samples == 0) {
  		/*
  		 * Process has just started IO. Use past statistics to
  		 * gauge success possibility
  		 */
  		if (ad->new_seek_mean > s) {
  			/* this request is better than what we're expecting */
  			return 1;
  		}
  
  	} else {
  		if (aic->seek_mean > s) {
  			/* this request is better than what we're expecting */
  			return 1;
  		}
  	}
  
  	return 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
614
615
616
617
618
619
620
621
622
623
624
  }
  
  /*
   * as_can_break_anticipation returns true if we have been anticipating this
   * request.
   *
   * It also returns true if the process against which we are anticipating
   * submits a write - that's presumably an fsync, O_SYNC write, etc. We want to
   * dispatch it ASAP, because we know that application will not be submitting
   * any new reads.
   *
f5b3db001   Nick Piggin   [PATCH] as: coope...
625
   * If the task which has submitted the request has exited, break anticipation.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
626
627
628
   *
   * If this task has queued some other IO, do not enter enticipation.
   */
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
629
  static int as_can_break_anticipation(struct as_data *ad, struct request *rq)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
630
631
632
  {
  	struct io_context *ioc;
  	struct as_io_context *aic;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
633
634
635
  
  	ioc = ad->io_context;
  	BUG_ON(!ioc);
521f3bbdb   Jens Axboe   io_context sharin...
636
  	spin_lock(&ioc->lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
637

8a8e674cb   Jens Axboe   [PATCH] as-iosche...
638
  	if (rq && ioc == RQ_IOC(rq)) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
639
  		/* request from same process */
521f3bbdb   Jens Axboe   io_context sharin...
640
  		spin_unlock(&ioc->lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
641
642
643
644
645
646
647
648
  		return 1;
  	}
  
  	if (ad->ioc_finished && as_antic_expired(ad)) {
  		/*
  		 * In this situation status should really be FINISHED,
  		 * however the timer hasn't had the chance to run yet.
  		 */
521f3bbdb   Jens Axboe   io_context sharin...
649
  		spin_unlock(&ioc->lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
650
651
652
653
  		return 1;
  	}
  
  	aic = ioc->aic;
521f3bbdb   Jens Axboe   io_context sharin...
654
655
  	if (!aic) {
  		spin_unlock(&ioc->lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
656
  		return 0;
521f3bbdb   Jens Axboe   io_context sharin...
657
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
658

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
659
660
  	if (atomic_read(&aic->nr_queued) > 0) {
  		/* process has more requests queued */
521f3bbdb   Jens Axboe   io_context sharin...
661
  		spin_unlock(&ioc->lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
662
663
664
665
666
  		return 1;
  	}
  
  	if (atomic_read(&aic->nr_dispatched) > 0) {
  		/* process has more requests dispatched */
521f3bbdb   Jens Axboe   io_context sharin...
667
  		spin_unlock(&ioc->lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
668
669
  		return 1;
  	}
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
670
  	if (rq && rq_is_sync(rq) && as_close_req(ad, aic, rq)) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
671
672
673
  		/*
  		 * Found a close request that is not one of ours.
  		 *
f5b3db001   Nick Piggin   [PATCH] as: coope...
674
675
  		 * This makes close requests from another process update
  		 * our IO history. Is generally useful when there are
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
676
677
678
  		 * two or more cooperating processes working in the same
  		 * area.
  		 */
f5b3db001   Nick Piggin   [PATCH] as: coope...
679
680
681
682
683
684
  		if (!test_bit(AS_TASK_RUNNING, &aic->state)) {
  			if (aic->ttime_samples == 0)
  				ad->exit_prob = (7*ad->exit_prob + 256)/8;
  
  			ad->exit_no_coop = (7*ad->exit_no_coop)/8;
  		}
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
685
  		as_update_iohist(ad, aic, rq);
521f3bbdb   Jens Axboe   io_context sharin...
686
  		spin_unlock(&ioc->lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
687
688
  		return 1;
  	}
f5b3db001   Nick Piggin   [PATCH] as: coope...
689
690
691
692
  	if (!test_bit(AS_TASK_RUNNING, &aic->state)) {
  		/* process anticipated on has exited */
  		if (aic->ttime_samples == 0)
  			ad->exit_prob = (7*ad->exit_prob + 256)/8;
521f3bbdb   Jens Axboe   io_context sharin...
693
694
  		if (ad->exit_no_coop > 128) {
  			spin_unlock(&ioc->lock);
f5b3db001   Nick Piggin   [PATCH] as: coope...
695
  			return 1;
521f3bbdb   Jens Axboe   io_context sharin...
696
  		}
f5b3db001   Nick Piggin   [PATCH] as: coope...
697
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
698
699
  
  	if (aic->ttime_samples == 0) {
521f3bbdb   Jens Axboe   io_context sharin...
700
701
  		if (ad->new_ttime_mean > ad->antic_expire) {
  			spin_unlock(&ioc->lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
702
  			return 1;
521f3bbdb   Jens Axboe   io_context sharin...
703
704
705
  		}
  		if (ad->exit_prob * ad->exit_no_coop > 128*256) {
  			spin_unlock(&ioc->lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
706
  			return 1;
521f3bbdb   Jens Axboe   io_context sharin...
707
  		}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
708
709
  	} else if (aic->ttime_mean > ad->antic_expire) {
  		/* the process thinks too much between requests */
521f3bbdb   Jens Axboe   io_context sharin...
710
  		spin_unlock(&ioc->lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
711
712
  		return 1;
  	}
521f3bbdb   Jens Axboe   io_context sharin...
713
  	spin_unlock(&ioc->lock);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
714
715
716
717
  	return 0;
  }
  
  /*
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
718
   * as_can_anticipate indicates whether we should either run rq
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
719
720
   * or keep anticipating a better request.
   */
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
721
  static int as_can_anticipate(struct as_data *ad, struct request *rq)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
722
  {
f7d7b7a7a   Jens Axboe   block: as/cfq ssd...
723
  #if 0 /* disable for now, we need to check tag level as well */
a68bbddba   Jens Axboe   block: add queue ...
724
725
726
  	/*
  	 * SSD device without seek penalty, disable idling
  	 */
f7d7b7a7a   Jens Axboe   block: as/cfq ssd...
727
  	if (blk_queue_nonrot(ad->q)) axman
a68bbddba   Jens Axboe   block: add queue ...
728
  		return 0;
f7d7b7a7a   Jens Axboe   block: as/cfq ssd...
729
  #endif
a68bbddba   Jens Axboe   block: add queue ...
730

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
731
732
733
734
735
736
737
738
739
740
741
  	if (!ad->io_context)
  		/*
  		 * Last request submitted was a write
  		 */
  		return 0;
  
  	if (ad->antic_status == ANTIC_FINISHED)
  		/*
  		 * Don't restart if we have just finished. Run the next request
  		 */
  		return 0;
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
742
  	if (as_can_break_anticipation(ad, rq))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
743
744
745
746
747
748
749
750
751
752
753
  		/*
  		 * This request is a good candidate. Don't keep anticipating,
  		 * run it.
  		 */
  		return 0;
  
  	/*
  	 * OK from here, we haven't finished, and don't have a decent request!
  	 * Status is either ANTIC_OFF so start waiting,
  	 * ANTIC_WAIT_REQ so continue waiting for request to finish
  	 * or ANTIC_WAIT_NEXT so continue waiting for an acceptable request.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
754
755
756
757
  	 */
  
  	return 1;
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
758
  /*
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
759
   * as_update_rq must be called whenever a request (rq) is added to
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
760
761
762
   * the sort_list. This function keeps caches up to date, and checks if the
   * request might be one we are "anticipating"
   */
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
763
  static void as_update_rq(struct as_data *ad, struct request *rq)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
764
  {
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
765
  	const int data_dir = rq_is_sync(rq);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
766

8a8e674cb   Jens Axboe   [PATCH] as-iosche...
767
768
  	/* keep the next_rq cache up to date */
  	ad->next_rq[data_dir] = as_choose_req(ad, rq, ad->next_rq[data_dir]);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
769
770
771
772
773
774
775
776
  
  	/*
  	 * have we been anticipating this request?
  	 * or does it come from the same process as the one we are anticipating
  	 * for?
  	 */
  	if (ad->antic_status == ANTIC_WAIT_REQ
  			|| ad->antic_status == ANTIC_WAIT_NEXT) {
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
777
  		if (as_can_break_anticipation(ad, rq))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
778
779
780
781
782
783
784
785
786
  			as_antic_stop(ad);
  	}
  }
  
  /*
   * Gathers timings and resizes the write batch automatically
   */
  static void update_write_batch(struct as_data *ad)
  {
1d6bfbdf3   Jens Axboe   as-iosched: get r...
787
  	unsigned long batch = ad->batch_expire[BLK_RW_ASYNC];
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
  	long write_time;
  
  	write_time = (jiffies - ad->current_batch_expires) + batch;
  	if (write_time < 0)
  		write_time = 0;
  
  	if (write_time > batch && !ad->write_batch_idled) {
  		if (write_time > batch * 3)
  			ad->write_batch_count /= 2;
  		else
  			ad->write_batch_count--;
  	} else if (write_time < batch && ad->current_write_count == 0) {
  		if (batch > write_time * 3)
  			ad->write_batch_count *= 2;
  		else
  			ad->write_batch_count++;
  	}
  
  	if (ad->write_batch_count < 1)
  		ad->write_batch_count = 1;
  }
  
  /*
   * as_completed_request is to be called when a request has completed and
   * returned something to the requesting process, be it an error or data.
   */
165125e1e   Jens Axboe   [BLOCK] Get rid o...
814
  static void as_completed_request(struct request_queue *q, struct request *rq)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
815
816
  {
  	struct as_data *ad = q->elevator->elevator_data;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
817
818
  
  	WARN_ON(!list_empty(&rq->queuelist));
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
819
  	if (RQ_STATE(rq) != AS_RQ_REMOVED) {
12e003681   Arjan van de Ven   Use WARN() in block/
820
821
  		WARN(1, "rq->state %d
  ", RQ_STATE(rq));
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
822
823
  		goto out;
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
824
  	if (ad->changed_batch && ad->nr_dispatched == 1) {
d585d0b9d   Divyesh Shah   block: Fix the st...
825
826
  		ad->current_batch_expires = jiffies +
  					ad->batch_expire[ad->batch_data_dir];
18887ad91   Jens Axboe   block: make kbloc...
827
  		kblockd_schedule_work(q, &ad->antic_work);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
828
  		ad->changed_batch = 0;
1d6bfbdf3   Jens Axboe   as-iosched: get r...
829
  		if (ad->batch_data_dir == BLK_RW_SYNC)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
830
831
832
833
834
835
836
837
838
839
  			ad->new_batch = 1;
  	}
  	WARN_ON(ad->nr_dispatched == 0);
  	ad->nr_dispatched--;
  
  	/*
  	 * Start counting the batch from when a request of that direction is
  	 * actually serviced. This should help devices with big TCQ windows
  	 * and writeback caches
  	 */
9e2585a8a   Jens Axboe   [PATCH] as-iosche...
840
  	if (ad->new_batch && ad->batch_data_dir == rq_is_sync(rq)) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
841
842
  		update_write_batch(ad);
  		ad->current_batch_expires = jiffies +
1d6bfbdf3   Jens Axboe   as-iosched: get r...
843
  				ad->batch_expire[BLK_RW_SYNC];
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
844
845
  		ad->new_batch = 0;
  	}
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
846
  	if (ad->io_context == RQ_IOC(rq) && ad->io_context) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
847
848
849
850
851
852
853
854
855
856
  		ad->antic_start = jiffies;
  		ad->ioc_finished = 1;
  		if (ad->antic_status == ANTIC_WAIT_REQ) {
  			/*
  			 * We were waiting on this request, now anticipate
  			 * the next one
  			 */
  			as_antic_waitnext(ad);
  		}
  	}
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
857
  	as_put_io_context(rq);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
858
  out:
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
859
  	RQ_SET_STATE(rq, AS_RQ_POSTSCHED);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
860
861
862
863
864
865
866
867
  }
  
  /*
   * as_remove_queued_request removes a request from the pre dispatch queue
   * without updating refcounts. It is expected the caller will drop the
   * reference unless it replaces the request at somepart of the elevator
   * (ie. the dispatch queue)
   */
165125e1e   Jens Axboe   [BLOCK] Get rid o...
868
869
  static void as_remove_queued_request(struct request_queue *q,
  				     struct request *rq)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
870
  {
9e2585a8a   Jens Axboe   [PATCH] as-iosche...
871
  	const int data_dir = rq_is_sync(rq);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
872
  	struct as_data *ad = q->elevator->elevator_data;
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
873
  	struct io_context *ioc;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
874

8a8e674cb   Jens Axboe   [PATCH] as-iosche...
875
  	WARN_ON(RQ_STATE(rq) != AS_RQ_QUEUED);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
876

8a8e674cb   Jens Axboe   [PATCH] as-iosche...
877
878
879
880
  	ioc = RQ_IOC(rq);
  	if (ioc && ioc->aic) {
  		BUG_ON(!atomic_read(&ioc->aic->nr_queued));
  		atomic_dec(&ioc->aic->nr_queued);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
881
882
883
  	}
  
  	/*
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
884
  	 * Update the "next_rq" cache if we are about to remove its
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
885
886
  	 * entry
  	 */
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
887
888
  	if (ad->next_rq[data_dir] == rq)
  		ad->next_rq[data_dir] = as_find_next_rq(ad, rq);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
889

d4f2f4629   Jens Axboe   [PATCH] as-iosche...
890
  	rq_fifo_clear(rq);
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
891
  	as_del_rq_rb(ad, rq);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
892
893
894
  }
  
  /*
8896f3c03   Aaron Carroll   as-iosched: fix i...
895
   * as_fifo_expired returns 0 if there are no expired requests on the fifo,
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
896
897
898
899
900
901
902
903
   * 1 otherwise.  It is ratelimited so that we only perform the check once per
   * `fifo_expire' interval.  Otherwise a large number of expired requests
   * would create a hopeless seekstorm.
   *
   * See as_antic_expired comment.
   */
  static int as_fifo_expired(struct as_data *ad, int adir)
  {
d4f2f4629   Jens Axboe   [PATCH] as-iosche...
904
  	struct request *rq;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
905
906
907
908
909
910
911
912
913
914
915
916
  	long delta_jif;
  
  	delta_jif = jiffies - ad->last_check_fifo[adir];
  	if (unlikely(delta_jif < 0))
  		delta_jif = -delta_jif;
  	if (delta_jif < ad->fifo_expire[adir])
  		return 0;
  
  	ad->last_check_fifo[adir] = jiffies;
  
  	if (list_empty(&ad->fifo_list[adir]))
  		return 0;
d4f2f4629   Jens Axboe   [PATCH] as-iosche...
917
  	rq = rq_entry_fifo(ad->fifo_list[adir].next);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
918

d4f2f4629   Jens Axboe   [PATCH] as-iosche...
919
  	return time_after(jiffies, rq_fifo_time(rq));
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
920
921
922
923
924
925
926
927
928
929
  }
  
  /*
   * as_batch_expired returns true if the current batch has expired. A batch
   * is a set of reads or a set of writes.
   */
  static inline int as_batch_expired(struct as_data *ad)
  {
  	if (ad->changed_batch || ad->new_batch)
  		return 0;
1d6bfbdf3   Jens Axboe   as-iosched: get r...
930
  	if (ad->batch_data_dir == BLK_RW_SYNC)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
931
932
933
934
935
936
937
938
939
940
  		/* TODO! add a check so a complete fifo gets written? */
  		return time_after(jiffies, ad->current_batch_expires);
  
  	return time_after(jiffies, ad->current_batch_expires)
  		|| ad->current_write_count == 0;
  }
  
  /*
   * move an entry to dispatch queue
   */
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
941
  static void as_move_to_dispatch(struct as_data *ad, struct request *rq)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
942
  {
9e2585a8a   Jens Axboe   [PATCH] as-iosche...
943
  	const int data_dir = rq_is_sync(rq);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
944

e37f346e3   Jens Axboe   [PATCH] as-iosche...
945
  	BUG_ON(RB_EMPTY_NODE(&rq->rb_node));
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
946
947
948
949
950
951
  
  	as_antic_stop(ad);
  	ad->antic_status = ANTIC_OFF;
  
  	/*
  	 * This has to be set in order to be correctly updated by
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
952
  	 * as_find_next_rq
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
953
954
  	 */
  	ad->last_sector[data_dir] = rq->sector + rq->nr_sectors;
1d6bfbdf3   Jens Axboe   as-iosched: get r...
955
  	if (data_dir == BLK_RW_SYNC) {
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
956
  		struct io_context *ioc = RQ_IOC(rq);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
957
  		/* In case we have to anticipate after this */
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
958
  		copy_io_context(&ad->io_context, &ioc);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
959
960
961
962
963
964
965
966
967
968
  	} else {
  		if (ad->io_context) {
  			put_io_context(ad->io_context);
  			ad->io_context = NULL;
  		}
  
  		if (ad->current_write_count != 0)
  			ad->current_write_count--;
  	}
  	ad->ioc_finished = 0;
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
969
  	ad->next_rq[data_dir] = as_find_next_rq(ad, rq);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
970
971
972
973
  
  	/*
  	 * take it off the sort and fifo list, add to dispatch queue
  	 */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
974
  	as_remove_queued_request(ad->q, rq);
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
975
  	WARN_ON(RQ_STATE(rq) != AS_RQ_QUEUED);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
976

b4878f245   Jens Axboe   [PATCH] 02/05: up...
977
  	elv_dispatch_sort(ad->q, rq);
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
978
979
980
  	RQ_SET_STATE(rq, AS_RQ_DISPATCHED);
  	if (RQ_IOC(rq) && RQ_IOC(rq)->aic)
  		atomic_inc(&RQ_IOC(rq)->aic->nr_dispatched);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
981
982
983
984
985
986
987
988
  	ad->nr_dispatched++;
  }
  
  /*
   * as_dispatch_request selects the best request according to
   * read/write expire, batch expire, etc, and moves it to the dispatch
   * queue. Returns 1 if a request was found, 0 otherwise.
   */
165125e1e   Jens Axboe   [BLOCK] Get rid o...
989
  static int as_dispatch_request(struct request_queue *q, int force)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
990
  {
b4878f245   Jens Axboe   [PATCH] 02/05: up...
991
  	struct as_data *ad = q->elevator->elevator_data;
1d6bfbdf3   Jens Axboe   as-iosched: get r...
992
993
  	const int reads = !list_empty(&ad->fifo_list[BLK_RW_SYNC]);
  	const int writes = !list_empty(&ad->fifo_list[BLK_RW_ASYNC]);
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
994
  	struct request *rq;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
995

b4878f245   Jens Axboe   [PATCH] 02/05: up...
996
997
998
999
  	if (unlikely(force)) {
  		/*
  		 * Forced dispatch, accounting is useless.  Reset
  		 * accounting states and dump fifo_lists.  Note that
1d6bfbdf3   Jens Axboe   as-iosched: get r...
1000
  		 * batch_data_dir is reset to BLK_RW_SYNC to avoid
b4878f245   Jens Axboe   [PATCH] 02/05: up...
1001
1002
1003
1004
  		 * screwing write batch accounting as write batch
  		 * accounting occurs on W->R transition.
  		 */
  		int dispatched = 0;
1d6bfbdf3   Jens Axboe   as-iosched: get r...
1005
  		ad->batch_data_dir = BLK_RW_SYNC;
b4878f245   Jens Axboe   [PATCH] 02/05: up...
1006
1007
  		ad->changed_batch = 0;
  		ad->new_batch = 0;
1d6bfbdf3   Jens Axboe   as-iosched: get r...
1008
1009
  		while (ad->next_rq[BLK_RW_SYNC]) {
  			as_move_to_dispatch(ad, ad->next_rq[BLK_RW_SYNC]);
b4878f245   Jens Axboe   [PATCH] 02/05: up...
1010
1011
  			dispatched++;
  		}
1d6bfbdf3   Jens Axboe   as-iosched: get r...
1012
  		ad->last_check_fifo[BLK_RW_SYNC] = jiffies;
b4878f245   Jens Axboe   [PATCH] 02/05: up...
1013

1d6bfbdf3   Jens Axboe   as-iosched: get r...
1014
1015
  		while (ad->next_rq[BLK_RW_ASYNC]) {
  			as_move_to_dispatch(ad, ad->next_rq[BLK_RW_ASYNC]);
b4878f245   Jens Axboe   [PATCH] 02/05: up...
1016
1017
  			dispatched++;
  		}
1d6bfbdf3   Jens Axboe   as-iosched: get r...
1018
  		ad->last_check_fifo[BLK_RW_ASYNC] = jiffies;
b4878f245   Jens Axboe   [PATCH] 02/05: up...
1019
1020
1021
  
  		return dispatched;
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1022
  	/* Signal that the write batch was uncontended, so we can't time it */
1d6bfbdf3   Jens Axboe   as-iosched: get r...
1023
  	if (ad->batch_data_dir == BLK_RW_ASYNC && !reads) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1024
1025
1026
1027
1028
1029
1030
1031
1032
  		if (ad->current_write_count == 0 || !writes)
  			ad->write_batch_idled = 1;
  	}
  
  	if (!(reads || writes)
  		|| ad->antic_status == ANTIC_WAIT_REQ
  		|| ad->antic_status == ANTIC_WAIT_NEXT
  		|| ad->changed_batch)
  		return 0;
f5b3db001   Nick Piggin   [PATCH] as: coope...
1033
  	if (!(reads && writes && as_batch_expired(ad))) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1034
1035
1036
  		/*
  		 * batch is still running or no reads or no writes
  		 */
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
1037
  		rq = ad->next_rq[ad->batch_data_dir];
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1038

1d6bfbdf3   Jens Axboe   as-iosched: get r...
1039
1040
  		if (ad->batch_data_dir == BLK_RW_SYNC && ad->antic_expire) {
  			if (as_fifo_expired(ad, BLK_RW_SYNC))
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1041
  				goto fifo_expired;
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
1042
  			if (as_can_anticipate(ad, rq)) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1043
1044
1045
1046
  				as_antic_waitreq(ad);
  				return 0;
  			}
  		}
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
1047
  		if (rq) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1048
1049
1050
  			/* we have a "next request" */
  			if (reads && !writes)
  				ad->current_batch_expires =
1d6bfbdf3   Jens Axboe   as-iosched: get r...
1051
  					jiffies + ad->batch_expire[BLK_RW_SYNC];
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1052
1053
1054
1055
1056
1057
1058
1059
1060
1061
  			goto dispatch_request;
  		}
  	}
  
  	/*
  	 * at this point we are not running a batch. select the appropriate
  	 * data direction (read / write)
  	 */
  
  	if (reads) {
1d6bfbdf3   Jens Axboe   as-iosched: get r...
1062
  		BUG_ON(RB_EMPTY_ROOT(&ad->sort_list[BLK_RW_SYNC]));
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1063

1d6bfbdf3   Jens Axboe   as-iosched: get r...
1064
  		if (writes && ad->batch_data_dir == BLK_RW_SYNC)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1065
1066
1067
1068
  			/*
  			 * Last batch was a read, switch to writes
  			 */
  			goto dispatch_writes;
1d6bfbdf3   Jens Axboe   as-iosched: get r...
1069
  		if (ad->batch_data_dir == BLK_RW_ASYNC) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1070
1071
1072
  			WARN_ON(ad->new_batch);
  			ad->changed_batch = 1;
  		}
1d6bfbdf3   Jens Axboe   as-iosched: get r...
1073
1074
  		ad->batch_data_dir = BLK_RW_SYNC;
  		rq = rq_entry_fifo(ad->fifo_list[BLK_RW_SYNC].next);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1075
1076
1077
1078
1079
1080
1081
1082
1083
1084
  		ad->last_check_fifo[ad->batch_data_dir] = jiffies;
  		goto dispatch_request;
  	}
  
  	/*
  	 * the last batch was a read
  	 */
  
  	if (writes) {
  dispatch_writes:
1d6bfbdf3   Jens Axboe   as-iosched: get r...
1085
  		BUG_ON(RB_EMPTY_ROOT(&ad->sort_list[BLK_RW_ASYNC]));
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1086

1d6bfbdf3   Jens Axboe   as-iosched: get r...
1087
  		if (ad->batch_data_dir == BLK_RW_SYNC) {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1088
1089
1090
1091
1092
1093
1094
1095
1096
  			ad->changed_batch = 1;
  
  			/*
  			 * new_batch might be 1 when the queue runs out of
  			 * reads. A subsequent submission of a write might
  			 * cause a change of batch before the read is finished.
  			 */
  			ad->new_batch = 0;
  		}
1d6bfbdf3   Jens Axboe   as-iosched: get r...
1097
  		ad->batch_data_dir = BLK_RW_ASYNC;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1098
1099
  		ad->current_write_count = ad->write_batch_count;
  		ad->write_batch_idled = 0;
1d6bfbdf3   Jens Axboe   as-iosched: get r...
1100
1101
  		rq = rq_entry_fifo(ad->fifo_list[BLK_RW_ASYNC].next);
  		ad->last_check_fifo[BLK_RW_ASYNC] = jiffies;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1102
1103
1104
1105
1106
1107
1108
1109
1110
1111
1112
1113
1114
  		goto dispatch_request;
  	}
  
  	BUG();
  	return 0;
  
  dispatch_request:
  	/*
  	 * If a request has expired, service it.
  	 */
  
  	if (as_fifo_expired(ad, ad->batch_data_dir)) {
  fifo_expired:
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
1115
  		rq = rq_entry_fifo(ad->fifo_list[ad->batch_data_dir].next);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1116
1117
1118
1119
1120
1121
1122
  	}
  
  	if (ad->changed_batch) {
  		WARN_ON(ad->new_batch);
  
  		if (ad->nr_dispatched)
  			return 0;
1d6bfbdf3   Jens Axboe   as-iosched: get r...
1123
  		if (ad->batch_data_dir == BLK_RW_ASYNC)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1124
  			ad->current_batch_expires = jiffies +
1d6bfbdf3   Jens Axboe   as-iosched: get r...
1125
  					ad->batch_expire[BLK_RW_ASYNC];
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1126
1127
1128
1129
1130
1131
1132
  		else
  			ad->new_batch = 1;
  
  		ad->changed_batch = 0;
  	}
  
  	/*
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
1133
  	 * rq is the selected appropriate request.
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1134
  	 */
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
1135
  	as_move_to_dispatch(ad, rq);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1136
1137
1138
  
  	return 1;
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1139
  /*
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
1140
   * add rq to rbtree and fifo
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1141
   */
165125e1e   Jens Axboe   [BLOCK] Get rid o...
1142
  static void as_add_request(struct request_queue *q, struct request *rq)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1143
  {
b4878f245   Jens Axboe   [PATCH] 02/05: up...
1144
  	struct as_data *ad = q->elevator->elevator_data;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1145
  	int data_dir;
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
1146
  	RQ_SET_STATE(rq, AS_RQ_NEW);
b4878f245   Jens Axboe   [PATCH] 02/05: up...
1147

9e2585a8a   Jens Axboe   [PATCH] as-iosche...
1148
  	data_dir = rq_is_sync(rq);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1149

b5deef901   Jens Axboe   [PATCH] Make sure...
1150
  	rq->elevator_private = as_get_io_context(q->node);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1151

8a8e674cb   Jens Axboe   [PATCH] as-iosche...
1152
1153
1154
  	if (RQ_IOC(rq)) {
  		as_update_iohist(ad, RQ_IOC(rq)->aic, rq);
  		atomic_inc(&RQ_IOC(rq)->aic->nr_queued);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1155
  	}
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
1156
  	as_add_rq_rb(ad, rq);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1157

ef9be1d33   Tejun Heo   [BLOCK] as-iosche...
1158
  	/*
8896f3c03   Aaron Carroll   as-iosched: fix i...
1159
  	 * set expire time and add to fifo list
ef9be1d33   Tejun Heo   [BLOCK] as-iosche...
1160
  	 */
d4f2f4629   Jens Axboe   [PATCH] as-iosche...
1161
1162
  	rq_set_fifo_time(rq, jiffies + ad->fifo_expire[data_dir]);
  	list_add_tail(&rq->queuelist, &ad->fifo_list[data_dir]);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1163

8a8e674cb   Jens Axboe   [PATCH] as-iosche...
1164
1165
  	as_update_rq(ad, rq); /* keep state machine up to date */
  	RQ_SET_STATE(rq, AS_RQ_QUEUED);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1166
  }
165125e1e   Jens Axboe   [BLOCK] Get rid o...
1167
  static void as_activate_request(struct request_queue *q, struct request *rq)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1168
  {
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
1169
1170
1171
1172
  	WARN_ON(RQ_STATE(rq) != AS_RQ_DISPATCHED);
  	RQ_SET_STATE(rq, AS_RQ_REMOVED);
  	if (RQ_IOC(rq) && RQ_IOC(rq)->aic)
  		atomic_dec(&RQ_IOC(rq)->aic->nr_dispatched);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1173
  }
165125e1e   Jens Axboe   [BLOCK] Get rid o...
1174
  static void as_deactivate_request(struct request_queue *q, struct request *rq)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1175
  {
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
1176
1177
1178
1179
  	WARN_ON(RQ_STATE(rq) != AS_RQ_REMOVED);
  	RQ_SET_STATE(rq, AS_RQ_DISPATCHED);
  	if (RQ_IOC(rq) && RQ_IOC(rq)->aic)
  		atomic_inc(&RQ_IOC(rq)->aic->nr_dispatched);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1180
1181
1182
1183
1184
1185
1186
1187
  }
  
  /*
   * as_queue_empty tells us if there are requests left in the device. It may
   * not be the case that a driver can get the next request even if the queue
   * is not empty - it is used in the block layer to check for plugging and
   * merging opportunities
   */
165125e1e   Jens Axboe   [BLOCK] Get rid o...
1188
  static int as_queue_empty(struct request_queue *q)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1189
1190
  {
  	struct as_data *ad = q->elevator->elevator_data;
1d6bfbdf3   Jens Axboe   as-iosched: get r...
1191
1192
  	return list_empty(&ad->fifo_list[BLK_RW_ASYNC])
  		&& list_empty(&ad->fifo_list[BLK_RW_SYNC]);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1193
  }
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1194
  static int
165125e1e   Jens Axboe   [BLOCK] Get rid o...
1195
  as_merge(struct request_queue *q, struct request **req, struct bio *bio)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1196
1197
1198
1199
  {
  	struct as_data *ad = q->elevator->elevator_data;
  	sector_t rb_key = bio->bi_sector + bio_sectors(bio);
  	struct request *__rq;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1200
1201
1202
1203
  
  	/*
  	 * check for front merge
  	 */
e37f346e3   Jens Axboe   [PATCH] as-iosche...
1204
  	__rq = elv_rb_find(&ad->sort_list[bio_data_dir(bio)], rb_key);
9817064b6   Jens Axboe   [PATCH] elevator:...
1205
1206
1207
  	if (__rq && elv_rq_merge_ok(__rq, bio)) {
  		*req = __rq;
  		return ELEVATOR_FRONT_MERGE;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1208
1209
1210
  	}
  
  	return ELEVATOR_NO_MERGE;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1211
  }
165125e1e   Jens Axboe   [BLOCK] Get rid o...
1212
1213
  static void as_merged_request(struct request_queue *q, struct request *req,
  			      int type)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1214
1215
  {
  	struct as_data *ad = q->elevator->elevator_data;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1216
1217
  
  	/*
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1218
1219
  	 * if the merge was a front merge, we need to reposition request
  	 */
e37f346e3   Jens Axboe   [PATCH] as-iosche...
1220
  	if (type == ELEVATOR_FRONT_MERGE) {
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
1221
1222
  		as_del_rq_rb(ad, req);
  		as_add_rq_rb(ad, req);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1223
1224
1225
1226
1227
1228
  		/*
  		 * Note! At this stage of this and the next function, our next
  		 * request may not be optimal - eg the request may have "grown"
  		 * behind the disk head. We currently don't bother adjusting.
  		 */
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1229
  }
165125e1e   Jens Axboe   [BLOCK] Get rid o...
1230
  static void as_merged_requests(struct request_queue *q, struct request *req,
f5b3db001   Nick Piggin   [PATCH] as: coope...
1231
  			 	struct request *next)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1232
  {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1233
  	/*
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
1234
1235
  	 * if next expires before rq, assign its expire time to arq
  	 * and move into next position (next will be deleted) in fifo
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1236
  	 */
d4f2f4629   Jens Axboe   [PATCH] as-iosche...
1237
1238
1239
1240
  	if (!list_empty(&req->queuelist) && !list_empty(&next->queuelist)) {
  		if (time_before(rq_fifo_time(next), rq_fifo_time(req))) {
  			list_move(&req->queuelist, &next->queuelist);
  			rq_set_fifo_time(req, rq_fifo_time(next));
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1241
1242
1243
1244
  		}
  	}
  
  	/*
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1245
1246
1247
  	 * kill knowledge of next, this one is a goner
  	 */
  	as_remove_queued_request(q, next);
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
1248
  	as_put_io_context(next);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1249

8a8e674cb   Jens Axboe   [PATCH] as-iosche...
1250
  	RQ_SET_STATE(next, AS_RQ_MERGED);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1251
1252
1253
1254
1255
1256
1257
1258
1259
1260
1261
  }
  
  /*
   * This is executed in a "deferred" process context, by kblockd. It calls the
   * driver's request_fn so the driver can submit that request.
   *
   * IMPORTANT! This guy will reenter the elevator, so set up all queue global
   * state before calling, and don't rely on any state over calls.
   *
   * FIXME! dispatch queue is not a queue at all!
   */
65f27f384   David Howells   WorkStruct: Pass ...
1262
  static void as_work_handler(struct work_struct *work)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1263
  {
65f27f384   David Howells   WorkStruct: Pass ...
1264
  	struct as_data *ad = container_of(work, struct as_data, antic_work);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1265

a7f557923   Tejun Heo   block: kill blk_s...
1266
  	blk_run_queue(ad->q);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1267
  }
165125e1e   Jens Axboe   [BLOCK] Get rid o...
1268
  static int as_may_queue(struct request_queue *q, int rw)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1269
1270
1271
1272
1273
1274
  {
  	int ret = ELV_MQUEUE_MAY;
  	struct as_data *ad = q->elevator->elevator_data;
  	struct io_context *ioc;
  	if (ad->antic_status == ANTIC_WAIT_REQ ||
  			ad->antic_status == ANTIC_WAIT_NEXT) {
b5deef901   Jens Axboe   [PATCH] Make sure...
1275
  		ioc = as_get_io_context(q->node);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1276
1277
1278
1279
1280
1281
1282
  		if (ad->io_context == ioc)
  			ret = ELV_MQUEUE_MUST;
  		put_io_context(ioc);
  	}
  
  	return ret;
  }
b374d18a4   Jens Axboe   block: get rid of...
1283
  static void as_exit_queue(struct elevator_queue *e)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1284
1285
1286
1287
  {
  	struct as_data *ad = e->elevator_data;
  
  	del_timer_sync(&ad->antic_timer);
64d01dc9e   Cheng Renquan   block: use cancel...
1288
  	cancel_work_sync(&ad->antic_work);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1289

1d6bfbdf3   Jens Axboe   as-iosched: get r...
1290
1291
  	BUG_ON(!list_empty(&ad->fifo_list[BLK_RW_SYNC]));
  	BUG_ON(!list_empty(&ad->fifo_list[BLK_RW_ASYNC]));
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1292

1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1293
  	put_io_context(ad->io_context);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1294
1295
1296
1297
  	kfree(ad);
  }
  
  /*
8a8e674cb   Jens Axboe   [PATCH] as-iosche...
1298
   * initialize elevator private data (as_data).
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1299
   */
165125e1e   Jens Axboe   [BLOCK] Get rid o...
1300
  static void *as_init_queue(struct request_queue *q)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1301
1302
  {
  	struct as_data *ad;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1303

94f6030ca   Christoph Lameter   Slab allocators: ...
1304
  	ad = kmalloc_node(sizeof(*ad), GFP_KERNEL | __GFP_ZERO, q->node);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1305
  	if (!ad)
bc1c11697   Jens Axboe   [PATCH] elevator ...
1306
  		return NULL;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1307
1308
  
  	ad->q = q; /* Identify what queue the data belongs to */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1309
1310
1311
1312
  	/* anticipatory scheduling helpers */
  	ad->antic_timer.function = as_antic_timeout;
  	ad->antic_timer.data = (unsigned long)q;
  	init_timer(&ad->antic_timer);
65f27f384   David Howells   WorkStruct: Pass ...
1313
  	INIT_WORK(&ad->antic_work, as_work_handler);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1314

1d6bfbdf3   Jens Axboe   as-iosched: get r...
1315
1316
1317
1318
1319
1320
  	INIT_LIST_HEAD(&ad->fifo_list[BLK_RW_SYNC]);
  	INIT_LIST_HEAD(&ad->fifo_list[BLK_RW_ASYNC]);
  	ad->sort_list[BLK_RW_SYNC] = RB_ROOT;
  	ad->sort_list[BLK_RW_ASYNC] = RB_ROOT;
  	ad->fifo_expire[BLK_RW_SYNC] = default_read_expire;
  	ad->fifo_expire[BLK_RW_ASYNC] = default_write_expire;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1321
  	ad->antic_expire = default_antic_expire;
1d6bfbdf3   Jens Axboe   as-iosched: get r...
1322
1323
  	ad->batch_expire[BLK_RW_SYNC] = default_read_batch_expire;
  	ad->batch_expire[BLK_RW_ASYNC] = default_write_batch_expire;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1324

1d6bfbdf3   Jens Axboe   as-iosched: get r...
1325
1326
  	ad->current_batch_expires = jiffies + ad->batch_expire[BLK_RW_SYNC];
  	ad->write_batch_count = ad->batch_expire[BLK_RW_ASYNC] / 10;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1327
1328
  	if (ad->write_batch_count < 2)
  		ad->write_batch_count = 2;
bc1c11697   Jens Axboe   [PATCH] elevator ...
1329
  	return ad;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1330
1331
1332
1333
1334
  }
  
  /*
   * sysfs parts below
   */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1335
1336
1337
1338
  
  static ssize_t
  as_var_show(unsigned int var, char *page)
  {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1339
1340
1341
1342
1343
1344
1345
  	return sprintf(page, "%d
  ", var);
  }
  
  static ssize_t
  as_var_store(unsigned long *var, const char *page, size_t count)
  {
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1346
  	char *p = (char *) page;
c9b3ad673   Jens Axboe   [PATCH] as-iosche...
1347
  	*var = simple_strtoul(p, &p, 10);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1348
1349
  	return count;
  }
b374d18a4   Jens Axboe   block: get rid of...
1350
  static ssize_t est_time_show(struct elevator_queue *e, char *page)
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1351
  {
3d1ab40f4   Al Viro   [PATCH] elevator_...
1352
  	struct as_data *ad = e->elevator_data;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1353
  	int pos = 0;
f5b3db001   Nick Piggin   [PATCH] as: coope...
1354
1355
1356
1357
1358
1359
1360
  	pos += sprintf(page+pos, "%lu %% exit probability
  ",
  				100*ad->exit_prob/256);
  	pos += sprintf(page+pos, "%lu %% probability of exiting without a "
  				"cooperating process submitting IO
  ",
  				100*ad->exit_no_coop/256);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1361
1362
  	pos += sprintf(page+pos, "%lu ms new thinktime
  ", ad->new_ttime_mean);
f5b3db001   Nick Piggin   [PATCH] as: coope...
1363
1364
1365
  	pos += sprintf(page+pos, "%llu sectors new seek distance
  ",
  				(unsigned long long)ad->new_seek_mean);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1366
1367
1368
1369
1370
  
  	return pos;
  }
  
  #define SHOW_FUNCTION(__FUNC, __VAR)				\
b374d18a4   Jens Axboe   block: get rid of...
1371
  static ssize_t __FUNC(struct elevator_queue *e, char *page)	\
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1372
  {								\
3d1ab40f4   Al Viro   [PATCH] elevator_...
1373
  	struct as_data *ad = e->elevator_data;			\
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1374
1375
  	return as_var_show(jiffies_to_msecs((__VAR)), (page));	\
  }
1d6bfbdf3   Jens Axboe   as-iosched: get r...
1376
1377
  SHOW_FUNCTION(as_read_expire_show, ad->fifo_expire[BLK_RW_SYNC]);
  SHOW_FUNCTION(as_write_expire_show, ad->fifo_expire[BLK_RW_ASYNC]);
e572ec7e4   Al Viro   [PATCH] fix rmmod...
1378
  SHOW_FUNCTION(as_antic_expire_show, ad->antic_expire);
1d6bfbdf3   Jens Axboe   as-iosched: get r...
1379
1380
  SHOW_FUNCTION(as_read_batch_expire_show, ad->batch_expire[BLK_RW_SYNC]);
  SHOW_FUNCTION(as_write_batch_expire_show, ad->batch_expire[BLK_RW_ASYNC]);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1381
1382
1383
  #undef SHOW_FUNCTION
  
  #define STORE_FUNCTION(__FUNC, __PTR, MIN, MAX)				\
b374d18a4   Jens Axboe   block: get rid of...
1384
  static ssize_t __FUNC(struct elevator_queue *e, const char *page, size_t count)	\
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1385
  {									\
3d1ab40f4   Al Viro   [PATCH] elevator_...
1386
1387
  	struct as_data *ad = e->elevator_data;				\
  	int ret = as_var_store(__PTR, (page), count);			\
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1388
1389
1390
1391
1392
1393
1394
  	if (*(__PTR) < (MIN))						\
  		*(__PTR) = (MIN);					\
  	else if (*(__PTR) > (MAX))					\
  		*(__PTR) = (MAX);					\
  	*(__PTR) = msecs_to_jiffies(*(__PTR));				\
  	return ret;							\
  }
1d6bfbdf3   Jens Axboe   as-iosched: get r...
1395
1396
1397
  STORE_FUNCTION(as_read_expire_store, &ad->fifo_expire[BLK_RW_SYNC], 0, INT_MAX);
  STORE_FUNCTION(as_write_expire_store,
  			&ad->fifo_expire[BLK_RW_ASYNC], 0, INT_MAX);
e572ec7e4   Al Viro   [PATCH] fix rmmod...
1398
1399
  STORE_FUNCTION(as_antic_expire_store, &ad->antic_expire, 0, INT_MAX);
  STORE_FUNCTION(as_read_batch_expire_store,
1d6bfbdf3   Jens Axboe   as-iosched: get r...
1400
  			&ad->batch_expire[BLK_RW_SYNC], 0, INT_MAX);
e572ec7e4   Al Viro   [PATCH] fix rmmod...
1401
  STORE_FUNCTION(as_write_batch_expire_store,
1d6bfbdf3   Jens Axboe   as-iosched: get r...
1402
  			&ad->batch_expire[BLK_RW_ASYNC], 0, INT_MAX);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1403
  #undef STORE_FUNCTION
e572ec7e4   Al Viro   [PATCH] fix rmmod...
1404
1405
1406
1407
1408
1409
1410
1411
1412
1413
1414
  #define AS_ATTR(name) \
  	__ATTR(name, S_IRUGO|S_IWUSR, as_##name##_show, as_##name##_store)
  
  static struct elv_fs_entry as_attrs[] = {
  	__ATTR_RO(est_time),
  	AS_ATTR(read_expire),
  	AS_ATTR(write_expire),
  	AS_ATTR(antic_expire),
  	AS_ATTR(read_batch_expire),
  	AS_ATTR(write_batch_expire),
  	__ATTR_NULL
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1415
  };
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1416
1417
1418
1419
1420
  static struct elevator_type iosched_as = {
  	.ops = {
  		.elevator_merge_fn = 		as_merge,
  		.elevator_merged_fn =		as_merged_request,
  		.elevator_merge_req_fn =	as_merged_requests,
b4878f245   Jens Axboe   [PATCH] 02/05: up...
1421
1422
1423
  		.elevator_dispatch_fn =		as_dispatch_request,
  		.elevator_add_req_fn =		as_add_request,
  		.elevator_activate_req_fn =	as_activate_request,
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1424
1425
1426
  		.elevator_deactivate_req_fn = 	as_deactivate_request,
  		.elevator_queue_empty_fn =	as_queue_empty,
  		.elevator_completed_req_fn =	as_completed_request,
e37f346e3   Jens Axboe   [PATCH] as-iosche...
1427
1428
  		.elevator_former_req_fn =	elv_rb_former_request,
  		.elevator_latter_req_fn =	elv_rb_latter_request,
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1429
1430
1431
  		.elevator_may_queue_fn =	as_may_queue,
  		.elevator_init_fn =		as_init_queue,
  		.elevator_exit_fn =		as_exit_queue,
e17a9489b   Al Viro   [PATCH] stop elv_...
1432
  		.trim =				as_trim,
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1433
  	},
3d1ab40f4   Al Viro   [PATCH] elevator_...
1434
  	.elevator_attrs = as_attrs,
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1435
1436
1437
1438
1439
1440
  	.elevator_name = "anticipatory",
  	.elevator_owner = THIS_MODULE,
  };
  
  static int __init as_init(void)
  {
2fdd82bd8   Adrian Bunk   block: let elv_re...
1441
1442
1443
  	elv_register(&iosched_as);
  
  	return 0;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1444
1445
1446
1447
  }
  
  static void __exit as_exit(void)
  {
6e9a4738c   Peter Zijlstra   [PATCH] completio...
1448
  	DECLARE_COMPLETION_ONSTACK(all_gone);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1449
  	elv_unregister(&iosched_as);
334e94de9   Al Viro   [PATCH] deal with...
1450
  	ioc_gone = &all_gone;
fba822722   OGAWA Hirofumi   [PATCH 1/2] iosch...
1451
1452
  	/* ioc_gone's update must be visible before reading ioc_count */
  	smp_wmb();
e4313dd42   Jens Axboe   [PATCH] as-iosche...
1453
  	if (elv_ioc_count_read(ioc_count))
863fddcb4   Jens Axboe   as-iosched: prope...
1454
  		wait_for_completion(&all_gone);
334e94de9   Al Viro   [PATCH] deal with...
1455
  	synchronize_rcu();
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1456
1457
1458
1459
1460
1461
1462
1463
  }
  
  module_init(as_init);
  module_exit(as_exit);
  
  MODULE_AUTHOR("Nick Piggin");
  MODULE_LICENSE("GPL");
  MODULE_DESCRIPTION("anticipatory IO scheduler");