Blame view

kernel/trace/ring_buffer.c 105 KB
7a8e76a38   Steven Rostedt   tracing: unified ...
1
2
3
4
5
6
  /*
   * Generic ring buffer
   *
   * Copyright (C) 2008 Steven Rostedt <srostedt@redhat.com>
   */
  #include <linux/ring_buffer.h>
14131f2f9   Ingo Molnar   tracing: implemen...
7
  #include <linux/trace_clock.h>
7a8e76a38   Steven Rostedt   tracing: unified ...
8
9
10
  #include <linux/spinlock.h>
  #include <linux/debugfs.h>
  #include <linux/uaccess.h>
a81bd80a0   Steven Rostedt   ring-buffer: use ...
11
  #include <linux/hardirq.h>
1744a21d5   Vegard Nossum   trace: annotate b...
12
  #include <linux/kmemcheck.h>
7a8e76a38   Steven Rostedt   tracing: unified ...
13
14
15
  #include <linux/module.h>
  #include <linux/percpu.h>
  #include <linux/mutex.h>
5a0e3ad6a   Tejun Heo   include cleanup: ...
16
  #include <linux/slab.h>
7a8e76a38   Steven Rostedt   tracing: unified ...
17
18
19
  #include <linux/init.h>
  #include <linux/hash.h>
  #include <linux/list.h>
554f786e2   Steven Rostedt   ring-buffer: only...
20
  #include <linux/cpu.h>
7a8e76a38   Steven Rostedt   tracing: unified ...
21
  #include <linux/fs.h>
79615760f   Christoph Lameter   local_t: Move loc...
22
  #include <asm/local.h>
182e9f5f7   Steven Rostedt   ftrace: insert in...
23
  #include "trace.h"
033601a32   Steven Rostedt   ring-buffer: add ...
24
  /*
d1b182a8d   Steven Rostedt   tracing/events/ri...
25
26
27
28
29
   * The ring buffer header is special. We must manually up keep it.
   */
  int ring_buffer_print_entry_header(struct trace_seq *s)
  {
  	int ret;
334d4169a   Lai Jiangshan   ring_buffer: comp...
30
31
32
33
  	ret = trace_seq_printf(s, "# compressed entry header
  ");
  	ret = trace_seq_printf(s, "\ttype_len    :    5 bits
  ");
d1b182a8d   Steven Rostedt   tracing/events/ri...
34
35
36
37
38
39
40
41
42
43
44
45
  	ret = trace_seq_printf(s, "\ttime_delta  :   27 bits
  ");
  	ret = trace_seq_printf(s, "\tarray       :   32 bits
  ");
  	ret = trace_seq_printf(s, "
  ");
  	ret = trace_seq_printf(s, "\tpadding     : type == %d
  ",
  			       RINGBUF_TYPE_PADDING);
  	ret = trace_seq_printf(s, "\ttime_extend : type == %d
  ",
  			       RINGBUF_TYPE_TIME_EXTEND);
334d4169a   Lai Jiangshan   ring_buffer: comp...
46
47
48
  	ret = trace_seq_printf(s, "\tdata max type_len  == %d
  ",
  			       RINGBUF_TYPE_DATA_TYPE_LEN_MAX);
d1b182a8d   Steven Rostedt   tracing/events/ri...
49
50
51
52
53
  
  	return ret;
  }
  
  /*
5cc985488   Steven Rostedt   ring-buffer: docu...
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
   * The ring buffer is made up of a list of pages. A separate list of pages is
   * allocated for each CPU. A writer may only write to a buffer that is
   * associated with the CPU it is currently executing on.  A reader may read
   * from any per cpu buffer.
   *
   * The reader is special. For each per cpu buffer, the reader has its own
   * reader page. When a reader has read the entire reader page, this reader
   * page is swapped with another page in the ring buffer.
   *
   * Now, as long as the writer is off the reader page, the reader can do what
   * ever it wants with that page. The writer will never write to that page
   * again (as long as it is out of the ring buffer).
   *
   * Here's some silly ASCII art.
   *
   *   +------+
   *   |reader|          RING BUFFER
   *   |page  |
   *   +------+        +---+   +---+   +---+
   *                   |   |-->|   |-->|   |
   *                   +---+   +---+   +---+
   *                     ^               |
   *                     |               |
   *                     +---------------+
   *
   *
   *   +------+
   *   |reader|          RING BUFFER
   *   |page  |------------------v
   *   +------+        +---+   +---+   +---+
   *                   |   |-->|   |-->|   |
   *                   +---+   +---+   +---+
   *                     ^               |
   *                     |               |
   *                     +---------------+
   *
   *
   *   +------+
   *   |reader|          RING BUFFER
   *   |page  |------------------v
   *   +------+        +---+   +---+   +---+
   *      ^            |   |-->|   |-->|   |
   *      |            +---+   +---+   +---+
   *      |                              |
   *      |                              |
   *      +------------------------------+
   *
   *
   *   +------+
   *   |buffer|          RING BUFFER
   *   |page  |------------------v
   *   +------+        +---+   +---+   +---+
   *      ^            |   |   |   |-->|   |
   *      |   New      +---+   +---+   +---+
   *      |  Reader------^               |
   *      |   page                       |
   *      +------------------------------+
   *
   *
   * After we make this swap, the reader can hand this page off to the splice
   * code and be done with it. It can even allocate a new page if it needs to
   * and swap that into the ring buffer.
   *
   * We will be using cmpxchg soon to make all this lockless.
   *
   */
  
  /*
033601a32   Steven Rostedt   ring-buffer: add ...
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
   * A fast way to enable or disable all ring buffers is to
   * call tracing_on or tracing_off. Turning off the ring buffers
   * prevents all ring buffers from being recorded to.
   * Turning this switch on, makes it OK to write to the
   * ring buffer, if the ring buffer is enabled itself.
   *
   * There's three layers that must be on in order to write
   * to the ring buffer.
   *
   * 1) This global flag must be set.
   * 2) The ring buffer must be enabled for recording.
   * 3) The per cpu buffer must be enabled for recording.
   *
   * In case of an anomaly, this global flag has a bit set that
   * will permantly disable all ring buffers.
   */
  
  /*
   * Global flag to disable all recording to ring buffers
   *  This has two bits: ON, DISABLED
   *
   *  ON   DISABLED
   * ---- ----------
   *   0      0        : ring buffers are off
   *   1      0        : ring buffers are on
   *   X      1        : ring buffers are permanently disabled
   */
  
  enum {
  	RB_BUFFERS_ON_BIT	= 0,
  	RB_BUFFERS_DISABLED_BIT	= 1,
  };
  
  enum {
  	RB_BUFFERS_ON		= 1 << RB_BUFFERS_ON_BIT,
  	RB_BUFFERS_DISABLED	= 1 << RB_BUFFERS_DISABLED_BIT,
  };
5e39841c4   Hannes Eder   tracing: fix spar...
159
  static unsigned long ring_buffer_flags __read_mostly = RB_BUFFERS_ON;
a35832446   Steven Rostedt   ring-buffer: buff...
160

474d32b68   Steven Rostedt   ring-buffer: make...
161
  #define BUF_PAGE_HDR_SIZE offsetof(struct buffer_data_page, data)
a35832446   Steven Rostedt   ring-buffer: buff...
162
163
164
165
166
167
168
169
  /**
   * tracing_on - enable all tracing buffers
   *
   * This function enables all tracing buffers that may have been
   * disabled with tracing_off.
   */
  void tracing_on(void)
  {
033601a32   Steven Rostedt   ring-buffer: add ...
170
  	set_bit(RB_BUFFERS_ON_BIT, &ring_buffer_flags);
a35832446   Steven Rostedt   ring-buffer: buff...
171
  }
c4f50183f   Robert Richter   ring_buffer: addi...
172
  EXPORT_SYMBOL_GPL(tracing_on);
a35832446   Steven Rostedt   ring-buffer: buff...
173
174
175
176
177
178
179
180
181
182
183
  
  /**
   * tracing_off - turn off all tracing buffers
   *
   * This function stops all tracing buffers from recording data.
   * It does not disable any overhead the tracers themselves may
   * be causing. This function simply causes all recording to
   * the ring buffers to fail.
   */
  void tracing_off(void)
  {
033601a32   Steven Rostedt   ring-buffer: add ...
184
185
  	clear_bit(RB_BUFFERS_ON_BIT, &ring_buffer_flags);
  }
c4f50183f   Robert Richter   ring_buffer: addi...
186
  EXPORT_SYMBOL_GPL(tracing_off);
033601a32   Steven Rostedt   ring-buffer: add ...
187
188
189
190
191
  
  /**
   * tracing_off_permanent - permanently disable ring buffers
   *
   * This function, once called, will disable all ring buffers
c3706f005   Wenji Huang   tracing: fix typo...
192
   * permanently.
033601a32   Steven Rostedt   ring-buffer: add ...
193
194
195
196
   */
  void tracing_off_permanent(void)
  {
  	set_bit(RB_BUFFERS_DISABLED_BIT, &ring_buffer_flags);
a35832446   Steven Rostedt   ring-buffer: buff...
197
  }
988ae9d6b   Steven Rostedt   ring-buffer: add ...
198
199
200
201
202
203
204
205
  /**
   * tracing_is_on - show state of ring buffers enabled
   */
  int tracing_is_on(void)
  {
  	return ring_buffer_flags == RB_BUFFERS_ON;
  }
  EXPORT_SYMBOL_GPL(tracing_is_on);
e3d6bf0a0   Steven Rostedt   ring-buffer: repl...
206
  #define RB_EVNT_HDR_SIZE (offsetof(struct ring_buffer_event, array))
67d347245   Andrew Morton   kernel/trace/ring...
207
  #define RB_ALIGNMENT		4U
334d4169a   Lai Jiangshan   ring_buffer: comp...
208
  #define RB_MAX_SMALL_DATA	(RB_ALIGNMENT * RINGBUF_TYPE_DATA_TYPE_LEN_MAX)
c7b093085   Steven Rostedt   ring-buffer: prev...
209
  #define RB_EVNT_MIN_SIZE	8U	/* two 32bit words */
334d4169a   Lai Jiangshan   ring_buffer: comp...
210

2271048d1   Steven Rostedt   ring-buffer: Do 8...
211
212
213
214
215
216
217
  #if !defined(CONFIG_64BIT) || defined(CONFIG_HAVE_EFFICIENT_UNALIGNED_ACCESS)
  # define RB_FORCE_8BYTE_ALIGNMENT	0
  # define RB_ARCH_ALIGNMENT		RB_ALIGNMENT
  #else
  # define RB_FORCE_8BYTE_ALIGNMENT	1
  # define RB_ARCH_ALIGNMENT		8U
  #endif
334d4169a   Lai Jiangshan   ring_buffer: comp...
218
219
  /* define RINGBUF_TYPE_DATA for 'case RINGBUF_TYPE_DATA:' */
  #define RINGBUF_TYPE_DATA 0 ... RINGBUF_TYPE_DATA_TYPE_LEN_MAX
7a8e76a38   Steven Rostedt   tracing: unified ...
220
221
222
223
224
  
  enum {
  	RB_LEN_TIME_EXTEND = 8,
  	RB_LEN_TIME_STAMP = 16,
  };
69d1b839f   Steven Rostedt   ring-buffer: Bind...
225
226
  #define skip_time_extend(event) \
  	((struct ring_buffer_event *)((char *)event + RB_LEN_TIME_EXTEND))
2d622719f   Tom Zanussi   tracing: add ring...
227
228
  static inline int rb_null_event(struct ring_buffer_event *event)
  {
a1863c212   Steven Rostedt   ring-buffer: do n...
229
  	return event->type_len == RINGBUF_TYPE_PADDING && !event->time_delta;
2d622719f   Tom Zanussi   tracing: add ring...
230
231
232
233
  }
  
  static void rb_event_set_padding(struct ring_buffer_event *event)
  {
a1863c212   Steven Rostedt   ring-buffer: do n...
234
  	/* padding has a NULL time_delta */
334d4169a   Lai Jiangshan   ring_buffer: comp...
235
  	event->type_len = RINGBUF_TYPE_PADDING;
2d622719f   Tom Zanussi   tracing: add ring...
236
237
  	event->time_delta = 0;
  }
34a148bf0   Andrew Morton   kernel/trace/ring...
238
  static unsigned
2d622719f   Tom Zanussi   tracing: add ring...
239
  rb_event_data_length(struct ring_buffer_event *event)
7a8e76a38   Steven Rostedt   tracing: unified ...
240
241
  {
  	unsigned length;
334d4169a   Lai Jiangshan   ring_buffer: comp...
242
243
  	if (event->type_len)
  		length = event->type_len * RB_ALIGNMENT;
2d622719f   Tom Zanussi   tracing: add ring...
244
245
246
247
  	else
  		length = event->array[0];
  	return length + RB_EVNT_HDR_SIZE;
  }
69d1b839f   Steven Rostedt   ring-buffer: Bind...
248
249
250
251
252
253
  /*
   * Return the length of the given event. Will return
   * the length of the time extend if the event is a
   * time extend.
   */
  static inline unsigned
2d622719f   Tom Zanussi   tracing: add ring...
254
255
  rb_event_length(struct ring_buffer_event *event)
  {
334d4169a   Lai Jiangshan   ring_buffer: comp...
256
  	switch (event->type_len) {
7a8e76a38   Steven Rostedt   tracing: unified ...
257
  	case RINGBUF_TYPE_PADDING:
2d622719f   Tom Zanussi   tracing: add ring...
258
259
260
  		if (rb_null_event(event))
  			/* undefined */
  			return -1;
334d4169a   Lai Jiangshan   ring_buffer: comp...
261
  		return  event->array[0] + RB_EVNT_HDR_SIZE;
7a8e76a38   Steven Rostedt   tracing: unified ...
262
263
264
265
266
267
268
269
  
  	case RINGBUF_TYPE_TIME_EXTEND:
  		return RB_LEN_TIME_EXTEND;
  
  	case RINGBUF_TYPE_TIME_STAMP:
  		return RB_LEN_TIME_STAMP;
  
  	case RINGBUF_TYPE_DATA:
2d622719f   Tom Zanussi   tracing: add ring...
270
  		return rb_event_data_length(event);
7a8e76a38   Steven Rostedt   tracing: unified ...
271
272
273
274
275
276
  	default:
  		BUG();
  	}
  	/* not hit */
  	return 0;
  }
69d1b839f   Steven Rostedt   ring-buffer: Bind...
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
  /*
   * Return total length of time extend and data,
   *   or just the event length for all other events.
   */
  static inline unsigned
  rb_event_ts_length(struct ring_buffer_event *event)
  {
  	unsigned len = 0;
  
  	if (event->type_len == RINGBUF_TYPE_TIME_EXTEND) {
  		/* time extends include the data event after it */
  		len = RB_LEN_TIME_EXTEND;
  		event = skip_time_extend(event);
  	}
  	return len + rb_event_length(event);
  }
7a8e76a38   Steven Rostedt   tracing: unified ...
293
294
295
  /**
   * ring_buffer_event_length - return the length of the event
   * @event: the event to get the length of
69d1b839f   Steven Rostedt   ring-buffer: Bind...
296
297
298
299
300
301
   *
   * Returns the size of the data load of a data event.
   * If the event is something other than a data event, it
   * returns the size of the event itself. With the exception
   * of a TIME EXTEND, where it still returns the size of the
   * data load of the data event after it.
7a8e76a38   Steven Rostedt   tracing: unified ...
302
303
304
   */
  unsigned ring_buffer_event_length(struct ring_buffer_event *event)
  {
69d1b839f   Steven Rostedt   ring-buffer: Bind...
305
306
307
308
309
310
  	unsigned length;
  
  	if (event->type_len == RINGBUF_TYPE_TIME_EXTEND)
  		event = skip_time_extend(event);
  
  	length = rb_event_length(event);
334d4169a   Lai Jiangshan   ring_buffer: comp...
311
  	if (event->type_len > RINGBUF_TYPE_DATA_TYPE_LEN_MAX)
465634adc   Robert Richter   ring_buffer: fix ...
312
313
314
315
316
  		return length;
  	length -= RB_EVNT_HDR_SIZE;
  	if (length > RB_MAX_SMALL_DATA + sizeof(event->array[0]))
                  length -= sizeof(event->array[0]);
  	return length;
7a8e76a38   Steven Rostedt   tracing: unified ...
317
  }
c4f50183f   Robert Richter   ring_buffer: addi...
318
  EXPORT_SYMBOL_GPL(ring_buffer_event_length);
7a8e76a38   Steven Rostedt   tracing: unified ...
319
320
  
  /* inline for ring buffer fast paths */
34a148bf0   Andrew Morton   kernel/trace/ring...
321
  static void *
7a8e76a38   Steven Rostedt   tracing: unified ...
322
323
  rb_event_data(struct ring_buffer_event *event)
  {
69d1b839f   Steven Rostedt   ring-buffer: Bind...
324
325
  	if (event->type_len == RINGBUF_TYPE_TIME_EXTEND)
  		event = skip_time_extend(event);
334d4169a   Lai Jiangshan   ring_buffer: comp...
326
  	BUG_ON(event->type_len > RINGBUF_TYPE_DATA_TYPE_LEN_MAX);
7a8e76a38   Steven Rostedt   tracing: unified ...
327
  	/* If length is in len field, then array[0] has the data */
334d4169a   Lai Jiangshan   ring_buffer: comp...
328
  	if (event->type_len)
7a8e76a38   Steven Rostedt   tracing: unified ...
329
330
331
332
333
334
335
336
337
338
339
340
341
  		return (void *)&event->array[0];
  	/* Otherwise length is in array[0] and array[1] has the data */
  	return (void *)&event->array[1];
  }
  
  /**
   * ring_buffer_event_data - return the data of the event
   * @event: the event to get the data from
   */
  void *ring_buffer_event_data(struct ring_buffer_event *event)
  {
  	return rb_event_data(event);
  }
c4f50183f   Robert Richter   ring_buffer: addi...
342
  EXPORT_SYMBOL_GPL(ring_buffer_event_data);
7a8e76a38   Steven Rostedt   tracing: unified ...
343
344
  
  #define for_each_buffer_cpu(buffer, cpu)		\
9e01c1b74   Rusty Russell   cpumask: convert ...
345
  	for_each_cpu(cpu, buffer->cpumask)
7a8e76a38   Steven Rostedt   tracing: unified ...
346
347
348
349
  
  #define TS_SHIFT	27
  #define TS_MASK		((1ULL << TS_SHIFT) - 1)
  #define TS_DELTA_TEST	(~TS_MASK)
66a8cb95e   Steven Rostedt   ring-buffer: Add ...
350
351
  /* Flag when events were overwritten */
  #define RB_MISSED_EVENTS	(1 << 31)
ff0ff84a0   Steven Rostedt   ring-buffer: Add ...
352
353
  /* Missed count stored at end */
  #define RB_MISSED_STORED	(1 << 30)
66a8cb95e   Steven Rostedt   ring-buffer: Add ...
354

abc9b56d6   Steven Rostedt   ring-buffer: move...
355
  struct buffer_data_page {
e4c2ce82c   Steven Rostedt   ring_buffer: allo...
356
  	u64		 time_stamp;	/* page time stamp */
c3706f005   Wenji Huang   tracing: fix typo...
357
  	local_t		 commit;	/* write committed index */
abc9b56d6   Steven Rostedt   ring-buffer: move...
358
359
  	unsigned char	 data[];	/* data of buffer page */
  };
77ae365ec   Steven Rostedt   ring-buffer: make...
360
361
362
363
364
365
366
367
  /*
   * Note, the buffer_page list must be first. The buffer pages
   * are allocated in cache lines, which means that each buffer
   * page will be at the beginning of a cache line, and thus
   * the least significant bits will be zero. We use this to
   * add flags in the list struct pointers, to make the ring buffer
   * lockless.
   */
abc9b56d6   Steven Rostedt   ring-buffer: move...
368
  struct buffer_page {
778c55d44   Steven Rostedt   ring-buffer: reco...
369
  	struct list_head list;		/* list of buffer pages */
abc9b56d6   Steven Rostedt   ring-buffer: move...
370
  	local_t		 write;		/* index for next write */
6f807acd2   Steven Rostedt   ring-buffer: move...
371
  	unsigned	 read;		/* index for next read */
778c55d44   Steven Rostedt   ring-buffer: reco...
372
  	local_t		 entries;	/* entries on this page */
ff0ff84a0   Steven Rostedt   ring-buffer: Add ...
373
  	unsigned long	 real_end;	/* real end of data */
abc9b56d6   Steven Rostedt   ring-buffer: move...
374
  	struct buffer_data_page *page;	/* Actual data page */
7a8e76a38   Steven Rostedt   tracing: unified ...
375
  };
77ae365ec   Steven Rostedt   ring-buffer: make...
376
377
378
379
380
381
382
383
384
385
386
387
388
389
  /*
   * The buffer page counters, write and entries, must be reset
   * atomically when crossing page boundaries. To synchronize this
   * update, two counters are inserted into the number. One is
   * the actual counter for the write position or count on the page.
   *
   * The other is a counter of updaters. Before an update happens
   * the update partition of the counter is incremented. This will
   * allow the updater to update the counter atomically.
   *
   * The counter is 20 bits, and the state data is 12.
   */
  #define RB_WRITE_MASK		0xfffff
  #define RB_WRITE_INTCNT		(1 << 20)
044fa782e   Steven Rostedt   ring-buffer: chan...
390
  static void rb_init_page(struct buffer_data_page *bpage)
abc9b56d6   Steven Rostedt   ring-buffer: move...
391
  {
044fa782e   Steven Rostedt   ring-buffer: chan...
392
  	local_set(&bpage->commit, 0);
abc9b56d6   Steven Rostedt   ring-buffer: move...
393
  }
474d32b68   Steven Rostedt   ring-buffer: make...
394
395
396
397
398
399
  /**
   * ring_buffer_page_len - the size of data on the page.
   * @page: The page to read
   *
   * Returns the amount of data on the page, including buffer page header.
   */
ef7a4a161   Steven Rostedt   ring-buffer: fix ...
400
401
  size_t ring_buffer_page_len(void *page)
  {
474d32b68   Steven Rostedt   ring-buffer: make...
402
403
  	return local_read(&((struct buffer_data_page *)page)->commit)
  		+ BUF_PAGE_HDR_SIZE;
ef7a4a161   Steven Rostedt   ring-buffer: fix ...
404
  }
7a8e76a38   Steven Rostedt   tracing: unified ...
405
  /*
ed56829cb   Steven Rostedt   ring_buffer: rese...
406
407
408
   * Also stolen from mm/slob.c. Thanks to Mathieu Desnoyers for pointing
   * this issue out.
   */
34a148bf0   Andrew Morton   kernel/trace/ring...
409
  static void free_buffer_page(struct buffer_page *bpage)
ed56829cb   Steven Rostedt   ring_buffer: rese...
410
  {
34a148bf0   Andrew Morton   kernel/trace/ring...
411
  	free_page((unsigned long)bpage->page);
e4c2ce82c   Steven Rostedt   ring_buffer: allo...
412
  	kfree(bpage);
ed56829cb   Steven Rostedt   ring_buffer: rese...
413
414
415
  }
  
  /*
7a8e76a38   Steven Rostedt   tracing: unified ...
416
417
418
419
420
421
422
423
   * We need to fit the time_stamp delta into 27 bits.
   */
  static inline int test_time_stamp(u64 delta)
  {
  	if (delta & TS_DELTA_TEST)
  		return 1;
  	return 0;
  }
474d32b68   Steven Rostedt   ring-buffer: make...
424
  #define BUF_PAGE_SIZE (PAGE_SIZE - BUF_PAGE_HDR_SIZE)
7a8e76a38   Steven Rostedt   tracing: unified ...
425

be957c447   Steven Rostedt   ring-buffer: move...
426
427
  /* Max payload is BUF_PAGE_SIZE - header (8bytes) */
  #define BUF_MAX_DATA_SIZE (BUF_PAGE_SIZE - (sizeof(u32) * 2))
d1b182a8d   Steven Rostedt   tracing/events/ri...
428
429
430
431
432
433
  int ring_buffer_print_page_header(struct trace_seq *s)
  {
  	struct buffer_data_page field;
  	int ret;
  
  	ret = trace_seq_printf(s, "\tfield: u64 timestamp;\t"
26a50744b   Tom Zanussi   tracing/events: A...
434
435
436
437
  			       "offset:0;\tsize:%u;\tsigned:%u;
  ",
  			       (unsigned int)sizeof(field.time_stamp),
  			       (unsigned int)is_signed_type(u64));
d1b182a8d   Steven Rostedt   tracing/events/ri...
438
439
  
  	ret = trace_seq_printf(s, "\tfield: local_t commit;\t"
26a50744b   Tom Zanussi   tracing/events: A...
440
441
  			       "offset:%u;\tsize:%u;\tsigned:%u;
  ",
d1b182a8d   Steven Rostedt   tracing/events/ri...
442
  			       (unsigned int)offsetof(typeof(field), commit),
26a50744b   Tom Zanussi   tracing/events: A...
443
444
  			       (unsigned int)sizeof(field.commit),
  			       (unsigned int)is_signed_type(long));
d1b182a8d   Steven Rostedt   tracing/events/ri...
445

66a8cb95e   Steven Rostedt   ring-buffer: Add ...
446
447
448
449
450
451
  	ret = trace_seq_printf(s, "\tfield: int overwrite;\t"
  			       "offset:%u;\tsize:%u;\tsigned:%u;
  ",
  			       (unsigned int)offsetof(typeof(field), commit),
  			       1,
  			       (unsigned int)is_signed_type(long));
d1b182a8d   Steven Rostedt   tracing/events/ri...
452
  	ret = trace_seq_printf(s, "\tfield: char data;\t"
26a50744b   Tom Zanussi   tracing/events: A...
453
454
  			       "offset:%u;\tsize:%u;\tsigned:%u;
  ",
d1b182a8d   Steven Rostedt   tracing/events/ri...
455
  			       (unsigned int)offsetof(typeof(field), data),
26a50744b   Tom Zanussi   tracing/events: A...
456
457
  			       (unsigned int)BUF_PAGE_SIZE,
  			       (unsigned int)is_signed_type(char));
d1b182a8d   Steven Rostedt   tracing/events/ri...
458
459
460
  
  	return ret;
  }
7a8e76a38   Steven Rostedt   tracing: unified ...
461
462
463
464
465
  /*
   * head_page == tail_page && head == tail then buffer is empty.
   */
  struct ring_buffer_per_cpu {
  	int				cpu;
985023dee   Richard Kennedy   trace: Reorder st...
466
  	atomic_t			record_disabled;
7a8e76a38   Steven Rostedt   tracing: unified ...
467
  	struct ring_buffer		*buffer;
5389f6fad   Thomas Gleixner   locking, tracing:...
468
  	raw_spinlock_t			reader_lock;	/* serialize readers */
445c89514   Thomas Gleixner   locking: Convert ...
469
  	arch_spinlock_t			lock;
7a8e76a38   Steven Rostedt   tracing: unified ...
470
  	struct lock_class_key		lock_key;
3adc54fa8   Steven Rostedt   ring-buffer: make...
471
  	struct list_head		*pages;
6f807acd2   Steven Rostedt   ring-buffer: move...
472
473
  	struct buffer_page		*head_page;	/* read from head */
  	struct buffer_page		*tail_page;	/* write to tail */
c3706f005   Wenji Huang   tracing: fix typo...
474
  	struct buffer_page		*commit_page;	/* committed pages */
d769041f8   Steven Rostedt   ring_buffer: impl...
475
  	struct buffer_page		*reader_page;
66a8cb95e   Steven Rostedt   ring-buffer: Add ...
476
477
  	unsigned long			lost_events;
  	unsigned long			last_overrun;
c64e148a3   Vaibhav Nagarnaik   trace: Add ring b...
478
  	local_t				entries_bytes;
77ae365ec   Steven Rostedt   ring-buffer: make...
479
480
  	local_t				commit_overrun;
  	local_t				overrun;
e4906eff9   Steven Rostedt   ring-buffer: conv...
481
  	local_t				entries;
fa7439531   Steven Rostedt   ring-buffer: use ...
482
483
  	local_t				committing;
  	local_t				commits;
77ae365ec   Steven Rostedt   ring-buffer: make...
484
  	unsigned long			read;
c64e148a3   Vaibhav Nagarnaik   trace: Add ring b...
485
  	unsigned long			read_bytes;
7a8e76a38   Steven Rostedt   tracing: unified ...
486
487
  	u64				write_stamp;
  	u64				read_stamp;
7a8e76a38   Steven Rostedt   tracing: unified ...
488
489
490
  };
  
  struct ring_buffer {
7a8e76a38   Steven Rostedt   tracing: unified ...
491
492
493
  	unsigned			pages;
  	unsigned			flags;
  	int				cpus;
7a8e76a38   Steven Rostedt   tracing: unified ...
494
  	atomic_t			record_disabled;
00f62f614   Arnaldo Carvalho de Melo   ring_buffer: paho...
495
  	cpumask_var_t			cpumask;
7a8e76a38   Steven Rostedt   tracing: unified ...
496

1f8a6a10f   Peter Zijlstra   ring-buffer: pass...
497
  	struct lock_class_key		*reader_lock_key;
7a8e76a38   Steven Rostedt   tracing: unified ...
498
499
500
  	struct mutex			mutex;
  
  	struct ring_buffer_per_cpu	**buffers;
554f786e2   Steven Rostedt   ring-buffer: only...
501

59222efe2   Steven Rostedt   ring-buffer: use ...
502
  #ifdef CONFIG_HOTPLUG_CPU
554f786e2   Steven Rostedt   ring-buffer: only...
503
504
  	struct notifier_block		cpu_notify;
  #endif
37886f6a9   Steven Rostedt   ring-buffer: add ...
505
  	u64				(*clock)(void);
7a8e76a38   Steven Rostedt   tracing: unified ...
506
507
508
509
510
511
  };
  
  struct ring_buffer_iter {
  	struct ring_buffer_per_cpu	*cpu_buffer;
  	unsigned long			head;
  	struct buffer_page		*head_page;
492a74f42   Steven Rostedt   ring-buffer: Chec...
512
513
  	struct buffer_page		*cache_reader_page;
  	unsigned long			cache_read;
7a8e76a38   Steven Rostedt   tracing: unified ...
514
515
  	u64				read_stamp;
  };
f536aafc5   Steven Rostedt   ring-buffer: repl...
516
  /* buffer may be either ring_buffer or ring_buffer_per_cpu */
077c5407c   Steven Rostedt   ring-buffer: disa...
517
518
519
520
521
522
523
524
525
526
527
528
529
  #define RB_WARN_ON(b, cond)						\
  	({								\
  		int _____ret = unlikely(cond);				\
  		if (_____ret) {						\
  			if (__same_type(*(b), struct ring_buffer_per_cpu)) { \
  				struct ring_buffer_per_cpu *__b =	\
  					(void *)b;			\
  				atomic_inc(&__b->buffer->record_disabled); \
  			} else						\
  				atomic_inc(&b->record_disabled);	\
  			WARN_ON(1);					\
  		}							\
  		_____ret;						\
3e89c7bb9   Steven Rostedt   ring-buffer: clea...
530
  	})
f536aafc5   Steven Rostedt   ring-buffer: repl...
531

37886f6a9   Steven Rostedt   ring-buffer: add ...
532
533
  /* Up this if you want to test the TIME_EXTENTS and normalization */
  #define DEBUG_SHIFT 0
6d3f1e12f   Jiri Olsa   tracing: Remove c...
534
  static inline u64 rb_time_stamp(struct ring_buffer *buffer)
88eb01253   Steven Rostedt   ring-buffer: use ...
535
536
537
538
  {
  	/* shift to debug/test normalization and TIME_EXTENTS */
  	return buffer->clock() << DEBUG_SHIFT;
  }
37886f6a9   Steven Rostedt   ring-buffer: add ...
539
540
541
542
543
  u64 ring_buffer_time_stamp(struct ring_buffer *buffer, int cpu)
  {
  	u64 time;
  
  	preempt_disable_notrace();
6d3f1e12f   Jiri Olsa   tracing: Remove c...
544
  	time = rb_time_stamp(buffer);
37886f6a9   Steven Rostedt   ring-buffer: add ...
545
546
547
548
549
550
551
552
553
554
555
556
557
  	preempt_enable_no_resched_notrace();
  
  	return time;
  }
  EXPORT_SYMBOL_GPL(ring_buffer_time_stamp);
  
  void ring_buffer_normalize_time_stamp(struct ring_buffer *buffer,
  				      int cpu, u64 *ts)
  {
  	/* Just stupid testing the normalize function and deltas */
  	*ts >>= DEBUG_SHIFT;
  }
  EXPORT_SYMBOL_GPL(ring_buffer_normalize_time_stamp);
77ae365ec   Steven Rostedt   ring-buffer: make...
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
  /*
   * Making the ring buffer lockless makes things tricky.
   * Although writes only happen on the CPU that they are on,
   * and they only need to worry about interrupts. Reads can
   * happen on any CPU.
   *
   * The reader page is always off the ring buffer, but when the
   * reader finishes with a page, it needs to swap its page with
   * a new one from the buffer. The reader needs to take from
   * the head (writes go to the tail). But if a writer is in overwrite
   * mode and wraps, it must push the head page forward.
   *
   * Here lies the problem.
   *
   * The reader must be careful to replace only the head page, and
   * not another one. As described at the top of the file in the
   * ASCII art, the reader sets its old page to point to the next
   * page after head. It then sets the page after head to point to
   * the old reader page. But if the writer moves the head page
   * during this operation, the reader could end up with the tail.
   *
   * We use cmpxchg to help prevent this race. We also do something
   * special with the page before head. We set the LSB to 1.
   *
   * When the writer must push the page forward, it will clear the
   * bit that points to the head page, move the head, and then set
   * the bit that points to the new head page.
   *
   * We also don't want an interrupt coming in and moving the head
   * page on another writer. Thus we use the second LSB to catch
   * that too. Thus:
   *
   * head->list->prev->next        bit 1          bit 0
   *                              -------        -------
   * Normal page                     0              0
   * Points to head page             0              1
   * New head page                   1              0
   *
   * Note we can not trust the prev pointer of the head page, because:
   *
   * +----+       +-----+        +-----+
   * |    |------>|  T  |---X--->|  N  |
   * |    |<------|     |        |     |
   * +----+       +-----+        +-----+
   *   ^                           ^ |
   *   |          +-----+          | |
   *   +----------|  R  |----------+ |
   *              |     |<-----------+
   *              +-----+
   *
   * Key:  ---X-->  HEAD flag set in pointer
   *         T      Tail page
   *         R      Reader page
   *         N      Next page
   *
   * (see __rb_reserve_next() to see where this happens)
   *
   *  What the above shows is that the reader just swapped out
   *  the reader page with a page in the buffer, but before it
   *  could make the new header point back to the new page added
   *  it was preempted by a writer. The writer moved forward onto
   *  the new page added by the reader and is about to move forward
   *  again.
   *
   *  You can see, it is legitimate for the previous pointer of
   *  the head (or any page) not to point back to itself. But only
   *  temporarially.
   */
  
  #define RB_PAGE_NORMAL		0UL
  #define RB_PAGE_HEAD		1UL
  #define RB_PAGE_UPDATE		2UL
  
  
  #define RB_FLAG_MASK		3UL
  
  /* PAGE_MOVED is not part of the mask */
  #define RB_PAGE_MOVED		4UL
  
  /*
   * rb_list_head - remove any bit
   */
  static struct list_head *rb_list_head(struct list_head *list)
  {
  	unsigned long val = (unsigned long)list;
  
  	return (struct list_head *)(val & ~RB_FLAG_MASK);
  }
  
  /*
6d3f1e12f   Jiri Olsa   tracing: Remove c...
648
   * rb_is_head_page - test if the given page is the head page
77ae365ec   Steven Rostedt   ring-buffer: make...
649
650
651
652
653
654
   *
   * Because the reader may move the head_page pointer, we can
   * not trust what the head page is (it may be pointing to
   * the reader page). But if the next page is a header page,
   * its flags will be non zero.
   */
42b16b3fb   Jesper Juhl   Kill off warning:...
655
  static inline int
77ae365ec   Steven Rostedt   ring-buffer: make...
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
  rb_is_head_page(struct ring_buffer_per_cpu *cpu_buffer,
  		struct buffer_page *page, struct list_head *list)
  {
  	unsigned long val;
  
  	val = (unsigned long)list->next;
  
  	if ((val & ~RB_FLAG_MASK) != (unsigned long)&page->list)
  		return RB_PAGE_MOVED;
  
  	return val & RB_FLAG_MASK;
  }
  
  /*
   * rb_is_reader_page
   *
   * The unique thing about the reader page, is that, if the
   * writer is ever on it, the previous pointer never points
   * back to the reader page.
   */
  static int rb_is_reader_page(struct buffer_page *page)
  {
  	struct list_head *list = page->list.prev;
  
  	return rb_list_head(list->next) != &page->list;
  }
  
  /*
   * rb_set_list_to_head - set a list_head to be pointing to head.
   */
  static void rb_set_list_to_head(struct ring_buffer_per_cpu *cpu_buffer,
  				struct list_head *list)
  {
  	unsigned long *ptr;
  
  	ptr = (unsigned long *)&list->next;
  	*ptr |= RB_PAGE_HEAD;
  	*ptr &= ~RB_PAGE_UPDATE;
  }
  
  /*
   * rb_head_page_activate - sets up head page
   */
  static void rb_head_page_activate(struct ring_buffer_per_cpu *cpu_buffer)
  {
  	struct buffer_page *head;
  
  	head = cpu_buffer->head_page;
  	if (!head)
  		return;
  
  	/*
  	 * Set the previous list pointer to have the HEAD flag.
  	 */
  	rb_set_list_to_head(cpu_buffer, head->list.prev);
  }
  
  static void rb_list_head_clear(struct list_head *list)
  {
  	unsigned long *ptr = (unsigned long *)&list->next;
  
  	*ptr &= ~RB_FLAG_MASK;
  }
  
  /*
   * rb_head_page_dactivate - clears head page ptr (for free list)
   */
  static void
  rb_head_page_deactivate(struct ring_buffer_per_cpu *cpu_buffer)
  {
  	struct list_head *hd;
  
  	/* Go through the whole list and clear any pointers found. */
  	rb_list_head_clear(cpu_buffer->pages);
  
  	list_for_each(hd, cpu_buffer->pages)
  		rb_list_head_clear(hd);
  }
  
  static int rb_head_page_set(struct ring_buffer_per_cpu *cpu_buffer,
  			    struct buffer_page *head,
  			    struct buffer_page *prev,
  			    int old_flag, int new_flag)
  {
  	struct list_head *list;
  	unsigned long val = (unsigned long)&head->list;
  	unsigned long ret;
  
  	list = &prev->list;
  
  	val &= ~RB_FLAG_MASK;
08a408161   Steven Rostedt   ring-buffer: type...
747
748
  	ret = cmpxchg((unsigned long *)&list->next,
  		      val | old_flag, val | new_flag);
77ae365ec   Steven Rostedt   ring-buffer: make...
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
  
  	/* check if the reader took the page */
  	if ((ret & ~RB_FLAG_MASK) != val)
  		return RB_PAGE_MOVED;
  
  	return ret & RB_FLAG_MASK;
  }
  
  static int rb_head_page_set_update(struct ring_buffer_per_cpu *cpu_buffer,
  				   struct buffer_page *head,
  				   struct buffer_page *prev,
  				   int old_flag)
  {
  	return rb_head_page_set(cpu_buffer, head, prev,
  				old_flag, RB_PAGE_UPDATE);
  }
  
  static int rb_head_page_set_head(struct ring_buffer_per_cpu *cpu_buffer,
  				 struct buffer_page *head,
  				 struct buffer_page *prev,
  				 int old_flag)
  {
  	return rb_head_page_set(cpu_buffer, head, prev,
  				old_flag, RB_PAGE_HEAD);
  }
  
  static int rb_head_page_set_normal(struct ring_buffer_per_cpu *cpu_buffer,
  				   struct buffer_page *head,
  				   struct buffer_page *prev,
  				   int old_flag)
  {
  	return rb_head_page_set(cpu_buffer, head, prev,
  				old_flag, RB_PAGE_NORMAL);
  }
  
  static inline void rb_inc_page(struct ring_buffer_per_cpu *cpu_buffer,
  			       struct buffer_page **bpage)
  {
  	struct list_head *p = rb_list_head((*bpage)->list.next);
  
  	*bpage = list_entry(p, struct buffer_page, list);
  }
  
  static struct buffer_page *
  rb_set_head_page(struct ring_buffer_per_cpu *cpu_buffer)
  {
  	struct buffer_page *head;
  	struct buffer_page *page;
  	struct list_head *list;
  	int i;
  
  	if (RB_WARN_ON(cpu_buffer, !cpu_buffer->head_page))
  		return NULL;
  
  	/* sanity check */
  	list = cpu_buffer->pages;
  	if (RB_WARN_ON(cpu_buffer, rb_list_head(list->prev->next) != list))
  		return NULL;
  
  	page = head = cpu_buffer->head_page;
  	/*
  	 * It is possible that the writer moves the header behind
  	 * where we started, and we miss in one loop.
  	 * A second loop should grab the header, but we'll do
  	 * three loops just because I'm paranoid.
  	 */
  	for (i = 0; i < 3; i++) {
  		do {
  			if (rb_is_head_page(cpu_buffer, page, page->list.prev)) {
  				cpu_buffer->head_page = page;
  				return page;
  			}
  			rb_inc_page(cpu_buffer, &page);
  		} while (page != head);
  	}
  
  	RB_WARN_ON(cpu_buffer, 1);
  
  	return NULL;
  }
  
  static int rb_head_page_replace(struct buffer_page *old,
  				struct buffer_page *new)
  {
  	unsigned long *ptr = (unsigned long *)&old->list.prev->next;
  	unsigned long val;
  	unsigned long ret;
  
  	val = *ptr & ~RB_FLAG_MASK;
  	val |= RB_PAGE_HEAD;
08a408161   Steven Rostedt   ring-buffer: type...
839
  	ret = cmpxchg(ptr, val, (unsigned long)&new->list);
77ae365ec   Steven Rostedt   ring-buffer: make...
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
  
  	return ret == val;
  }
  
  /*
   * rb_tail_page_update - move the tail page forward
   *
   * Returns 1 if moved tail page, 0 if someone else did.
   */
  static int rb_tail_page_update(struct ring_buffer_per_cpu *cpu_buffer,
  			       struct buffer_page *tail_page,
  			       struct buffer_page *next_page)
  {
  	struct buffer_page *old_tail;
  	unsigned long old_entries;
  	unsigned long old_write;
  	int ret = 0;
  
  	/*
  	 * The tail page now needs to be moved forward.
  	 *
  	 * We need to reset the tail page, but without messing
  	 * with possible erasing of data brought in by interrupts
  	 * that have moved the tail page and are currently on it.
  	 *
  	 * We add a counter to the write field to denote this.
  	 */
  	old_write = local_add_return(RB_WRITE_INTCNT, &next_page->write);
  	old_entries = local_add_return(RB_WRITE_INTCNT, &next_page->entries);
  
  	/*
  	 * Just make sure we have seen our old_write and synchronize
  	 * with any interrupts that come in.
  	 */
  	barrier();
  
  	/*
  	 * If the tail page is still the same as what we think
  	 * it is, then it is up to us to update the tail
  	 * pointer.
  	 */
  	if (tail_page == cpu_buffer->tail_page) {
  		/* Zero the write counter */
  		unsigned long val = old_write & ~RB_WRITE_MASK;
  		unsigned long eval = old_entries & ~RB_WRITE_MASK;
  
  		/*
  		 * This will only succeed if an interrupt did
  		 * not come in and change it. In which case, we
  		 * do not want to modify it.
da706d8bc   Lai Jiangshan   ring_buffer: Fix ...
890
891
892
893
894
  		 *
  		 * We add (void) to let the compiler know that we do not care
  		 * about the return value of these functions. We use the
  		 * cmpxchg to only update if an interrupt did not already
  		 * do it for us. If the cmpxchg fails, we don't care.
77ae365ec   Steven Rostedt   ring-buffer: make...
895
  		 */
da706d8bc   Lai Jiangshan   ring_buffer: Fix ...
896
897
  		(void)local_cmpxchg(&next_page->write, old_write, val);
  		(void)local_cmpxchg(&next_page->entries, old_entries, eval);
77ae365ec   Steven Rostedt   ring-buffer: make...
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
  
  		/*
  		 * No need to worry about races with clearing out the commit.
  		 * it only can increment when a commit takes place. But that
  		 * only happens in the outer most nested commit.
  		 */
  		local_set(&next_page->page->commit, 0);
  
  		old_tail = cmpxchg(&cpu_buffer->tail_page,
  				   tail_page, next_page);
  
  		if (old_tail == tail_page)
  			ret = 1;
  	}
  
  	return ret;
  }
  
  static int rb_check_bpage(struct ring_buffer_per_cpu *cpu_buffer,
  			  struct buffer_page *bpage)
  {
  	unsigned long val = (unsigned long)bpage;
  
  	if (RB_WARN_ON(cpu_buffer, val & RB_FLAG_MASK))
  		return 1;
  
  	return 0;
  }
  
  /**
   * rb_check_list - make sure a pointer to a list has the last bits zero
   */
  static int rb_check_list(struct ring_buffer_per_cpu *cpu_buffer,
  			 struct list_head *list)
  {
  	if (RB_WARN_ON(cpu_buffer, rb_list_head(list->prev) != list->prev))
  		return 1;
  	if (RB_WARN_ON(cpu_buffer, rb_list_head(list->next) != list->next))
  		return 1;
  	return 0;
  }
7a8e76a38   Steven Rostedt   tracing: unified ...
939
940
941
942
  /**
   * check_pages - integrity check of buffer pages
   * @cpu_buffer: CPU buffer with pages to test
   *
c3706f005   Wenji Huang   tracing: fix typo...
943
   * As a safety measure we check to make sure the data pages have not
7a8e76a38   Steven Rostedt   tracing: unified ...
944
945
946
947
   * been corrupted.
   */
  static int rb_check_pages(struct ring_buffer_per_cpu *cpu_buffer)
  {
3adc54fa8   Steven Rostedt   ring-buffer: make...
948
  	struct list_head *head = cpu_buffer->pages;
044fa782e   Steven Rostedt   ring-buffer: chan...
949
  	struct buffer_page *bpage, *tmp;
7a8e76a38   Steven Rostedt   tracing: unified ...
950

77ae365ec   Steven Rostedt   ring-buffer: make...
951
  	rb_head_page_deactivate(cpu_buffer);
3e89c7bb9   Steven Rostedt   ring-buffer: clea...
952
953
954
955
  	if (RB_WARN_ON(cpu_buffer, head->next->prev != head))
  		return -1;
  	if (RB_WARN_ON(cpu_buffer, head->prev->next != head))
  		return -1;
7a8e76a38   Steven Rostedt   tracing: unified ...
956

77ae365ec   Steven Rostedt   ring-buffer: make...
957
958
  	if (rb_check_list(cpu_buffer, head))
  		return -1;
044fa782e   Steven Rostedt   ring-buffer: chan...
959
  	list_for_each_entry_safe(bpage, tmp, head, list) {
3e89c7bb9   Steven Rostedt   ring-buffer: clea...
960
  		if (RB_WARN_ON(cpu_buffer,
044fa782e   Steven Rostedt   ring-buffer: chan...
961
  			       bpage->list.next->prev != &bpage->list))
3e89c7bb9   Steven Rostedt   ring-buffer: clea...
962
963
  			return -1;
  		if (RB_WARN_ON(cpu_buffer,
044fa782e   Steven Rostedt   ring-buffer: chan...
964
  			       bpage->list.prev->next != &bpage->list))
3e89c7bb9   Steven Rostedt   ring-buffer: clea...
965
  			return -1;
77ae365ec   Steven Rostedt   ring-buffer: make...
966
967
  		if (rb_check_list(cpu_buffer, &bpage->list))
  			return -1;
7a8e76a38   Steven Rostedt   tracing: unified ...
968
  	}
77ae365ec   Steven Rostedt   ring-buffer: make...
969
  	rb_head_page_activate(cpu_buffer);
7a8e76a38   Steven Rostedt   tracing: unified ...
970
971
  	return 0;
  }
7a8e76a38   Steven Rostedt   tracing: unified ...
972
973
974
  static int rb_allocate_pages(struct ring_buffer_per_cpu *cpu_buffer,
  			     unsigned nr_pages)
  {
044fa782e   Steven Rostedt   ring-buffer: chan...
975
  	struct buffer_page *bpage, *tmp;
7a8e76a38   Steven Rostedt   tracing: unified ...
976
977
  	LIST_HEAD(pages);
  	unsigned i;
3adc54fa8   Steven Rostedt   ring-buffer: make...
978
  	WARN_ON(!nr_pages);
7a8e76a38   Steven Rostedt   tracing: unified ...
979
  	for (i = 0; i < nr_pages; i++) {
7ea590640   Vaibhav Nagarnaik   tracing: Use NUMA...
980
  		struct page *page;
d7ec4bfed   Vaibhav Nagarnaik   ring-buffer: Set ...
981
982
983
984
985
  		/*
  		 * __GFP_NORETRY flag makes sure that the allocation fails
  		 * gracefully without invoking oom-killer and the system is
  		 * not destabilized.
  		 */
044fa782e   Steven Rostedt   ring-buffer: chan...
986
  		bpage = kzalloc_node(ALIGN(sizeof(*bpage), cache_line_size()),
d7ec4bfed   Vaibhav Nagarnaik   ring-buffer: Set ...
987
988
  				    GFP_KERNEL | __GFP_NORETRY,
  				    cpu_to_node(cpu_buffer->cpu));
044fa782e   Steven Rostedt   ring-buffer: chan...
989
  		if (!bpage)
e4c2ce82c   Steven Rostedt   ring_buffer: allo...
990
  			goto free_pages;
77ae365ec   Steven Rostedt   ring-buffer: make...
991
992
  
  		rb_check_bpage(cpu_buffer, bpage);
044fa782e   Steven Rostedt   ring-buffer: chan...
993
  		list_add(&bpage->list, &pages);
e4c2ce82c   Steven Rostedt   ring_buffer: allo...
994

7ea590640   Vaibhav Nagarnaik   tracing: Use NUMA...
995
  		page = alloc_pages_node(cpu_to_node(cpu_buffer->cpu),
d7ec4bfed   Vaibhav Nagarnaik   ring-buffer: Set ...
996
  					GFP_KERNEL | __GFP_NORETRY, 0);
7ea590640   Vaibhav Nagarnaik   tracing: Use NUMA...
997
  		if (!page)
7a8e76a38   Steven Rostedt   tracing: unified ...
998
  			goto free_pages;
7ea590640   Vaibhav Nagarnaik   tracing: Use NUMA...
999
  		bpage->page = page_address(page);
044fa782e   Steven Rostedt   ring-buffer: chan...
1000
  		rb_init_page(bpage->page);
7a8e76a38   Steven Rostedt   tracing: unified ...
1001
  	}
3adc54fa8   Steven Rostedt   ring-buffer: make...
1002
1003
1004
1005
1006
1007
1008
  	/*
  	 * The ring buffer page list is a circular list that does not
  	 * start and end with a list head. All page list items point to
  	 * other pages.
  	 */
  	cpu_buffer->pages = pages.next;
  	list_del(&pages);
7a8e76a38   Steven Rostedt   tracing: unified ...
1009
1010
1011
1012
1013
1014
  
  	rb_check_pages(cpu_buffer);
  
  	return 0;
  
   free_pages:
044fa782e   Steven Rostedt   ring-buffer: chan...
1015
1016
1017
  	list_for_each_entry_safe(bpage, tmp, &pages, list) {
  		list_del_init(&bpage->list);
  		free_buffer_page(bpage);
7a8e76a38   Steven Rostedt   tracing: unified ...
1018
1019
1020
1021
1022
1023
1024
1025
  	}
  	return -ENOMEM;
  }
  
  static struct ring_buffer_per_cpu *
  rb_allocate_cpu_buffer(struct ring_buffer *buffer, int cpu)
  {
  	struct ring_buffer_per_cpu *cpu_buffer;
044fa782e   Steven Rostedt   ring-buffer: chan...
1026
  	struct buffer_page *bpage;
7ea590640   Vaibhav Nagarnaik   tracing: Use NUMA...
1027
  	struct page *page;
7a8e76a38   Steven Rostedt   tracing: unified ...
1028
1029
1030
1031
1032
1033
1034
1035
1036
  	int ret;
  
  	cpu_buffer = kzalloc_node(ALIGN(sizeof(*cpu_buffer), cache_line_size()),
  				  GFP_KERNEL, cpu_to_node(cpu));
  	if (!cpu_buffer)
  		return NULL;
  
  	cpu_buffer->cpu = cpu;
  	cpu_buffer->buffer = buffer;
5389f6fad   Thomas Gleixner   locking, tracing:...
1037
  	raw_spin_lock_init(&cpu_buffer->reader_lock);
1f8a6a10f   Peter Zijlstra   ring-buffer: pass...
1038
  	lockdep_set_class(&cpu_buffer->reader_lock, buffer->reader_lock_key);
edc35bd72   Thomas Gleixner   locking: Rename _...
1039
  	cpu_buffer->lock = (arch_spinlock_t)__ARCH_SPIN_LOCK_UNLOCKED;
7a8e76a38   Steven Rostedt   tracing: unified ...
1040

044fa782e   Steven Rostedt   ring-buffer: chan...
1041
  	bpage = kzalloc_node(ALIGN(sizeof(*bpage), cache_line_size()),
e4c2ce82c   Steven Rostedt   ring_buffer: allo...
1042
  			    GFP_KERNEL, cpu_to_node(cpu));
044fa782e   Steven Rostedt   ring-buffer: chan...
1043
  	if (!bpage)
e4c2ce82c   Steven Rostedt   ring_buffer: allo...
1044
  		goto fail_free_buffer;
77ae365ec   Steven Rostedt   ring-buffer: make...
1045
  	rb_check_bpage(cpu_buffer, bpage);
044fa782e   Steven Rostedt   ring-buffer: chan...
1046
  	cpu_buffer->reader_page = bpage;
7ea590640   Vaibhav Nagarnaik   tracing: Use NUMA...
1047
1048
  	page = alloc_pages_node(cpu_to_node(cpu), GFP_KERNEL, 0);
  	if (!page)
e4c2ce82c   Steven Rostedt   ring_buffer: allo...
1049
  		goto fail_free_reader;
7ea590640   Vaibhav Nagarnaik   tracing: Use NUMA...
1050
  	bpage->page = page_address(page);
044fa782e   Steven Rostedt   ring-buffer: chan...
1051
  	rb_init_page(bpage->page);
e4c2ce82c   Steven Rostedt   ring_buffer: allo...
1052

d769041f8   Steven Rostedt   ring_buffer: impl...
1053
  	INIT_LIST_HEAD(&cpu_buffer->reader_page->list);
d769041f8   Steven Rostedt   ring_buffer: impl...
1054

7a8e76a38   Steven Rostedt   tracing: unified ...
1055
1056
  	ret = rb_allocate_pages(cpu_buffer, buffer->pages);
  	if (ret < 0)
d769041f8   Steven Rostedt   ring_buffer: impl...
1057
  		goto fail_free_reader;
7a8e76a38   Steven Rostedt   tracing: unified ...
1058
1059
  
  	cpu_buffer->head_page
3adc54fa8   Steven Rostedt   ring-buffer: make...
1060
  		= list_entry(cpu_buffer->pages, struct buffer_page, list);
bf41a158c   Steven Rostedt   ring-buffer: make...
1061
  	cpu_buffer->tail_page = cpu_buffer->commit_page = cpu_buffer->head_page;
7a8e76a38   Steven Rostedt   tracing: unified ...
1062

77ae365ec   Steven Rostedt   ring-buffer: make...
1063
  	rb_head_page_activate(cpu_buffer);
7a8e76a38   Steven Rostedt   tracing: unified ...
1064
  	return cpu_buffer;
d769041f8   Steven Rostedt   ring_buffer: impl...
1065
1066
   fail_free_reader:
  	free_buffer_page(cpu_buffer->reader_page);
7a8e76a38   Steven Rostedt   tracing: unified ...
1067
1068
1069
1070
1071
1072
1073
   fail_free_buffer:
  	kfree(cpu_buffer);
  	return NULL;
  }
  
  static void rb_free_cpu_buffer(struct ring_buffer_per_cpu *cpu_buffer)
  {
3adc54fa8   Steven Rostedt   ring-buffer: make...
1074
  	struct list_head *head = cpu_buffer->pages;
044fa782e   Steven Rostedt   ring-buffer: chan...
1075
  	struct buffer_page *bpage, *tmp;
7a8e76a38   Steven Rostedt   tracing: unified ...
1076

d769041f8   Steven Rostedt   ring_buffer: impl...
1077
  	free_buffer_page(cpu_buffer->reader_page);
77ae365ec   Steven Rostedt   ring-buffer: make...
1078
  	rb_head_page_deactivate(cpu_buffer);
3adc54fa8   Steven Rostedt   ring-buffer: make...
1079
1080
1081
1082
1083
1084
  	if (head) {
  		list_for_each_entry_safe(bpage, tmp, head, list) {
  			list_del_init(&bpage->list);
  			free_buffer_page(bpage);
  		}
  		bpage = list_entry(head, struct buffer_page, list);
044fa782e   Steven Rostedt   ring-buffer: chan...
1085
  		free_buffer_page(bpage);
7a8e76a38   Steven Rostedt   tracing: unified ...
1086
  	}
3adc54fa8   Steven Rostedt   ring-buffer: make...
1087

7a8e76a38   Steven Rostedt   tracing: unified ...
1088
1089
  	kfree(cpu_buffer);
  }
59222efe2   Steven Rostedt   ring-buffer: use ...
1090
  #ifdef CONFIG_HOTPLUG_CPU
09c9e84d4   Frederic Weisbecker   tracing/ring-buff...
1091
1092
  static int rb_cpu_notify(struct notifier_block *self,
  			 unsigned long action, void *hcpu);
554f786e2   Steven Rostedt   ring-buffer: only...
1093
  #endif
7a8e76a38   Steven Rostedt   tracing: unified ...
1094
1095
  /**
   * ring_buffer_alloc - allocate a new ring_buffer
68814b58c   Robert Richter   ring_buffer: upda...
1096
   * @size: the size in bytes per cpu that is needed.
7a8e76a38   Steven Rostedt   tracing: unified ...
1097
1098
1099
1100
1101
1102
1103
   * @flags: attributes to set for the ring buffer.
   *
   * Currently the only flag that is available is the RB_FL_OVERWRITE
   * flag. This flag means that the buffer will overwrite old data
   * when the buffer wraps. If this flag is not set, the buffer will
   * drop data when the tail hits the head.
   */
1f8a6a10f   Peter Zijlstra   ring-buffer: pass...
1104
1105
  struct ring_buffer *__ring_buffer_alloc(unsigned long size, unsigned flags,
  					struct lock_class_key *key)
7a8e76a38   Steven Rostedt   tracing: unified ...
1106
1107
1108
1109
1110
1111
1112
1113
1114
1115
  {
  	struct ring_buffer *buffer;
  	int bsize;
  	int cpu;
  
  	/* keep it in its own cache line */
  	buffer = kzalloc(ALIGN(sizeof(*buffer), cache_line_size()),
  			 GFP_KERNEL);
  	if (!buffer)
  		return NULL;
9e01c1b74   Rusty Russell   cpumask: convert ...
1116
1117
  	if (!alloc_cpumask_var(&buffer->cpumask, GFP_KERNEL))
  		goto fail_free_buffer;
7a8e76a38   Steven Rostedt   tracing: unified ...
1118
1119
  	buffer->pages = DIV_ROUND_UP(size, BUF_PAGE_SIZE);
  	buffer->flags = flags;
37886f6a9   Steven Rostedt   ring-buffer: add ...
1120
  	buffer->clock = trace_clock_local;
1f8a6a10f   Peter Zijlstra   ring-buffer: pass...
1121
  	buffer->reader_lock_key = key;
7a8e76a38   Steven Rostedt   tracing: unified ...
1122
1123
  
  	/* need at least two pages */
5f78abeeb   Steven Rostedt   ring-buffer: chec...
1124
1125
  	if (buffer->pages < 2)
  		buffer->pages = 2;
7a8e76a38   Steven Rostedt   tracing: unified ...
1126

3bf832ce1   Frederic Weisbecker   tracing/ring-buff...
1127
1128
1129
1130
1131
1132
  	/*
  	 * In case of non-hotplug cpu, if the ring-buffer is allocated
  	 * in early initcall, it will not be notified of secondary cpus.
  	 * In that off case, we need to allocate for all possible cpus.
  	 */
  #ifdef CONFIG_HOTPLUG_CPU
554f786e2   Steven Rostedt   ring-buffer: only...
1133
1134
  	get_online_cpus();
  	cpumask_copy(buffer->cpumask, cpu_online_mask);
3bf832ce1   Frederic Weisbecker   tracing/ring-buff...
1135
1136
1137
  #else
  	cpumask_copy(buffer->cpumask, cpu_possible_mask);
  #endif
7a8e76a38   Steven Rostedt   tracing: unified ...
1138
1139
1140
1141
1142
1143
  	buffer->cpus = nr_cpu_ids;
  
  	bsize = sizeof(void *) * nr_cpu_ids;
  	buffer->buffers = kzalloc(ALIGN(bsize, cache_line_size()),
  				  GFP_KERNEL);
  	if (!buffer->buffers)
9e01c1b74   Rusty Russell   cpumask: convert ...
1144
  		goto fail_free_cpumask;
7a8e76a38   Steven Rostedt   tracing: unified ...
1145
1146
1147
1148
1149
1150
1151
  
  	for_each_buffer_cpu(buffer, cpu) {
  		buffer->buffers[cpu] =
  			rb_allocate_cpu_buffer(buffer, cpu);
  		if (!buffer->buffers[cpu])
  			goto fail_free_buffers;
  	}
59222efe2   Steven Rostedt   ring-buffer: use ...
1152
  #ifdef CONFIG_HOTPLUG_CPU
554f786e2   Steven Rostedt   ring-buffer: only...
1153
1154
1155
1156
1157
1158
  	buffer->cpu_notify.notifier_call = rb_cpu_notify;
  	buffer->cpu_notify.priority = 0;
  	register_cpu_notifier(&buffer->cpu_notify);
  #endif
  
  	put_online_cpus();
7a8e76a38   Steven Rostedt   tracing: unified ...
1159
1160
1161
1162
1163
1164
1165
1166
1167
1168
  	mutex_init(&buffer->mutex);
  
  	return buffer;
  
   fail_free_buffers:
  	for_each_buffer_cpu(buffer, cpu) {
  		if (buffer->buffers[cpu])
  			rb_free_cpu_buffer(buffer->buffers[cpu]);
  	}
  	kfree(buffer->buffers);
9e01c1b74   Rusty Russell   cpumask: convert ...
1169
1170
   fail_free_cpumask:
  	free_cpumask_var(buffer->cpumask);
554f786e2   Steven Rostedt   ring-buffer: only...
1171
  	put_online_cpus();
9e01c1b74   Rusty Russell   cpumask: convert ...
1172

7a8e76a38   Steven Rostedt   tracing: unified ...
1173
1174
1175
1176
   fail_free_buffer:
  	kfree(buffer);
  	return NULL;
  }
1f8a6a10f   Peter Zijlstra   ring-buffer: pass...
1177
  EXPORT_SYMBOL_GPL(__ring_buffer_alloc);
7a8e76a38   Steven Rostedt   tracing: unified ...
1178
1179
1180
1181
1182
1183
1184
1185
1186
  
  /**
   * ring_buffer_free - free a ring buffer.
   * @buffer: the buffer to free.
   */
  void
  ring_buffer_free(struct ring_buffer *buffer)
  {
  	int cpu;
554f786e2   Steven Rostedt   ring-buffer: only...
1187
  	get_online_cpus();
59222efe2   Steven Rostedt   ring-buffer: use ...
1188
  #ifdef CONFIG_HOTPLUG_CPU
554f786e2   Steven Rostedt   ring-buffer: only...
1189
1190
  	unregister_cpu_notifier(&buffer->cpu_notify);
  #endif
7a8e76a38   Steven Rostedt   tracing: unified ...
1191
1192
  	for_each_buffer_cpu(buffer, cpu)
  		rb_free_cpu_buffer(buffer->buffers[cpu]);
554f786e2   Steven Rostedt   ring-buffer: only...
1193
  	put_online_cpus();
bd3f02212   Eric Dumazet   ring-buffer: Fix ...
1194
  	kfree(buffer->buffers);
9e01c1b74   Rusty Russell   cpumask: convert ...
1195
  	free_cpumask_var(buffer->cpumask);
7a8e76a38   Steven Rostedt   tracing: unified ...
1196
1197
  	kfree(buffer);
  }
c4f50183f   Robert Richter   ring_buffer: addi...
1198
  EXPORT_SYMBOL_GPL(ring_buffer_free);
7a8e76a38   Steven Rostedt   tracing: unified ...
1199

37886f6a9   Steven Rostedt   ring-buffer: add ...
1200
1201
1202
1203
1204
  void ring_buffer_set_clock(struct ring_buffer *buffer,
  			   u64 (*clock)(void))
  {
  	buffer->clock = clock;
  }
7a8e76a38   Steven Rostedt   tracing: unified ...
1205
1206
1207
1208
1209
  static void rb_reset_cpu(struct ring_buffer_per_cpu *cpu_buffer);
  
  static void
  rb_remove_pages(struct ring_buffer_per_cpu *cpu_buffer, unsigned nr_pages)
  {
044fa782e   Steven Rostedt   ring-buffer: chan...
1210
  	struct buffer_page *bpage;
7a8e76a38   Steven Rostedt   tracing: unified ...
1211
1212
  	struct list_head *p;
  	unsigned i;
5389f6fad   Thomas Gleixner   locking, tracing:...
1213
  	raw_spin_lock_irq(&cpu_buffer->reader_lock);
77ae365ec   Steven Rostedt   ring-buffer: make...
1214
  	rb_head_page_deactivate(cpu_buffer);
7a8e76a38   Steven Rostedt   tracing: unified ...
1215
  	for (i = 0; i < nr_pages; i++) {
3adc54fa8   Steven Rostedt   ring-buffer: make...
1216
  		if (RB_WARN_ON(cpu_buffer, list_empty(cpu_buffer->pages)))
292f60c0c   Julia Lawall   ring-buffer: Add ...
1217
  			goto out;
3adc54fa8   Steven Rostedt   ring-buffer: make...
1218
  		p = cpu_buffer->pages->next;
044fa782e   Steven Rostedt   ring-buffer: chan...
1219
1220
1221
  		bpage = list_entry(p, struct buffer_page, list);
  		list_del_init(&bpage->list);
  		free_buffer_page(bpage);
7a8e76a38   Steven Rostedt   tracing: unified ...
1222
  	}
3adc54fa8   Steven Rostedt   ring-buffer: make...
1223
  	if (RB_WARN_ON(cpu_buffer, list_empty(cpu_buffer->pages)))
292f60c0c   Julia Lawall   ring-buffer: Add ...
1224
  		goto out;
7a8e76a38   Steven Rostedt   tracing: unified ...
1225
1226
  
  	rb_reset_cpu(cpu_buffer);
7a8e76a38   Steven Rostedt   tracing: unified ...
1227
  	rb_check_pages(cpu_buffer);
292f60c0c   Julia Lawall   ring-buffer: Add ...
1228
  out:
5389f6fad   Thomas Gleixner   locking, tracing:...
1229
  	raw_spin_unlock_irq(&cpu_buffer->reader_lock);
7a8e76a38   Steven Rostedt   tracing: unified ...
1230
1231
1232
1233
1234
1235
  }
  
  static void
  rb_insert_pages(struct ring_buffer_per_cpu *cpu_buffer,
  		struct list_head *pages, unsigned nr_pages)
  {
044fa782e   Steven Rostedt   ring-buffer: chan...
1236
  	struct buffer_page *bpage;
7a8e76a38   Steven Rostedt   tracing: unified ...
1237
1238
  	struct list_head *p;
  	unsigned i;
5389f6fad   Thomas Gleixner   locking, tracing:...
1239
  	raw_spin_lock_irq(&cpu_buffer->reader_lock);
77ae365ec   Steven Rostedt   ring-buffer: make...
1240
  	rb_head_page_deactivate(cpu_buffer);
7a8e76a38   Steven Rostedt   tracing: unified ...
1241
  	for (i = 0; i < nr_pages; i++) {
3e89c7bb9   Steven Rostedt   ring-buffer: clea...
1242
  		if (RB_WARN_ON(cpu_buffer, list_empty(pages)))
292f60c0c   Julia Lawall   ring-buffer: Add ...
1243
  			goto out;
7a8e76a38   Steven Rostedt   tracing: unified ...
1244
  		p = pages->next;
044fa782e   Steven Rostedt   ring-buffer: chan...
1245
1246
  		bpage = list_entry(p, struct buffer_page, list);
  		list_del_init(&bpage->list);
3adc54fa8   Steven Rostedt   ring-buffer: make...
1247
  		list_add_tail(&bpage->list, cpu_buffer->pages);
7a8e76a38   Steven Rostedt   tracing: unified ...
1248
1249
  	}
  	rb_reset_cpu(cpu_buffer);
7a8e76a38   Steven Rostedt   tracing: unified ...
1250
  	rb_check_pages(cpu_buffer);
292f60c0c   Julia Lawall   ring-buffer: Add ...
1251
  out:
5389f6fad   Thomas Gleixner   locking, tracing:...
1252
  	raw_spin_unlock_irq(&cpu_buffer->reader_lock);
7a8e76a38   Steven Rostedt   tracing: unified ...
1253
1254
1255
1256
1257
1258
1259
  }
  
  /**
   * ring_buffer_resize - resize the ring buffer
   * @buffer: the buffer to resize.
   * @size: the new size.
   *
7a8e76a38   Steven Rostedt   tracing: unified ...
1260
1261
1262
1263
1264
1265
1266
1267
   * Minimum size is 2 * BUF_PAGE_SIZE.
   *
   * Returns -1 on failure.
   */
  int ring_buffer_resize(struct ring_buffer *buffer, unsigned long size)
  {
  	struct ring_buffer_per_cpu *cpu_buffer;
  	unsigned nr_pages, rm_pages, new_pages;
044fa782e   Steven Rostedt   ring-buffer: chan...
1268
  	struct buffer_page *bpage, *tmp;
7a8e76a38   Steven Rostedt   tracing: unified ...
1269
  	unsigned long buffer_size;
7a8e76a38   Steven Rostedt   tracing: unified ...
1270
1271
  	LIST_HEAD(pages);
  	int i, cpu;
ee51a1de7   Ingo Molnar   tracing: fix mmio...
1272
1273
1274
1275
1276
  	/*
  	 * Always succeed at resizing a non-existent buffer:
  	 */
  	if (!buffer)
  		return size;
7a8e76a38   Steven Rostedt   tracing: unified ...
1277
1278
1279
1280
1281
1282
1283
1284
1285
1286
  	size = DIV_ROUND_UP(size, BUF_PAGE_SIZE);
  	size *= BUF_PAGE_SIZE;
  	buffer_size = buffer->pages * BUF_PAGE_SIZE;
  
  	/* we need a minimum of two pages */
  	if (size < BUF_PAGE_SIZE * 2)
  		size = BUF_PAGE_SIZE * 2;
  
  	if (size == buffer_size)
  		return size;
184210154   Steven Rostedt   ring-buffer: Use ...
1287
1288
1289
1290
  	atomic_inc(&buffer->record_disabled);
  
  	/* Make sure all writers are done with this buffer. */
  	synchronize_sched();
7a8e76a38   Steven Rostedt   tracing: unified ...
1291
  	mutex_lock(&buffer->mutex);
554f786e2   Steven Rostedt   ring-buffer: only...
1292
  	get_online_cpus();
7a8e76a38   Steven Rostedt   tracing: unified ...
1293
1294
1295
1296
1297
1298
  
  	nr_pages = DIV_ROUND_UP(size, BUF_PAGE_SIZE);
  
  	if (size < buffer_size) {
  
  		/* easy case, just free pages */
554f786e2   Steven Rostedt   ring-buffer: only...
1299
1300
  		if (RB_WARN_ON(buffer, nr_pages >= buffer->pages))
  			goto out_fail;
7a8e76a38   Steven Rostedt   tracing: unified ...
1301
1302
1303
1304
1305
1306
1307
1308
1309
1310
1311
1312
1313
1314
1315
1316
1317
1318
  
  		rm_pages = buffer->pages - nr_pages;
  
  		for_each_buffer_cpu(buffer, cpu) {
  			cpu_buffer = buffer->buffers[cpu];
  			rb_remove_pages(cpu_buffer, rm_pages);
  		}
  		goto out;
  	}
  
  	/*
  	 * This is a bit more difficult. We only want to add pages
  	 * when we can allocate enough for all CPUs. We do this
  	 * by allocating all the pages and storing them on a local
  	 * link list. If we succeed in our allocation, then we
  	 * add these pages to the cpu_buffers. Otherwise we just free
  	 * them all and return -ENOMEM;
  	 */
554f786e2   Steven Rostedt   ring-buffer: only...
1319
1320
  	if (RB_WARN_ON(buffer, nr_pages <= buffer->pages))
  		goto out_fail;
f536aafc5   Steven Rostedt   ring-buffer: repl...
1321

7a8e76a38   Steven Rostedt   tracing: unified ...
1322
1323
1324
1325
  	new_pages = nr_pages - buffer->pages;
  
  	for_each_buffer_cpu(buffer, cpu) {
  		for (i = 0; i < new_pages; i++) {
7ea590640   Vaibhav Nagarnaik   tracing: Use NUMA...
1326
  			struct page *page;
d7ec4bfed   Vaibhav Nagarnaik   ring-buffer: Set ...
1327
1328
1329
1330
1331
  			/*
  			 * __GFP_NORETRY flag makes sure that the allocation
  			 * fails gracefully without invoking oom-killer and
  			 * the system is not destabilized.
  			 */
044fa782e   Steven Rostedt   ring-buffer: chan...
1332
  			bpage = kzalloc_node(ALIGN(sizeof(*bpage),
e4c2ce82c   Steven Rostedt   ring_buffer: allo...
1333
  						  cache_line_size()),
d7ec4bfed   Vaibhav Nagarnaik   ring-buffer: Set ...
1334
1335
  					    GFP_KERNEL | __GFP_NORETRY,
  					    cpu_to_node(cpu));
044fa782e   Steven Rostedt   ring-buffer: chan...
1336
  			if (!bpage)
e4c2ce82c   Steven Rostedt   ring_buffer: allo...
1337
  				goto free_pages;
044fa782e   Steven Rostedt   ring-buffer: chan...
1338
  			list_add(&bpage->list, &pages);
d7ec4bfed   Vaibhav Nagarnaik   ring-buffer: Set ...
1339
1340
  			page = alloc_pages_node(cpu_to_node(cpu),
  						GFP_KERNEL | __GFP_NORETRY, 0);
7ea590640   Vaibhav Nagarnaik   tracing: Use NUMA...
1341
  			if (!page)
7a8e76a38   Steven Rostedt   tracing: unified ...
1342
  				goto free_pages;
7ea590640   Vaibhav Nagarnaik   tracing: Use NUMA...
1343
  			bpage->page = page_address(page);
044fa782e   Steven Rostedt   ring-buffer: chan...
1344
  			rb_init_page(bpage->page);
7a8e76a38   Steven Rostedt   tracing: unified ...
1345
1346
1347
1348
1349
1350
1351
  		}
  	}
  
  	for_each_buffer_cpu(buffer, cpu) {
  		cpu_buffer = buffer->buffers[cpu];
  		rb_insert_pages(cpu_buffer, &pages, new_pages);
  	}
554f786e2   Steven Rostedt   ring-buffer: only...
1352
1353
  	if (RB_WARN_ON(buffer, !list_empty(&pages)))
  		goto out_fail;
7a8e76a38   Steven Rostedt   tracing: unified ...
1354
1355
1356
  
   out:
  	buffer->pages = nr_pages;
554f786e2   Steven Rostedt   ring-buffer: only...
1357
  	put_online_cpus();
7a8e76a38   Steven Rostedt   tracing: unified ...
1358
  	mutex_unlock(&buffer->mutex);
184210154   Steven Rostedt   ring-buffer: Use ...
1359
  	atomic_dec(&buffer->record_disabled);
7a8e76a38   Steven Rostedt   tracing: unified ...
1360
1361
1362
  	return size;
  
   free_pages:
044fa782e   Steven Rostedt   ring-buffer: chan...
1363
1364
1365
  	list_for_each_entry_safe(bpage, tmp, &pages, list) {
  		list_del_init(&bpage->list);
  		free_buffer_page(bpage);
7a8e76a38   Steven Rostedt   tracing: unified ...
1366
  	}
554f786e2   Steven Rostedt   ring-buffer: only...
1367
  	put_online_cpus();
641d2f63c   Vegard Nossum   trace: introduce ...
1368
  	mutex_unlock(&buffer->mutex);
184210154   Steven Rostedt   ring-buffer: Use ...
1369
  	atomic_dec(&buffer->record_disabled);
7a8e76a38   Steven Rostedt   tracing: unified ...
1370
  	return -ENOMEM;
554f786e2   Steven Rostedt   ring-buffer: only...
1371
1372
1373
1374
1375
1376
1377
1378
  
  	/*
  	 * Something went totally wrong, and we are too paranoid
  	 * to even clean up the mess.
  	 */
   out_fail:
  	put_online_cpus();
  	mutex_unlock(&buffer->mutex);
184210154   Steven Rostedt   ring-buffer: Use ...
1379
  	atomic_dec(&buffer->record_disabled);
554f786e2   Steven Rostedt   ring-buffer: only...
1380
  	return -1;
7a8e76a38   Steven Rostedt   tracing: unified ...
1381
  }
c4f50183f   Robert Richter   ring_buffer: addi...
1382
  EXPORT_SYMBOL_GPL(ring_buffer_resize);
7a8e76a38   Steven Rostedt   tracing: unified ...
1383

750912fa3   David Sharp   tracing: Add an '...
1384
1385
1386
1387
1388
1389
1390
1391
1392
1393
  void ring_buffer_change_overwrite(struct ring_buffer *buffer, int val)
  {
  	mutex_lock(&buffer->mutex);
  	if (val)
  		buffer->flags |= RB_FL_OVERWRITE;
  	else
  		buffer->flags &= ~RB_FL_OVERWRITE;
  	mutex_unlock(&buffer->mutex);
  }
  EXPORT_SYMBOL_GPL(ring_buffer_change_overwrite);
8789a9e7d   Steven Rostedt   ring-buffer: read...
1394
  static inline void *
044fa782e   Steven Rostedt   ring-buffer: chan...
1395
  __rb_data_page_index(struct buffer_data_page *bpage, unsigned index)
8789a9e7d   Steven Rostedt   ring-buffer: read...
1396
  {
044fa782e   Steven Rostedt   ring-buffer: chan...
1397
  	return bpage->data + index;
8789a9e7d   Steven Rostedt   ring-buffer: read...
1398
  }
044fa782e   Steven Rostedt   ring-buffer: chan...
1399
  static inline void *__rb_page_index(struct buffer_page *bpage, unsigned index)
7a8e76a38   Steven Rostedt   tracing: unified ...
1400
  {
044fa782e   Steven Rostedt   ring-buffer: chan...
1401
  	return bpage->page->data + index;
7a8e76a38   Steven Rostedt   tracing: unified ...
1402
1403
1404
  }
  
  static inline struct ring_buffer_event *
d769041f8   Steven Rostedt   ring_buffer: impl...
1405
  rb_reader_event(struct ring_buffer_per_cpu *cpu_buffer)
7a8e76a38   Steven Rostedt   tracing: unified ...
1406
  {
6f807acd2   Steven Rostedt   ring-buffer: move...
1407
1408
1409
1410
1411
  	return __rb_page_index(cpu_buffer->reader_page,
  			       cpu_buffer->reader_page->read);
  }
  
  static inline struct ring_buffer_event *
7a8e76a38   Steven Rostedt   tracing: unified ...
1412
1413
  rb_iter_head_event(struct ring_buffer_iter *iter)
  {
6f807acd2   Steven Rostedt   ring-buffer: move...
1414
  	return __rb_page_index(iter->head_page, iter->head);
7a8e76a38   Steven Rostedt   tracing: unified ...
1415
  }
77ae365ec   Steven Rostedt   ring-buffer: make...
1416
  static inline unsigned long rb_page_write(struct buffer_page *bpage)
bf41a158c   Steven Rostedt   ring-buffer: make...
1417
  {
77ae365ec   Steven Rostedt   ring-buffer: make...
1418
  	return local_read(&bpage->write) & RB_WRITE_MASK;
bf41a158c   Steven Rostedt   ring-buffer: make...
1419
1420
1421
1422
  }
  
  static inline unsigned rb_page_commit(struct buffer_page *bpage)
  {
abc9b56d6   Steven Rostedt   ring-buffer: move...
1423
  	return local_read(&bpage->page->commit);
bf41a158c   Steven Rostedt   ring-buffer: make...
1424
  }
77ae365ec   Steven Rostedt   ring-buffer: make...
1425
1426
1427
1428
  static inline unsigned long rb_page_entries(struct buffer_page *bpage)
  {
  	return local_read(&bpage->entries) & RB_WRITE_MASK;
  }
25985edce   Lucas De Marchi   Fix common misspe...
1429
  /* Size is determined by what has been committed */
bf41a158c   Steven Rostedt   ring-buffer: make...
1430
1431
1432
1433
1434
1435
1436
1437
1438
1439
  static inline unsigned rb_page_size(struct buffer_page *bpage)
  {
  	return rb_page_commit(bpage);
  }
  
  static inline unsigned
  rb_commit_index(struct ring_buffer_per_cpu *cpu_buffer)
  {
  	return rb_page_commit(cpu_buffer->commit_page);
  }
bf41a158c   Steven Rostedt   ring-buffer: make...
1440
1441
1442
1443
  static inline unsigned
  rb_event_index(struct ring_buffer_event *event)
  {
  	unsigned long addr = (unsigned long)event;
22f470f8d   Steven Rostedt   ring-buffer: use ...
1444
  	return (addr & ~PAGE_MASK) - BUF_PAGE_HDR_SIZE;
bf41a158c   Steven Rostedt   ring-buffer: make...
1445
  }
0f0c85fc8   Steven Rostedt   ring-buffer: smal...
1446
  static inline int
fa7439531   Steven Rostedt   ring-buffer: use ...
1447
1448
  rb_event_is_commit(struct ring_buffer_per_cpu *cpu_buffer,
  		   struct ring_buffer_event *event)
bf41a158c   Steven Rostedt   ring-buffer: make...
1449
1450
1451
1452
1453
1454
1455
1456
1457
1458
  {
  	unsigned long addr = (unsigned long)event;
  	unsigned long index;
  
  	index = rb_event_index(event);
  	addr &= PAGE_MASK;
  
  	return cpu_buffer->commit_page->page == (void *)addr &&
  		rb_commit_index(cpu_buffer) == index;
  }
34a148bf0   Andrew Morton   kernel/trace/ring...
1459
  static void
bf41a158c   Steven Rostedt   ring-buffer: make...
1460
  rb_set_commit_to_write(struct ring_buffer_per_cpu *cpu_buffer)
7a8e76a38   Steven Rostedt   tracing: unified ...
1461
  {
77ae365ec   Steven Rostedt   ring-buffer: make...
1462
  	unsigned long max_count;
bf41a158c   Steven Rostedt   ring-buffer: make...
1463
1464
1465
1466
1467
1468
1469
1470
  	/*
  	 * We only race with interrupts and NMIs on this CPU.
  	 * If we own the commit event, then we can commit
  	 * all others that interrupted us, since the interruptions
  	 * are in stack format (they finish before they come
  	 * back to us). This allows us to do a simple loop to
  	 * assign the commit to the tail.
  	 */
a8ccf1d6f   Steven Rostedt   ring-buffer: fix ...
1471
   again:
77ae365ec   Steven Rostedt   ring-buffer: make...
1472
  	max_count = cpu_buffer->buffer->pages * 100;
bf41a158c   Steven Rostedt   ring-buffer: make...
1473
  	while (cpu_buffer->commit_page != cpu_buffer->tail_page) {
77ae365ec   Steven Rostedt   ring-buffer: make...
1474
1475
1476
1477
1478
1479
1480
  		if (RB_WARN_ON(cpu_buffer, !(--max_count)))
  			return;
  		if (RB_WARN_ON(cpu_buffer,
  			       rb_is_reader_page(cpu_buffer->tail_page)))
  			return;
  		local_set(&cpu_buffer->commit_page->page->commit,
  			  rb_page_write(cpu_buffer->commit_page));
bf41a158c   Steven Rostedt   ring-buffer: make...
1481
  		rb_inc_page(cpu_buffer, &cpu_buffer->commit_page);
abc9b56d6   Steven Rostedt   ring-buffer: move...
1482
1483
  		cpu_buffer->write_stamp =
  			cpu_buffer->commit_page->page->time_stamp;
bf41a158c   Steven Rostedt   ring-buffer: make...
1484
1485
1486
1487
1488
  		/* add barrier to keep gcc from optimizing too much */
  		barrier();
  	}
  	while (rb_commit_index(cpu_buffer) !=
  	       rb_page_write(cpu_buffer->commit_page)) {
77ae365ec   Steven Rostedt   ring-buffer: make...
1489
1490
1491
1492
1493
1494
  
  		local_set(&cpu_buffer->commit_page->page->commit,
  			  rb_page_write(cpu_buffer->commit_page));
  		RB_WARN_ON(cpu_buffer,
  			   local_read(&cpu_buffer->commit_page->page->commit) &
  			   ~RB_WRITE_MASK);
bf41a158c   Steven Rostedt   ring-buffer: make...
1495
1496
  		barrier();
  	}
a8ccf1d6f   Steven Rostedt   ring-buffer: fix ...
1497
1498
1499
1500
1501
1502
1503
1504
1505
1506
1507
  
  	/* again, keep gcc from optimizing */
  	barrier();
  
  	/*
  	 * If an interrupt came in just after the first while loop
  	 * and pushed the tail page forward, we will be left with
  	 * a dangling commit that will never go forward.
  	 */
  	if (unlikely(cpu_buffer->commit_page != cpu_buffer->tail_page))
  		goto again;
7a8e76a38   Steven Rostedt   tracing: unified ...
1508
  }
d769041f8   Steven Rostedt   ring_buffer: impl...
1509
  static void rb_reset_reader_page(struct ring_buffer_per_cpu *cpu_buffer)
7a8e76a38   Steven Rostedt   tracing: unified ...
1510
  {
abc9b56d6   Steven Rostedt   ring-buffer: move...
1511
  	cpu_buffer->read_stamp = cpu_buffer->reader_page->page->time_stamp;
6f807acd2   Steven Rostedt   ring-buffer: move...
1512
  	cpu_buffer->reader_page->read = 0;
d769041f8   Steven Rostedt   ring_buffer: impl...
1513
  }
34a148bf0   Andrew Morton   kernel/trace/ring...
1514
  static void rb_inc_iter(struct ring_buffer_iter *iter)
d769041f8   Steven Rostedt   ring_buffer: impl...
1515
1516
1517
1518
1519
1520
1521
1522
1523
1524
  {
  	struct ring_buffer_per_cpu *cpu_buffer = iter->cpu_buffer;
  
  	/*
  	 * The iterator could be on the reader page (it starts there).
  	 * But the head could have moved, since the reader was
  	 * found. Check for this case and assign the iterator
  	 * to the head page instead of next.
  	 */
  	if (iter->head_page == cpu_buffer->reader_page)
77ae365ec   Steven Rostedt   ring-buffer: make...
1525
  		iter->head_page = rb_set_head_page(cpu_buffer);
d769041f8   Steven Rostedt   ring_buffer: impl...
1526
1527
  	else
  		rb_inc_page(cpu_buffer, &iter->head_page);
abc9b56d6   Steven Rostedt   ring-buffer: move...
1528
  	iter->read_stamp = iter->head_page->page->time_stamp;
7a8e76a38   Steven Rostedt   tracing: unified ...
1529
1530
  	iter->head = 0;
  }
69d1b839f   Steven Rostedt   ring-buffer: Bind...
1531
1532
1533
1534
1535
1536
1537
1538
1539
1540
1541
1542
1543
1544
1545
1546
1547
1548
  /* Slow path, do not inline */
  static noinline struct ring_buffer_event *
  rb_add_time_stamp(struct ring_buffer_event *event, u64 delta)
  {
  	event->type_len = RINGBUF_TYPE_TIME_EXTEND;
  
  	/* Not the first event on the page? */
  	if (rb_event_index(event)) {
  		event->time_delta = delta & TS_MASK;
  		event->array[0] = delta >> TS_SHIFT;
  	} else {
  		/* nope, just zero it */
  		event->time_delta = 0;
  		event->array[0] = 0;
  	}
  
  	return skip_time_extend(event);
  }
7a8e76a38   Steven Rostedt   tracing: unified ...
1549
1550
1551
1552
1553
1554
1555
1556
1557
1558
1559
  /**
   * ring_buffer_update_event - update event type and data
   * @event: the even to update
   * @type: the type of event
   * @length: the size of the event field in the ring buffer
   *
   * Update the type and data fields of the event. The length
   * is the actual size that is written to the ring buffer,
   * and with this, we can determine what to place into the
   * data field.
   */
34a148bf0   Andrew Morton   kernel/trace/ring...
1560
  static void
69d1b839f   Steven Rostedt   ring-buffer: Bind...
1561
1562
1563
  rb_update_event(struct ring_buffer_per_cpu *cpu_buffer,
  		struct ring_buffer_event *event, unsigned length,
  		int add_timestamp, u64 delta)
7a8e76a38   Steven Rostedt   tracing: unified ...
1564
  {
69d1b839f   Steven Rostedt   ring-buffer: Bind...
1565
1566
1567
  	/* Only a commit updates the timestamp */
  	if (unlikely(!rb_event_is_commit(cpu_buffer, event)))
  		delta = 0;
7a8e76a38   Steven Rostedt   tracing: unified ...
1568

69d1b839f   Steven Rostedt   ring-buffer: Bind...
1569
1570
1571
1572
1573
1574
1575
1576
  	/*
  	 * If we need to add a timestamp, then we
  	 * add it to the start of the resevered space.
  	 */
  	if (unlikely(add_timestamp)) {
  		event = rb_add_time_stamp(event, delta);
  		length -= RB_LEN_TIME_EXTEND;
  		delta = 0;
7a8e76a38   Steven Rostedt   tracing: unified ...
1577
  	}
69d1b839f   Steven Rostedt   ring-buffer: Bind...
1578
1579
1580
1581
1582
1583
1584
1585
  
  	event->time_delta = delta;
  	length -= RB_EVNT_HDR_SIZE;
  	if (length > RB_MAX_SMALL_DATA || RB_FORCE_8BYTE_ALIGNMENT) {
  		event->type_len = 0;
  		event->array[0] = length;
  	} else
  		event->type_len = DIV_ROUND_UP(length, RB_ALIGNMENT);
7a8e76a38   Steven Rostedt   tracing: unified ...
1586
  }
77ae365ec   Steven Rostedt   ring-buffer: make...
1587
1588
1589
1590
1591
1592
1593
1594
1595
1596
1597
1598
1599
1600
1601
1602
1603
1604
1605
1606
1607
1608
1609
1610
1611
1612
1613
1614
1615
1616
1617
1618
1619
1620
1621
1622
1623
1624
1625
1626
1627
1628
1629
1630
1631
1632
  /*
   * rb_handle_head_page - writer hit the head page
   *
   * Returns: +1 to retry page
   *           0 to continue
   *          -1 on error
   */
  static int
  rb_handle_head_page(struct ring_buffer_per_cpu *cpu_buffer,
  		    struct buffer_page *tail_page,
  		    struct buffer_page *next_page)
  {
  	struct buffer_page *new_head;
  	int entries;
  	int type;
  	int ret;
  
  	entries = rb_page_entries(next_page);
  
  	/*
  	 * The hard part is here. We need to move the head
  	 * forward, and protect against both readers on
  	 * other CPUs and writers coming in via interrupts.
  	 */
  	type = rb_head_page_set_update(cpu_buffer, next_page, tail_page,
  				       RB_PAGE_HEAD);
  
  	/*
  	 * type can be one of four:
  	 *  NORMAL - an interrupt already moved it for us
  	 *  HEAD   - we are the first to get here.
  	 *  UPDATE - we are the interrupt interrupting
  	 *           a current move.
  	 *  MOVED  - a reader on another CPU moved the next
  	 *           pointer to its reader page. Give up
  	 *           and try again.
  	 */
  
  	switch (type) {
  	case RB_PAGE_HEAD:
  		/*
  		 * We changed the head to UPDATE, thus
  		 * it is our responsibility to update
  		 * the counters.
  		 */
  		local_add(entries, &cpu_buffer->overrun);
c64e148a3   Vaibhav Nagarnaik   trace: Add ring b...
1633
  		local_sub(BUF_PAGE_SIZE, &cpu_buffer->entries_bytes);
77ae365ec   Steven Rostedt   ring-buffer: make...
1634
1635
1636
1637
1638
1639
1640
1641
1642
1643
1644
1645
1646
1647
1648
1649
1650
1651
1652
1653
1654
1655
1656
1657
1658
1659
1660
1661
1662
1663
1664
1665
1666
1667
1668
1669
1670
1671
1672
1673
1674
1675
1676
1677
1678
1679
1680
1681
1682
1683
1684
1685
1686
1687
1688
1689
1690
1691
1692
1693
1694
1695
1696
1697
1698
1699
1700
1701
1702
1703
1704
1705
1706
1707
1708
1709
1710
1711
1712
1713
1714
1715
1716
1717
1718
1719
1720
1721
1722
1723
1724
1725
1726
1727
1728
1729
1730
1731
1732
1733
1734
1735
1736
1737
1738
1739
1740
1741
1742
1743
  
  		/*
  		 * The entries will be zeroed out when we move the
  		 * tail page.
  		 */
  
  		/* still more to do */
  		break;
  
  	case RB_PAGE_UPDATE:
  		/*
  		 * This is an interrupt that interrupt the
  		 * previous update. Still more to do.
  		 */
  		break;
  	case RB_PAGE_NORMAL:
  		/*
  		 * An interrupt came in before the update
  		 * and processed this for us.
  		 * Nothing left to do.
  		 */
  		return 1;
  	case RB_PAGE_MOVED:
  		/*
  		 * The reader is on another CPU and just did
  		 * a swap with our next_page.
  		 * Try again.
  		 */
  		return 1;
  	default:
  		RB_WARN_ON(cpu_buffer, 1); /* WTF??? */
  		return -1;
  	}
  
  	/*
  	 * Now that we are here, the old head pointer is
  	 * set to UPDATE. This will keep the reader from
  	 * swapping the head page with the reader page.
  	 * The reader (on another CPU) will spin till
  	 * we are finished.
  	 *
  	 * We just need to protect against interrupts
  	 * doing the job. We will set the next pointer
  	 * to HEAD. After that, we set the old pointer
  	 * to NORMAL, but only if it was HEAD before.
  	 * otherwise we are an interrupt, and only
  	 * want the outer most commit to reset it.
  	 */
  	new_head = next_page;
  	rb_inc_page(cpu_buffer, &new_head);
  
  	ret = rb_head_page_set_head(cpu_buffer, new_head, next_page,
  				    RB_PAGE_NORMAL);
  
  	/*
  	 * Valid returns are:
  	 *  HEAD   - an interrupt came in and already set it.
  	 *  NORMAL - One of two things:
  	 *            1) We really set it.
  	 *            2) A bunch of interrupts came in and moved
  	 *               the page forward again.
  	 */
  	switch (ret) {
  	case RB_PAGE_HEAD:
  	case RB_PAGE_NORMAL:
  		/* OK */
  		break;
  	default:
  		RB_WARN_ON(cpu_buffer, 1);
  		return -1;
  	}
  
  	/*
  	 * It is possible that an interrupt came in,
  	 * set the head up, then more interrupts came in
  	 * and moved it again. When we get back here,
  	 * the page would have been set to NORMAL but we
  	 * just set it back to HEAD.
  	 *
  	 * How do you detect this? Well, if that happened
  	 * the tail page would have moved.
  	 */
  	if (ret == RB_PAGE_NORMAL) {
  		/*
  		 * If the tail had moved passed next, then we need
  		 * to reset the pointer.
  		 */
  		if (cpu_buffer->tail_page != tail_page &&
  		    cpu_buffer->tail_page != next_page)
  			rb_head_page_set_normal(cpu_buffer, new_head,
  						next_page,
  						RB_PAGE_HEAD);
  	}
  
  	/*
  	 * If this was the outer most commit (the one that
  	 * changed the original pointer from HEAD to UPDATE),
  	 * then it is up to us to reset it to NORMAL.
  	 */
  	if (type == RB_PAGE_HEAD) {
  		ret = rb_head_page_set_normal(cpu_buffer, next_page,
  					      tail_page,
  					      RB_PAGE_UPDATE);
  		if (RB_WARN_ON(cpu_buffer,
  			       ret != RB_PAGE_UPDATE))
  			return -1;
  	}
  
  	return 0;
  }
34a148bf0   Andrew Morton   kernel/trace/ring...
1744
  static unsigned rb_calculate_event_length(unsigned length)
7a8e76a38   Steven Rostedt   tracing: unified ...
1745
1746
1747
1748
1749
1750
  {
  	struct ring_buffer_event event; /* Used only for sizeof array */
  
  	/* zero length can cause confusions */
  	if (!length)
  		length = 1;
2271048d1   Steven Rostedt   ring-buffer: Do 8...
1751
  	if (length > RB_MAX_SMALL_DATA || RB_FORCE_8BYTE_ALIGNMENT)
7a8e76a38   Steven Rostedt   tracing: unified ...
1752
1753
1754
  		length += sizeof(event.array[0]);
  
  	length += RB_EVNT_HDR_SIZE;
2271048d1   Steven Rostedt   ring-buffer: Do 8...
1755
  	length = ALIGN(length, RB_ARCH_ALIGNMENT);
7a8e76a38   Steven Rostedt   tracing: unified ...
1756
1757
1758
  
  	return length;
  }
c7b093085   Steven Rostedt   ring-buffer: prev...
1759
1760
1761
1762
1763
1764
1765
1766
1767
1768
1769
1770
  static inline void
  rb_reset_tail(struct ring_buffer_per_cpu *cpu_buffer,
  	      struct buffer_page *tail_page,
  	      unsigned long tail, unsigned long length)
  {
  	struct ring_buffer_event *event;
  
  	/*
  	 * Only the event that crossed the page boundary
  	 * must fill the old tail_page with padding.
  	 */
  	if (tail >= BUF_PAGE_SIZE) {
b3230c8b4   Steven Rostedt   ring-buffer: Rese...
1771
1772
1773
1774
1775
1776
1777
  		/*
  		 * If the page was filled, then we still need
  		 * to update the real_end. Reset it to zero
  		 * and the reader will ignore it.
  		 */
  		if (tail == BUF_PAGE_SIZE)
  			tail_page->real_end = 0;
c7b093085   Steven Rostedt   ring-buffer: prev...
1778
1779
1780
1781
1782
  		local_sub(length, &tail_page->write);
  		return;
  	}
  
  	event = __rb_page_index(tail_page, tail);
b0b7065b6   Linus Torvalds   Merge branch 'tra...
1783
  	kmemcheck_annotate_bitfield(event, bitfield);
c7b093085   Steven Rostedt   ring-buffer: prev...
1784

c64e148a3   Vaibhav Nagarnaik   trace: Add ring b...
1785
1786
  	/* account for padding bytes */
  	local_add(BUF_PAGE_SIZE - tail, &cpu_buffer->entries_bytes);
c7b093085   Steven Rostedt   ring-buffer: prev...
1787
  	/*
ff0ff84a0   Steven Rostedt   ring-buffer: Add ...
1788
1789
1790
1791
1792
1793
1794
  	 * Save the original length to the meta data.
  	 * This will be used by the reader to add lost event
  	 * counter.
  	 */
  	tail_page->real_end = tail;
  
  	/*
c7b093085   Steven Rostedt   ring-buffer: prev...
1795
1796
1797
1798
1799
1800
1801
1802
1803
1804
1805
1806
1807
1808
1809
1810
1811
1812
1813
1814
1815
1816
1817
1818
1819
1820
  	 * If this event is bigger than the minimum size, then
  	 * we need to be careful that we don't subtract the
  	 * write counter enough to allow another writer to slip
  	 * in on this page.
  	 * We put in a discarded commit instead, to make sure
  	 * that this space is not used again.
  	 *
  	 * If we are less than the minimum size, we don't need to
  	 * worry about it.
  	 */
  	if (tail > (BUF_PAGE_SIZE - RB_EVNT_MIN_SIZE)) {
  		/* No room for any events */
  
  		/* Mark the rest of the page with padding */
  		rb_event_set_padding(event);
  
  		/* Set the write back to the previous setting */
  		local_sub(length, &tail_page->write);
  		return;
  	}
  
  	/* Put in a discarded event */
  	event->array[0] = (BUF_PAGE_SIZE - tail) - RB_EVNT_HDR_SIZE;
  	event->type_len = RINGBUF_TYPE_PADDING;
  	/* time delta must be non zero */
  	event->time_delta = 1;
c7b093085   Steven Rostedt   ring-buffer: prev...
1821
1822
1823
1824
1825
  
  	/* Set write to end of buffer */
  	length = (tail + length) - BUF_PAGE_SIZE;
  	local_sub(length, &tail_page->write);
  }
6634ff26c   Steven Rostedt   ring-buffer: make...
1826

747e94ae3   Steven Rostedt   ring-buffer: Make...
1827
1828
1829
1830
  /*
   * This is the slow path, force gcc not to inline it.
   */
  static noinline struct ring_buffer_event *
6634ff26c   Steven Rostedt   ring-buffer: make...
1831
1832
  rb_move_tail(struct ring_buffer_per_cpu *cpu_buffer,
  	     unsigned long length, unsigned long tail,
e8bc43e84   Steven Rostedt   ring-buffer: Pass...
1833
  	     struct buffer_page *tail_page, u64 ts)
7a8e76a38   Steven Rostedt   tracing: unified ...
1834
  {
5a50e33cc   Steven Rostedt   ring-buffer: Move...
1835
  	struct buffer_page *commit_page = cpu_buffer->commit_page;
7a8e76a38   Steven Rostedt   tracing: unified ...
1836
  	struct ring_buffer *buffer = cpu_buffer->buffer;
77ae365ec   Steven Rostedt   ring-buffer: make...
1837
1838
  	struct buffer_page *next_page;
  	int ret;
aa20ae844   Steven Rostedt   ring-buffer: move...
1839
1840
  
  	next_page = tail_page;
aa20ae844   Steven Rostedt   ring-buffer: move...
1841
  	rb_inc_page(cpu_buffer, &next_page);
aa20ae844   Steven Rostedt   ring-buffer: move...
1842
1843
1844
1845
1846
1847
  	/*
  	 * If for some reason, we had an interrupt storm that made
  	 * it all the way around the buffer, bail, and warn
  	 * about it.
  	 */
  	if (unlikely(next_page == commit_page)) {
77ae365ec   Steven Rostedt   ring-buffer: make...
1848
  		local_inc(&cpu_buffer->commit_overrun);
aa20ae844   Steven Rostedt   ring-buffer: move...
1849
1850
  		goto out_reset;
  	}
77ae365ec   Steven Rostedt   ring-buffer: make...
1851
1852
1853
1854
1855
1856
1857
1858
1859
1860
1861
1862
1863
1864
1865
  	/*
  	 * This is where the fun begins!
  	 *
  	 * We are fighting against races between a reader that
  	 * could be on another CPU trying to swap its reader
  	 * page with the buffer head.
  	 *
  	 * We are also fighting against interrupts coming in and
  	 * moving the head or tail on us as well.
  	 *
  	 * If the next page is the head page then we have filled
  	 * the buffer, unless the commit page is still on the
  	 * reader page.
  	 */
  	if (rb_is_head_page(cpu_buffer, next_page, &tail_page->list)) {
aa20ae844   Steven Rostedt   ring-buffer: move...
1866

77ae365ec   Steven Rostedt   ring-buffer: make...
1867
1868
1869
1870
1871
1872
1873
1874
1875
1876
1877
1878
1879
1880
1881
1882
1883
1884
1885
1886
1887
1888
1889
1890
1891
1892
1893
1894
1895
1896
1897
1898
1899
1900
1901
1902
1903
  		/*
  		 * If the commit is not on the reader page, then
  		 * move the header page.
  		 */
  		if (!rb_is_reader_page(cpu_buffer->commit_page)) {
  			/*
  			 * If we are not in overwrite mode,
  			 * this is easy, just stop here.
  			 */
  			if (!(buffer->flags & RB_FL_OVERWRITE))
  				goto out_reset;
  
  			ret = rb_handle_head_page(cpu_buffer,
  						  tail_page,
  						  next_page);
  			if (ret < 0)
  				goto out_reset;
  			if (ret)
  				goto out_again;
  		} else {
  			/*
  			 * We need to be careful here too. The
  			 * commit page could still be on the reader
  			 * page. We could have a small buffer, and
  			 * have filled up the buffer with events
  			 * from interrupts and such, and wrapped.
  			 *
  			 * Note, if the tail page is also the on the
  			 * reader_page, we let it move out.
  			 */
  			if (unlikely((cpu_buffer->commit_page !=
  				      cpu_buffer->tail_page) &&
  				     (cpu_buffer->commit_page ==
  				      cpu_buffer->reader_page))) {
  				local_inc(&cpu_buffer->commit_overrun);
  				goto out_reset;
  			}
aa20ae844   Steven Rostedt   ring-buffer: move...
1904
1905
  		}
  	}
77ae365ec   Steven Rostedt   ring-buffer: make...
1906
1907
1908
1909
1910
1911
  	ret = rb_tail_page_update(cpu_buffer, tail_page, next_page);
  	if (ret) {
  		/*
  		 * Nested commits always have zero deltas, so
  		 * just reread the time stamp
  		 */
e8bc43e84   Steven Rostedt   ring-buffer: Pass...
1912
1913
  		ts = rb_time_stamp(buffer);
  		next_page->page->time_stamp = ts;
aa20ae844   Steven Rostedt   ring-buffer: move...
1914
  	}
77ae365ec   Steven Rostedt   ring-buffer: make...
1915
   out_again:
aa20ae844   Steven Rostedt   ring-buffer: move...
1916

77ae365ec   Steven Rostedt   ring-buffer: make...
1917
  	rb_reset_tail(cpu_buffer, tail_page, tail, length);
aa20ae844   Steven Rostedt   ring-buffer: move...
1918
1919
1920
  
  	/* fail and let the caller try again */
  	return ERR_PTR(-EAGAIN);
45141d466   Steven Rostedt   ring-buffer: rena...
1921
   out_reset:
6f3b34402   Lai Jiangshan   ring_buffer: rese...
1922
  	/* reset write */
c7b093085   Steven Rostedt   ring-buffer: prev...
1923
  	rb_reset_tail(cpu_buffer, tail_page, tail, length);
6f3b34402   Lai Jiangshan   ring_buffer: rese...
1924

bf41a158c   Steven Rostedt   ring-buffer: make...
1925
  	return NULL;
7a8e76a38   Steven Rostedt   tracing: unified ...
1926
  }
6634ff26c   Steven Rostedt   ring-buffer: make...
1927
1928
  static struct ring_buffer_event *
  __rb_reserve_next(struct ring_buffer_per_cpu *cpu_buffer,
69d1b839f   Steven Rostedt   ring-buffer: Bind...
1929
1930
  		  unsigned long length, u64 ts,
  		  u64 delta, int add_timestamp)
6634ff26c   Steven Rostedt   ring-buffer: make...
1931
  {
5a50e33cc   Steven Rostedt   ring-buffer: Move...
1932
  	struct buffer_page *tail_page;
6634ff26c   Steven Rostedt   ring-buffer: make...
1933
1934
  	struct ring_buffer_event *event;
  	unsigned long tail, write;
69d1b839f   Steven Rostedt   ring-buffer: Bind...
1935
1936
1937
1938
1939
1940
1941
  	/*
  	 * If the time delta since the last event is too big to
  	 * hold in the time field of the event, then we append a
  	 * TIME EXTEND event ahead of the data event.
  	 */
  	if (unlikely(add_timestamp))
  		length += RB_LEN_TIME_EXTEND;
6634ff26c   Steven Rostedt   ring-buffer: make...
1942
1943
  	tail_page = cpu_buffer->tail_page;
  	write = local_add_return(length, &tail_page->write);
77ae365ec   Steven Rostedt   ring-buffer: make...
1944
1945
1946
  
  	/* set write to only the index of the write */
  	write &= RB_WRITE_MASK;
6634ff26c   Steven Rostedt   ring-buffer: make...
1947
1948
1949
  	tail = write - length;
  
  	/* See if we shot pass the end of this buffer page */
747e94ae3   Steven Rostedt   ring-buffer: Make...
1950
  	if (unlikely(write > BUF_PAGE_SIZE))
6634ff26c   Steven Rostedt   ring-buffer: make...
1951
  		return rb_move_tail(cpu_buffer, length, tail,
5a50e33cc   Steven Rostedt   ring-buffer: Move...
1952
  				    tail_page, ts);
6634ff26c   Steven Rostedt   ring-buffer: make...
1953
1954
  
  	/* We reserved something on the buffer */
6634ff26c   Steven Rostedt   ring-buffer: make...
1955
  	event = __rb_page_index(tail_page, tail);
1744a21d5   Vegard Nossum   trace: annotate b...
1956
  	kmemcheck_annotate_bitfield(event, bitfield);
69d1b839f   Steven Rostedt   ring-buffer: Bind...
1957
  	rb_update_event(cpu_buffer, event, length, add_timestamp, delta);
6634ff26c   Steven Rostedt   ring-buffer: make...
1958

69d1b839f   Steven Rostedt   ring-buffer: Bind...
1959
  	local_inc(&tail_page->entries);
6634ff26c   Steven Rostedt   ring-buffer: make...
1960
1961
  
  	/*
fa7439531   Steven Rostedt   ring-buffer: use ...
1962
1963
  	 * If this is the first commit on the page, then update
  	 * its timestamp.
6634ff26c   Steven Rostedt   ring-buffer: make...
1964
  	 */
fa7439531   Steven Rostedt   ring-buffer: use ...
1965
  	if (!tail)
e8bc43e84   Steven Rostedt   ring-buffer: Pass...
1966
  		tail_page->page->time_stamp = ts;
6634ff26c   Steven Rostedt   ring-buffer: make...
1967

c64e148a3   Vaibhav Nagarnaik   trace: Add ring b...
1968
1969
  	/* account for these added bytes */
  	local_add(length, &cpu_buffer->entries_bytes);
6634ff26c   Steven Rostedt   ring-buffer: make...
1970
1971
  	return event;
  }
edd813bff   Steven Rostedt   ring-buffer: try ...
1972
1973
1974
1975
1976
1977
1978
1979
1980
1981
  static inline int
  rb_try_to_discard(struct ring_buffer_per_cpu *cpu_buffer,
  		  struct ring_buffer_event *event)
  {
  	unsigned long new_index, old_index;
  	struct buffer_page *bpage;
  	unsigned long index;
  	unsigned long addr;
  
  	new_index = rb_event_index(event);
69d1b839f   Steven Rostedt   ring-buffer: Bind...
1982
  	old_index = new_index + rb_event_ts_length(event);
edd813bff   Steven Rostedt   ring-buffer: try ...
1983
1984
1985
1986
1987
1988
  	addr = (unsigned long)event;
  	addr &= PAGE_MASK;
  
  	bpage = cpu_buffer->tail_page;
  
  	if (bpage->page == (void *)addr && rb_page_write(bpage) == old_index) {
77ae365ec   Steven Rostedt   ring-buffer: make...
1989
1990
  		unsigned long write_mask =
  			local_read(&bpage->write) & ~RB_WRITE_MASK;
c64e148a3   Vaibhav Nagarnaik   trace: Add ring b...
1991
  		unsigned long event_length = rb_event_length(event);
edd813bff   Steven Rostedt   ring-buffer: try ...
1992
1993
1994
1995
1996
1997
  		/*
  		 * This is on the tail page. It is possible that
  		 * a write could come in and move the tail page
  		 * and write to the next page. That is fine
  		 * because we just shorten what is on this page.
  		 */
77ae365ec   Steven Rostedt   ring-buffer: make...
1998
1999
  		old_index += write_mask;
  		new_index += write_mask;
edd813bff   Steven Rostedt   ring-buffer: try ...
2000
  		index = local_cmpxchg(&bpage->write, old_index, new_index);
c64e148a3   Vaibhav Nagarnaik   trace: Add ring b...
2001
2002
2003
  		if (index == old_index) {
  			/* update counters */
  			local_sub(event_length, &cpu_buffer->entries_bytes);
edd813bff   Steven Rostedt   ring-buffer: try ...
2004
  			return 1;
c64e148a3   Vaibhav Nagarnaik   trace: Add ring b...
2005
  		}
edd813bff   Steven Rostedt   ring-buffer: try ...
2006
2007
2008
2009
2010
  	}
  
  	/* could not discard */
  	return 0;
  }
fa7439531   Steven Rostedt   ring-buffer: use ...
2011
2012
2013
2014
2015
  static void rb_start_commit(struct ring_buffer_per_cpu *cpu_buffer)
  {
  	local_inc(&cpu_buffer->committing);
  	local_inc(&cpu_buffer->commits);
  }
d9abde213   Steven Rostedt   ring-buffer: Micr...
2016
  static inline void rb_end_commit(struct ring_buffer_per_cpu *cpu_buffer)
fa7439531   Steven Rostedt   ring-buffer: use ...
2017
2018
2019
2020
2021
2022
2023
2024
2025
2026
2027
2028
2029
2030
2031
2032
2033
2034
2035
2036
2037
2038
2039
2040
2041
2042
2043
2044
2045
2046
  {
  	unsigned long commits;
  
  	if (RB_WARN_ON(cpu_buffer,
  		       !local_read(&cpu_buffer->committing)))
  		return;
  
   again:
  	commits = local_read(&cpu_buffer->commits);
  	/* synchronize with interrupts */
  	barrier();
  	if (local_read(&cpu_buffer->committing) == 1)
  		rb_set_commit_to_write(cpu_buffer);
  
  	local_dec(&cpu_buffer->committing);
  
  	/* synchronize with interrupts */
  	barrier();
  
  	/*
  	 * Need to account for interrupts coming in between the
  	 * updating of the commit page and the clearing of the
  	 * committing counter.
  	 */
  	if (unlikely(local_read(&cpu_buffer->commits) != commits) &&
  	    !local_read(&cpu_buffer->committing)) {
  		local_inc(&cpu_buffer->committing);
  		goto again;
  	}
  }
7a8e76a38   Steven Rostedt   tracing: unified ...
2047
  static struct ring_buffer_event *
62f0b3eb5   Steven Rostedt   ring-buffer: chec...
2048
2049
  rb_reserve_next_event(struct ring_buffer *buffer,
  		      struct ring_buffer_per_cpu *cpu_buffer,
1cd8d7358   Steven Rostedt   ring-buffer: remo...
2050
  		      unsigned long length)
7a8e76a38   Steven Rostedt   tracing: unified ...
2051
2052
  {
  	struct ring_buffer_event *event;
69d1b839f   Steven Rostedt   ring-buffer: Bind...
2053
  	u64 ts, delta;
818e3dd30   Steven Rostedt   tracing, ring-buf...
2054
  	int nr_loops = 0;
69d1b839f   Steven Rostedt   ring-buffer: Bind...
2055
  	int add_timestamp;
140ff8912   Steven Rostedt   ring-buffer: Remo...
2056
  	u64 diff;
7a8e76a38   Steven Rostedt   tracing: unified ...
2057

fa7439531   Steven Rostedt   ring-buffer: use ...
2058
  	rb_start_commit(cpu_buffer);
85bac32c4   Steven Rostedt   ring-buffer: only...
2059
  #ifdef CONFIG_RING_BUFFER_ALLOW_SWAP
62f0b3eb5   Steven Rostedt   ring-buffer: chec...
2060
2061
2062
2063
2064
2065
2066
2067
2068
2069
2070
2071
  	/*
  	 * Due to the ability to swap a cpu buffer from a buffer
  	 * it is possible it was swapped before we committed.
  	 * (committing stops a swap). We check for it here and
  	 * if it happened, we have to fail the write.
  	 */
  	barrier();
  	if (unlikely(ACCESS_ONCE(cpu_buffer->buffer) != buffer)) {
  		local_dec(&cpu_buffer->committing);
  		local_dec(&cpu_buffer->commits);
  		return NULL;
  	}
85bac32c4   Steven Rostedt   ring-buffer: only...
2072
  #endif
62f0b3eb5   Steven Rostedt   ring-buffer: chec...
2073

be957c447   Steven Rostedt   ring-buffer: move...
2074
  	length = rb_calculate_event_length(length);
bf41a158c   Steven Rostedt   ring-buffer: make...
2075
   again:
69d1b839f   Steven Rostedt   ring-buffer: Bind...
2076
2077
  	add_timestamp = 0;
  	delta = 0;
818e3dd30   Steven Rostedt   tracing, ring-buf...
2078
2079
2080
2081
2082
2083
2084
2085
2086
  	/*
  	 * We allow for interrupts to reenter here and do a trace.
  	 * If one does, it will cause this original code to loop
  	 * back here. Even with heavy interrupts happening, this
  	 * should only happen a few times in a row. If this happens
  	 * 1000 times in a row, there must be either an interrupt
  	 * storm or we have something buggy.
  	 * Bail!
  	 */
3e89c7bb9   Steven Rostedt   ring-buffer: clea...
2087
  	if (RB_WARN_ON(cpu_buffer, ++nr_loops > 1000))
fa7439531   Steven Rostedt   ring-buffer: use ...
2088
  		goto out_fail;
818e3dd30   Steven Rostedt   tracing, ring-buf...
2089

6d3f1e12f   Jiri Olsa   tracing: Remove c...
2090
  	ts = rb_time_stamp(cpu_buffer->buffer);
140ff8912   Steven Rostedt   ring-buffer: Remo...
2091
  	diff = ts - cpu_buffer->write_stamp;
7a8e76a38   Steven Rostedt   tracing: unified ...
2092

140ff8912   Steven Rostedt   ring-buffer: Remo...
2093
2094
  	/* make sure this diff is calculated here */
  	barrier();
bf41a158c   Steven Rostedt   ring-buffer: make...
2095

140ff8912   Steven Rostedt   ring-buffer: Remo...
2096
2097
  	/* Did the write stamp get updated already? */
  	if (likely(ts >= cpu_buffer->write_stamp)) {
168b6b1d0   Steven Rostedt   ring-buffer: move...
2098
2099
  		delta = diff;
  		if (unlikely(test_time_stamp(delta))) {
31274d72f   Jiri Olsa   tracing: Explain ...
2100
2101
2102
2103
  			int local_clock_stable = 1;
  #ifdef CONFIG_HAVE_UNSTABLE_SCHED_CLOCK
  			local_clock_stable = sched_clock_stable;
  #endif
69d1b839f   Steven Rostedt   ring-buffer: Bind...
2104
  			WARN_ONCE(delta > (1ULL << 59),
31274d72f   Jiri Olsa   tracing: Explain ...
2105
2106
  				  KERN_WARNING "Delta way too big! %llu ts=%llu write stamp = %llu
  %s",
69d1b839f   Steven Rostedt   ring-buffer: Bind...
2107
2108
  				  (unsigned long long)delta,
  				  (unsigned long long)ts,
31274d72f   Jiri Olsa   tracing: Explain ...
2109
2110
2111
2112
2113
2114
2115
2116
  				  (unsigned long long)cpu_buffer->write_stamp,
  				  local_clock_stable ? "" :
  				  "If you just came from a suspend/resume,
  "
  				  "please switch to the trace global clock:
  "
  				  "  echo global > /sys/kernel/debug/tracing/trace_clock
  ");
69d1b839f   Steven Rostedt   ring-buffer: Bind...
2117
  			add_timestamp = 1;
7a8e76a38   Steven Rostedt   tracing: unified ...
2118
  		}
168b6b1d0   Steven Rostedt   ring-buffer: move...
2119
  	}
7a8e76a38   Steven Rostedt   tracing: unified ...
2120

69d1b839f   Steven Rostedt   ring-buffer: Bind...
2121
2122
  	event = __rb_reserve_next(cpu_buffer, length, ts,
  				  delta, add_timestamp);
168b6b1d0   Steven Rostedt   ring-buffer: move...
2123
  	if (unlikely(PTR_ERR(event) == -EAGAIN))
bf41a158c   Steven Rostedt   ring-buffer: make...
2124
  		goto again;
fa7439531   Steven Rostedt   ring-buffer: use ...
2125
2126
  	if (!event)
  		goto out_fail;
7a8e76a38   Steven Rostedt   tracing: unified ...
2127

7a8e76a38   Steven Rostedt   tracing: unified ...
2128
  	return event;
fa7439531   Steven Rostedt   ring-buffer: use ...
2129
2130
2131
2132
  
   out_fail:
  	rb_end_commit(cpu_buffer);
  	return NULL;
7a8e76a38   Steven Rostedt   tracing: unified ...
2133
  }
1155de47c   Paul Mundt   ring-buffer: Make...
2134
  #ifdef CONFIG_TRACING
aa18efb2a   Steven Rostedt   tracing: use recu...
2135
  #define TRACE_RECURSIVE_DEPTH 16
261842b7c   Steven Rostedt   tracing: add same...
2136

d9abde213   Steven Rostedt   ring-buffer: Micr...
2137
2138
  /* Keep this code out of the fast path cache */
  static noinline void trace_recursive_fail(void)
261842b7c   Steven Rostedt   tracing: add same...
2139
  {
aa18efb2a   Steven Rostedt   tracing: use recu...
2140
2141
  	/* Disable all tracing before we do anything else */
  	tracing_off_permanent();
261842b7c   Steven Rostedt   tracing: add same...
2142

7d7d2b803   Steven Rostedt   ring-buffer: fix ...
2143
  	printk_once(KERN_WARNING "Tracing recursion: depth[%ld]:"
aa18efb2a   Steven Rostedt   tracing: use recu...
2144
2145
  		    "HC[%lu]:SC[%lu]:NMI[%lu]
  ",
b1cff0ad1   Steven Rostedt   ftrace: Add inter...
2146
  		    trace_recursion_buffer(),
aa18efb2a   Steven Rostedt   tracing: use recu...
2147
2148
2149
  		    hardirq_count() >> HARDIRQ_SHIFT,
  		    softirq_count() >> SOFTIRQ_SHIFT,
  		    in_nmi());
261842b7c   Steven Rostedt   tracing: add same...
2150

aa18efb2a   Steven Rostedt   tracing: use recu...
2151
  	WARN_ON_ONCE(1);
d9abde213   Steven Rostedt   ring-buffer: Micr...
2152
2153
2154
2155
  }
  
  static inline int trace_recursive_lock(void)
  {
b1cff0ad1   Steven Rostedt   ftrace: Add inter...
2156
  	trace_recursion_inc();
d9abde213   Steven Rostedt   ring-buffer: Micr...
2157

b1cff0ad1   Steven Rostedt   ftrace: Add inter...
2158
  	if (likely(trace_recursion_buffer() < TRACE_RECURSIVE_DEPTH))
d9abde213   Steven Rostedt   ring-buffer: Micr...
2159
2160
2161
  		return 0;
  
  	trace_recursive_fail();
aa18efb2a   Steven Rostedt   tracing: use recu...
2162
  	return -1;
261842b7c   Steven Rostedt   tracing: add same...
2163
  }
d9abde213   Steven Rostedt   ring-buffer: Micr...
2164
  static inline void trace_recursive_unlock(void)
261842b7c   Steven Rostedt   tracing: add same...
2165
  {
b1cff0ad1   Steven Rostedt   ftrace: Add inter...
2166
  	WARN_ON_ONCE(!trace_recursion_buffer());
261842b7c   Steven Rostedt   tracing: add same...
2167

b1cff0ad1   Steven Rostedt   ftrace: Add inter...
2168
  	trace_recursion_dec();
261842b7c   Steven Rostedt   tracing: add same...
2169
  }
1155de47c   Paul Mundt   ring-buffer: Make...
2170
2171
2172
2173
2174
2175
  #else
  
  #define trace_recursive_lock()		(0)
  #define trace_recursive_unlock()	do { } while (0)
  
  #endif
7a8e76a38   Steven Rostedt   tracing: unified ...
2176
2177
2178
2179
  /**
   * ring_buffer_lock_reserve - reserve a part of the buffer
   * @buffer: the ring buffer to reserve from
   * @length: the length of the data to reserve (excluding event header)
7a8e76a38   Steven Rostedt   tracing: unified ...
2180
2181
2182
2183
2184
2185
2186
2187
2188
2189
2190
2191
   *
   * Returns a reseverd event on the ring buffer to copy directly to.
   * The user of this interface will need to get the body to write into
   * and can use the ring_buffer_event_data() interface.
   *
   * The length is the length of the data needed, not the event length
   * which also includes the event header.
   *
   * Must be paired with ring_buffer_unlock_commit, unless NULL is returned.
   * If NULL is returned, then nothing has been allocated or locked.
   */
  struct ring_buffer_event *
0a9877514   Arnaldo Carvalho de Melo   ring_buffer: remo...
2192
  ring_buffer_lock_reserve(struct ring_buffer *buffer, unsigned long length)
7a8e76a38   Steven Rostedt   tracing: unified ...
2193
2194
2195
  {
  	struct ring_buffer_per_cpu *cpu_buffer;
  	struct ring_buffer_event *event;
5168ae50a   Steven Rostedt   tracing: Remove f...
2196
  	int cpu;
7a8e76a38   Steven Rostedt   tracing: unified ...
2197

033601a32   Steven Rostedt   ring-buffer: add ...
2198
  	if (ring_buffer_flags != RB_BUFFERS_ON)
a35832446   Steven Rostedt   ring-buffer: buff...
2199
  		return NULL;
bf41a158c   Steven Rostedt   ring-buffer: make...
2200
  	/* If we are tracing schedule, we don't want to recurse */
5168ae50a   Steven Rostedt   tracing: Remove f...
2201
  	preempt_disable_notrace();
bf41a158c   Steven Rostedt   ring-buffer: make...
2202

52fbe9cde   Lai Jiangshan   ring-buffer: Move...
2203
2204
  	if (atomic_read(&buffer->record_disabled))
  		goto out_nocheck;
261842b7c   Steven Rostedt   tracing: add same...
2205
2206
  	if (trace_recursive_lock())
  		goto out_nocheck;
7a8e76a38   Steven Rostedt   tracing: unified ...
2207
  	cpu = raw_smp_processor_id();
9e01c1b74   Rusty Russell   cpumask: convert ...
2208
  	if (!cpumask_test_cpu(cpu, buffer->cpumask))
d769041f8   Steven Rostedt   ring_buffer: impl...
2209
  		goto out;
7a8e76a38   Steven Rostedt   tracing: unified ...
2210
2211
  
  	cpu_buffer = buffer->buffers[cpu];
7a8e76a38   Steven Rostedt   tracing: unified ...
2212
2213
  
  	if (atomic_read(&cpu_buffer->record_disabled))
d769041f8   Steven Rostedt   ring_buffer: impl...
2214
  		goto out;
7a8e76a38   Steven Rostedt   tracing: unified ...
2215

be957c447   Steven Rostedt   ring-buffer: move...
2216
  	if (length > BUF_MAX_DATA_SIZE)
bf41a158c   Steven Rostedt   ring-buffer: make...
2217
  		goto out;
7a8e76a38   Steven Rostedt   tracing: unified ...
2218

62f0b3eb5   Steven Rostedt   ring-buffer: chec...
2219
  	event = rb_reserve_next_event(buffer, cpu_buffer, length);
7a8e76a38   Steven Rostedt   tracing: unified ...
2220
  	if (!event)
d769041f8   Steven Rostedt   ring_buffer: impl...
2221
  		goto out;
7a8e76a38   Steven Rostedt   tracing: unified ...
2222
2223
  
  	return event;
d769041f8   Steven Rostedt   ring_buffer: impl...
2224
   out:
261842b7c   Steven Rostedt   tracing: add same...
2225
2226
2227
  	trace_recursive_unlock();
  
   out_nocheck:
5168ae50a   Steven Rostedt   tracing: Remove f...
2228
  	preempt_enable_notrace();
7a8e76a38   Steven Rostedt   tracing: unified ...
2229
2230
  	return NULL;
  }
c4f50183f   Robert Richter   ring_buffer: addi...
2231
  EXPORT_SYMBOL_GPL(ring_buffer_lock_reserve);
7a8e76a38   Steven Rostedt   tracing: unified ...
2232

a1863c212   Steven Rostedt   ring-buffer: do n...
2233
2234
  static void
  rb_update_write_stamp(struct ring_buffer_per_cpu *cpu_buffer,
7a8e76a38   Steven Rostedt   tracing: unified ...
2235
2236
  		      struct ring_buffer_event *event)
  {
69d1b839f   Steven Rostedt   ring-buffer: Bind...
2237
  	u64 delta;
fa7439531   Steven Rostedt   ring-buffer: use ...
2238
2239
2240
2241
  	/*
  	 * The event first in the commit queue updates the
  	 * time stamp.
  	 */
69d1b839f   Steven Rostedt   ring-buffer: Bind...
2242
2243
2244
2245
2246
2247
2248
2249
2250
2251
2252
2253
2254
2255
2256
2257
  	if (rb_event_is_commit(cpu_buffer, event)) {
  		/*
  		 * A commit event that is first on a page
  		 * updates the write timestamp with the page stamp
  		 */
  		if (!rb_event_index(event))
  			cpu_buffer->write_stamp =
  				cpu_buffer->commit_page->page->time_stamp;
  		else if (event->type_len == RINGBUF_TYPE_TIME_EXTEND) {
  			delta = event->array[0];
  			delta <<= TS_SHIFT;
  			delta += event->time_delta;
  			cpu_buffer->write_stamp += delta;
  		} else
  			cpu_buffer->write_stamp += event->time_delta;
  	}
a1863c212   Steven Rostedt   ring-buffer: do n...
2258
  }
bf41a158c   Steven Rostedt   ring-buffer: make...
2259

a1863c212   Steven Rostedt   ring-buffer: do n...
2260
2261
2262
2263
2264
  static void rb_commit(struct ring_buffer_per_cpu *cpu_buffer,
  		      struct ring_buffer_event *event)
  {
  	local_inc(&cpu_buffer->entries);
  	rb_update_write_stamp(cpu_buffer, event);
fa7439531   Steven Rostedt   ring-buffer: use ...
2265
  	rb_end_commit(cpu_buffer);
7a8e76a38   Steven Rostedt   tracing: unified ...
2266
2267
2268
2269
2270
2271
  }
  
  /**
   * ring_buffer_unlock_commit - commit a reserved
   * @buffer: The buffer to commit to
   * @event: The event pointer to commit.
7a8e76a38   Steven Rostedt   tracing: unified ...
2272
2273
2274
2275
2276
2277
   *
   * This commits the data to the ring buffer, and releases any locks held.
   *
   * Must be paired with ring_buffer_lock_reserve.
   */
  int ring_buffer_unlock_commit(struct ring_buffer *buffer,
0a9877514   Arnaldo Carvalho de Melo   ring_buffer: remo...
2278
  			      struct ring_buffer_event *event)
7a8e76a38   Steven Rostedt   tracing: unified ...
2279
2280
2281
2282
2283
  {
  	struct ring_buffer_per_cpu *cpu_buffer;
  	int cpu = raw_smp_processor_id();
  
  	cpu_buffer = buffer->buffers[cpu];
7a8e76a38   Steven Rostedt   tracing: unified ...
2284
  	rb_commit(cpu_buffer, event);
261842b7c   Steven Rostedt   tracing: add same...
2285
  	trace_recursive_unlock();
5168ae50a   Steven Rostedt   tracing: Remove f...
2286
  	preempt_enable_notrace();
7a8e76a38   Steven Rostedt   tracing: unified ...
2287
2288
2289
  
  	return 0;
  }
c4f50183f   Robert Richter   ring_buffer: addi...
2290
  EXPORT_SYMBOL_GPL(ring_buffer_unlock_commit);
7a8e76a38   Steven Rostedt   tracing: unified ...
2291

f3b9aae16   Frederic Weisbecker   tracing/ring-buff...
2292
2293
  static inline void rb_event_discard(struct ring_buffer_event *event)
  {
69d1b839f   Steven Rostedt   ring-buffer: Bind...
2294
2295
  	if (event->type_len == RINGBUF_TYPE_TIME_EXTEND)
  		event = skip_time_extend(event);
334d4169a   Lai Jiangshan   ring_buffer: comp...
2296
2297
2298
  	/* array[0] holds the actual length for the discarded event */
  	event->array[0] = rb_event_data_length(event) - RB_EVNT_HDR_SIZE;
  	event->type_len = RINGBUF_TYPE_PADDING;
f3b9aae16   Frederic Weisbecker   tracing/ring-buff...
2299
2300
2301
2302
  	/* time delta must be non zero */
  	if (!event->time_delta)
  		event->time_delta = 1;
  }
a1863c212   Steven Rostedt   ring-buffer: do n...
2303
2304
2305
2306
2307
2308
2309
2310
2311
2312
2313
2314
2315
2316
2317
2318
2319
2320
2321
2322
2323
2324
2325
2326
2327
2328
2329
2330
2331
2332
2333
2334
2335
2336
2337
2338
2339
2340
2341
  /*
   * Decrement the entries to the page that an event is on.
   * The event does not even need to exist, only the pointer
   * to the page it is on. This may only be called before the commit
   * takes place.
   */
  static inline void
  rb_decrement_entry(struct ring_buffer_per_cpu *cpu_buffer,
  		   struct ring_buffer_event *event)
  {
  	unsigned long addr = (unsigned long)event;
  	struct buffer_page *bpage = cpu_buffer->commit_page;
  	struct buffer_page *start;
  
  	addr &= PAGE_MASK;
  
  	/* Do the likely case first */
  	if (likely(bpage->page == (void *)addr)) {
  		local_dec(&bpage->entries);
  		return;
  	}
  
  	/*
  	 * Because the commit page may be on the reader page we
  	 * start with the next page and check the end loop there.
  	 */
  	rb_inc_page(cpu_buffer, &bpage);
  	start = bpage;
  	do {
  		if (bpage->page == (void *)addr) {
  			local_dec(&bpage->entries);
  			return;
  		}
  		rb_inc_page(cpu_buffer, &bpage);
  	} while (bpage != start);
  
  	/* commit not part of this buffer?? */
  	RB_WARN_ON(cpu_buffer, 1);
  }
7a8e76a38   Steven Rostedt   tracing: unified ...
2342
  /**
fa1b47dd8   Steven Rostedt   ring-buffer: add ...
2343
2344
2345
2346
   * ring_buffer_commit_discard - discard an event that has not been committed
   * @buffer: the ring buffer
   * @event: non committed event to discard
   *
dc892f733   Steven Rostedt   ring-buffer: remo...
2347
2348
2349
2350
2351
2352
   * Sometimes an event that is in the ring buffer needs to be ignored.
   * This function lets the user discard an event in the ring buffer
   * and then that event will not be read later.
   *
   * This function only works if it is called before the the item has been
   * committed. It will try to free the event from the ring buffer
fa1b47dd8   Steven Rostedt   ring-buffer: add ...
2353
2354
2355
2356
2357
2358
2359
2360
2361
2362
2363
2364
   * if another event has not been added behind it.
   *
   * If another event has been added behind it, it will set the event
   * up as discarded, and perform the commit.
   *
   * If this function is called, do not call ring_buffer_unlock_commit on
   * the event.
   */
  void ring_buffer_discard_commit(struct ring_buffer *buffer,
  				struct ring_buffer_event *event)
  {
  	struct ring_buffer_per_cpu *cpu_buffer;
fa1b47dd8   Steven Rostedt   ring-buffer: add ...
2365
2366
2367
  	int cpu;
  
  	/* The event is discarded regardless */
f3b9aae16   Frederic Weisbecker   tracing/ring-buff...
2368
  	rb_event_discard(event);
fa1b47dd8   Steven Rostedt   ring-buffer: add ...
2369

fa7439531   Steven Rostedt   ring-buffer: use ...
2370
2371
  	cpu = smp_processor_id();
  	cpu_buffer = buffer->buffers[cpu];
fa1b47dd8   Steven Rostedt   ring-buffer: add ...
2372
2373
2374
2375
2376
  	/*
  	 * This must only be called if the event has not been
  	 * committed yet. Thus we can assume that preemption
  	 * is still disabled.
  	 */
fa7439531   Steven Rostedt   ring-buffer: use ...
2377
  	RB_WARN_ON(buffer, !local_read(&cpu_buffer->committing));
fa1b47dd8   Steven Rostedt   ring-buffer: add ...
2378

a1863c212   Steven Rostedt   ring-buffer: do n...
2379
  	rb_decrement_entry(cpu_buffer, event);
0f2541d29   Steven Rostedt   ring-buffer: fix ...
2380
  	if (rb_try_to_discard(cpu_buffer, event))
edd813bff   Steven Rostedt   ring-buffer: try ...
2381
  		goto out;
fa1b47dd8   Steven Rostedt   ring-buffer: add ...
2382
2383
2384
  
  	/*
  	 * The commit is still visible by the reader, so we
a1863c212   Steven Rostedt   ring-buffer: do n...
2385
  	 * must still update the timestamp.
fa1b47dd8   Steven Rostedt   ring-buffer: add ...
2386
  	 */
a1863c212   Steven Rostedt   ring-buffer: do n...
2387
  	rb_update_write_stamp(cpu_buffer, event);
fa1b47dd8   Steven Rostedt   ring-buffer: add ...
2388
   out:
fa7439531   Steven Rostedt   ring-buffer: use ...
2389
  	rb_end_commit(cpu_buffer);
fa1b47dd8   Steven Rostedt   ring-buffer: add ...
2390

f3b9aae16   Frederic Weisbecker   tracing/ring-buff...
2391
  	trace_recursive_unlock();
5168ae50a   Steven Rostedt   tracing: Remove f...
2392
  	preempt_enable_notrace();
fa1b47dd8   Steven Rostedt   ring-buffer: add ...
2393
2394
2395
2396
2397
  
  }
  EXPORT_SYMBOL_GPL(ring_buffer_discard_commit);
  
  /**
7a8e76a38   Steven Rostedt   tracing: unified ...
2398
2399
2400
2401
2402
2403
2404
2405
2406
2407
2408
2409
2410
2411
2412
2413
2414
2415
   * ring_buffer_write - write data to the buffer without reserving
   * @buffer: The ring buffer to write to.
   * @length: The length of the data being written (excluding the event header)
   * @data: The data to write to the buffer.
   *
   * This is like ring_buffer_lock_reserve and ring_buffer_unlock_commit as
   * one function. If you already have the data to write to the buffer, it
   * may be easier to simply call this function.
   *
   * Note, like ring_buffer_lock_reserve, the length is the length of the data
   * and not the length of the event which would hold the header.
   */
  int ring_buffer_write(struct ring_buffer *buffer,
  			unsigned long length,
  			void *data)
  {
  	struct ring_buffer_per_cpu *cpu_buffer;
  	struct ring_buffer_event *event;
7a8e76a38   Steven Rostedt   tracing: unified ...
2416
2417
  	void *body;
  	int ret = -EBUSY;
5168ae50a   Steven Rostedt   tracing: Remove f...
2418
  	int cpu;
7a8e76a38   Steven Rostedt   tracing: unified ...
2419

033601a32   Steven Rostedt   ring-buffer: add ...
2420
  	if (ring_buffer_flags != RB_BUFFERS_ON)
a35832446   Steven Rostedt   ring-buffer: buff...
2421
  		return -EBUSY;
5168ae50a   Steven Rostedt   tracing: Remove f...
2422
  	preempt_disable_notrace();
bf41a158c   Steven Rostedt   ring-buffer: make...
2423

52fbe9cde   Lai Jiangshan   ring-buffer: Move...
2424
2425
  	if (atomic_read(&buffer->record_disabled))
  		goto out;
7a8e76a38   Steven Rostedt   tracing: unified ...
2426
  	cpu = raw_smp_processor_id();
9e01c1b74   Rusty Russell   cpumask: convert ...
2427
  	if (!cpumask_test_cpu(cpu, buffer->cpumask))
d769041f8   Steven Rostedt   ring_buffer: impl...
2428
  		goto out;
7a8e76a38   Steven Rostedt   tracing: unified ...
2429
2430
  
  	cpu_buffer = buffer->buffers[cpu];
7a8e76a38   Steven Rostedt   tracing: unified ...
2431
2432
2433
  
  	if (atomic_read(&cpu_buffer->record_disabled))
  		goto out;
be957c447   Steven Rostedt   ring-buffer: move...
2434
2435
  	if (length > BUF_MAX_DATA_SIZE)
  		goto out;
62f0b3eb5   Steven Rostedt   ring-buffer: chec...
2436
  	event = rb_reserve_next_event(buffer, cpu_buffer, length);
7a8e76a38   Steven Rostedt   tracing: unified ...
2437
2438
2439
2440
2441
2442
2443
2444
2445
2446
2447
  	if (!event)
  		goto out;
  
  	body = rb_event_data(event);
  
  	memcpy(body, data, length);
  
  	rb_commit(cpu_buffer, event);
  
  	ret = 0;
   out:
5168ae50a   Steven Rostedt   tracing: Remove f...
2448
  	preempt_enable_notrace();
7a8e76a38   Steven Rostedt   tracing: unified ...
2449
2450
2451
  
  	return ret;
  }
c4f50183f   Robert Richter   ring_buffer: addi...
2452
  EXPORT_SYMBOL_GPL(ring_buffer_write);
7a8e76a38   Steven Rostedt   tracing: unified ...
2453

34a148bf0   Andrew Morton   kernel/trace/ring...
2454
  static int rb_per_cpu_empty(struct ring_buffer_per_cpu *cpu_buffer)
bf41a158c   Steven Rostedt   ring-buffer: make...
2455
2456
  {
  	struct buffer_page *reader = cpu_buffer->reader_page;
77ae365ec   Steven Rostedt   ring-buffer: make...
2457
  	struct buffer_page *head = rb_set_head_page(cpu_buffer);
bf41a158c   Steven Rostedt   ring-buffer: make...
2458
  	struct buffer_page *commit = cpu_buffer->commit_page;
77ae365ec   Steven Rostedt   ring-buffer: make...
2459
2460
2461
  	/* In case of error, head will be NULL */
  	if (unlikely(!head))
  		return 1;
bf41a158c   Steven Rostedt   ring-buffer: make...
2462
2463
2464
2465
2466
  	return reader->read == rb_page_commit(reader) &&
  		(commit == reader ||
  		 (commit == head &&
  		  head->read == rb_page_commit(commit)));
  }
7a8e76a38   Steven Rostedt   tracing: unified ...
2467
  /**
7a8e76a38   Steven Rostedt   tracing: unified ...
2468
2469
2470
2471
2472
2473
2474
2475
2476
2477
2478
2479
   * ring_buffer_record_disable - stop all writes into the buffer
   * @buffer: The ring buffer to stop writes to.
   *
   * This prevents all writes to the buffer. Any attempt to write
   * to the buffer after this will fail and return NULL.
   *
   * The caller should call synchronize_sched() after this.
   */
  void ring_buffer_record_disable(struct ring_buffer *buffer)
  {
  	atomic_inc(&buffer->record_disabled);
  }
c4f50183f   Robert Richter   ring_buffer: addi...
2480
  EXPORT_SYMBOL_GPL(ring_buffer_record_disable);
7a8e76a38   Steven Rostedt   tracing: unified ...
2481
2482
2483
2484
2485
2486
  
  /**
   * ring_buffer_record_enable - enable writes to the buffer
   * @buffer: The ring buffer to enable writes
   *
   * Note, multiple disables will need the same number of enables
c41b20e72   Adam Buchbinder   Fix misspellings ...
2487
   * to truly enable the writing (much like preempt_disable).
7a8e76a38   Steven Rostedt   tracing: unified ...
2488
2489
2490
2491
2492
   */
  void ring_buffer_record_enable(struct ring_buffer *buffer)
  {
  	atomic_dec(&buffer->record_disabled);
  }
c4f50183f   Robert Richter   ring_buffer: addi...
2493
  EXPORT_SYMBOL_GPL(ring_buffer_record_enable);
7a8e76a38   Steven Rostedt   tracing: unified ...
2494
2495
2496
2497
2498
2499
2500
2501
2502
2503
2504
2505
2506
2507
  
  /**
   * ring_buffer_record_disable_cpu - stop all writes into the cpu_buffer
   * @buffer: The ring buffer to stop writes to.
   * @cpu: The CPU buffer to stop
   *
   * This prevents all writes to the buffer. Any attempt to write
   * to the buffer after this will fail and return NULL.
   *
   * The caller should call synchronize_sched() after this.
   */
  void ring_buffer_record_disable_cpu(struct ring_buffer *buffer, int cpu)
  {
  	struct ring_buffer_per_cpu *cpu_buffer;
9e01c1b74   Rusty Russell   cpumask: convert ...
2508
  	if (!cpumask_test_cpu(cpu, buffer->cpumask))
8aabee573   Steven Rostedt   ring-buffer: remo...
2509
  		return;
7a8e76a38   Steven Rostedt   tracing: unified ...
2510
2511
2512
2513
  
  	cpu_buffer = buffer->buffers[cpu];
  	atomic_inc(&cpu_buffer->record_disabled);
  }
c4f50183f   Robert Richter   ring_buffer: addi...
2514
  EXPORT_SYMBOL_GPL(ring_buffer_record_disable_cpu);
7a8e76a38   Steven Rostedt   tracing: unified ...
2515
2516
2517
2518
2519
2520
2521
  
  /**
   * ring_buffer_record_enable_cpu - enable writes to the buffer
   * @buffer: The ring buffer to enable writes
   * @cpu: The CPU to enable.
   *
   * Note, multiple disables will need the same number of enables
c41b20e72   Adam Buchbinder   Fix misspellings ...
2522
   * to truly enable the writing (much like preempt_disable).
7a8e76a38   Steven Rostedt   tracing: unified ...
2523
2524
2525
2526
   */
  void ring_buffer_record_enable_cpu(struct ring_buffer *buffer, int cpu)
  {
  	struct ring_buffer_per_cpu *cpu_buffer;
9e01c1b74   Rusty Russell   cpumask: convert ...
2527
  	if (!cpumask_test_cpu(cpu, buffer->cpumask))
8aabee573   Steven Rostedt   ring-buffer: remo...
2528
  		return;
7a8e76a38   Steven Rostedt   tracing: unified ...
2529
2530
2531
2532
  
  	cpu_buffer = buffer->buffers[cpu];
  	atomic_dec(&cpu_buffer->record_disabled);
  }
c4f50183f   Robert Richter   ring_buffer: addi...
2533
  EXPORT_SYMBOL_GPL(ring_buffer_record_enable_cpu);
7a8e76a38   Steven Rostedt   tracing: unified ...
2534

f6195aa09   Steven Rostedt   ring-buffer: Plac...
2535
2536
2537
2538
2539
2540
2541
2542
2543
2544
2545
2546
  /*
   * The total entries in the ring buffer is the running counter
   * of entries entered into the ring buffer, minus the sum of
   * the entries read from the ring buffer and the number of
   * entries that were overwritten.
   */
  static inline unsigned long
  rb_num_of_entries(struct ring_buffer_per_cpu *cpu_buffer)
  {
  	return local_read(&cpu_buffer->entries) -
  		(local_read(&cpu_buffer->overrun) + cpu_buffer->read);
  }
7a8e76a38   Steven Rostedt   tracing: unified ...
2547
  /**
c64e148a3   Vaibhav Nagarnaik   trace: Add ring b...
2548
2549
2550
2551
2552
2553
2554
2555
2556
2557
2558
2559
2560
2561
2562
   * ring_buffer_oldest_event_ts - get the oldest event timestamp from the buffer
   * @buffer: The ring buffer
   * @cpu: The per CPU buffer to read from.
   */
  unsigned long ring_buffer_oldest_event_ts(struct ring_buffer *buffer, int cpu)
  {
  	unsigned long flags;
  	struct ring_buffer_per_cpu *cpu_buffer;
  	struct buffer_page *bpage;
  	unsigned long ret;
  
  	if (!cpumask_test_cpu(cpu, buffer->cpumask))
  		return 0;
  
  	cpu_buffer = buffer->buffers[cpu];
7115e3fcf   Linus Torvalds   Merge branch 'per...
2563
  	raw_spin_lock_irqsave(&cpu_buffer->reader_lock, flags);
c64e148a3   Vaibhav Nagarnaik   trace: Add ring b...
2564
2565
2566
2567
2568
2569
2570
2571
2572
  	/*
  	 * if the tail is on reader_page, oldest time stamp is on the reader
  	 * page
  	 */
  	if (cpu_buffer->tail_page == cpu_buffer->reader_page)
  		bpage = cpu_buffer->reader_page;
  	else
  		bpage = rb_set_head_page(cpu_buffer);
  	ret = bpage->page->time_stamp;
7115e3fcf   Linus Torvalds   Merge branch 'per...
2573
  	raw_spin_unlock_irqrestore(&cpu_buffer->reader_lock, flags);
c64e148a3   Vaibhav Nagarnaik   trace: Add ring b...
2574
2575
2576
2577
2578
2579
2580
2581
2582
2583
2584
2585
2586
2587
2588
2589
2590
2591
2592
2593
2594
2595
2596
2597
2598
2599
  
  	return ret;
  }
  EXPORT_SYMBOL_GPL(ring_buffer_oldest_event_ts);
  
  /**
   * ring_buffer_bytes_cpu - get the number of bytes consumed in a cpu buffer
   * @buffer: The ring buffer
   * @cpu: The per CPU buffer to read from.
   */
  unsigned long ring_buffer_bytes_cpu(struct ring_buffer *buffer, int cpu)
  {
  	struct ring_buffer_per_cpu *cpu_buffer;
  	unsigned long ret;
  
  	if (!cpumask_test_cpu(cpu, buffer->cpumask))
  		return 0;
  
  	cpu_buffer = buffer->buffers[cpu];
  	ret = local_read(&cpu_buffer->entries_bytes) - cpu_buffer->read_bytes;
  
  	return ret;
  }
  EXPORT_SYMBOL_GPL(ring_buffer_bytes_cpu);
  
  /**
7a8e76a38   Steven Rostedt   tracing: unified ...
2600
2601
2602
2603
2604
2605
2606
   * ring_buffer_entries_cpu - get the number of entries in a cpu buffer
   * @buffer: The ring buffer
   * @cpu: The per CPU buffer to get the entries from.
   */
  unsigned long ring_buffer_entries_cpu(struct ring_buffer *buffer, int cpu)
  {
  	struct ring_buffer_per_cpu *cpu_buffer;
9e01c1b74   Rusty Russell   cpumask: convert ...
2607
  	if (!cpumask_test_cpu(cpu, buffer->cpumask))
8aabee573   Steven Rostedt   ring-buffer: remo...
2608
  		return 0;
7a8e76a38   Steven Rostedt   tracing: unified ...
2609
2610
  
  	cpu_buffer = buffer->buffers[cpu];
554f786e2   Steven Rostedt   ring-buffer: only...
2611

f6195aa09   Steven Rostedt   ring-buffer: Plac...
2612
  	return rb_num_of_entries(cpu_buffer);
7a8e76a38   Steven Rostedt   tracing: unified ...
2613
  }
c4f50183f   Robert Richter   ring_buffer: addi...
2614
  EXPORT_SYMBOL_GPL(ring_buffer_entries_cpu);
7a8e76a38   Steven Rostedt   tracing: unified ...
2615
2616
2617
2618
2619
2620
2621
2622
2623
  
  /**
   * ring_buffer_overrun_cpu - get the number of overruns in a cpu_buffer
   * @buffer: The ring buffer
   * @cpu: The per CPU buffer to get the number of overruns from
   */
  unsigned long ring_buffer_overrun_cpu(struct ring_buffer *buffer, int cpu)
  {
  	struct ring_buffer_per_cpu *cpu_buffer;
8aabee573   Steven Rostedt   ring-buffer: remo...
2624
  	unsigned long ret;
7a8e76a38   Steven Rostedt   tracing: unified ...
2625

9e01c1b74   Rusty Russell   cpumask: convert ...
2626
  	if (!cpumask_test_cpu(cpu, buffer->cpumask))
8aabee573   Steven Rostedt   ring-buffer: remo...
2627
  		return 0;
7a8e76a38   Steven Rostedt   tracing: unified ...
2628
2629
  
  	cpu_buffer = buffer->buffers[cpu];
77ae365ec   Steven Rostedt   ring-buffer: make...
2630
  	ret = local_read(&cpu_buffer->overrun);
554f786e2   Steven Rostedt   ring-buffer: only...
2631
2632
  
  	return ret;
7a8e76a38   Steven Rostedt   tracing: unified ...
2633
  }
c4f50183f   Robert Richter   ring_buffer: addi...
2634
  EXPORT_SYMBOL_GPL(ring_buffer_overrun_cpu);
7a8e76a38   Steven Rostedt   tracing: unified ...
2635
2636
  
  /**
f0d2c681a   Steven Rostedt   ring-buffer: add ...
2637
2638
2639
2640
2641
2642
2643
2644
2645
2646
2647
2648
2649
2650
   * ring_buffer_commit_overrun_cpu - get the number of overruns caused by commits
   * @buffer: The ring buffer
   * @cpu: The per CPU buffer to get the number of overruns from
   */
  unsigned long
  ring_buffer_commit_overrun_cpu(struct ring_buffer *buffer, int cpu)
  {
  	struct ring_buffer_per_cpu *cpu_buffer;
  	unsigned long ret;
  
  	if (!cpumask_test_cpu(cpu, buffer->cpumask))
  		return 0;
  
  	cpu_buffer = buffer->buffers[cpu];
77ae365ec   Steven Rostedt   ring-buffer: make...
2651
  	ret = local_read(&cpu_buffer->commit_overrun);
f0d2c681a   Steven Rostedt   ring-buffer: add ...
2652
2653
2654
2655
2656
2657
  
  	return ret;
  }
  EXPORT_SYMBOL_GPL(ring_buffer_commit_overrun_cpu);
  
  /**
7a8e76a38   Steven Rostedt   tracing: unified ...
2658
2659
2660
2661
2662
2663
2664
2665
2666
2667
2668
2669
2670
2671
2672
   * ring_buffer_entries - get the number of entries in a buffer
   * @buffer: The ring buffer
   *
   * Returns the total number of entries in the ring buffer
   * (all CPU entries)
   */
  unsigned long ring_buffer_entries(struct ring_buffer *buffer)
  {
  	struct ring_buffer_per_cpu *cpu_buffer;
  	unsigned long entries = 0;
  	int cpu;
  
  	/* if you care about this being correct, lock the buffer */
  	for_each_buffer_cpu(buffer, cpu) {
  		cpu_buffer = buffer->buffers[cpu];
f6195aa09   Steven Rostedt   ring-buffer: Plac...
2673
  		entries += rb_num_of_entries(cpu_buffer);
7a8e76a38   Steven Rostedt   tracing: unified ...
2674
2675
2676
2677
  	}
  
  	return entries;
  }
c4f50183f   Robert Richter   ring_buffer: addi...
2678
  EXPORT_SYMBOL_GPL(ring_buffer_entries);
7a8e76a38   Steven Rostedt   tracing: unified ...
2679
2680
  
  /**
67b394f7f   Jiri Olsa   tracing: Fix comm...
2681
   * ring_buffer_overruns - get the number of overruns in buffer
7a8e76a38   Steven Rostedt   tracing: unified ...
2682
2683
2684
2685
2686
2687
2688
2689
2690
2691
2692
2693
2694
2695
   * @buffer: The ring buffer
   *
   * Returns the total number of overruns in the ring buffer
   * (all CPU entries)
   */
  unsigned long ring_buffer_overruns(struct ring_buffer *buffer)
  {
  	struct ring_buffer_per_cpu *cpu_buffer;
  	unsigned long overruns = 0;
  	int cpu;
  
  	/* if you care about this being correct, lock the buffer */
  	for_each_buffer_cpu(buffer, cpu) {
  		cpu_buffer = buffer->buffers[cpu];
77ae365ec   Steven Rostedt   ring-buffer: make...
2696
  		overruns += local_read(&cpu_buffer->overrun);
7a8e76a38   Steven Rostedt   tracing: unified ...
2697
2698
2699
2700
  	}
  
  	return overruns;
  }
c4f50183f   Robert Richter   ring_buffer: addi...
2701
  EXPORT_SYMBOL_GPL(ring_buffer_overruns);
7a8e76a38   Steven Rostedt   tracing: unified ...
2702

642edba5f   Steven Rostedt   ring-buffer: fix ...
2703
  static void rb_iter_reset(struct ring_buffer_iter *iter)
7a8e76a38   Steven Rostedt   tracing: unified ...
2704
2705
  {
  	struct ring_buffer_per_cpu *cpu_buffer = iter->cpu_buffer;
d769041f8   Steven Rostedt   ring_buffer: impl...
2706
2707
  	/* Iterator usage is expected to have record disabled */
  	if (list_empty(&cpu_buffer->reader_page->list)) {
77ae365ec   Steven Rostedt   ring-buffer: make...
2708
2709
2710
2711
  		iter->head_page = rb_set_head_page(cpu_buffer);
  		if (unlikely(!iter->head_page))
  			return;
  		iter->head = iter->head_page->read;
d769041f8   Steven Rostedt   ring_buffer: impl...
2712
2713
  	} else {
  		iter->head_page = cpu_buffer->reader_page;
6f807acd2   Steven Rostedt   ring-buffer: move...
2714
  		iter->head = cpu_buffer->reader_page->read;
d769041f8   Steven Rostedt   ring_buffer: impl...
2715
2716
2717
2718
  	}
  	if (iter->head)
  		iter->read_stamp = cpu_buffer->read_stamp;
  	else
abc9b56d6   Steven Rostedt   ring-buffer: move...
2719
  		iter->read_stamp = iter->head_page->page->time_stamp;
492a74f42   Steven Rostedt   ring-buffer: Chec...
2720
2721
  	iter->cache_reader_page = cpu_buffer->reader_page;
  	iter->cache_read = cpu_buffer->read;
642edba5f   Steven Rostedt   ring-buffer: fix ...
2722
  }
f83c9d0fe   Steven Rostedt   ring-buffer: add ...
2723

642edba5f   Steven Rostedt   ring-buffer: fix ...
2724
2725
2726
2727
2728
2729
2730
2731
2732
  /**
   * ring_buffer_iter_reset - reset an iterator
   * @iter: The iterator to reset
   *
   * Resets the iterator, so that it will start from the beginning
   * again.
   */
  void ring_buffer_iter_reset(struct ring_buffer_iter *iter)
  {
554f786e2   Steven Rostedt   ring-buffer: only...
2733
  	struct ring_buffer_per_cpu *cpu_buffer;
642edba5f   Steven Rostedt   ring-buffer: fix ...
2734
  	unsigned long flags;
554f786e2   Steven Rostedt   ring-buffer: only...
2735
2736
2737
2738
  	if (!iter)
  		return;
  
  	cpu_buffer = iter->cpu_buffer;
5389f6fad   Thomas Gleixner   locking, tracing:...
2739
  	raw_spin_lock_irqsave(&cpu_buffer->reader_lock, flags);
642edba5f   Steven Rostedt   ring-buffer: fix ...
2740
  	rb_iter_reset(iter);
5389f6fad   Thomas Gleixner   locking, tracing:...
2741
  	raw_spin_unlock_irqrestore(&cpu_buffer->reader_lock, flags);
7a8e76a38   Steven Rostedt   tracing: unified ...
2742
  }
c4f50183f   Robert Richter   ring_buffer: addi...
2743
  EXPORT_SYMBOL_GPL(ring_buffer_iter_reset);
7a8e76a38   Steven Rostedt   tracing: unified ...
2744
2745
2746
2747
2748
2749
2750
2751
2752
2753
  
  /**
   * ring_buffer_iter_empty - check if an iterator has no more to read
   * @iter: The iterator to check
   */
  int ring_buffer_iter_empty(struct ring_buffer_iter *iter)
  {
  	struct ring_buffer_per_cpu *cpu_buffer;
  
  	cpu_buffer = iter->cpu_buffer;
bf41a158c   Steven Rostedt   ring-buffer: make...
2754
2755
  	return iter->head_page == cpu_buffer->commit_page &&
  		iter->head == rb_commit_index(cpu_buffer);
7a8e76a38   Steven Rostedt   tracing: unified ...
2756
  }
c4f50183f   Robert Richter   ring_buffer: addi...
2757
  EXPORT_SYMBOL_GPL(ring_buffer_iter_empty);
7a8e76a38   Steven Rostedt   tracing: unified ...
2758
2759
2760
2761
2762
2763
  
  static void
  rb_update_read_stamp(struct ring_buffer_per_cpu *cpu_buffer,
  		     struct ring_buffer_event *event)
  {
  	u64 delta;
334d4169a   Lai Jiangshan   ring_buffer: comp...
2764
  	switch (event->type_len) {
7a8e76a38   Steven Rostedt   tracing: unified ...
2765
2766
2767
2768
2769
2770
2771
2772
2773
2774
2775
2776
2777
2778
2779
2780
2781
2782
2783
2784
2785
2786
2787
2788
2789
2790
2791
2792
2793
  	case RINGBUF_TYPE_PADDING:
  		return;
  
  	case RINGBUF_TYPE_TIME_EXTEND:
  		delta = event->array[0];
  		delta <<= TS_SHIFT;
  		delta += event->time_delta;
  		cpu_buffer->read_stamp += delta;
  		return;
  
  	case RINGBUF_TYPE_TIME_STAMP:
  		/* FIXME: not implemented */
  		return;
  
  	case RINGBUF_TYPE_DATA:
  		cpu_buffer->read_stamp += event->time_delta;
  		return;
  
  	default:
  		BUG();
  	}
  	return;
  }
  
  static void
  rb_update_iter_read_stamp(struct ring_buffer_iter *iter,
  			  struct ring_buffer_event *event)
  {
  	u64 delta;
334d4169a   Lai Jiangshan   ring_buffer: comp...
2794
  	switch (event->type_len) {
7a8e76a38   Steven Rostedt   tracing: unified ...
2795
2796
2797
2798
2799
2800
2801
2802
2803
2804
2805
2806
2807
2808
2809
2810
2811
2812
2813
2814
2815
2816
2817
  	case RINGBUF_TYPE_PADDING:
  		return;
  
  	case RINGBUF_TYPE_TIME_EXTEND:
  		delta = event->array[0];
  		delta <<= TS_SHIFT;
  		delta += event->time_delta;
  		iter->read_stamp += delta;
  		return;
  
  	case RINGBUF_TYPE_TIME_STAMP:
  		/* FIXME: not implemented */
  		return;
  
  	case RINGBUF_TYPE_DATA:
  		iter->read_stamp += event->time_delta;
  		return;
  
  	default:
  		BUG();
  	}
  	return;
  }
d769041f8   Steven Rostedt   ring_buffer: impl...
2818
2819
  static struct buffer_page *
  rb_get_reader_page(struct ring_buffer_per_cpu *cpu_buffer)
7a8e76a38   Steven Rostedt   tracing: unified ...
2820
  {
d769041f8   Steven Rostedt   ring_buffer: impl...
2821
  	struct buffer_page *reader = NULL;
66a8cb95e   Steven Rostedt   ring-buffer: Add ...
2822
  	unsigned long overwrite;
d769041f8   Steven Rostedt   ring_buffer: impl...
2823
  	unsigned long flags;
818e3dd30   Steven Rostedt   tracing, ring-buf...
2824
  	int nr_loops = 0;
77ae365ec   Steven Rostedt   ring-buffer: make...
2825
  	int ret;
d769041f8   Steven Rostedt   ring_buffer: impl...
2826

3e03fb7f1   Steven Rostedt   ring-buffer: conv...
2827
  	local_irq_save(flags);
0199c4e68   Thomas Gleixner   locking: Convert ...
2828
  	arch_spin_lock(&cpu_buffer->lock);
d769041f8   Steven Rostedt   ring_buffer: impl...
2829
2830
  
   again:
818e3dd30   Steven Rostedt   tracing, ring-buf...
2831
2832
2833
2834
2835
2836
  	/*
  	 * This should normally only loop twice. But because the
  	 * start of the reader inserts an empty page, it causes
  	 * a case where we will loop three times. There should be no
  	 * reason to loop four times (that I know of).
  	 */
3e89c7bb9   Steven Rostedt   ring-buffer: clea...
2837
  	if (RB_WARN_ON(cpu_buffer, ++nr_loops > 3)) {
818e3dd30   Steven Rostedt   tracing, ring-buf...
2838
2839
2840
  		reader = NULL;
  		goto out;
  	}
d769041f8   Steven Rostedt   ring_buffer: impl...
2841
2842
2843
  	reader = cpu_buffer->reader_page;
  
  	/* If there's more to read, return this page */
bf41a158c   Steven Rostedt   ring-buffer: make...
2844
  	if (cpu_buffer->reader_page->read < rb_page_size(reader))
d769041f8   Steven Rostedt   ring_buffer: impl...
2845
2846
2847
  		goto out;
  
  	/* Never should we have an index greater than the size */
3e89c7bb9   Steven Rostedt   ring-buffer: clea...
2848
2849
2850
  	if (RB_WARN_ON(cpu_buffer,
  		       cpu_buffer->reader_page->read > rb_page_size(reader)))
  		goto out;
d769041f8   Steven Rostedt   ring_buffer: impl...
2851
2852
2853
  
  	/* check if we caught up to the tail */
  	reader = NULL;
bf41a158c   Steven Rostedt   ring-buffer: make...
2854
  	if (cpu_buffer->commit_page == cpu_buffer->reader_page)
d769041f8   Steven Rostedt   ring_buffer: impl...
2855
  		goto out;
7a8e76a38   Steven Rostedt   tracing: unified ...
2856
2857
  
  	/*
d769041f8   Steven Rostedt   ring_buffer: impl...
2858
  	 * Reset the reader page to size zero.
7a8e76a38   Steven Rostedt   tracing: unified ...
2859
  	 */
77ae365ec   Steven Rostedt   ring-buffer: make...
2860
2861
2862
  	local_set(&cpu_buffer->reader_page->write, 0);
  	local_set(&cpu_buffer->reader_page->entries, 0);
  	local_set(&cpu_buffer->reader_page->page->commit, 0);
ff0ff84a0   Steven Rostedt   ring-buffer: Add ...
2863
  	cpu_buffer->reader_page->real_end = 0;
7a8e76a38   Steven Rostedt   tracing: unified ...
2864

77ae365ec   Steven Rostedt   ring-buffer: make...
2865
2866
2867
2868
2869
   spin:
  	/*
  	 * Splice the empty reader page into the list around the head.
  	 */
  	reader = rb_set_head_page(cpu_buffer);
0e1ff5d72   Steven Rostedt   ring-buffer: Add ...
2870
  	cpu_buffer->reader_page->list.next = rb_list_head(reader->list.next);
d769041f8   Steven Rostedt   ring_buffer: impl...
2871
  	cpu_buffer->reader_page->list.prev = reader->list.prev;
bf41a158c   Steven Rostedt   ring-buffer: make...
2872

3adc54fa8   Steven Rostedt   ring-buffer: make...
2873
2874
2875
  	/*
  	 * cpu_buffer->pages just needs to point to the buffer, it
  	 *  has no specific buffer page to point to. Lets move it out
25985edce   Lucas De Marchi   Fix common misspe...
2876
  	 *  of our way so we don't accidentally swap it.
3adc54fa8   Steven Rostedt   ring-buffer: make...
2877
2878
  	 */
  	cpu_buffer->pages = reader->list.prev;
77ae365ec   Steven Rostedt   ring-buffer: make...
2879
2880
  	/* The reader page will be pointing to the new head */
  	rb_set_list_to_head(cpu_buffer, &cpu_buffer->reader_page->list);
7a8e76a38   Steven Rostedt   tracing: unified ...
2881

77ae365ec   Steven Rostedt   ring-buffer: make...
2882
  	/*
66a8cb95e   Steven Rostedt   ring-buffer: Add ...
2883
2884
2885
2886
2887
2888
2889
2890
2891
2892
2893
2894
  	 * We want to make sure we read the overruns after we set up our
  	 * pointers to the next object. The writer side does a
  	 * cmpxchg to cross pages which acts as the mb on the writer
  	 * side. Note, the reader will constantly fail the swap
  	 * while the writer is updating the pointers, so this
  	 * guarantees that the overwrite recorded here is the one we
  	 * want to compare with the last_overrun.
  	 */
  	smp_mb();
  	overwrite = local_read(&(cpu_buffer->overrun));
  
  	/*
77ae365ec   Steven Rostedt   ring-buffer: make...
2895
2896
2897
2898
2899
2900
2901
2902
2903
2904
2905
  	 * Here's the tricky part.
  	 *
  	 * We need to move the pointer past the header page.
  	 * But we can only do that if a writer is not currently
  	 * moving it. The page before the header page has the
  	 * flag bit '1' set if it is pointing to the page we want.
  	 * but if the writer is in the process of moving it
  	 * than it will be '2' or already moved '0'.
  	 */
  
  	ret = rb_head_page_replace(reader, cpu_buffer->reader_page);
7a8e76a38   Steven Rostedt   tracing: unified ...
2906
2907
  
  	/*
77ae365ec   Steven Rostedt   ring-buffer: make...
2908
  	 * If we did not convert it, then we must try again.
7a8e76a38   Steven Rostedt   tracing: unified ...
2909
  	 */
77ae365ec   Steven Rostedt   ring-buffer: make...
2910
2911
  	if (!ret)
  		goto spin;
7a8e76a38   Steven Rostedt   tracing: unified ...
2912

77ae365ec   Steven Rostedt   ring-buffer: make...
2913
2914
2915
2916
2917
  	/*
  	 * Yeah! We succeeded in replacing the page.
  	 *
  	 * Now make the new head point back to the reader page.
  	 */
5ded3dc6a   David Sharp   ring-buffer: Wrap...
2918
  	rb_list_head(reader->list.next)->prev = &cpu_buffer->reader_page->list;
77ae365ec   Steven Rostedt   ring-buffer: make...
2919
  	rb_inc_page(cpu_buffer, &cpu_buffer->head_page);
d769041f8   Steven Rostedt   ring_buffer: impl...
2920
2921
2922
2923
  
  	/* Finally update the reader page to the new head */
  	cpu_buffer->reader_page = reader;
  	rb_reset_reader_page(cpu_buffer);
66a8cb95e   Steven Rostedt   ring-buffer: Add ...
2924
2925
2926
2927
  	if (overwrite != cpu_buffer->last_overrun) {
  		cpu_buffer->lost_events = overwrite - cpu_buffer->last_overrun;
  		cpu_buffer->last_overrun = overwrite;
  	}
d769041f8   Steven Rostedt   ring_buffer: impl...
2928
2929
2930
  	goto again;
  
   out:
0199c4e68   Thomas Gleixner   locking: Convert ...
2931
  	arch_spin_unlock(&cpu_buffer->lock);
3e03fb7f1   Steven Rostedt   ring-buffer: conv...
2932
  	local_irq_restore(flags);
d769041f8   Steven Rostedt   ring_buffer: impl...
2933
2934
2935
2936
2937
2938
2939
2940
2941
2942
2943
  
  	return reader;
  }
  
  static void rb_advance_reader(struct ring_buffer_per_cpu *cpu_buffer)
  {
  	struct ring_buffer_event *event;
  	struct buffer_page *reader;
  	unsigned length;
  
  	reader = rb_get_reader_page(cpu_buffer);
7a8e76a38   Steven Rostedt   tracing: unified ...
2944

d769041f8   Steven Rostedt   ring_buffer: impl...
2945
  	/* This function should not be called when buffer is empty */
3e89c7bb9   Steven Rostedt   ring-buffer: clea...
2946
2947
  	if (RB_WARN_ON(cpu_buffer, !reader))
  		return;
7a8e76a38   Steven Rostedt   tracing: unified ...
2948

d769041f8   Steven Rostedt   ring_buffer: impl...
2949
  	event = rb_reader_event(cpu_buffer);
a1863c212   Steven Rostedt   ring-buffer: do n...
2950
  	if (event->type_len <= RINGBUF_TYPE_DATA_TYPE_LEN_MAX)
e4906eff9   Steven Rostedt   ring-buffer: conv...
2951
  		cpu_buffer->read++;
d769041f8   Steven Rostedt   ring_buffer: impl...
2952
2953
2954
2955
  
  	rb_update_read_stamp(cpu_buffer, event);
  
  	length = rb_event_length(event);
6f807acd2   Steven Rostedt   ring-buffer: move...
2956
  	cpu_buffer->reader_page->read += length;
7a8e76a38   Steven Rostedt   tracing: unified ...
2957
2958
2959
2960
  }
  
  static void rb_advance_iter(struct ring_buffer_iter *iter)
  {
7a8e76a38   Steven Rostedt   tracing: unified ...
2961
2962
2963
2964
2965
  	struct ring_buffer_per_cpu *cpu_buffer;
  	struct ring_buffer_event *event;
  	unsigned length;
  
  	cpu_buffer = iter->cpu_buffer;
7a8e76a38   Steven Rostedt   tracing: unified ...
2966
2967
2968
2969
  
  	/*
  	 * Check if we are at the end of the buffer.
  	 */
bf41a158c   Steven Rostedt   ring-buffer: make...
2970
  	if (iter->head >= rb_page_size(iter->head_page)) {
ea05b57cc   Steven Rostedt   ring-buffer: disc...
2971
2972
  		/* discarded commits can make the page empty */
  		if (iter->head_page == cpu_buffer->commit_page)
3e89c7bb9   Steven Rostedt   ring-buffer: clea...
2973
  			return;
d769041f8   Steven Rostedt   ring_buffer: impl...
2974
  		rb_inc_iter(iter);
7a8e76a38   Steven Rostedt   tracing: unified ...
2975
2976
2977
2978
2979
2980
2981
2982
2983
2984
2985
  		return;
  	}
  
  	event = rb_iter_head_event(iter);
  
  	length = rb_event_length(event);
  
  	/*
  	 * This should not be called to advance the header if we are
  	 * at the tail of the buffer.
  	 */
3e89c7bb9   Steven Rostedt   ring-buffer: clea...
2986
  	if (RB_WARN_ON(cpu_buffer,
f536aafc5   Steven Rostedt   ring-buffer: repl...
2987
  		       (iter->head_page == cpu_buffer->commit_page) &&
3e89c7bb9   Steven Rostedt   ring-buffer: clea...
2988
2989
  		       (iter->head + length > rb_commit_index(cpu_buffer))))
  		return;
7a8e76a38   Steven Rostedt   tracing: unified ...
2990
2991
2992
2993
2994
2995
  
  	rb_update_iter_read_stamp(iter, event);
  
  	iter->head += length;
  
  	/* check for end of page padding */
bf41a158c   Steven Rostedt   ring-buffer: make...
2996
2997
  	if ((iter->head >= rb_page_size(iter->head_page)) &&
  	    (iter->head_page != cpu_buffer->commit_page))
7a8e76a38   Steven Rostedt   tracing: unified ...
2998
2999
  		rb_advance_iter(iter);
  }
66a8cb95e   Steven Rostedt   ring-buffer: Add ...
3000
3001
3002
3003
  static int rb_lost_events(struct ring_buffer_per_cpu *cpu_buffer)
  {
  	return cpu_buffer->lost_events;
  }
f83c9d0fe   Steven Rostedt   ring-buffer: add ...
3004
  static struct ring_buffer_event *
66a8cb95e   Steven Rostedt   ring-buffer: Add ...
3005
3006
  rb_buffer_peek(struct ring_buffer_per_cpu *cpu_buffer, u64 *ts,
  	       unsigned long *lost_events)
7a8e76a38   Steven Rostedt   tracing: unified ...
3007
  {
7a8e76a38   Steven Rostedt   tracing: unified ...
3008
  	struct ring_buffer_event *event;
d769041f8   Steven Rostedt   ring_buffer: impl...
3009
  	struct buffer_page *reader;
818e3dd30   Steven Rostedt   tracing, ring-buf...
3010
  	int nr_loops = 0;
7a8e76a38   Steven Rostedt   tracing: unified ...
3011

7a8e76a38   Steven Rostedt   tracing: unified ...
3012
   again:
818e3dd30   Steven Rostedt   tracing, ring-buf...
3013
  	/*
69d1b839f   Steven Rostedt   ring-buffer: Bind...
3014
3015
3016
3017
  	 * We repeat when a time extend is encountered.
  	 * Since the time extend is always attached to a data event,
  	 * we should never loop more than once.
  	 * (We never hit the following condition more than twice).
818e3dd30   Steven Rostedt   tracing, ring-buf...
3018
  	 */
69d1b839f   Steven Rostedt   ring-buffer: Bind...
3019
  	if (RB_WARN_ON(cpu_buffer, ++nr_loops > 2))
818e3dd30   Steven Rostedt   tracing, ring-buf...
3020
  		return NULL;
818e3dd30   Steven Rostedt   tracing, ring-buf...
3021

d769041f8   Steven Rostedt   ring_buffer: impl...
3022
3023
  	reader = rb_get_reader_page(cpu_buffer);
  	if (!reader)
7a8e76a38   Steven Rostedt   tracing: unified ...
3024
  		return NULL;
d769041f8   Steven Rostedt   ring_buffer: impl...
3025
  	event = rb_reader_event(cpu_buffer);
7a8e76a38   Steven Rostedt   tracing: unified ...
3026

334d4169a   Lai Jiangshan   ring_buffer: comp...
3027
  	switch (event->type_len) {
7a8e76a38   Steven Rostedt   tracing: unified ...
3028
  	case RINGBUF_TYPE_PADDING:
2d622719f   Tom Zanussi   tracing: add ring...
3029
3030
3031
3032
3033
3034
3035
3036
3037
3038
  		if (rb_null_event(event))
  			RB_WARN_ON(cpu_buffer, 1);
  		/*
  		 * Because the writer could be discarding every
  		 * event it creates (which would probably be bad)
  		 * if we were to go back to "again" then we may never
  		 * catch up, and will trigger the warn on, or lock
  		 * the box. Return the padding, and we will release
  		 * the current locks, and try again.
  		 */
2d622719f   Tom Zanussi   tracing: add ring...
3039
  		return event;
7a8e76a38   Steven Rostedt   tracing: unified ...
3040
3041
3042
  
  	case RINGBUF_TYPE_TIME_EXTEND:
  		/* Internal data, OK to advance */
d769041f8   Steven Rostedt   ring_buffer: impl...
3043
  		rb_advance_reader(cpu_buffer);
7a8e76a38   Steven Rostedt   tracing: unified ...
3044
3045
3046
3047
  		goto again;
  
  	case RINGBUF_TYPE_TIME_STAMP:
  		/* FIXME: not implemented */
d769041f8   Steven Rostedt   ring_buffer: impl...
3048
  		rb_advance_reader(cpu_buffer);
7a8e76a38   Steven Rostedt   tracing: unified ...
3049
3050
3051
3052
3053
  		goto again;
  
  	case RINGBUF_TYPE_DATA:
  		if (ts) {
  			*ts = cpu_buffer->read_stamp + event->time_delta;
d8eeb2d3b   Robert Richter   ring-buffer: cons...
3054
  			ring_buffer_normalize_time_stamp(cpu_buffer->buffer,
37886f6a9   Steven Rostedt   ring-buffer: add ...
3055
  							 cpu_buffer->cpu, ts);
7a8e76a38   Steven Rostedt   tracing: unified ...
3056
  		}
66a8cb95e   Steven Rostedt   ring-buffer: Add ...
3057
3058
  		if (lost_events)
  			*lost_events = rb_lost_events(cpu_buffer);
7a8e76a38   Steven Rostedt   tracing: unified ...
3059
3060
3061
3062
3063
3064
3065
3066
  		return event;
  
  	default:
  		BUG();
  	}
  
  	return NULL;
  }
c4f50183f   Robert Richter   ring_buffer: addi...
3067
  EXPORT_SYMBOL_GPL(ring_buffer_peek);
7a8e76a38   Steven Rostedt   tracing: unified ...
3068

f83c9d0fe   Steven Rostedt   ring-buffer: add ...
3069
3070
  static struct ring_buffer_event *
  rb_iter_peek(struct ring_buffer_iter *iter, u64 *ts)
7a8e76a38   Steven Rostedt   tracing: unified ...
3071
3072
3073
3074
  {
  	struct ring_buffer *buffer;
  	struct ring_buffer_per_cpu *cpu_buffer;
  	struct ring_buffer_event *event;
818e3dd30   Steven Rostedt   tracing, ring-buf...
3075
  	int nr_loops = 0;
7a8e76a38   Steven Rostedt   tracing: unified ...
3076

7a8e76a38   Steven Rostedt   tracing: unified ...
3077
3078
  	cpu_buffer = iter->cpu_buffer;
  	buffer = cpu_buffer->buffer;
492a74f42   Steven Rostedt   ring-buffer: Chec...
3079
3080
3081
3082
3083
3084
3085
3086
  	/*
  	 * Check if someone performed a consuming read to
  	 * the buffer. A consuming read invalidates the iterator
  	 * and we need to reset the iterator in this case.
  	 */
  	if (unlikely(iter->cache_read != cpu_buffer->read ||
  		     iter->cache_reader_page != cpu_buffer->reader_page))
  		rb_iter_reset(iter);
7a8e76a38   Steven Rostedt   tracing: unified ...
3087
   again:
3c05d7482   Steven Rostedt   ring-buffer: Chec...
3088
3089
  	if (ring_buffer_iter_empty(iter))
  		return NULL;
818e3dd30   Steven Rostedt   tracing, ring-buf...
3090
  	/*
69d1b839f   Steven Rostedt   ring-buffer: Bind...
3091
3092
3093
3094
  	 * We repeat when a time extend is encountered.
  	 * Since the time extend is always attached to a data event,
  	 * we should never loop more than once.
  	 * (We never hit the following condition more than twice).
818e3dd30   Steven Rostedt   tracing, ring-buf...
3095
  	 */
69d1b839f   Steven Rostedt   ring-buffer: Bind...
3096
  	if (RB_WARN_ON(cpu_buffer, ++nr_loops > 2))
818e3dd30   Steven Rostedt   tracing, ring-buf...
3097
  		return NULL;
818e3dd30   Steven Rostedt   tracing, ring-buf...
3098

7a8e76a38   Steven Rostedt   tracing: unified ...
3099
3100
  	if (rb_per_cpu_empty(cpu_buffer))
  		return NULL;
3c05d7482   Steven Rostedt   ring-buffer: Chec...
3101
3102
3103
3104
  	if (iter->head >= local_read(&iter->head_page->page->commit)) {
  		rb_inc_iter(iter);
  		goto again;
  	}
7a8e76a38   Steven Rostedt   tracing: unified ...
3105
  	event = rb_iter_head_event(iter);
334d4169a   Lai Jiangshan   ring_buffer: comp...
3106
  	switch (event->type_len) {
7a8e76a38   Steven Rostedt   tracing: unified ...
3107
  	case RINGBUF_TYPE_PADDING:
2d622719f   Tom Zanussi   tracing: add ring...
3108
3109
3110
3111
3112
3113
  		if (rb_null_event(event)) {
  			rb_inc_iter(iter);
  			goto again;
  		}
  		rb_advance_iter(iter);
  		return event;
7a8e76a38   Steven Rostedt   tracing: unified ...
3114
3115
3116
3117
3118
3119
3120
3121
3122
3123
3124
3125
3126
3127
  
  	case RINGBUF_TYPE_TIME_EXTEND:
  		/* Internal data, OK to advance */
  		rb_advance_iter(iter);
  		goto again;
  
  	case RINGBUF_TYPE_TIME_STAMP:
  		/* FIXME: not implemented */
  		rb_advance_iter(iter);
  		goto again;
  
  	case RINGBUF_TYPE_DATA:
  		if (ts) {
  			*ts = iter->read_stamp + event->time_delta;
37886f6a9   Steven Rostedt   ring-buffer: add ...
3128
3129
  			ring_buffer_normalize_time_stamp(buffer,
  							 cpu_buffer->cpu, ts);
7a8e76a38   Steven Rostedt   tracing: unified ...
3130
3131
3132
3133
3134
3135
3136
3137
3138
  		}
  		return event;
  
  	default:
  		BUG();
  	}
  
  	return NULL;
  }
c4f50183f   Robert Richter   ring_buffer: addi...
3139
  EXPORT_SYMBOL_GPL(ring_buffer_iter_peek);
7a8e76a38   Steven Rostedt   tracing: unified ...
3140

8d707e8eb   Steven Rostedt   ring-buffer: do n...
3141
3142
3143
3144
3145
3146
3147
3148
  static inline int rb_ok_to_lock(void)
  {
  	/*
  	 * If an NMI die dumps out the content of the ring buffer
  	 * do not grab locks. We also permanently disable the ring
  	 * buffer too. A one time deal is all you get from reading
  	 * the ring buffer from an NMI.
  	 */
464e85eb0   Steven Rostedt   ring-buffer: do n...
3149
  	if (likely(!in_nmi()))
8d707e8eb   Steven Rostedt   ring-buffer: do n...
3150
3151
3152
3153
3154
  		return 1;
  
  	tracing_off_permanent();
  	return 0;
  }
7a8e76a38   Steven Rostedt   tracing: unified ...
3155
  /**
f83c9d0fe   Steven Rostedt   ring-buffer: add ...
3156
3157
3158
3159
   * ring_buffer_peek - peek at the next event to be read
   * @buffer: The ring buffer to read
   * @cpu: The cpu to peak at
   * @ts: The timestamp counter of this event.
66a8cb95e   Steven Rostedt   ring-buffer: Add ...
3160
   * @lost_events: a variable to store if events were lost (may be NULL)
f83c9d0fe   Steven Rostedt   ring-buffer: add ...
3161
3162
3163
3164
3165
   *
   * This will return the event that will be read next, but does
   * not consume the data.
   */
  struct ring_buffer_event *
66a8cb95e   Steven Rostedt   ring-buffer: Add ...
3166
3167
  ring_buffer_peek(struct ring_buffer *buffer, int cpu, u64 *ts,
  		 unsigned long *lost_events)
f83c9d0fe   Steven Rostedt   ring-buffer: add ...
3168
3169
  {
  	struct ring_buffer_per_cpu *cpu_buffer = buffer->buffers[cpu];
8aabee573   Steven Rostedt   ring-buffer: remo...
3170
  	struct ring_buffer_event *event;
f83c9d0fe   Steven Rostedt   ring-buffer: add ...
3171
  	unsigned long flags;
8d707e8eb   Steven Rostedt   ring-buffer: do n...
3172
  	int dolock;
f83c9d0fe   Steven Rostedt   ring-buffer: add ...
3173

554f786e2   Steven Rostedt   ring-buffer: only...
3174
  	if (!cpumask_test_cpu(cpu, buffer->cpumask))
8aabee573   Steven Rostedt   ring-buffer: remo...
3175
  		return NULL;
554f786e2   Steven Rostedt   ring-buffer: only...
3176

8d707e8eb   Steven Rostedt   ring-buffer: do n...
3177
  	dolock = rb_ok_to_lock();
2d622719f   Tom Zanussi   tracing: add ring...
3178
   again:
8d707e8eb   Steven Rostedt   ring-buffer: do n...
3179
3180
  	local_irq_save(flags);
  	if (dolock)
5389f6fad   Thomas Gleixner   locking, tracing:...
3181
  		raw_spin_lock(&cpu_buffer->reader_lock);
66a8cb95e   Steven Rostedt   ring-buffer: Add ...
3182
  	event = rb_buffer_peek(cpu_buffer, ts, lost_events);
469535a59   Robert Richter   ring-buffer: Fix ...
3183
3184
  	if (event && event->type_len == RINGBUF_TYPE_PADDING)
  		rb_advance_reader(cpu_buffer);
8d707e8eb   Steven Rostedt   ring-buffer: do n...
3185
  	if (dolock)
5389f6fad   Thomas Gleixner   locking, tracing:...
3186
  		raw_spin_unlock(&cpu_buffer->reader_lock);
8d707e8eb   Steven Rostedt   ring-buffer: do n...
3187
  	local_irq_restore(flags);
f83c9d0fe   Steven Rostedt   ring-buffer: add ...
3188

1b959e18c   Steven Rostedt   ring-buffer: remo...
3189
  	if (event && event->type_len == RINGBUF_TYPE_PADDING)
2d622719f   Tom Zanussi   tracing: add ring...
3190
  		goto again;
2d622719f   Tom Zanussi   tracing: add ring...
3191

f83c9d0fe   Steven Rostedt   ring-buffer: add ...
3192
3193
3194
3195
3196
3197
3198
3199
3200
3201
3202
3203
3204
3205
3206
3207
3208
  	return event;
  }
  
  /**
   * ring_buffer_iter_peek - peek at the next event to be read
   * @iter: The ring buffer iterator
   * @ts: The timestamp counter of this event.
   *
   * This will return the event that will be read next, but does
   * not increment the iterator.
   */
  struct ring_buffer_event *
  ring_buffer_iter_peek(struct ring_buffer_iter *iter, u64 *ts)
  {
  	struct ring_buffer_per_cpu *cpu_buffer = iter->cpu_buffer;
  	struct ring_buffer_event *event;
  	unsigned long flags;
2d622719f   Tom Zanussi   tracing: add ring...
3209
   again:
5389f6fad   Thomas Gleixner   locking, tracing:...
3210
  	raw_spin_lock_irqsave(&cpu_buffer->reader_lock, flags);
f83c9d0fe   Steven Rostedt   ring-buffer: add ...
3211
  	event = rb_iter_peek(iter, ts);
5389f6fad   Thomas Gleixner   locking, tracing:...
3212
  	raw_spin_unlock_irqrestore(&cpu_buffer->reader_lock, flags);
f83c9d0fe   Steven Rostedt   ring-buffer: add ...
3213

1b959e18c   Steven Rostedt   ring-buffer: remo...
3214
  	if (event && event->type_len == RINGBUF_TYPE_PADDING)
2d622719f   Tom Zanussi   tracing: add ring...
3215
  		goto again;
2d622719f   Tom Zanussi   tracing: add ring...
3216

f83c9d0fe   Steven Rostedt   ring-buffer: add ...
3217
3218
3219
3220
  	return event;
  }
  
  /**
7a8e76a38   Steven Rostedt   tracing: unified ...
3221
3222
   * ring_buffer_consume - return an event and consume it
   * @buffer: The ring buffer to get the next event from
66a8cb95e   Steven Rostedt   ring-buffer: Add ...
3223
3224
3225
   * @cpu: the cpu to read the buffer from
   * @ts: a variable to store the timestamp (may be NULL)
   * @lost_events: a variable to store if events were lost (may be NULL)
7a8e76a38   Steven Rostedt   tracing: unified ...
3226
3227
3228
3229
3230
3231
   *
   * Returns the next event in the ring buffer, and that event is consumed.
   * Meaning, that sequential reads will keep returning a different event,
   * and eventually empty the ring buffer if the producer is slower.
   */
  struct ring_buffer_event *
66a8cb95e   Steven Rostedt   ring-buffer: Add ...
3232
3233
  ring_buffer_consume(struct ring_buffer *buffer, int cpu, u64 *ts,
  		    unsigned long *lost_events)
7a8e76a38   Steven Rostedt   tracing: unified ...
3234
  {
554f786e2   Steven Rostedt   ring-buffer: only...
3235
3236
  	struct ring_buffer_per_cpu *cpu_buffer;
  	struct ring_buffer_event *event = NULL;
f83c9d0fe   Steven Rostedt   ring-buffer: add ...
3237
  	unsigned long flags;
8d707e8eb   Steven Rostedt   ring-buffer: do n...
3238
3239
3240
  	int dolock;
  
  	dolock = rb_ok_to_lock();
7a8e76a38   Steven Rostedt   tracing: unified ...
3241

2d622719f   Tom Zanussi   tracing: add ring...
3242
   again:
554f786e2   Steven Rostedt   ring-buffer: only...
3243
3244
  	/* might be called in atomic */
  	preempt_disable();
9e01c1b74   Rusty Russell   cpumask: convert ...
3245
  	if (!cpumask_test_cpu(cpu, buffer->cpumask))
554f786e2   Steven Rostedt   ring-buffer: only...
3246
  		goto out;
7a8e76a38   Steven Rostedt   tracing: unified ...
3247

554f786e2   Steven Rostedt   ring-buffer: only...
3248
  	cpu_buffer = buffer->buffers[cpu];
8d707e8eb   Steven Rostedt   ring-buffer: do n...
3249
3250
  	local_irq_save(flags);
  	if (dolock)
5389f6fad   Thomas Gleixner   locking, tracing:...
3251
  		raw_spin_lock(&cpu_buffer->reader_lock);
f83c9d0fe   Steven Rostedt   ring-buffer: add ...
3252

66a8cb95e   Steven Rostedt   ring-buffer: Add ...
3253
3254
3255
  	event = rb_buffer_peek(cpu_buffer, ts, lost_events);
  	if (event) {
  		cpu_buffer->lost_events = 0;
469535a59   Robert Richter   ring-buffer: Fix ...
3256
  		rb_advance_reader(cpu_buffer);
66a8cb95e   Steven Rostedt   ring-buffer: Add ...
3257
  	}
7a8e76a38   Steven Rostedt   tracing: unified ...
3258

8d707e8eb   Steven Rostedt   ring-buffer: do n...
3259
  	if (dolock)
5389f6fad   Thomas Gleixner   locking, tracing:...
3260
  		raw_spin_unlock(&cpu_buffer->reader_lock);
8d707e8eb   Steven Rostedt   ring-buffer: do n...
3261
  	local_irq_restore(flags);
f83c9d0fe   Steven Rostedt   ring-buffer: add ...
3262

554f786e2   Steven Rostedt   ring-buffer: only...
3263
3264
   out:
  	preempt_enable();
1b959e18c   Steven Rostedt   ring-buffer: remo...
3265
  	if (event && event->type_len == RINGBUF_TYPE_PADDING)
2d622719f   Tom Zanussi   tracing: add ring...
3266
  		goto again;
2d622719f   Tom Zanussi   tracing: add ring...
3267

7a8e76a38   Steven Rostedt   tracing: unified ...
3268
3269
  	return event;
  }
c4f50183f   Robert Richter   ring_buffer: addi...
3270
  EXPORT_SYMBOL_GPL(ring_buffer_consume);
7a8e76a38   Steven Rostedt   tracing: unified ...
3271
3272
  
  /**
72c9ddfd4   David Miller   ring-buffer: Make...
3273
   * ring_buffer_read_prepare - Prepare for a non consuming read of the buffer
7a8e76a38   Steven Rostedt   tracing: unified ...
3274
3275
3276
   * @buffer: The ring buffer to read from
   * @cpu: The cpu buffer to iterate over
   *
72c9ddfd4   David Miller   ring-buffer: Make...
3277
3278
3279
   * This performs the initial preparations necessary to iterate
   * through the buffer.  Memory is allocated, buffer recording
   * is disabled, and the iterator pointer is returned to the caller.
7a8e76a38   Steven Rostedt   tracing: unified ...
3280
   *
72c9ddfd4   David Miller   ring-buffer: Make...
3281
3282
3283
3284
3285
3286
3287
3288
3289
3290
   * Disabling buffer recordng prevents the reading from being
   * corrupted. This is not a consuming read, so a producer is not
   * expected.
   *
   * After a sequence of ring_buffer_read_prepare calls, the user is
   * expected to make at least one call to ring_buffer_prepare_sync.
   * Afterwards, ring_buffer_read_start is invoked to get things going
   * for real.
   *
   * This overall must be paired with ring_buffer_finish.
7a8e76a38   Steven Rostedt   tracing: unified ...
3291
3292
   */
  struct ring_buffer_iter *
72c9ddfd4   David Miller   ring-buffer: Make...
3293
  ring_buffer_read_prepare(struct ring_buffer *buffer, int cpu)
7a8e76a38   Steven Rostedt   tracing: unified ...
3294
3295
  {
  	struct ring_buffer_per_cpu *cpu_buffer;
8aabee573   Steven Rostedt   ring-buffer: remo...
3296
  	struct ring_buffer_iter *iter;
7a8e76a38   Steven Rostedt   tracing: unified ...
3297

9e01c1b74   Rusty Russell   cpumask: convert ...
3298
  	if (!cpumask_test_cpu(cpu, buffer->cpumask))
8aabee573   Steven Rostedt   ring-buffer: remo...
3299
  		return NULL;
7a8e76a38   Steven Rostedt   tracing: unified ...
3300
3301
3302
  
  	iter = kmalloc(sizeof(*iter), GFP_KERNEL);
  	if (!iter)
8aabee573   Steven Rostedt   ring-buffer: remo...
3303
  		return NULL;
7a8e76a38   Steven Rostedt   tracing: unified ...
3304
3305
3306
3307
3308
3309
  
  	cpu_buffer = buffer->buffers[cpu];
  
  	iter->cpu_buffer = cpu_buffer;
  
  	atomic_inc(&cpu_buffer->record_disabled);
72c9ddfd4   David Miller   ring-buffer: Make...
3310
3311
3312
3313
3314
3315
3316
3317
3318
3319
3320
3321
3322
3323
3324
  
  	return iter;
  }
  EXPORT_SYMBOL_GPL(ring_buffer_read_prepare);
  
  /**
   * ring_buffer_read_prepare_sync - Synchronize a set of prepare calls
   *
   * All previously invoked ring_buffer_read_prepare calls to prepare
   * iterators will be synchronized.  Afterwards, read_buffer_read_start
   * calls on those iterators are allowed.
   */
  void
  ring_buffer_read_prepare_sync(void)
  {
7a8e76a38   Steven Rostedt   tracing: unified ...
3325
  	synchronize_sched();
72c9ddfd4   David Miller   ring-buffer: Make...
3326
3327
3328
3329
3330
3331
3332
3333
3334
3335
3336
3337
3338
3339
3340
3341
3342
3343
3344
3345
3346
3347
3348
3349
  }
  EXPORT_SYMBOL_GPL(ring_buffer_read_prepare_sync);
  
  /**
   * ring_buffer_read_start - start a non consuming read of the buffer
   * @iter: The iterator returned by ring_buffer_read_prepare
   *
   * This finalizes the startup of an iteration through the buffer.
   * The iterator comes from a call to ring_buffer_read_prepare and
   * an intervening ring_buffer_read_prepare_sync must have been
   * performed.
   *
   * Must be paired with ring_buffer_finish.
   */
  void
  ring_buffer_read_start(struct ring_buffer_iter *iter)
  {
  	struct ring_buffer_per_cpu *cpu_buffer;
  	unsigned long flags;
  
  	if (!iter)
  		return;
  
  	cpu_buffer = iter->cpu_buffer;
7a8e76a38   Steven Rostedt   tracing: unified ...
3350

5389f6fad   Thomas Gleixner   locking, tracing:...
3351
  	raw_spin_lock_irqsave(&cpu_buffer->reader_lock, flags);
0199c4e68   Thomas Gleixner   locking: Convert ...
3352
  	arch_spin_lock(&cpu_buffer->lock);
642edba5f   Steven Rostedt   ring-buffer: fix ...
3353
  	rb_iter_reset(iter);
0199c4e68   Thomas Gleixner   locking: Convert ...
3354
  	arch_spin_unlock(&cpu_buffer->lock);
5389f6fad   Thomas Gleixner   locking, tracing:...
3355
  	raw_spin_unlock_irqrestore(&cpu_buffer->reader_lock, flags);
7a8e76a38   Steven Rostedt   tracing: unified ...
3356
  }
c4f50183f   Robert Richter   ring_buffer: addi...
3357
  EXPORT_SYMBOL_GPL(ring_buffer_read_start);
7a8e76a38   Steven Rostedt   tracing: unified ...
3358
3359
3360
3361
3362
3363
3364
3365
3366
3367
3368
3369
3370
3371
3372
3373
  
  /**
   * ring_buffer_finish - finish reading the iterator of the buffer
   * @iter: The iterator retrieved by ring_buffer_start
   *
   * This re-enables the recording to the buffer, and frees the
   * iterator.
   */
  void
  ring_buffer_read_finish(struct ring_buffer_iter *iter)
  {
  	struct ring_buffer_per_cpu *cpu_buffer = iter->cpu_buffer;
  
  	atomic_dec(&cpu_buffer->record_disabled);
  	kfree(iter);
  }
c4f50183f   Robert Richter   ring_buffer: addi...
3374
  EXPORT_SYMBOL_GPL(ring_buffer_read_finish);
7a8e76a38   Steven Rostedt   tracing: unified ...
3375
3376
3377
3378
3379
3380
3381
3382
3383
3384
3385
3386
  
  /**
   * ring_buffer_read - read the next item in the ring buffer by the iterator
   * @iter: The ring buffer iterator
   * @ts: The time stamp of the event read.
   *
   * This reads the next event in the ring buffer and increments the iterator.
   */
  struct ring_buffer_event *
  ring_buffer_read(struct ring_buffer_iter *iter, u64 *ts)
  {
  	struct ring_buffer_event *event;
f83c9d0fe   Steven Rostedt   ring-buffer: add ...
3387
3388
  	struct ring_buffer_per_cpu *cpu_buffer = iter->cpu_buffer;
  	unsigned long flags;
7a8e76a38   Steven Rostedt   tracing: unified ...
3389

5389f6fad   Thomas Gleixner   locking, tracing:...
3390
  	raw_spin_lock_irqsave(&cpu_buffer->reader_lock, flags);
7e9391cfe   Steven Rostedt   ring-buffer: fix ...
3391
   again:
f83c9d0fe   Steven Rostedt   ring-buffer: add ...
3392
  	event = rb_iter_peek(iter, ts);
7a8e76a38   Steven Rostedt   tracing: unified ...
3393
  	if (!event)
f83c9d0fe   Steven Rostedt   ring-buffer: add ...
3394
  		goto out;
7a8e76a38   Steven Rostedt   tracing: unified ...
3395

7e9391cfe   Steven Rostedt   ring-buffer: fix ...
3396
3397
  	if (event->type_len == RINGBUF_TYPE_PADDING)
  		goto again;
7a8e76a38   Steven Rostedt   tracing: unified ...
3398
  	rb_advance_iter(iter);
f83c9d0fe   Steven Rostedt   ring-buffer: add ...
3399
   out:
5389f6fad   Thomas Gleixner   locking, tracing:...
3400
  	raw_spin_unlock_irqrestore(&cpu_buffer->reader_lock, flags);
7a8e76a38   Steven Rostedt   tracing: unified ...
3401
3402
3403
  
  	return event;
  }
c4f50183f   Robert Richter   ring_buffer: addi...
3404
  EXPORT_SYMBOL_GPL(ring_buffer_read);
7a8e76a38   Steven Rostedt   tracing: unified ...
3405
3406
3407
3408
3409
3410
3411
3412
3413
  
  /**
   * ring_buffer_size - return the size of the ring buffer (in bytes)
   * @buffer: The ring buffer.
   */
  unsigned long ring_buffer_size(struct ring_buffer *buffer)
  {
  	return BUF_PAGE_SIZE * buffer->pages;
  }
c4f50183f   Robert Richter   ring_buffer: addi...
3414
  EXPORT_SYMBOL_GPL(ring_buffer_size);
7a8e76a38   Steven Rostedt   tracing: unified ...
3415
3416
3417
3418
  
  static void
  rb_reset_cpu(struct ring_buffer_per_cpu *cpu_buffer)
  {
77ae365ec   Steven Rostedt   ring-buffer: make...
3419
  	rb_head_page_deactivate(cpu_buffer);
7a8e76a38   Steven Rostedt   tracing: unified ...
3420
  	cpu_buffer->head_page
3adc54fa8   Steven Rostedt   ring-buffer: make...
3421
  		= list_entry(cpu_buffer->pages, struct buffer_page, list);
bf41a158c   Steven Rostedt   ring-buffer: make...
3422
  	local_set(&cpu_buffer->head_page->write, 0);
778c55d44   Steven Rostedt   ring-buffer: reco...
3423
  	local_set(&cpu_buffer->head_page->entries, 0);
abc9b56d6   Steven Rostedt   ring-buffer: move...
3424
  	local_set(&cpu_buffer->head_page->page->commit, 0);
d769041f8   Steven Rostedt   ring_buffer: impl...
3425

6f807acd2   Steven Rostedt   ring-buffer: move...
3426
  	cpu_buffer->head_page->read = 0;
bf41a158c   Steven Rostedt   ring-buffer: make...
3427
3428
3429
3430
3431
3432
  
  	cpu_buffer->tail_page = cpu_buffer->head_page;
  	cpu_buffer->commit_page = cpu_buffer->head_page;
  
  	INIT_LIST_HEAD(&cpu_buffer->reader_page->list);
  	local_set(&cpu_buffer->reader_page->write, 0);
778c55d44   Steven Rostedt   ring-buffer: reco...
3433
  	local_set(&cpu_buffer->reader_page->entries, 0);
abc9b56d6   Steven Rostedt   ring-buffer: move...
3434
  	local_set(&cpu_buffer->reader_page->page->commit, 0);
6f807acd2   Steven Rostedt   ring-buffer: move...
3435
  	cpu_buffer->reader_page->read = 0;
7a8e76a38   Steven Rostedt   tracing: unified ...
3436

77ae365ec   Steven Rostedt   ring-buffer: make...
3437
  	local_set(&cpu_buffer->commit_overrun, 0);
c64e148a3   Vaibhav Nagarnaik   trace: Add ring b...
3438
  	local_set(&cpu_buffer->entries_bytes, 0);
77ae365ec   Steven Rostedt   ring-buffer: make...
3439
  	local_set(&cpu_buffer->overrun, 0);
e4906eff9   Steven Rostedt   ring-buffer: conv...
3440
  	local_set(&cpu_buffer->entries, 0);
fa7439531   Steven Rostedt   ring-buffer: use ...
3441
3442
  	local_set(&cpu_buffer->committing, 0);
  	local_set(&cpu_buffer->commits, 0);
77ae365ec   Steven Rostedt   ring-buffer: make...
3443
  	cpu_buffer->read = 0;
c64e148a3   Vaibhav Nagarnaik   trace: Add ring b...
3444
  	cpu_buffer->read_bytes = 0;
69507c065   Steven Rostedt   ring-buffer: rese...
3445
3446
3447
  
  	cpu_buffer->write_stamp = 0;
  	cpu_buffer->read_stamp = 0;
77ae365ec   Steven Rostedt   ring-buffer: make...
3448

66a8cb95e   Steven Rostedt   ring-buffer: Add ...
3449
3450
  	cpu_buffer->lost_events = 0;
  	cpu_buffer->last_overrun = 0;
77ae365ec   Steven Rostedt   ring-buffer: make...
3451
  	rb_head_page_activate(cpu_buffer);
7a8e76a38   Steven Rostedt   tracing: unified ...
3452
3453
3454
3455
3456
3457
3458
3459
3460
3461
3462
  }
  
  /**
   * ring_buffer_reset_cpu - reset a ring buffer per CPU buffer
   * @buffer: The ring buffer to reset a per cpu buffer of
   * @cpu: The CPU buffer to be reset
   */
  void ring_buffer_reset_cpu(struct ring_buffer *buffer, int cpu)
  {
  	struct ring_buffer_per_cpu *cpu_buffer = buffer->buffers[cpu];
  	unsigned long flags;
9e01c1b74   Rusty Russell   cpumask: convert ...
3463
  	if (!cpumask_test_cpu(cpu, buffer->cpumask))
8aabee573   Steven Rostedt   ring-buffer: remo...
3464
  		return;
7a8e76a38   Steven Rostedt   tracing: unified ...
3465

41ede23ed   Steven Rostedt   ring-buffer: disa...
3466
  	atomic_inc(&cpu_buffer->record_disabled);
5389f6fad   Thomas Gleixner   locking, tracing:...
3467
  	raw_spin_lock_irqsave(&cpu_buffer->reader_lock, flags);
f83c9d0fe   Steven Rostedt   ring-buffer: add ...
3468

41b6a95d6   Steven Rostedt   ring-buffer: do n...
3469
3470
  	if (RB_WARN_ON(cpu_buffer, local_read(&cpu_buffer->committing)))
  		goto out;
0199c4e68   Thomas Gleixner   locking: Convert ...
3471
  	arch_spin_lock(&cpu_buffer->lock);
7a8e76a38   Steven Rostedt   tracing: unified ...
3472
3473
  
  	rb_reset_cpu(cpu_buffer);
0199c4e68   Thomas Gleixner   locking: Convert ...
3474
  	arch_spin_unlock(&cpu_buffer->lock);
f83c9d0fe   Steven Rostedt   ring-buffer: add ...
3475

41b6a95d6   Steven Rostedt   ring-buffer: do n...
3476
   out:
5389f6fad   Thomas Gleixner   locking, tracing:...
3477
  	raw_spin_unlock_irqrestore(&cpu_buffer->reader_lock, flags);
41ede23ed   Steven Rostedt   ring-buffer: disa...
3478
3479
  
  	atomic_dec(&cpu_buffer->record_disabled);
7a8e76a38   Steven Rostedt   tracing: unified ...
3480
  }
c4f50183f   Robert Richter   ring_buffer: addi...
3481
  EXPORT_SYMBOL_GPL(ring_buffer_reset_cpu);
7a8e76a38   Steven Rostedt   tracing: unified ...
3482
3483
3484
3485
3486
3487
3488
  
  /**
   * ring_buffer_reset - reset a ring buffer
   * @buffer: The ring buffer to reset all cpu buffers
   */
  void ring_buffer_reset(struct ring_buffer *buffer)
  {
7a8e76a38   Steven Rostedt   tracing: unified ...
3489
  	int cpu;
7a8e76a38   Steven Rostedt   tracing: unified ...
3490
  	for_each_buffer_cpu(buffer, cpu)
d769041f8   Steven Rostedt   ring_buffer: impl...
3491
  		ring_buffer_reset_cpu(buffer, cpu);
7a8e76a38   Steven Rostedt   tracing: unified ...
3492
  }
c4f50183f   Robert Richter   ring_buffer: addi...
3493
  EXPORT_SYMBOL_GPL(ring_buffer_reset);
7a8e76a38   Steven Rostedt   tracing: unified ...
3494
3495
3496
3497
3498
3499
3500
3501
  
  /**
   * rind_buffer_empty - is the ring buffer empty?
   * @buffer: The ring buffer to test
   */
  int ring_buffer_empty(struct ring_buffer *buffer)
  {
  	struct ring_buffer_per_cpu *cpu_buffer;
d47882078   Steven Rostedt   ring-buffer: add ...
3502
  	unsigned long flags;
8d707e8eb   Steven Rostedt   ring-buffer: do n...
3503
  	int dolock;
7a8e76a38   Steven Rostedt   tracing: unified ...
3504
  	int cpu;
d47882078   Steven Rostedt   ring-buffer: add ...
3505
  	int ret;
7a8e76a38   Steven Rostedt   tracing: unified ...
3506

8d707e8eb   Steven Rostedt   ring-buffer: do n...
3507
  	dolock = rb_ok_to_lock();
7a8e76a38   Steven Rostedt   tracing: unified ...
3508
3509
3510
3511
  
  	/* yes this is racy, but if you don't like the race, lock the buffer */
  	for_each_buffer_cpu(buffer, cpu) {
  		cpu_buffer = buffer->buffers[cpu];
8d707e8eb   Steven Rostedt   ring-buffer: do n...
3512
3513
  		local_irq_save(flags);
  		if (dolock)
5389f6fad   Thomas Gleixner   locking, tracing:...
3514
  			raw_spin_lock(&cpu_buffer->reader_lock);
d47882078   Steven Rostedt   ring-buffer: add ...
3515
  		ret = rb_per_cpu_empty(cpu_buffer);
8d707e8eb   Steven Rostedt   ring-buffer: do n...
3516
  		if (dolock)
5389f6fad   Thomas Gleixner   locking, tracing:...
3517
  			raw_spin_unlock(&cpu_buffer->reader_lock);
8d707e8eb   Steven Rostedt   ring-buffer: do n...
3518
  		local_irq_restore(flags);
d47882078   Steven Rostedt   ring-buffer: add ...
3519
  		if (!ret)
7a8e76a38   Steven Rostedt   tracing: unified ...
3520
3521
  			return 0;
  	}
554f786e2   Steven Rostedt   ring-buffer: only...
3522

7a8e76a38   Steven Rostedt   tracing: unified ...
3523
3524
  	return 1;
  }
c4f50183f   Robert Richter   ring_buffer: addi...
3525
  EXPORT_SYMBOL_GPL(ring_buffer_empty);
7a8e76a38   Steven Rostedt   tracing: unified ...
3526
3527
3528
3529
3530
3531
3532
3533
3534
  
  /**
   * ring_buffer_empty_cpu - is a cpu buffer of a ring buffer empty?
   * @buffer: The ring buffer
   * @cpu: The CPU buffer to test
   */
  int ring_buffer_empty_cpu(struct ring_buffer *buffer, int cpu)
  {
  	struct ring_buffer_per_cpu *cpu_buffer;
d47882078   Steven Rostedt   ring-buffer: add ...
3535
  	unsigned long flags;
8d707e8eb   Steven Rostedt   ring-buffer: do n...
3536
  	int dolock;
8aabee573   Steven Rostedt   ring-buffer: remo...
3537
  	int ret;
7a8e76a38   Steven Rostedt   tracing: unified ...
3538

9e01c1b74   Rusty Russell   cpumask: convert ...
3539
  	if (!cpumask_test_cpu(cpu, buffer->cpumask))
8aabee573   Steven Rostedt   ring-buffer: remo...
3540
  		return 1;
7a8e76a38   Steven Rostedt   tracing: unified ...
3541

8d707e8eb   Steven Rostedt   ring-buffer: do n...
3542
  	dolock = rb_ok_to_lock();
7a8e76a38   Steven Rostedt   tracing: unified ...
3543
  	cpu_buffer = buffer->buffers[cpu];
8d707e8eb   Steven Rostedt   ring-buffer: do n...
3544
3545
  	local_irq_save(flags);
  	if (dolock)
5389f6fad   Thomas Gleixner   locking, tracing:...
3546
  		raw_spin_lock(&cpu_buffer->reader_lock);
554f786e2   Steven Rostedt   ring-buffer: only...
3547
  	ret = rb_per_cpu_empty(cpu_buffer);
8d707e8eb   Steven Rostedt   ring-buffer: do n...
3548
  	if (dolock)
5389f6fad   Thomas Gleixner   locking, tracing:...
3549
  		raw_spin_unlock(&cpu_buffer->reader_lock);
8d707e8eb   Steven Rostedt   ring-buffer: do n...
3550
  	local_irq_restore(flags);
554f786e2   Steven Rostedt   ring-buffer: only...
3551
3552
  
  	return ret;
7a8e76a38   Steven Rostedt   tracing: unified ...
3553
  }
c4f50183f   Robert Richter   ring_buffer: addi...
3554
  EXPORT_SYMBOL_GPL(ring_buffer_empty_cpu);
7a8e76a38   Steven Rostedt   tracing: unified ...
3555

85bac32c4   Steven Rostedt   ring-buffer: only...
3556
  #ifdef CONFIG_RING_BUFFER_ALLOW_SWAP
7a8e76a38   Steven Rostedt   tracing: unified ...
3557
3558
3559
3560
3561
3562
3563
3564
3565
3566
3567
3568
3569
3570
3571
  /**
   * ring_buffer_swap_cpu - swap a CPU buffer between two ring buffers
   * @buffer_a: One buffer to swap with
   * @buffer_b: The other buffer to swap with
   *
   * This function is useful for tracers that want to take a "snapshot"
   * of a CPU buffer and has another back up buffer lying around.
   * it is expected that the tracer handles the cpu buffer not being
   * used at the moment.
   */
  int ring_buffer_swap_cpu(struct ring_buffer *buffer_a,
  			 struct ring_buffer *buffer_b, int cpu)
  {
  	struct ring_buffer_per_cpu *cpu_buffer_a;
  	struct ring_buffer_per_cpu *cpu_buffer_b;
554f786e2   Steven Rostedt   ring-buffer: only...
3572
  	int ret = -EINVAL;
9e01c1b74   Rusty Russell   cpumask: convert ...
3573
3574
  	if (!cpumask_test_cpu(cpu, buffer_a->cpumask) ||
  	    !cpumask_test_cpu(cpu, buffer_b->cpumask))
554f786e2   Steven Rostedt   ring-buffer: only...
3575
  		goto out;
7a8e76a38   Steven Rostedt   tracing: unified ...
3576
3577
  
  	/* At least make sure the two buffers are somewhat the same */
6d102bc68   Lai Jiangshan   tracing/ring-buff...
3578
  	if (buffer_a->pages != buffer_b->pages)
554f786e2   Steven Rostedt   ring-buffer: only...
3579
3580
3581
  		goto out;
  
  	ret = -EAGAIN;
7a8e76a38   Steven Rostedt   tracing: unified ...
3582

97b17efe4   Steven Rostedt   ring-buffer: do n...
3583
  	if (ring_buffer_flags != RB_BUFFERS_ON)
554f786e2   Steven Rostedt   ring-buffer: only...
3584
  		goto out;
97b17efe4   Steven Rostedt   ring-buffer: do n...
3585
3586
  
  	if (atomic_read(&buffer_a->record_disabled))
554f786e2   Steven Rostedt   ring-buffer: only...
3587
  		goto out;
97b17efe4   Steven Rostedt   ring-buffer: do n...
3588
3589
  
  	if (atomic_read(&buffer_b->record_disabled))
554f786e2   Steven Rostedt   ring-buffer: only...
3590
  		goto out;
97b17efe4   Steven Rostedt   ring-buffer: do n...
3591

7a8e76a38   Steven Rostedt   tracing: unified ...
3592
3593
  	cpu_buffer_a = buffer_a->buffers[cpu];
  	cpu_buffer_b = buffer_b->buffers[cpu];
97b17efe4   Steven Rostedt   ring-buffer: do n...
3594
  	if (atomic_read(&cpu_buffer_a->record_disabled))
554f786e2   Steven Rostedt   ring-buffer: only...
3595
  		goto out;
97b17efe4   Steven Rostedt   ring-buffer: do n...
3596
3597
  
  	if (atomic_read(&cpu_buffer_b->record_disabled))
554f786e2   Steven Rostedt   ring-buffer: only...
3598
  		goto out;
97b17efe4   Steven Rostedt   ring-buffer: do n...
3599

7a8e76a38   Steven Rostedt   tracing: unified ...
3600
3601
3602
3603
3604
3605
3606
3607
  	/*
  	 * We can't do a synchronize_sched here because this
  	 * function can be called in atomic context.
  	 * Normally this will be called from the same CPU as cpu.
  	 * If not it's up to the caller to protect this.
  	 */
  	atomic_inc(&cpu_buffer_a->record_disabled);
  	atomic_inc(&cpu_buffer_b->record_disabled);
98277991a   Steven Rostedt   ring-buffer: do n...
3608
3609
3610
3611
3612
  	ret = -EBUSY;
  	if (local_read(&cpu_buffer_a->committing))
  		goto out_dec;
  	if (local_read(&cpu_buffer_b->committing))
  		goto out_dec;
7a8e76a38   Steven Rostedt   tracing: unified ...
3613
3614
3615
3616
3617
  	buffer_a->buffers[cpu] = cpu_buffer_b;
  	buffer_b->buffers[cpu] = cpu_buffer_a;
  
  	cpu_buffer_b->buffer = buffer_a;
  	cpu_buffer_a->buffer = buffer_b;
98277991a   Steven Rostedt   ring-buffer: do n...
3618
3619
3620
  	ret = 0;
  
  out_dec:
7a8e76a38   Steven Rostedt   tracing: unified ...
3621
3622
  	atomic_dec(&cpu_buffer_a->record_disabled);
  	atomic_dec(&cpu_buffer_b->record_disabled);
554f786e2   Steven Rostedt   ring-buffer: only...
3623
  out:
554f786e2   Steven Rostedt   ring-buffer: only...
3624
  	return ret;
7a8e76a38   Steven Rostedt   tracing: unified ...
3625
  }
c4f50183f   Robert Richter   ring_buffer: addi...
3626
  EXPORT_SYMBOL_GPL(ring_buffer_swap_cpu);
85bac32c4   Steven Rostedt   ring-buffer: only...
3627
  #endif /* CONFIG_RING_BUFFER_ALLOW_SWAP */
7a8e76a38   Steven Rostedt   tracing: unified ...
3628

8789a9e7d   Steven Rostedt   ring-buffer: read...
3629
3630
3631
3632
3633
3634
3635
3636
3637
3638
3639
3640
3641
3642
3643
  /**
   * ring_buffer_alloc_read_page - allocate a page to read from buffer
   * @buffer: the buffer to allocate for.
   *
   * This function is used in conjunction with ring_buffer_read_page.
   * When reading a full page from the ring buffer, these functions
   * can be used to speed up the process. The calling function should
   * allocate a few pages first with this function. Then when it
   * needs to get pages from the ring buffer, it passes the result
   * of this function into ring_buffer_read_page, which will swap
   * the page that was allocated, with the read page of the buffer.
   *
   * Returns:
   *  The page allocated, or NULL on error.
   */
7ea590640   Vaibhav Nagarnaik   tracing: Use NUMA...
3644
  void *ring_buffer_alloc_read_page(struct ring_buffer *buffer, int cpu)
8789a9e7d   Steven Rostedt   ring-buffer: read...
3645
  {
044fa782e   Steven Rostedt   ring-buffer: chan...
3646
  	struct buffer_data_page *bpage;
7ea590640   Vaibhav Nagarnaik   tracing: Use NUMA...
3647
  	struct page *page;
8789a9e7d   Steven Rostedt   ring-buffer: read...
3648

d7ec4bfed   Vaibhav Nagarnaik   ring-buffer: Set ...
3649
3650
  	page = alloc_pages_node(cpu_to_node(cpu),
  				GFP_KERNEL | __GFP_NORETRY, 0);
7ea590640   Vaibhav Nagarnaik   tracing: Use NUMA...
3651
  	if (!page)
8789a9e7d   Steven Rostedt   ring-buffer: read...
3652
  		return NULL;
7ea590640   Vaibhav Nagarnaik   tracing: Use NUMA...
3653
  	bpage = page_address(page);
8789a9e7d   Steven Rostedt   ring-buffer: read...
3654

ef7a4a161   Steven Rostedt   ring-buffer: fix ...
3655
  	rb_init_page(bpage);
044fa782e   Steven Rostedt   ring-buffer: chan...
3656
  	return bpage;
8789a9e7d   Steven Rostedt   ring-buffer: read...
3657
  }
d6ce96dab   Steven Rostedt   ring-buffer: expo...
3658
  EXPORT_SYMBOL_GPL(ring_buffer_alloc_read_page);
8789a9e7d   Steven Rostedt   ring-buffer: read...
3659
3660
3661
3662
3663
3664
3665
3666
3667
3668
3669
3670
  
  /**
   * ring_buffer_free_read_page - free an allocated read page
   * @buffer: the buffer the page was allocate for
   * @data: the page to free
   *
   * Free a page allocated from ring_buffer_alloc_read_page.
   */
  void ring_buffer_free_read_page(struct ring_buffer *buffer, void *data)
  {
  	free_page((unsigned long)data);
  }
d6ce96dab   Steven Rostedt   ring-buffer: expo...
3671
  EXPORT_SYMBOL_GPL(ring_buffer_free_read_page);
8789a9e7d   Steven Rostedt   ring-buffer: read...
3672
3673
3674
3675
3676
  
  /**
   * ring_buffer_read_page - extract a page from the ring buffer
   * @buffer: buffer to extract from
   * @data_page: the page to use allocated from ring_buffer_alloc_read_page
ef7a4a161   Steven Rostedt   ring-buffer: fix ...
3677
   * @len: amount to extract
8789a9e7d   Steven Rostedt   ring-buffer: read...
3678
3679
3680
3681
3682
3683
3684
3685
3686
   * @cpu: the cpu of the buffer to extract
   * @full: should the extraction only happen when the page is full.
   *
   * This function will pull out a page from the ring buffer and consume it.
   * @data_page must be the address of the variable that was returned
   * from ring_buffer_alloc_read_page. This is because the page might be used
   * to swap with a page in the ring buffer.
   *
   * for example:
b85fa01ed   Lai Jiangshan   ring_buffer: fix ...
3687
   *	rpage = ring_buffer_alloc_read_page(buffer);
8789a9e7d   Steven Rostedt   ring-buffer: read...
3688
3689
   *	if (!rpage)
   *		return error;
ef7a4a161   Steven Rostedt   ring-buffer: fix ...
3690
   *	ret = ring_buffer_read_page(buffer, &rpage, len, cpu, 0);
667d24125   Lai Jiangshan   ring_buffer: fix ...
3691
3692
   *	if (ret >= 0)
   *		process_page(rpage, ret);
8789a9e7d   Steven Rostedt   ring-buffer: read...
3693
3694
3695
3696
3697
3698
3699
3700
3701
3702
   *
   * When @full is set, the function will not return true unless
   * the writer is off the reader page.
   *
   * Note: it is up to the calling functions to handle sleeps and wakeups.
   *  The ring buffer can be used anywhere in the kernel and can not
   *  blindly call wake_up. The layer that uses the ring buffer must be
   *  responsible for that.
   *
   * Returns:
667d24125   Lai Jiangshan   ring_buffer: fix ...
3703
3704
   *  >=0 if data has been transferred, returns the offset of consumed data.
   *  <0 if no data has been transferred.
8789a9e7d   Steven Rostedt   ring-buffer: read...
3705
3706
   */
  int ring_buffer_read_page(struct ring_buffer *buffer,
ef7a4a161   Steven Rostedt   ring-buffer: fix ...
3707
  			  void **data_page, size_t len, int cpu, int full)
8789a9e7d   Steven Rostedt   ring-buffer: read...
3708
3709
3710
  {
  	struct ring_buffer_per_cpu *cpu_buffer = buffer->buffers[cpu];
  	struct ring_buffer_event *event;
044fa782e   Steven Rostedt   ring-buffer: chan...
3711
  	struct buffer_data_page *bpage;
ef7a4a161   Steven Rostedt   ring-buffer: fix ...
3712
  	struct buffer_page *reader;
ff0ff84a0   Steven Rostedt   ring-buffer: Add ...
3713
  	unsigned long missed_events;
8789a9e7d   Steven Rostedt   ring-buffer: read...
3714
  	unsigned long flags;
ef7a4a161   Steven Rostedt   ring-buffer: fix ...
3715
  	unsigned int commit;
667d24125   Lai Jiangshan   ring_buffer: fix ...
3716
  	unsigned int read;
4f3640f8a   Steven Rostedt   ring-buffer: fix ...
3717
  	u64 save_timestamp;
667d24125   Lai Jiangshan   ring_buffer: fix ...
3718
  	int ret = -1;
8789a9e7d   Steven Rostedt   ring-buffer: read...
3719

554f786e2   Steven Rostedt   ring-buffer: only...
3720
3721
  	if (!cpumask_test_cpu(cpu, buffer->cpumask))
  		goto out;
474d32b68   Steven Rostedt   ring-buffer: make...
3722
3723
3724
3725
3726
  	/*
  	 * If len is not big enough to hold the page header, then
  	 * we can not copy anything.
  	 */
  	if (len <= BUF_PAGE_HDR_SIZE)
554f786e2   Steven Rostedt   ring-buffer: only...
3727
  		goto out;
474d32b68   Steven Rostedt   ring-buffer: make...
3728
3729
  
  	len -= BUF_PAGE_HDR_SIZE;
8789a9e7d   Steven Rostedt   ring-buffer: read...
3730
  	if (!data_page)
554f786e2   Steven Rostedt   ring-buffer: only...
3731
  		goto out;
8789a9e7d   Steven Rostedt   ring-buffer: read...
3732

044fa782e   Steven Rostedt   ring-buffer: chan...
3733
3734
  	bpage = *data_page;
  	if (!bpage)
554f786e2   Steven Rostedt   ring-buffer: only...
3735
  		goto out;
8789a9e7d   Steven Rostedt   ring-buffer: read...
3736

5389f6fad   Thomas Gleixner   locking, tracing:...
3737
  	raw_spin_lock_irqsave(&cpu_buffer->reader_lock, flags);
8789a9e7d   Steven Rostedt   ring-buffer: read...
3738

ef7a4a161   Steven Rostedt   ring-buffer: fix ...
3739
3740
  	reader = rb_get_reader_page(cpu_buffer);
  	if (!reader)
554f786e2   Steven Rostedt   ring-buffer: only...
3741
  		goto out_unlock;
8789a9e7d   Steven Rostedt   ring-buffer: read...
3742

ef7a4a161   Steven Rostedt   ring-buffer: fix ...
3743
3744
3745
3746
  	event = rb_reader_event(cpu_buffer);
  
  	read = reader->read;
  	commit = rb_page_commit(reader);
667d24125   Lai Jiangshan   ring_buffer: fix ...
3747

66a8cb95e   Steven Rostedt   ring-buffer: Add ...
3748
  	/* Check if any events were dropped */
ff0ff84a0   Steven Rostedt   ring-buffer: Add ...
3749
  	missed_events = cpu_buffer->lost_events;
66a8cb95e   Steven Rostedt   ring-buffer: Add ...
3750

8789a9e7d   Steven Rostedt   ring-buffer: read...
3751
  	/*
474d32b68   Steven Rostedt   ring-buffer: make...
3752
3753
3754
3755
3756
  	 * If this page has been partially read or
  	 * if len is not big enough to read the rest of the page or
  	 * a writer is still on the page, then
  	 * we must copy the data from the page to the buffer.
  	 * Otherwise, we can simply swap the page with the one passed in.
8789a9e7d   Steven Rostedt   ring-buffer: read...
3757
  	 */
474d32b68   Steven Rostedt   ring-buffer: make...
3758
  	if (read || (len < (commit - read)) ||
ef7a4a161   Steven Rostedt   ring-buffer: fix ...
3759
  	    cpu_buffer->reader_page == cpu_buffer->commit_page) {
667d24125   Lai Jiangshan   ring_buffer: fix ...
3760
  		struct buffer_data_page *rpage = cpu_buffer->reader_page->page;
474d32b68   Steven Rostedt   ring-buffer: make...
3761
3762
  		unsigned int rpos = read;
  		unsigned int pos = 0;
ef7a4a161   Steven Rostedt   ring-buffer: fix ...
3763
  		unsigned int size;
8789a9e7d   Steven Rostedt   ring-buffer: read...
3764
3765
  
  		if (full)
554f786e2   Steven Rostedt   ring-buffer: only...
3766
  			goto out_unlock;
8789a9e7d   Steven Rostedt   ring-buffer: read...
3767

ef7a4a161   Steven Rostedt   ring-buffer: fix ...
3768
3769
  		if (len > (commit - read))
  			len = (commit - read);
69d1b839f   Steven Rostedt   ring-buffer: Bind...
3770
3771
  		/* Always keep the time extend and data together */
  		size = rb_event_ts_length(event);
ef7a4a161   Steven Rostedt   ring-buffer: fix ...
3772
3773
  
  		if (len < size)
554f786e2   Steven Rostedt   ring-buffer: only...
3774
  			goto out_unlock;
ef7a4a161   Steven Rostedt   ring-buffer: fix ...
3775

4f3640f8a   Steven Rostedt   ring-buffer: fix ...
3776
3777
  		/* save the current timestamp, since the user will need it */
  		save_timestamp = cpu_buffer->read_stamp;
ef7a4a161   Steven Rostedt   ring-buffer: fix ...
3778
3779
  		/* Need to copy one event at a time */
  		do {
e1e359273   David Sharp   ring_buffer: Off-...
3780
3781
3782
3783
3784
3785
3786
  			/* We need the size of one event, because
  			 * rb_advance_reader only advances by one event,
  			 * whereas rb_event_ts_length may include the size of
  			 * one or two events.
  			 * We have already ensured there's enough space if this
  			 * is a time extend. */
  			size = rb_event_length(event);
474d32b68   Steven Rostedt   ring-buffer: make...
3787
  			memcpy(bpage->data + pos, rpage->data + rpos, size);
ef7a4a161   Steven Rostedt   ring-buffer: fix ...
3788
3789
3790
3791
  
  			len -= size;
  
  			rb_advance_reader(cpu_buffer);
474d32b68   Steven Rostedt   ring-buffer: make...
3792
3793
  			rpos = reader->read;
  			pos += size;
ef7a4a161   Steven Rostedt   ring-buffer: fix ...
3794

18fab912d   Huang Ying   tracing: Fix ring...
3795
3796
  			if (rpos >= commit)
  				break;
ef7a4a161   Steven Rostedt   ring-buffer: fix ...
3797
  			event = rb_reader_event(cpu_buffer);
69d1b839f   Steven Rostedt   ring-buffer: Bind...
3798
3799
  			/* Always keep the time extend and data together */
  			size = rb_event_ts_length(event);
e1e359273   David Sharp   ring_buffer: Off-...
3800
  		} while (len >= size);
667d24125   Lai Jiangshan   ring_buffer: fix ...
3801
3802
  
  		/* update bpage */
ef7a4a161   Steven Rostedt   ring-buffer: fix ...
3803
  		local_set(&bpage->commit, pos);
4f3640f8a   Steven Rostedt   ring-buffer: fix ...
3804
  		bpage->time_stamp = save_timestamp;
ef7a4a161   Steven Rostedt   ring-buffer: fix ...
3805

474d32b68   Steven Rostedt   ring-buffer: make...
3806
3807
  		/* we copied everything to the beginning */
  		read = 0;
8789a9e7d   Steven Rostedt   ring-buffer: read...
3808
  	} else {
afbab76a6   Steven Rostedt   ring-buffer: have...
3809
  		/* update the entry counter */
77ae365ec   Steven Rostedt   ring-buffer: make...
3810
  		cpu_buffer->read += rb_page_entries(reader);
c64e148a3   Vaibhav Nagarnaik   trace: Add ring b...
3811
  		cpu_buffer->read_bytes += BUF_PAGE_SIZE;
afbab76a6   Steven Rostedt   ring-buffer: have...
3812

8789a9e7d   Steven Rostedt   ring-buffer: read...
3813
  		/* swap the pages */
044fa782e   Steven Rostedt   ring-buffer: chan...
3814
  		rb_init_page(bpage);
ef7a4a161   Steven Rostedt   ring-buffer: fix ...
3815
3816
3817
  		bpage = reader->page;
  		reader->page = *data_page;
  		local_set(&reader->write, 0);
778c55d44   Steven Rostedt   ring-buffer: reco...
3818
  		local_set(&reader->entries, 0);
ef7a4a161   Steven Rostedt   ring-buffer: fix ...
3819
  		reader->read = 0;
044fa782e   Steven Rostedt   ring-buffer: chan...
3820
  		*data_page = bpage;
ff0ff84a0   Steven Rostedt   ring-buffer: Add ...
3821
3822
3823
3824
3825
3826
3827
3828
  
  		/*
  		 * Use the real_end for the data size,
  		 * This gives us a chance to store the lost events
  		 * on the page.
  		 */
  		if (reader->real_end)
  			local_set(&bpage->commit, reader->real_end);
8789a9e7d   Steven Rostedt   ring-buffer: read...
3829
  	}
667d24125   Lai Jiangshan   ring_buffer: fix ...
3830
  	ret = read;
8789a9e7d   Steven Rostedt   ring-buffer: read...
3831

66a8cb95e   Steven Rostedt   ring-buffer: Add ...
3832
  	cpu_buffer->lost_events = 0;
2711ca237   Steven Rostedt   ring-buffer: Move...
3833
3834
  
  	commit = local_read(&bpage->commit);
66a8cb95e   Steven Rostedt   ring-buffer: Add ...
3835
3836
3837
  	/*
  	 * Set a flag in the commit field if we lost events
  	 */
ff0ff84a0   Steven Rostedt   ring-buffer: Add ...
3838
  	if (missed_events) {
ff0ff84a0   Steven Rostedt   ring-buffer: Add ...
3839
3840
3841
3842
3843
3844
3845
  		/* If there is room at the end of the page to save the
  		 * missed events, then record it there.
  		 */
  		if (BUF_PAGE_SIZE - commit >= sizeof(missed_events)) {
  			memcpy(&bpage->data[commit], &missed_events,
  			       sizeof(missed_events));
  			local_add(RB_MISSED_STORED, &bpage->commit);
2711ca237   Steven Rostedt   ring-buffer: Move...
3846
  			commit += sizeof(missed_events);
ff0ff84a0   Steven Rostedt   ring-buffer: Add ...
3847
  		}
66a8cb95e   Steven Rostedt   ring-buffer: Add ...
3848
  		local_add(RB_MISSED_EVENTS, &bpage->commit);
ff0ff84a0   Steven Rostedt   ring-buffer: Add ...
3849
  	}
66a8cb95e   Steven Rostedt   ring-buffer: Add ...
3850

2711ca237   Steven Rostedt   ring-buffer: Move...
3851
3852
3853
3854
3855
  	/*
  	 * This page may be off to user land. Zero it out here.
  	 */
  	if (commit < BUF_PAGE_SIZE)
  		memset(&bpage->data[commit], 0, BUF_PAGE_SIZE - commit);
554f786e2   Steven Rostedt   ring-buffer: only...
3856
   out_unlock:
5389f6fad   Thomas Gleixner   locking, tracing:...
3857
  	raw_spin_unlock_irqrestore(&cpu_buffer->reader_lock, flags);
8789a9e7d   Steven Rostedt   ring-buffer: read...
3858

554f786e2   Steven Rostedt   ring-buffer: only...
3859
   out:
8789a9e7d   Steven Rostedt   ring-buffer: read...
3860
3861
  	return ret;
  }
d6ce96dab   Steven Rostedt   ring-buffer: expo...
3862
  EXPORT_SYMBOL_GPL(ring_buffer_read_page);
8789a9e7d   Steven Rostedt   ring-buffer: read...
3863

1155de47c   Paul Mundt   ring-buffer: Make...
3864
  #ifdef CONFIG_TRACING
a35832446   Steven Rostedt   ring-buffer: buff...
3865
3866
3867
3868
  static ssize_t
  rb_simple_read(struct file *filp, char __user *ubuf,
  	       size_t cnt, loff_t *ppos)
  {
5e39841c4   Hannes Eder   tracing: fix spar...
3869
  	unsigned long *p = filp->private_data;
a35832446   Steven Rostedt   ring-buffer: buff...
3870
3871
  	char buf[64];
  	int r;
033601a32   Steven Rostedt   ring-buffer: add ...
3872
3873
3874
3875
3876
3877
  	if (test_bit(RB_BUFFERS_DISABLED_BIT, p))
  		r = sprintf(buf, "permanently disabled
  ");
  	else
  		r = sprintf(buf, "%d
  ", test_bit(RB_BUFFERS_ON_BIT, p));
a35832446   Steven Rostedt   ring-buffer: buff...
3878
3879
3880
3881
3882
3883
3884
3885
  
  	return simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
  }
  
  static ssize_t
  rb_simple_write(struct file *filp, const char __user *ubuf,
  		size_t cnt, loff_t *ppos)
  {
5e39841c4   Hannes Eder   tracing: fix spar...
3886
  	unsigned long *p = filp->private_data;
5e39841c4   Hannes Eder   tracing: fix spar...
3887
  	unsigned long val;
a35832446   Steven Rostedt   ring-buffer: buff...
3888
  	int ret;
22fe9b54d   Peter Huewe   tracing: Convert ...
3889
3890
  	ret = kstrtoul_from_user(ubuf, cnt, 10, &val);
  	if (ret)
a35832446   Steven Rostedt   ring-buffer: buff...
3891
  		return ret;
033601a32   Steven Rostedt   ring-buffer: add ...
3892
3893
3894
3895
  	if (val)
  		set_bit(RB_BUFFERS_ON_BIT, p);
  	else
  		clear_bit(RB_BUFFERS_ON_BIT, p);
a35832446   Steven Rostedt   ring-buffer: buff...
3896
3897
3898
3899
3900
  
  	(*ppos)++;
  
  	return cnt;
  }
5e2336a0d   Steven Rostedt   tracing: make all...
3901
  static const struct file_operations rb_simple_fops = {
a35832446   Steven Rostedt   ring-buffer: buff...
3902
3903
3904
  	.open		= tracing_open_generic,
  	.read		= rb_simple_read,
  	.write		= rb_simple_write,
6038f373a   Arnd Bergmann   llseek: automatic...
3905
  	.llseek		= default_llseek,
a35832446   Steven Rostedt   ring-buffer: buff...
3906
3907
3908
3909
3910
3911
  };
  
  
  static __init int rb_init_debugfs(void)
  {
  	struct dentry *d_tracer;
a35832446   Steven Rostedt   ring-buffer: buff...
3912
3913
  
  	d_tracer = tracing_init_dentry();
5452af664   Frederic Weisbecker   tracing/ftrace: f...
3914
3915
  	trace_create_file("tracing_on", 0644, d_tracer,
  			    &ring_buffer_flags, &rb_simple_fops);
a35832446   Steven Rostedt   ring-buffer: buff...
3916
3917
3918
3919
3920
  
  	return 0;
  }
  
  fs_initcall(rb_init_debugfs);
1155de47c   Paul Mundt   ring-buffer: Make...
3921
  #endif
554f786e2   Steven Rostedt   ring-buffer: only...
3922

59222efe2   Steven Rostedt   ring-buffer: use ...
3923
  #ifdef CONFIG_HOTPLUG_CPU
09c9e84d4   Frederic Weisbecker   tracing/ring-buff...
3924
3925
  static int rb_cpu_notify(struct notifier_block *self,
  			 unsigned long action, void *hcpu)
554f786e2   Steven Rostedt   ring-buffer: only...
3926
3927
3928
3929
3930
3931
3932
3933
  {
  	struct ring_buffer *buffer =
  		container_of(self, struct ring_buffer, cpu_notify);
  	long cpu = (long)hcpu;
  
  	switch (action) {
  	case CPU_UP_PREPARE:
  	case CPU_UP_PREPARE_FROZEN:
3f237a79d   Rusty Russell   cpumask: use new ...
3934
  		if (cpumask_test_cpu(cpu, buffer->cpumask))
554f786e2   Steven Rostedt   ring-buffer: only...
3935
3936
3937
3938
3939
3940
3941
3942
3943
3944
3945
  			return NOTIFY_OK;
  
  		buffer->buffers[cpu] =
  			rb_allocate_cpu_buffer(buffer, cpu);
  		if (!buffer->buffers[cpu]) {
  			WARN(1, "failed to allocate ring buffer on CPU %ld
  ",
  			     cpu);
  			return NOTIFY_OK;
  		}
  		smp_wmb();
3f237a79d   Rusty Russell   cpumask: use new ...
3946
  		cpumask_set_cpu(cpu, buffer->cpumask);
554f786e2   Steven Rostedt   ring-buffer: only...
3947
3948
3949
3950
3951
3952
3953
3954
3955
3956
3957
3958
3959
3960
3961
  		break;
  	case CPU_DOWN_PREPARE:
  	case CPU_DOWN_PREPARE_FROZEN:
  		/*
  		 * Do nothing.
  		 *  If we were to free the buffer, then the user would
  		 *  lose any trace that was in the buffer.
  		 */
  		break;
  	default:
  		break;
  	}
  	return NOTIFY_OK;
  }
  #endif