Blame view

kernel/taskstats.c 15.8 KB
c757249af   Shailabh Nagar   [PATCH] per-task-...
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
  /*
   * taskstats.c - Export per-task statistics to userland
   *
   * Copyright (C) Shailabh Nagar, IBM Corp. 2006
   *           (C) Balbir Singh,   IBM Corp. 2006
   *
   * This program is free software; you can redistribute it and/or modify
   * it under the terms of the GNU General Public License as published by
   * the Free Software Foundation; either version 2 of the License, or
   * (at your option) any later version.
   *
   * This program is distributed in the hope that it will be useful,
   * but WITHOUT ANY WARRANTY; without even the implied warranty of
   * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
   * GNU General Public License for more details.
   *
   */
  
  #include <linux/kernel.h>
  #include <linux/taskstats_kern.h>
f3cef7a99   Jay Lan   [PATCH] csa: basi...
21
  #include <linux/tsacct_kern.h>
6f44993fe   Shailabh Nagar   [PATCH] per-task-...
22
  #include <linux/delayacct.h>
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
23
24
  #include <linux/cpumask.h>
  #include <linux/percpu.h>
5a0e3ad6a   Tejun Heo   include cleanup: ...
25
  #include <linux/slab.h>
846c7bb05   Balbir Singh   Add cgroupstats
26
27
28
29
  #include <linux/cgroupstats.h>
  #include <linux/cgroup.h>
  #include <linux/fs.h>
  #include <linux/file.h>
c757249af   Shailabh Nagar   [PATCH] per-task-...
30
31
  #include <net/genetlink.h>
  #include <asm/atomic.h>
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
32
33
34
35
36
  /*
   * Maximum length of a cpumask that can be specified in
   * the TASKSTATS_CMD_ATTR_REGISTER/DEREGISTER_CPUMASK attribute
   */
  #define TASKSTATS_CPUMASK_MAXLEN	(100+6*NR_CPUS)
b81f3ea92   Vegard Nossum   taskstats: remove...
37
  static DEFINE_PER_CPU(__u32, taskstats_seqnum);
c757249af   Shailabh Nagar   [PATCH] per-task-...
38
  static int family_registered;
e18b890bb   Christoph Lameter   [PATCH] slab: rem...
39
  struct kmem_cache *taskstats_cache;
c757249af   Shailabh Nagar   [PATCH] per-task-...
40
41
42
43
44
45
46
  
  static struct genl_family family = {
  	.id		= GENL_ID_GENERATE,
  	.name		= TASKSTATS_GENL_NAME,
  	.version	= TASKSTATS_GENL_VERSION,
  	.maxattr	= TASKSTATS_CMD_ATTR_MAX,
  };
b54452b07   Alexey Dobriyan   const: struct nla...
47
  static const struct nla_policy taskstats_cmd_get_policy[TASKSTATS_CMD_ATTR_MAX+1] = {
c757249af   Shailabh Nagar   [PATCH] per-task-...
48
49
  	[TASKSTATS_CMD_ATTR_PID]  = { .type = NLA_U32 },
  	[TASKSTATS_CMD_ATTR_TGID] = { .type = NLA_U32 },
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
50
51
  	[TASKSTATS_CMD_ATTR_REGISTER_CPUMASK] = { .type = NLA_STRING },
  	[TASKSTATS_CMD_ATTR_DEREGISTER_CPUMASK] = { .type = NLA_STRING },};
b54452b07   Alexey Dobriyan   const: struct nla...
52
  static const struct nla_policy cgroupstats_cmd_get_policy[CGROUPSTATS_CMD_ATTR_MAX+1] = {
846c7bb05   Balbir Singh   Add cgroupstats
53
54
  	[CGROUPSTATS_CMD_ATTR_FD] = { .type = NLA_U32 },
  };
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
55
56
57
  struct listener {
  	struct list_head list;
  	pid_t pid;
bb129994c   Shailabh Nagar   [PATCH] Remove do...
58
  	char valid;
c757249af   Shailabh Nagar   [PATCH] per-task-...
59
  };
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
60
61
62
63
64
65
66
67
68
69
70
  struct listener_list {
  	struct rw_semaphore sem;
  	struct list_head list;
  };
  static DEFINE_PER_CPU(struct listener_list, listener_array);
  
  enum actions {
  	REGISTER,
  	DEREGISTER,
  	CPU_DONT_CARE
  };
c757249af   Shailabh Nagar   [PATCH] per-task-...
71
72
  
  static int prepare_reply(struct genl_info *info, u8 cmd, struct sk_buff **skbp,
371674853   Oleg Nesterov   [PATCH] taskstats...
73
  				size_t size)
c757249af   Shailabh Nagar   [PATCH] per-task-...
74
75
76
77
78
79
80
  {
  	struct sk_buff *skb;
  	void *reply;
  
  	/*
  	 * If new attributes are added, please revisit this allocation
  	 */
3dabc7157   Thomas Graf   [GENL]: Add genlm...
81
  	skb = genlmsg_new(size, GFP_KERNEL);
c757249af   Shailabh Nagar   [PATCH] per-task-...
82
83
84
85
  	if (!skb)
  		return -ENOMEM;
  
  	if (!info) {
cd85fc58c   Christoph Lameter   taskstats: Use th...
86
  		int seq = this_cpu_inc_return(taskstats_seqnum) - 1;
c757249af   Shailabh Nagar   [PATCH] per-task-...
87

17c157c88   Thomas Graf   [GENL]: Add genlm...
88
  		reply = genlmsg_put(skb, 0, seq, &family, 0, cmd);
c757249af   Shailabh Nagar   [PATCH] per-task-...
89
  	} else
17c157c88   Thomas Graf   [GENL]: Add genlm...
90
  		reply = genlmsg_put_reply(skb, info, &family, 0, cmd);
c757249af   Shailabh Nagar   [PATCH] per-task-...
91
92
93
94
95
96
  	if (reply == NULL) {
  		nlmsg_free(skb);
  		return -EINVAL;
  	}
  
  	*skbp = skb;
c757249af   Shailabh Nagar   [PATCH] per-task-...
97
98
  	return 0;
  }
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
99
100
101
  /*
   * Send taskstats data in @skb to listener with nl_pid @pid
   */
134e63756   Johannes Berg   genetlink: make n...
102
  static int send_reply(struct sk_buff *skb, struct genl_info *info)
c757249af   Shailabh Nagar   [PATCH] per-task-...
103
  {
b529ccf27   Arnaldo Carvalho de Melo   [NETLINK]: Introd...
104
  	struct genlmsghdr *genlhdr = nlmsg_data(nlmsg_hdr(skb));
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
105
  	void *reply = genlmsg_data(genlhdr);
c757249af   Shailabh Nagar   [PATCH] per-task-...
106
  	int rc;
c757249af   Shailabh Nagar   [PATCH] per-task-...
107
108
109
110
111
  	rc = genlmsg_end(skb, reply);
  	if (rc < 0) {
  		nlmsg_free(skb);
  		return rc;
  	}
134e63756   Johannes Berg   genetlink: make n...
112
  	return genlmsg_reply(skb, info);
c757249af   Shailabh Nagar   [PATCH] per-task-...
113
  }
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
114
115
116
  /*
   * Send taskstats data in @skb to listeners registered for @cpu's exit data
   */
115085ea0   Oleg Nesterov   [PATCH] taskstats...
117
118
  static void send_cpu_listeners(struct sk_buff *skb,
  					struct listener_list *listeners)
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
119
  {
b529ccf27   Arnaldo Carvalho de Melo   [NETLINK]: Introd...
120
  	struct genlmsghdr *genlhdr = nlmsg_data(nlmsg_hdr(skb));
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
121
122
123
  	struct listener *s, *tmp;
  	struct sk_buff *skb_next, *skb_cur = skb;
  	void *reply = genlmsg_data(genlhdr);
d94a04151   Shailabh Nagar   [PATCH] taskstats...
124
  	int rc, delcount = 0;
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
125
126
127
128
  
  	rc = genlmsg_end(skb, reply);
  	if (rc < 0) {
  		nlmsg_free(skb);
d94a04151   Shailabh Nagar   [PATCH] taskstats...
129
  		return;
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
130
131
132
  	}
  
  	rc = 0;
bb129994c   Shailabh Nagar   [PATCH] Remove do...
133
  	down_read(&listeners->sem);
d94a04151   Shailabh Nagar   [PATCH] taskstats...
134
  	list_for_each_entry(s, &listeners->list, list) {
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
135
136
137
  		skb_next = NULL;
  		if (!list_is_last(&s->list, &listeners->list)) {
  			skb_next = skb_clone(skb_cur, GFP_KERNEL);
d94a04151   Shailabh Nagar   [PATCH] taskstats...
138
  			if (!skb_next)
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
139
  				break;
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
140
  		}
134e63756   Johannes Berg   genetlink: make n...
141
  		rc = genlmsg_unicast(&init_net, skb_cur, s->pid);
d94a04151   Shailabh Nagar   [PATCH] taskstats...
142
  		if (rc == -ECONNREFUSED) {
bb129994c   Shailabh Nagar   [PATCH] Remove do...
143
144
  			s->valid = 0;
  			delcount++;
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
145
146
147
  		}
  		skb_cur = skb_next;
  	}
bb129994c   Shailabh Nagar   [PATCH] Remove do...
148
  	up_read(&listeners->sem);
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
149

d94a04151   Shailabh Nagar   [PATCH] taskstats...
150
151
  	if (skb_cur)
  		nlmsg_free(skb_cur);
bb129994c   Shailabh Nagar   [PATCH] Remove do...
152
  	if (!delcount)
d94a04151   Shailabh Nagar   [PATCH] taskstats...
153
  		return;
bb129994c   Shailabh Nagar   [PATCH] Remove do...
154
155
156
157
158
159
160
161
162
163
  
  	/* Delete invalidated entries */
  	down_write(&listeners->sem);
  	list_for_each_entry_safe(s, tmp, &listeners->list, list) {
  		if (!s->valid) {
  			list_del(&s->list);
  			kfree(s);
  		}
  	}
  	up_write(&listeners->sem);
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
164
  }
3d9e0cf1f   Michael Holzheu   taskstats: split ...
165
  static void fill_stats(struct task_struct *tsk, struct taskstats *stats)
c757249af   Shailabh Nagar   [PATCH] per-task-...
166
  {
51de4d908   Oleg Nesterov   [PATCH] taskstats...
167
  	memset(stats, 0, sizeof(*stats));
c757249af   Shailabh Nagar   [PATCH] per-task-...
168
169
170
171
  	/*
  	 * Each accounting subsystem adds calls to its functions to
  	 * fill in relevant parts of struct taskstsats as follows
  	 *
7d94dddd4   Shailabh Nagar   [PATCH] make task...
172
  	 *	per-task-foo(stats, tsk);
c757249af   Shailabh Nagar   [PATCH] per-task-...
173
  	 */
7d94dddd4   Shailabh Nagar   [PATCH] make task...
174
  	delayacct_add_tsk(stats, tsk);
f3cef7a99   Jay Lan   [PATCH] csa: basi...
175
176
  
  	/* fill in basic acct fields */
6f44993fe   Shailabh Nagar   [PATCH] per-task-...
177
  	stats->version = TASKSTATS_VERSION;
b663a79c1   Maxim Uvarov   taskstats: add co...
178
179
  	stats->nvcsw = tsk->nvcsw;
  	stats->nivcsw = tsk->nivcsw;
f3cef7a99   Jay Lan   [PATCH] csa: basi...
180
  	bacct_add_tsk(stats, tsk);
6f44993fe   Shailabh Nagar   [PATCH] per-task-...
181

9acc18535   Jay Lan   [PATCH] csa: Exte...
182
183
  	/* fill in extended acct fields */
  	xacct_add_tsk(stats, tsk);
3d9e0cf1f   Michael Holzheu   taskstats: split ...
184
  }
9acc18535   Jay Lan   [PATCH] csa: Exte...
185

3d9e0cf1f   Michael Holzheu   taskstats: split ...
186
187
188
  static int fill_stats_for_pid(pid_t pid, struct taskstats *stats)
  {
  	struct task_struct *tsk;
c757249af   Shailabh Nagar   [PATCH] per-task-...
189

3d9e0cf1f   Michael Holzheu   taskstats: split ...
190
191
192
193
194
195
196
197
198
199
  	rcu_read_lock();
  	tsk = find_task_by_vpid(pid);
  	if (tsk)
  		get_task_struct(tsk);
  	rcu_read_unlock();
  	if (!tsk)
  		return -ESRCH;
  	fill_stats(tsk, stats);
  	put_task_struct(tsk);
  	return 0;
c757249af   Shailabh Nagar   [PATCH] per-task-...
200
  }
3d9e0cf1f   Michael Holzheu   taskstats: split ...
201
  static int fill_stats_for_tgid(pid_t tgid, struct taskstats *stats)
c757249af   Shailabh Nagar   [PATCH] per-task-...
202
  {
3d9e0cf1f   Michael Holzheu   taskstats: split ...
203
  	struct task_struct *tsk, *first;
ad4ecbcba   Shailabh Nagar   [PATCH] delay acc...
204
  	unsigned long flags;
a98b60942   Oleg Nesterov   [PATCH] taskstats...
205
  	int rc = -ESRCH;
c757249af   Shailabh Nagar   [PATCH] per-task-...
206

ad4ecbcba   Shailabh Nagar   [PATCH] delay acc...
207
208
209
210
  	/*
  	 * Add additional stats from live tasks except zombie thread group
  	 * leaders who are already counted with the dead tasks
  	 */
a98b60942   Oleg Nesterov   [PATCH] taskstats...
211
  	rcu_read_lock();
3d9e0cf1f   Michael Holzheu   taskstats: split ...
212
  	first = find_task_by_vpid(tgid);
ad4ecbcba   Shailabh Nagar   [PATCH] delay acc...
213

a98b60942   Oleg Nesterov   [PATCH] taskstats...
214
215
  	if (!first || !lock_task_sighand(first, &flags))
  		goto out;
ad4ecbcba   Shailabh Nagar   [PATCH] delay acc...
216

a98b60942   Oleg Nesterov   [PATCH] taskstats...
217
218
  	if (first->signal->stats)
  		memcpy(stats, first->signal->stats, sizeof(*stats));
51de4d908   Oleg Nesterov   [PATCH] taskstats...
219
220
  	else
  		memset(stats, 0, sizeof(*stats));
fca178c0c   Oleg Nesterov   [PATCH] fill_tgid...
221

a98b60942   Oleg Nesterov   [PATCH] taskstats...
222
  	tsk = first;
c757249af   Shailabh Nagar   [PATCH] per-task-...
223
  	do {
d7c3f5f23   Oleg Nesterov   [PATCH] fill_tgid...
224
  		if (tsk->exit_state)
ad4ecbcba   Shailabh Nagar   [PATCH] delay acc...
225
  			continue;
c757249af   Shailabh Nagar   [PATCH] per-task-...
226
  		/*
ad4ecbcba   Shailabh Nagar   [PATCH] delay acc...
227
  		 * Accounting subsystem can call its functions here to
c757249af   Shailabh Nagar   [PATCH] per-task-...
228
229
  		 * fill in relevant parts of struct taskstsats as follows
  		 *
ad4ecbcba   Shailabh Nagar   [PATCH] delay acc...
230
  		 *	per-task-foo(stats, tsk);
c757249af   Shailabh Nagar   [PATCH] per-task-...
231
  		 */
ad4ecbcba   Shailabh Nagar   [PATCH] delay acc...
232
  		delayacct_add_tsk(stats, tsk);
6f44993fe   Shailabh Nagar   [PATCH] per-task-...
233

b663a79c1   Maxim Uvarov   taskstats: add co...
234
235
  		stats->nvcsw += tsk->nvcsw;
  		stats->nivcsw += tsk->nivcsw;
c757249af   Shailabh Nagar   [PATCH] per-task-...
236
  	} while_each_thread(first, tsk);
6f44993fe   Shailabh Nagar   [PATCH] per-task-...
237

a98b60942   Oleg Nesterov   [PATCH] taskstats...
238
239
240
241
242
243
  	unlock_task_sighand(first, &flags);
  	rc = 0;
  out:
  	rcu_read_unlock();
  
  	stats->version = TASKSTATS_VERSION;
c757249af   Shailabh Nagar   [PATCH] per-task-...
244
  	/*
3a4fa0a25   Robert P. J. Day   Fix misspellings ...
245
  	 * Accounting subsystems can also add calls here to modify
ad4ecbcba   Shailabh Nagar   [PATCH] delay acc...
246
  	 * fields of taskstats.
c757249af   Shailabh Nagar   [PATCH] per-task-...
247
  	 */
a98b60942   Oleg Nesterov   [PATCH] taskstats...
248
  	return rc;
ad4ecbcba   Shailabh Nagar   [PATCH] delay acc...
249
  }
ad4ecbcba   Shailabh Nagar   [PATCH] delay acc...
250
251
252
  static void fill_tgid_exit(struct task_struct *tsk)
  {
  	unsigned long flags;
b8534d7bd   Oleg Nesterov   [PATCH] taskstats...
253
  	spin_lock_irqsave(&tsk->sighand->siglock, flags);
ad4ecbcba   Shailabh Nagar   [PATCH] delay acc...
254
255
256
257
258
259
260
261
262
263
264
  	if (!tsk->signal->stats)
  		goto ret;
  
  	/*
  	 * Each accounting subsystem calls its functions here to
  	 * accumalate its per-task stats for tsk, into the per-tgid structure
  	 *
  	 *	per-task-foo(tsk->signal->stats, tsk);
  	 */
  	delayacct_add_tsk(tsk->signal->stats, tsk);
  ret:
b8534d7bd   Oleg Nesterov   [PATCH] taskstats...
265
  	spin_unlock_irqrestore(&tsk->sighand->siglock, flags);
ad4ecbcba   Shailabh Nagar   [PATCH] delay acc...
266
  	return;
c757249af   Shailabh Nagar   [PATCH] per-task-...
267
  }
41c7bb958   Rusty Russell   cpumask: convert ...
268
  static int add_del_listener(pid_t pid, const struct cpumask *mask, int isadd)
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
269
270
271
272
  {
  	struct listener_list *listeners;
  	struct listener *s, *tmp;
  	unsigned int cpu;
ad4ecbcba   Shailabh Nagar   [PATCH] delay acc...
273

41c7bb958   Rusty Russell   cpumask: convert ...
274
  	if (!cpumask_subset(mask, cpu_possible_mask))
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
275
276
277
  		return -EINVAL;
  
  	if (isadd == REGISTER) {
41c7bb958   Rusty Russell   cpumask: convert ...
278
  		for_each_cpu(cpu, mask) {
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
279
280
281
282
283
284
  			s = kmalloc_node(sizeof(struct listener), GFP_KERNEL,
  					 cpu_to_node(cpu));
  			if (!s)
  				goto cleanup;
  			s->pid = pid;
  			INIT_LIST_HEAD(&s->list);
bb129994c   Shailabh Nagar   [PATCH] Remove do...
285
  			s->valid = 1;
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
286
287
288
289
290
291
292
293
294
295
296
  
  			listeners = &per_cpu(listener_array, cpu);
  			down_write(&listeners->sem);
  			list_add(&s->list, &listeners->list);
  			up_write(&listeners->sem);
  		}
  		return 0;
  	}
  
  	/* Deregister or cleanup */
  cleanup:
41c7bb958   Rusty Russell   cpumask: convert ...
297
  	for_each_cpu(cpu, mask) {
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
298
299
300
301
302
303
304
305
306
307
308
309
310
  		listeners = &per_cpu(listener_array, cpu);
  		down_write(&listeners->sem);
  		list_for_each_entry_safe(s, tmp, &listeners->list, list) {
  			if (s->pid == pid) {
  				list_del(&s->list);
  				kfree(s);
  				break;
  			}
  		}
  		up_write(&listeners->sem);
  	}
  	return 0;
  }
41c7bb958   Rusty Russell   cpumask: convert ...
311
  static int parse(struct nlattr *na, struct cpumask *mask)
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
  {
  	char *data;
  	int len;
  	int ret;
  
  	if (na == NULL)
  		return 1;
  	len = nla_len(na);
  	if (len > TASKSTATS_CPUMASK_MAXLEN)
  		return -E2BIG;
  	if (len < 1)
  		return -EINVAL;
  	data = kmalloc(len, GFP_KERNEL);
  	if (!data)
  		return -ENOMEM;
  	nla_strlcpy(data, na, len);
29c0177e6   Rusty Russell   cpumask: change c...
328
  	ret = cpulist_parse(data, mask);
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
329
330
331
  	kfree(data);
  	return ret;
  }
9ab020cf0   Jeff Mahoney   taskstats: use be...
332
  #if defined(CONFIG_64BIT) && !defined(CONFIG_HAVE_EFFICIENT_UNALIGNED_ACCESS)
4be2c95d1   Jeff Mahoney   taskstats: pad ta...
333
334
  #define TASKSTATS_NEEDS_PADDING 1
  #endif
51de4d908   Oleg Nesterov   [PATCH] taskstats...
335
  static struct taskstats *mk_reply(struct sk_buff *skb, int type, u32 pid)
68062b86f   Oleg Nesterov   [PATCH] taskstats...
336
  {
51de4d908   Oleg Nesterov   [PATCH] taskstats...
337
  	struct nlattr *na, *ret;
68062b86f   Oleg Nesterov   [PATCH] taskstats...
338
  	int aggr;
371674853   Oleg Nesterov   [PATCH] taskstats...
339
340
341
  	aggr = (type == TASKSTATS_TYPE_PID)
  			? TASKSTATS_TYPE_AGGR_PID
  			: TASKSTATS_TYPE_AGGR_TGID;
68062b86f   Oleg Nesterov   [PATCH] taskstats...
342

4be2c95d1   Jeff Mahoney   taskstats: pad ta...
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
  	/*
  	 * The taskstats structure is internally aligned on 8 byte
  	 * boundaries but the layout of the aggregrate reply, with
  	 * two NLA headers and the pid (each 4 bytes), actually
  	 * force the entire structure to be unaligned. This causes
  	 * the kernel to issue unaligned access warnings on some
  	 * architectures like ia64. Unfortunately, some software out there
  	 * doesn't properly unroll the NLA packet and assumes that the start
  	 * of the taskstats structure will always be 20 bytes from the start
  	 * of the netlink payload. Aligning the start of the taskstats
  	 * structure breaks this software, which we don't want. So, for now
  	 * the alignment only happens on architectures that require it
  	 * and those users will have to update to fixed versions of those
  	 * packages. Space is reserved in the packet only when needed.
  	 * This ifdef should be removed in several years e.g. 2012 once
  	 * we can be confident that fixed versions are installed on most
  	 * systems. We add the padding before the aggregate since the
  	 * aggregate is already a defined type.
  	 */
  #ifdef TASKSTATS_NEEDS_PADDING
  	if (nla_put(skb, TASKSTATS_TYPE_NULL, 0, NULL) < 0)
  		goto err;
  #endif
68062b86f   Oleg Nesterov   [PATCH] taskstats...
366
  	na = nla_nest_start(skb, aggr);
371674853   Oleg Nesterov   [PATCH] taskstats...
367
368
  	if (!na)
  		goto err;
4be2c95d1   Jeff Mahoney   taskstats: pad ta...
369
370
  
  	if (nla_put(skb, type, sizeof(pid), &pid) < 0)
51de4d908   Oleg Nesterov   [PATCH] taskstats...
371
372
373
374
  		goto err;
  	ret = nla_reserve(skb, TASKSTATS_TYPE_STATS, sizeof(struct taskstats));
  	if (!ret)
  		goto err;
68062b86f   Oleg Nesterov   [PATCH] taskstats...
375
  	nla_nest_end(skb, na);
51de4d908   Oleg Nesterov   [PATCH] taskstats...
376
377
378
  	return nla_data(ret);
  err:
  	return NULL;
68062b86f   Oleg Nesterov   [PATCH] taskstats...
379
  }
846c7bb05   Balbir Singh   Add cgroupstats
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
  static int cgroupstats_user_cmd(struct sk_buff *skb, struct genl_info *info)
  {
  	int rc = 0;
  	struct sk_buff *rep_skb;
  	struct cgroupstats *stats;
  	struct nlattr *na;
  	size_t size;
  	u32 fd;
  	struct file *file;
  	int fput_needed;
  
  	na = info->attrs[CGROUPSTATS_CMD_ATTR_FD];
  	if (!na)
  		return -EINVAL;
  
  	fd = nla_get_u32(info->attrs[CGROUPSTATS_CMD_ATTR_FD]);
  	file = fget_light(fd, &fput_needed);
f96159840   Adrian Bunk   kernel/taskstats....
397
398
  	if (!file)
  		return 0;
846c7bb05   Balbir Singh   Add cgroupstats
399

f96159840   Adrian Bunk   kernel/taskstats....
400
  	size = nla_total_size(sizeof(struct cgroupstats));
846c7bb05   Balbir Singh   Add cgroupstats
401

f96159840   Adrian Bunk   kernel/taskstats....
402
403
404
405
  	rc = prepare_reply(info, CGROUPSTATS_CMD_NEW, &rep_skb,
  				size);
  	if (rc < 0)
  		goto err;
846c7bb05   Balbir Singh   Add cgroupstats
406

f96159840   Adrian Bunk   kernel/taskstats....
407
408
409
410
  	na = nla_reserve(rep_skb, CGROUPSTATS_TYPE_CGROUP_STATS,
  				sizeof(struct cgroupstats));
  	stats = nla_data(na);
  	memset(stats, 0, sizeof(*stats));
846c7bb05   Balbir Singh   Add cgroupstats
411

f96159840   Adrian Bunk   kernel/taskstats....
412
413
414
415
  	rc = cgroupstats_build(stats, file->f_dentry);
  	if (rc < 0) {
  		nlmsg_free(rep_skb);
  		goto err;
846c7bb05   Balbir Singh   Add cgroupstats
416
  	}
134e63756   Johannes Berg   genetlink: make n...
417
  	rc = send_reply(rep_skb, info);
f96159840   Adrian Bunk   kernel/taskstats....
418

846c7bb05   Balbir Singh   Add cgroupstats
419
  err:
f96159840   Adrian Bunk   kernel/taskstats....
420
  	fput_light(file, fput_needed);
846c7bb05   Balbir Singh   Add cgroupstats
421
422
  	return rc;
  }
932331259   Michael Holzheu   taskstats: separa...
423
  static int cmd_attr_register_cpumask(struct genl_info *info)
c757249af   Shailabh Nagar   [PATCH] per-task-...
424
  {
41c7bb958   Rusty Russell   cpumask: convert ...
425
  	cpumask_var_t mask;
932331259   Michael Holzheu   taskstats: separa...
426
  	int rc;
41c7bb958   Rusty Russell   cpumask: convert ...
427
428
429
  
  	if (!alloc_cpumask_var(&mask, GFP_KERNEL))
  		return -ENOMEM;
41c7bb958   Rusty Russell   cpumask: convert ...
430
  	rc = parse(info->attrs[TASKSTATS_CMD_ATTR_REGISTER_CPUMASK], mask);
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
431
  	if (rc < 0)
932331259   Michael Holzheu   taskstats: separa...
432
433
434
435
436
437
438
439
440
441
442
  		goto out;
  	rc = add_del_listener(info->snd_pid, mask, REGISTER);
  out:
  	free_cpumask_var(mask);
  	return rc;
  }
  
  static int cmd_attr_deregister_cpumask(struct genl_info *info)
  {
  	cpumask_var_t mask;
  	int rc;
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
443

932331259   Michael Holzheu   taskstats: separa...
444
445
  	if (!alloc_cpumask_var(&mask, GFP_KERNEL))
  		return -ENOMEM;
41c7bb958   Rusty Russell   cpumask: convert ...
446
  	rc = parse(info->attrs[TASKSTATS_CMD_ATTR_DEREGISTER_CPUMASK], mask);
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
447
  	if (rc < 0)
932331259   Michael Holzheu   taskstats: separa...
448
449
450
  		goto out;
  	rc = add_del_listener(info->snd_pid, mask, DEREGISTER);
  out:
41c7bb958   Rusty Russell   cpumask: convert ...
451
  	free_cpumask_var(mask);
932331259   Michael Holzheu   taskstats: separa...
452
453
  	return rc;
  }
4be2c95d1   Jeff Mahoney   taskstats: pad ta...
454
455
456
457
458
459
460
461
462
463
464
  static size_t taskstats_packet_size(void)
  {
  	size_t size;
  
  	size = nla_total_size(sizeof(u32)) +
  		nla_total_size(sizeof(struct taskstats)) + nla_total_size(0);
  #ifdef TASKSTATS_NEEDS_PADDING
  	size += nla_total_size(0); /* Padding for alignment */
  #endif
  	return size;
  }
932331259   Michael Holzheu   taskstats: separa...
465
466
467
468
469
470
471
  static int cmd_attr_pid(struct genl_info *info)
  {
  	struct taskstats *stats;
  	struct sk_buff *rep_skb;
  	size_t size;
  	u32 pid;
  	int rc;
c757249af   Shailabh Nagar   [PATCH] per-task-...
472

4be2c95d1   Jeff Mahoney   taskstats: pad ta...
473
  	size = taskstats_packet_size();
c757249af   Shailabh Nagar   [PATCH] per-task-...
474

371674853   Oleg Nesterov   [PATCH] taskstats...
475
  	rc = prepare_reply(info, TASKSTATS_CMD_NEW, &rep_skb, size);
c757249af   Shailabh Nagar   [PATCH] per-task-...
476
477
  	if (rc < 0)
  		return rc;
51de4d908   Oleg Nesterov   [PATCH] taskstats...
478
  	rc = -EINVAL;
932331259   Michael Holzheu   taskstats: separa...
479
480
481
  	pid = nla_get_u32(info->attrs[TASKSTATS_CMD_ATTR_PID]);
  	stats = mk_reply(rep_skb, TASKSTATS_TYPE_PID, pid);
  	if (!stats)
c757249af   Shailabh Nagar   [PATCH] per-task-...
482
  		goto err;
c757249af   Shailabh Nagar   [PATCH] per-task-...
483

3d9e0cf1f   Michael Holzheu   taskstats: split ...
484
  	rc = fill_stats_for_pid(pid, stats);
932331259   Michael Holzheu   taskstats: separa...
485
486
  	if (rc < 0)
  		goto err;
134e63756   Johannes Berg   genetlink: make n...
487
  	return send_reply(rep_skb, info);
c757249af   Shailabh Nagar   [PATCH] per-task-...
488
489
490
491
  err:
  	nlmsg_free(rep_skb);
  	return rc;
  }
932331259   Michael Holzheu   taskstats: separa...
492
493
494
495
496
497
498
  static int cmd_attr_tgid(struct genl_info *info)
  {
  	struct taskstats *stats;
  	struct sk_buff *rep_skb;
  	size_t size;
  	u32 tgid;
  	int rc;
4be2c95d1   Jeff Mahoney   taskstats: pad ta...
499
  	size = taskstats_packet_size();
932331259   Michael Holzheu   taskstats: separa...
500
501
502
503
504
505
506
507
508
509
  
  	rc = prepare_reply(info, TASKSTATS_CMD_NEW, &rep_skb, size);
  	if (rc < 0)
  		return rc;
  
  	rc = -EINVAL;
  	tgid = nla_get_u32(info->attrs[TASKSTATS_CMD_ATTR_TGID]);
  	stats = mk_reply(rep_skb, TASKSTATS_TYPE_TGID, tgid);
  	if (!stats)
  		goto err;
3d9e0cf1f   Michael Holzheu   taskstats: split ...
510
  	rc = fill_stats_for_tgid(tgid, stats);
932331259   Michael Holzheu   taskstats: separa...
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
  	if (rc < 0)
  		goto err;
  	return send_reply(rep_skb, info);
  err:
  	nlmsg_free(rep_skb);
  	return rc;
  }
  
  static int taskstats_user_cmd(struct sk_buff *skb, struct genl_info *info)
  {
  	if (info->attrs[TASKSTATS_CMD_ATTR_REGISTER_CPUMASK])
  		return cmd_attr_register_cpumask(info);
  	else if (info->attrs[TASKSTATS_CMD_ATTR_DEREGISTER_CPUMASK])
  		return cmd_attr_deregister_cpumask(info);
  	else if (info->attrs[TASKSTATS_CMD_ATTR_PID])
  		return cmd_attr_pid(info);
  	else if (info->attrs[TASKSTATS_CMD_ATTR_TGID])
  		return cmd_attr_tgid(info);
  	else
  		return -EINVAL;
  }
34ec12349   Oleg Nesterov   [PATCH] taskstats...
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
  static struct taskstats *taskstats_tgid_alloc(struct task_struct *tsk)
  {
  	struct signal_struct *sig = tsk->signal;
  	struct taskstats *stats;
  
  	if (sig->stats || thread_group_empty(tsk))
  		goto ret;
  
  	/* No problem if kmem_cache_zalloc() fails */
  	stats = kmem_cache_zalloc(taskstats_cache, GFP_KERNEL);
  
  	spin_lock_irq(&tsk->sighand->siglock);
  	if (!sig->stats) {
  		sig->stats = stats;
  		stats = NULL;
  	}
  	spin_unlock_irq(&tsk->sighand->siglock);
  
  	if (stats)
  		kmem_cache_free(taskstats_cache, stats);
  ret:
  	return sig->stats;
  }
c757249af   Shailabh Nagar   [PATCH] per-task-...
555
  /* Send pid data out on exit */
115085ea0   Oleg Nesterov   [PATCH] taskstats...
556
  void taskstats_exit(struct task_struct *tsk, int group_dead)
c757249af   Shailabh Nagar   [PATCH] per-task-...
557
558
  {
  	int rc;
115085ea0   Oleg Nesterov   [PATCH] taskstats...
559
  	struct listener_list *listeners;
51de4d908   Oleg Nesterov   [PATCH] taskstats...
560
  	struct taskstats *stats;
c757249af   Shailabh Nagar   [PATCH] per-task-...
561
  	struct sk_buff *rep_skb;
c757249af   Shailabh Nagar   [PATCH] per-task-...
562
563
  	size_t size;
  	int is_thread_group;
c757249af   Shailabh Nagar   [PATCH] per-task-...
564

4a279ff1e   Oleg Nesterov   [PATCH] taskstats...
565
  	if (!family_registered)
c757249af   Shailabh Nagar   [PATCH] per-task-...
566
  		return;
c757249af   Shailabh Nagar   [PATCH] per-task-...
567
568
569
  	/*
  	 * Size includes space for nested attributes
  	 */
4be2c95d1   Jeff Mahoney   taskstats: pad ta...
570
  	size = taskstats_packet_size();
c757249af   Shailabh Nagar   [PATCH] per-task-...
571

34ec12349   Oleg Nesterov   [PATCH] taskstats...
572
  	is_thread_group = !!taskstats_tgid_alloc(tsk);
4a279ff1e   Oleg Nesterov   [PATCH] taskstats...
573
574
575
576
577
578
  	if (is_thread_group) {
  		/* PID + STATS + TGID + STATS */
  		size = 2 * size;
  		/* fill the tsk->signal->stats structure */
  		fill_tgid_exit(tsk);
  	}
cd85fc58c   Christoph Lameter   taskstats: Use th...
579
  	listeners = __this_cpu_ptr(&listener_array);
115085ea0   Oleg Nesterov   [PATCH] taskstats...
580
581
  	if (list_empty(&listeners->list))
  		return;
371674853   Oleg Nesterov   [PATCH] taskstats...
582
  	rc = prepare_reply(NULL, TASKSTATS_CMD_NEW, &rep_skb, size);
c757249af   Shailabh Nagar   [PATCH] per-task-...
583
  	if (rc < 0)
51de4d908   Oleg Nesterov   [PATCH] taskstats...
584
  		return;
c757249af   Shailabh Nagar   [PATCH] per-task-...
585

51de4d908   Oleg Nesterov   [PATCH] taskstats...
586
587
  	stats = mk_reply(rep_skb, TASKSTATS_TYPE_PID, tsk->pid);
  	if (!stats)
371674853   Oleg Nesterov   [PATCH] taskstats...
588
  		goto err;
c757249af   Shailabh Nagar   [PATCH] per-task-...
589

3d9e0cf1f   Michael Holzheu   taskstats: split ...
590
  	fill_stats(tsk, stats);
c757249af   Shailabh Nagar   [PATCH] per-task-...
591

c757249af   Shailabh Nagar   [PATCH] per-task-...
592
  	/*
ad4ecbcba   Shailabh Nagar   [PATCH] delay acc...
593
  	 * Doesn't matter if tsk is the leader or the last group member leaving
c757249af   Shailabh Nagar   [PATCH] per-task-...
594
  	 */
68062b86f   Oleg Nesterov   [PATCH] taskstats...
595
  	if (!is_thread_group || !group_dead)
ad4ecbcba   Shailabh Nagar   [PATCH] delay acc...
596
  		goto send;
c757249af   Shailabh Nagar   [PATCH] per-task-...
597

51de4d908   Oleg Nesterov   [PATCH] taskstats...
598
599
  	stats = mk_reply(rep_skb, TASKSTATS_TYPE_TGID, tsk->tgid);
  	if (!stats)
371674853   Oleg Nesterov   [PATCH] taskstats...
600
  		goto err;
51de4d908   Oleg Nesterov   [PATCH] taskstats...
601
602
  
  	memcpy(stats, tsk->signal->stats, sizeof(*stats));
c757249af   Shailabh Nagar   [PATCH] per-task-...
603

ad4ecbcba   Shailabh Nagar   [PATCH] delay acc...
604
  send:
115085ea0   Oleg Nesterov   [PATCH] taskstats...
605
  	send_cpu_listeners(rep_skb, listeners);
ad4ecbcba   Shailabh Nagar   [PATCH] delay acc...
606
  	return;
371674853   Oleg Nesterov   [PATCH] taskstats...
607
  err:
c757249af   Shailabh Nagar   [PATCH] per-task-...
608
  	nlmsg_free(rep_skb);
c757249af   Shailabh Nagar   [PATCH] per-task-...
609
610
611
612
  }
  
  static struct genl_ops taskstats_ops = {
  	.cmd		= TASKSTATS_CMD_GET,
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
613
  	.doit		= taskstats_user_cmd,
c757249af   Shailabh Nagar   [PATCH] per-task-...
614
615
  	.policy		= taskstats_cmd_get_policy,
  };
846c7bb05   Balbir Singh   Add cgroupstats
616
617
618
619
620
  static struct genl_ops cgroupstats_ops = {
  	.cmd		= CGROUPSTATS_CMD_GET,
  	.doit		= cgroupstats_user_cmd,
  	.policy		= cgroupstats_cmd_get_policy,
  };
c757249af   Shailabh Nagar   [PATCH] per-task-...
621
622
623
  /* Needed early in initialization */
  void __init taskstats_init_early(void)
  {
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
624
  	unsigned int i;
0a31bd5f2   Christoph Lameter   KMEM_CACHE(): sim...
625
  	taskstats_cache = KMEM_CACHE(taskstats, SLAB_PANIC);
f9fd8914c   Shailabh Nagar   [PATCH] per-task ...
626
627
628
629
  	for_each_possible_cpu(i) {
  		INIT_LIST_HEAD(&(per_cpu(listener_array, i).list));
  		init_rwsem(&(per_cpu(listener_array, i).sem));
  	}
c757249af   Shailabh Nagar   [PATCH] per-task-...
630
631
632
633
634
635
636
637
638
639
640
641
642
  }
  
  static int __init taskstats_init(void)
  {
  	int rc;
  
  	rc = genl_register_family(&family);
  	if (rc)
  		return rc;
  
  	rc = genl_register_ops(&family, &taskstats_ops);
  	if (rc < 0)
  		goto err;
846c7bb05   Balbir Singh   Add cgroupstats
643
644
645
  	rc = genl_register_ops(&family, &cgroupstats_ops);
  	if (rc < 0)
  		goto err_cgroup_ops;
c757249af   Shailabh Nagar   [PATCH] per-task-...
646
  	family_registered = 1;
846c7bb05   Balbir Singh   Add cgroupstats
647
648
  	printk("registered taskstats version %d
  ", TASKSTATS_GENL_VERSION);
c757249af   Shailabh Nagar   [PATCH] per-task-...
649
  	return 0;
846c7bb05   Balbir Singh   Add cgroupstats
650
651
  err_cgroup_ops:
  	genl_unregister_ops(&family, &taskstats_ops);
c757249af   Shailabh Nagar   [PATCH] per-task-...
652
653
654
655
656
657
658
659
660
661
  err:
  	genl_unregister_family(&family);
  	return rc;
  }
  
  /*
   * late initcall ensures initialization of statistics collection
   * mechanisms precedes initialization of the taskstats interface
   */
  late_initcall(taskstats_init);