Blame view

net/sched/cls_cgroup.c 7.21 KB
f40092373   Thomas Graf   pkt_sched: Contro...
1
2
3
4
5
6
7
8
9
10
11
12
  /*
   * net/sched/cls_cgroup.c	Control Group Classifier
   *
   *		This program is free software; you can redistribute it and/or
   *		modify it under the terms of the GNU General Public License
   *		as published by the Free Software Foundation; either version
   *		2 of the License, or (at your option) any later version.
   *
   * Authors:	Thomas Graf <tgraf@suug.ch>
   */
  
  #include <linux/module.h>
5a0e3ad6a   Tejun Heo   include cleanup: ...
13
  #include <linux/slab.h>
f40092373   Thomas Graf   pkt_sched: Contro...
14
15
16
17
18
  #include <linux/types.h>
  #include <linux/string.h>
  #include <linux/errno.h>
  #include <linux/skbuff.h>
  #include <linux/cgroup.h>
f84517253   Herbert Xu   cls_cgroup: Store...
19
  #include <linux/rcupdate.h>
f40092373   Thomas Graf   pkt_sched: Contro...
20
21
  #include <net/rtnetlink.h>
  #include <net/pkt_cls.h>
f84517253   Herbert Xu   cls_cgroup: Store...
22
23
  #include <net/sock.h>
  #include <net/cls_cgroup.h>
f40092373   Thomas Graf   pkt_sched: Contro...
24

8e039d84b   Ben Blum   cgroups: net_cls ...
25
26
27
28
29
30
31
32
33
34
35
36
  static struct cgroup_subsys_state *cgrp_create(struct cgroup_subsys *ss,
  					       struct cgroup *cgrp);
  static void cgrp_destroy(struct cgroup_subsys *ss, struct cgroup *cgrp);
  static int cgrp_populate(struct cgroup_subsys *ss, struct cgroup *cgrp);
  
  struct cgroup_subsys net_cls_subsys = {
  	.name		= "net_cls",
  	.create		= cgrp_create,
  	.destroy	= cgrp_destroy,
  	.populate	= cgrp_populate,
  #ifdef CONFIG_NET_CLS_CGROUP
  	.subsys_id	= net_cls_subsys_id,
8e039d84b   Ben Blum   cgroups: net_cls ...
37
38
39
  #endif
  	.module		= THIS_MODULE,
  };
8e8ba8541   Li Zefan   cls_cgroup: clean...
40
  static inline struct cgroup_cls_state *cgrp_cls_state(struct cgroup *cgrp)
f40092373   Thomas Graf   pkt_sched: Contro...
41
  {
8e8ba8541   Li Zefan   cls_cgroup: clean...
42
43
44
45
46
47
48
49
  	return container_of(cgroup_subsys_state(cgrp, net_cls_subsys_id),
  			    struct cgroup_cls_state, css);
  }
  
  static inline struct cgroup_cls_state *task_cls_state(struct task_struct *p)
  {
  	return container_of(task_subsys_state(p, net_cls_subsys_id),
  			    struct cgroup_cls_state, css);
f40092373   Thomas Graf   pkt_sched: Contro...
50
51
52
53
54
55
  }
  
  static struct cgroup_subsys_state *cgrp_create(struct cgroup_subsys *ss,
  						 struct cgroup *cgrp)
  {
  	struct cgroup_cls_state *cs;
cc7ec456f   Eric Dumazet   net_sched: cleanups
56
57
  	cs = kzalloc(sizeof(*cs), GFP_KERNEL);
  	if (!cs)
f40092373   Thomas Graf   pkt_sched: Contro...
58
59
60
  		return ERR_PTR(-ENOMEM);
  
  	if (cgrp->parent)
8e8ba8541   Li Zefan   cls_cgroup: clean...
61
  		cs->classid = cgrp_cls_state(cgrp->parent)->classid;
f40092373   Thomas Graf   pkt_sched: Contro...
62
63
64
65
66
67
  
  	return &cs->css;
  }
  
  static void cgrp_destroy(struct cgroup_subsys *ss, struct cgroup *cgrp)
  {
8e8ba8541   Li Zefan   cls_cgroup: clean...
68
  	kfree(cgrp_cls_state(cgrp));
f40092373   Thomas Graf   pkt_sched: Contro...
69
70
71
72
  }
  
  static u64 read_classid(struct cgroup *cgrp, struct cftype *cft)
  {
8e8ba8541   Li Zefan   cls_cgroup: clean...
73
  	return cgrp_cls_state(cgrp)->classid;
f40092373   Thomas Graf   pkt_sched: Contro...
74
75
76
77
  }
  
  static int write_classid(struct cgroup *cgrp, struct cftype *cft, u64 value)
  {
8e8ba8541   Li Zefan   cls_cgroup: clean...
78
  	cgrp_cls_state(cgrp)->classid = (u32) value;
f40092373   Thomas Graf   pkt_sched: Contro...
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
  	return 0;
  }
  
  static struct cftype ss_files[] = {
  	{
  		.name = "classid",
  		.read_u64 = read_classid,
  		.write_u64 = write_classid,
  	},
  };
  
  static int cgrp_populate(struct cgroup_subsys *ss, struct cgroup *cgrp)
  {
  	return cgroup_add_files(cgrp, ss, ss_files, ARRAY_SIZE(ss_files));
  }
cc7ec456f   Eric Dumazet   net_sched: cleanups
94
  struct cls_cgroup_head {
f40092373   Thomas Graf   pkt_sched: Contro...
95
96
97
98
  	u32			handle;
  	struct tcf_exts		exts;
  	struct tcf_ematch_tree	ematches;
  };
dc7f9f6e8   Eric Dumazet   net: sched: const...
99
  static int cls_cgroup_classify(struct sk_buff *skb, const struct tcf_proto *tp,
f40092373   Thomas Graf   pkt_sched: Contro...
100
101
102
  			       struct tcf_result *res)
  {
  	struct cls_cgroup_head *head = tp->root;
e65fcfd63   Paul Menage   cls_cgroup: read ...
103
  	u32 classid;
f40092373   Thomas Graf   pkt_sched: Contro...
104

f84517253   Herbert Xu   cls_cgroup: Store...
105
106
107
  	rcu_read_lock();
  	classid = task_cls_state(current)->classid;
  	rcu_read_unlock();
f40092373   Thomas Graf   pkt_sched: Contro...
108
109
110
111
112
113
114
115
116
117
  	/*
  	 * Due to the nature of the classifier it is required to ignore all
  	 * packets originating from softirq context as accessing `current'
  	 * would lead to false results.
  	 *
  	 * This test assumes that all callers of dev_queue_xmit() explicitely
  	 * disable bh. Knowing this, it is possible to detect softirq based
  	 * calls by looking at the number of nested bh disable calls because
  	 * softirqs always disables bh.
  	 */
75e1056f5   Venkatesh Pallipadi   sched: Fix softir...
118
  	if (in_serving_softirq()) {
f84517253   Herbert Xu   cls_cgroup: Store...
119
120
121
122
123
  		/* If there is an sk_classid we'll use that. */
  		if (!skb->sk)
  			return -1;
  		classid = skb->sk->sk_classid;
  	}
f40092373   Thomas Graf   pkt_sched: Contro...
124

e65fcfd63   Paul Menage   cls_cgroup: read ...
125
126
127
128
129
130
131
132
133
  	if (!classid)
  		return -1;
  
  	if (!tcf_em_tree_match(skb, &head->ematches, NULL))
  		return -1;
  
  	res->classid = classid;
  	res->class = 0;
  	return tcf_exts_exec(skb, &head->exts, res);
f40092373   Thomas Graf   pkt_sched: Contro...
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
  }
  
  static unsigned long cls_cgroup_get(struct tcf_proto *tp, u32 handle)
  {
  	return 0UL;
  }
  
  static void cls_cgroup_put(struct tcf_proto *tp, unsigned long f)
  {
  }
  
  static int cls_cgroup_init(struct tcf_proto *tp)
  {
  	return 0;
  }
  
  static const struct tcf_ext_map cgroup_ext_map = {
  	.action = TCA_CGROUP_ACT,
  	.police = TCA_CGROUP_POLICE,
  };
  
  static const struct nla_policy cgroup_policy[TCA_CGROUP_MAX + 1] = {
  	[TCA_CGROUP_EMATCHES]	= { .type = NLA_NESTED },
  };
  
  static int cls_cgroup_change(struct tcf_proto *tp, unsigned long base,
  			     u32 handle, struct nlattr **tca,
  			     unsigned long *arg)
  {
cc7ec456f   Eric Dumazet   net_sched: cleanups
163
  	struct nlattr *tb[TCA_CGROUP_MAX + 1];
f40092373   Thomas Graf   pkt_sched: Contro...
164
165
166
167
  	struct cls_cgroup_head *head = tp->root;
  	struct tcf_ematch_tree t;
  	struct tcf_exts e;
  	int err;
52ea3a56a   Minoru Usui   cls_cgroup: Fix o...
168
169
  	if (!tca[TCA_OPTIONS])
  		return -EINVAL;
f40092373   Thomas Graf   pkt_sched: Contro...
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
  	if (head == NULL) {
  		if (!handle)
  			return -EINVAL;
  
  		head = kzalloc(sizeof(*head), GFP_KERNEL);
  		if (head == NULL)
  			return -ENOBUFS;
  
  		head->handle = handle;
  
  		tcf_tree_lock(tp);
  		tp->root = head;
  		tcf_tree_unlock(tp);
  	}
  
  	if (handle != head->handle)
  		return -ENOENT;
  
  	err = nla_parse_nested(tb, TCA_CGROUP_MAX, tca[TCA_OPTIONS],
  			       cgroup_policy);
  	if (err < 0)
  		return err;
  
  	err = tcf_exts_validate(tp, tb, tca[TCA_RATE], &e, &cgroup_ext_map);
  	if (err < 0)
  		return err;
  
  	err = tcf_em_tree_validate(tp, tb[TCA_CGROUP_EMATCHES], &t);
  	if (err < 0)
  		return err;
  
  	tcf_exts_change(tp, &head->exts, &e);
  	tcf_em_tree_change(tp, &head->ematches, &t);
  
  	return 0;
  }
  
  static void cls_cgroup_destroy(struct tcf_proto *tp)
  {
47a1a1d4b   Patrick McHardy   pkt_sched: remove...
209
  	struct cls_cgroup_head *head = tp->root;
f40092373   Thomas Graf   pkt_sched: Contro...
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
  
  	if (head) {
  		tcf_exts_destroy(tp, &head->exts);
  		tcf_em_tree_destroy(tp, &head->ematches);
  		kfree(head);
  	}
  }
  
  static int cls_cgroup_delete(struct tcf_proto *tp, unsigned long arg)
  {
  	return -EOPNOTSUPP;
  }
  
  static void cls_cgroup_walk(struct tcf_proto *tp, struct tcf_walker *arg)
  {
  	struct cls_cgroup_head *head = tp->root;
  
  	if (arg->count < arg->skip)
  		goto skip;
  
  	if (arg->fn(tp, (unsigned long) head, arg) < 0) {
  		arg->stop = 1;
  		return;
  	}
  skip:
  	arg->count++;
  }
  
  static int cls_cgroup_dump(struct tcf_proto *tp, unsigned long fh,
  			   struct sk_buff *skb, struct tcmsg *t)
  {
  	struct cls_cgroup_head *head = tp->root;
  	unsigned char *b = skb_tail_pointer(skb);
  	struct nlattr *nest;
  
  	t->tcm_handle = head->handle;
  
  	nest = nla_nest_start(skb, TCA_OPTIONS);
  	if (nest == NULL)
  		goto nla_put_failure;
  
  	if (tcf_exts_dump(skb, &head->exts, &cgroup_ext_map) < 0 ||
  	    tcf_em_tree_dump(skb, &head->ematches, TCA_CGROUP_EMATCHES) < 0)
  		goto nla_put_failure;
  
  	nla_nest_end(skb, nest);
  
  	if (tcf_exts_dump_stats(skb, &head->exts, &cgroup_ext_map) < 0)
  		goto nla_put_failure;
  
  	return skb->len;
  
  nla_put_failure:
  	nlmsg_trim(skb, b);
  	return -1;
  }
  
  static struct tcf_proto_ops cls_cgroup_ops __read_mostly = {
  	.kind		=	"cgroup",
  	.init		=	cls_cgroup_init,
  	.change		=	cls_cgroup_change,
  	.classify	=	cls_cgroup_classify,
  	.destroy	=	cls_cgroup_destroy,
  	.get		=	cls_cgroup_get,
  	.put		=	cls_cgroup_put,
  	.delete		=	cls_cgroup_delete,
  	.walk		=	cls_cgroup_walk,
  	.dump		=	cls_cgroup_dump,
  	.owner		=	THIS_MODULE,
  };
  
  static int __init init_cgroup_cls(void)
  {
f84517253   Herbert Xu   cls_cgroup: Store...
283
  	int ret;
8e039d84b   Ben Blum   cgroups: net_cls ...
284
285
  	ret = cgroup_load_subsys(&net_cls_subsys);
  	if (ret)
f84517253   Herbert Xu   cls_cgroup: Store...
286
287
288
289
290
291
292
293
294
295
296
297
298
  		goto out;
  
  #ifndef CONFIG_NET_CLS_CGROUP
  	/* We can't use rcu_assign_pointer because this is an int. */
  	smp_wmb();
  	net_cls_subsys_id = net_cls_subsys.subsys_id;
  #endif
  
  	ret = register_tcf_proto_ops(&cls_cgroup_ops);
  	if (ret)
  		cgroup_unload_subsys(&net_cls_subsys);
  
  out:
8e039d84b   Ben Blum   cgroups: net_cls ...
299
  	return ret;
f40092373   Thomas Graf   pkt_sched: Contro...
300
301
302
303
304
  }
  
  static void __exit exit_cgroup_cls(void)
  {
  	unregister_tcf_proto_ops(&cls_cgroup_ops);
f84517253   Herbert Xu   cls_cgroup: Store...
305
306
307
308
309
  
  #ifndef CONFIG_NET_CLS_CGROUP
  	net_cls_subsys_id = -1;
  	synchronize_rcu();
  #endif
8e039d84b   Ben Blum   cgroups: net_cls ...
310
  	cgroup_unload_subsys(&net_cls_subsys);
f40092373   Thomas Graf   pkt_sched: Contro...
311
312
313
314
315
  }
  
  module_init(init_cgroup_cls);
  module_exit(exit_cgroup_cls);
  MODULE_LICENSE("GPL");