Commit | Line | Data |
---|---|---|
e5dfb815 PM |
1 | /* |
2 | * net/sched/cls_flow.c Generic flow classifier | |
3 | * | |
4 | * Copyright (c) 2007, 2008 Patrick McHardy <kaber@trash.net> | |
5 | * | |
6 | * This program is free software; you can redistribute it and/or | |
7 | * modify it under the terms of the GNU General Public License | |
8 | * as published by the Free Software Foundation; either version 2 | |
9 | * of the License, or (at your option) any later version. | |
10 | */ | |
11 | ||
12 | #include <linux/kernel.h> | |
13 | #include <linux/init.h> | |
14 | #include <linux/list.h> | |
15 | #include <linux/jhash.h> | |
16 | #include <linux/random.h> | |
17 | #include <linux/pkt_cls.h> | |
18 | #include <linux/skbuff.h> | |
19 | #include <linux/in.h> | |
20 | #include <linux/ip.h> | |
21 | #include <linux/ipv6.h> | |
9ec13810 | 22 | #include <linux/if_vlan.h> |
5a0e3ad6 | 23 | #include <linux/slab.h> |
3a9a231d | 24 | #include <linux/module.h> |
743b2a66 | 25 | #include <net/inet_sock.h> |
e5dfb815 PM |
26 | |
27 | #include <net/pkt_cls.h> | |
28 | #include <net/ip.h> | |
29 | #include <net/route.h> | |
1bd758eb | 30 | #include <net/flow_dissector.h> |
6bd2a9af | 31 | |
0013de38 | 32 | #if IS_ENABLED(CONFIG_NF_CONNTRACK) |
e5dfb815 PM |
33 | #include <net/netfilter/nf_conntrack.h> |
34 | #endif | |
35 | ||
36 | struct flow_head { | |
37 | struct list_head filters; | |
70da9f0b | 38 | struct rcu_head rcu; |
e5dfb815 PM |
39 | }; |
40 | ||
41 | struct flow_filter { | |
42 | struct list_head list; | |
43 | struct tcf_exts exts; | |
44 | struct tcf_ematch_tree ematches; | |
70da9f0b | 45 | struct tcf_proto *tp; |
72d9794f PM |
46 | struct timer_list perturb_timer; |
47 | u32 perturb_period; | |
e5dfb815 PM |
48 | u32 handle; |
49 | ||
50 | u32 nkeys; | |
51 | u32 keymask; | |
52 | u32 mode; | |
53 | u32 mask; | |
54 | u32 xor; | |
55 | u32 rshift; | |
56 | u32 addend; | |
57 | u32 divisor; | |
58 | u32 baseclass; | |
72d9794f | 59 | u32 hashrnd; |
70da9f0b | 60 | struct rcu_head rcu; |
e5dfb815 PM |
61 | }; |
62 | ||
e5dfb815 PM |
63 | static inline u32 addr_fold(void *addr) |
64 | { | |
65 | unsigned long a = (unsigned long)addr; | |
66 | ||
67 | return (a & 0xFFFFFFFF) ^ (BITS_PER_LONG > 32 ? a >> 32 : 0); | |
68 | } | |
69 | ||
6bd2a9af | 70 | static u32 flow_get_src(const struct sk_buff *skb, const struct flow_keys *flow) |
e5dfb815 | 71 | { |
c3f83241 TH |
72 | __be32 src = flow_get_u32_src(flow); |
73 | ||
74 | if (src) | |
75 | return ntohl(src); | |
76 | ||
4b95c3d4 | 77 | return addr_fold(skb->sk); |
e5dfb815 PM |
78 | } |
79 | ||
6bd2a9af | 80 | static u32 flow_get_dst(const struct sk_buff *skb, const struct flow_keys *flow) |
e5dfb815 | 81 | { |
c3f83241 TH |
82 | __be32 dst = flow_get_u32_dst(flow); |
83 | ||
84 | if (dst) | |
85 | return ntohl(dst); | |
86 | ||
d8b9605d | 87 | return addr_fold(skb_dst(skb)) ^ (__force u16) tc_skb_protocol(skb); |
e5dfb815 PM |
88 | } |
89 | ||
6bd2a9af | 90 | static u32 flow_get_proto(const struct sk_buff *skb, const struct flow_keys *flow) |
e5dfb815 | 91 | { |
06635a35 | 92 | return flow->basic.ip_proto; |
e5dfb815 PM |
93 | } |
94 | ||
6bd2a9af | 95 | static u32 flow_get_proto_src(const struct sk_buff *skb, const struct flow_keys *flow) |
e5dfb815 | 96 | { |
06635a35 | 97 | if (flow->ports.ports) |
59346afe | 98 | return ntohs(flow->ports.src); |
e5dfb815 | 99 | |
859c2012 ED |
100 | return addr_fold(skb->sk); |
101 | } | |
102 | ||
6bd2a9af | 103 | static u32 flow_get_proto_dst(const struct sk_buff *skb, const struct flow_keys *flow) |
859c2012 | 104 | { |
06635a35 | 105 | if (flow->ports.ports) |
59346afe | 106 | return ntohs(flow->ports.dst); |
e5dfb815 | 107 | |
d8b9605d | 108 | return addr_fold(skb_dst(skb)) ^ (__force u16) tc_skb_protocol(skb); |
e5dfb815 PM |
109 | } |
110 | ||
111 | static u32 flow_get_iif(const struct sk_buff *skb) | |
112 | { | |
8964be4a | 113 | return skb->skb_iif; |
e5dfb815 PM |
114 | } |
115 | ||
116 | static u32 flow_get_priority(const struct sk_buff *skb) | |
117 | { | |
118 | return skb->priority; | |
119 | } | |
120 | ||
121 | static u32 flow_get_mark(const struct sk_buff *skb) | |
122 | { | |
123 | return skb->mark; | |
124 | } | |
125 | ||
126 | static u32 flow_get_nfct(const struct sk_buff *skb) | |
127 | { | |
0013de38 | 128 | #if IS_ENABLED(CONFIG_NF_CONNTRACK) |
e5dfb815 PM |
129 | return addr_fold(skb->nfct); |
130 | #else | |
131 | return 0; | |
132 | #endif | |
133 | } | |
134 | ||
0013de38 | 135 | #if IS_ENABLED(CONFIG_NF_CONNTRACK) |
e5dfb815 PM |
136 | #define CTTUPLE(skb, member) \ |
137 | ({ \ | |
138 | enum ip_conntrack_info ctinfo; \ | |
859c2012 | 139 | const struct nf_conn *ct = nf_ct_get(skb, &ctinfo); \ |
e5dfb815 PM |
140 | if (ct == NULL) \ |
141 | goto fallback; \ | |
142 | ct->tuplehash[CTINFO2DIR(ctinfo)].tuple.member; \ | |
143 | }) | |
144 | #else | |
145 | #define CTTUPLE(skb, member) \ | |
146 | ({ \ | |
147 | goto fallback; \ | |
148 | 0; \ | |
149 | }) | |
150 | #endif | |
151 | ||
6bd2a9af | 152 | static u32 flow_get_nfct_src(const struct sk_buff *skb, const struct flow_keys *flow) |
e5dfb815 | 153 | { |
d8b9605d | 154 | switch (tc_skb_protocol(skb)) { |
60678040 | 155 | case htons(ETH_P_IP): |
e5dfb815 | 156 | return ntohl(CTTUPLE(skb, src.u3.ip)); |
60678040 | 157 | case htons(ETH_P_IPV6): |
e5dfb815 PM |
158 | return ntohl(CTTUPLE(skb, src.u3.ip6[3])); |
159 | } | |
160 | fallback: | |
6bd2a9af | 161 | return flow_get_src(skb, flow); |
e5dfb815 PM |
162 | } |
163 | ||
6bd2a9af | 164 | static u32 flow_get_nfct_dst(const struct sk_buff *skb, const struct flow_keys *flow) |
e5dfb815 | 165 | { |
d8b9605d | 166 | switch (tc_skb_protocol(skb)) { |
60678040 | 167 | case htons(ETH_P_IP): |
e5dfb815 | 168 | return ntohl(CTTUPLE(skb, dst.u3.ip)); |
60678040 | 169 | case htons(ETH_P_IPV6): |
e5dfb815 PM |
170 | return ntohl(CTTUPLE(skb, dst.u3.ip6[3])); |
171 | } | |
172 | fallback: | |
6bd2a9af | 173 | return flow_get_dst(skb, flow); |
e5dfb815 PM |
174 | } |
175 | ||
6bd2a9af | 176 | static u32 flow_get_nfct_proto_src(const struct sk_buff *skb, const struct flow_keys *flow) |
e5dfb815 PM |
177 | { |
178 | return ntohs(CTTUPLE(skb, src.u.all)); | |
179 | fallback: | |
6bd2a9af | 180 | return flow_get_proto_src(skb, flow); |
e5dfb815 PM |
181 | } |
182 | ||
6bd2a9af | 183 | static u32 flow_get_nfct_proto_dst(const struct sk_buff *skb, const struct flow_keys *flow) |
e5dfb815 PM |
184 | { |
185 | return ntohs(CTTUPLE(skb, dst.u.all)); | |
186 | fallback: | |
6bd2a9af | 187 | return flow_get_proto_dst(skb, flow); |
e5dfb815 PM |
188 | } |
189 | ||
190 | static u32 flow_get_rtclassid(const struct sk_buff *skb) | |
191 | { | |
c7066f70 | 192 | #ifdef CONFIG_IP_ROUTE_CLASSID |
adf30907 ED |
193 | if (skb_dst(skb)) |
194 | return skb_dst(skb)->tclassid; | |
e5dfb815 PM |
195 | #endif |
196 | return 0; | |
197 | } | |
198 | ||
199 | static u32 flow_get_skuid(const struct sk_buff *skb) | |
200 | { | |
743b2a66 ED |
201 | struct sock *sk = skb_to_full_sk(skb); |
202 | ||
203 | if (sk && sk->sk_socket && sk->sk_socket->file) { | |
204 | kuid_t skuid = sk->sk_socket->file->f_cred->fsuid; | |
205 | ||
a6c6796c EB |
206 | return from_kuid(&init_user_ns, skuid); |
207 | } | |
e5dfb815 PM |
208 | return 0; |
209 | } | |
210 | ||
211 | static u32 flow_get_skgid(const struct sk_buff *skb) | |
212 | { | |
743b2a66 ED |
213 | struct sock *sk = skb_to_full_sk(skb); |
214 | ||
215 | if (sk && sk->sk_socket && sk->sk_socket->file) { | |
216 | kgid_t skgid = sk->sk_socket->file->f_cred->fsgid; | |
217 | ||
a6c6796c EB |
218 | return from_kgid(&init_user_ns, skgid); |
219 | } | |
e5dfb815 PM |
220 | return 0; |
221 | } | |
222 | ||
9ec13810 PM |
223 | static u32 flow_get_vlan_tag(const struct sk_buff *skb) |
224 | { | |
225 | u16 uninitialized_var(tag); | |
226 | ||
227 | if (vlan_get_tag(skb, &tag) < 0) | |
228 | return 0; | |
229 | return tag & VLAN_VID_MASK; | |
230 | } | |
231 | ||
739a91ef CG |
232 | static u32 flow_get_rxhash(struct sk_buff *skb) |
233 | { | |
3958afa1 | 234 | return skb_get_hash(skb); |
739a91ef CG |
235 | } |
236 | ||
6bd2a9af | 237 | static u32 flow_key_get(struct sk_buff *skb, int key, struct flow_keys *flow) |
e5dfb815 PM |
238 | { |
239 | switch (key) { | |
240 | case FLOW_KEY_SRC: | |
6bd2a9af | 241 | return flow_get_src(skb, flow); |
e5dfb815 | 242 | case FLOW_KEY_DST: |
6bd2a9af | 243 | return flow_get_dst(skb, flow); |
e5dfb815 | 244 | case FLOW_KEY_PROTO: |
6bd2a9af | 245 | return flow_get_proto(skb, flow); |
e5dfb815 | 246 | case FLOW_KEY_PROTO_SRC: |
6bd2a9af | 247 | return flow_get_proto_src(skb, flow); |
e5dfb815 | 248 | case FLOW_KEY_PROTO_DST: |
6bd2a9af | 249 | return flow_get_proto_dst(skb, flow); |
e5dfb815 PM |
250 | case FLOW_KEY_IIF: |
251 | return flow_get_iif(skb); | |
252 | case FLOW_KEY_PRIORITY: | |
253 | return flow_get_priority(skb); | |
254 | case FLOW_KEY_MARK: | |
255 | return flow_get_mark(skb); | |
256 | case FLOW_KEY_NFCT: | |
257 | return flow_get_nfct(skb); | |
258 | case FLOW_KEY_NFCT_SRC: | |
6bd2a9af | 259 | return flow_get_nfct_src(skb, flow); |
e5dfb815 | 260 | case FLOW_KEY_NFCT_DST: |
6bd2a9af | 261 | return flow_get_nfct_dst(skb, flow); |
e5dfb815 | 262 | case FLOW_KEY_NFCT_PROTO_SRC: |
6bd2a9af | 263 | return flow_get_nfct_proto_src(skb, flow); |
e5dfb815 | 264 | case FLOW_KEY_NFCT_PROTO_DST: |
6bd2a9af | 265 | return flow_get_nfct_proto_dst(skb, flow); |
e5dfb815 PM |
266 | case FLOW_KEY_RTCLASSID: |
267 | return flow_get_rtclassid(skb); | |
268 | case FLOW_KEY_SKUID: | |
269 | return flow_get_skuid(skb); | |
270 | case FLOW_KEY_SKGID: | |
271 | return flow_get_skgid(skb); | |
9ec13810 PM |
272 | case FLOW_KEY_VLAN_TAG: |
273 | return flow_get_vlan_tag(skb); | |
739a91ef CG |
274 | case FLOW_KEY_RXHASH: |
275 | return flow_get_rxhash(skb); | |
e5dfb815 PM |
276 | default: |
277 | WARN_ON(1); | |
278 | return 0; | |
279 | } | |
280 | } | |
281 | ||
6bd2a9af ED |
282 | #define FLOW_KEYS_NEEDED ((1 << FLOW_KEY_SRC) | \ |
283 | (1 << FLOW_KEY_DST) | \ | |
284 | (1 << FLOW_KEY_PROTO) | \ | |
285 | (1 << FLOW_KEY_PROTO_SRC) | \ | |
286 | (1 << FLOW_KEY_PROTO_DST) | \ | |
287 | (1 << FLOW_KEY_NFCT_SRC) | \ | |
288 | (1 << FLOW_KEY_NFCT_DST) | \ | |
289 | (1 << FLOW_KEY_NFCT_PROTO_SRC) | \ | |
290 | (1 << FLOW_KEY_NFCT_PROTO_DST)) | |
291 | ||
dc7f9f6e | 292 | static int flow_classify(struct sk_buff *skb, const struct tcf_proto *tp, |
e5dfb815 PM |
293 | struct tcf_result *res) |
294 | { | |
70da9f0b | 295 | struct flow_head *head = rcu_dereference_bh(tp->root); |
e5dfb815 PM |
296 | struct flow_filter *f; |
297 | u32 keymask; | |
298 | u32 classid; | |
299 | unsigned int n, key; | |
300 | int r; | |
301 | ||
70da9f0b | 302 | list_for_each_entry_rcu(f, &head->filters, list) { |
3a53943b | 303 | u32 keys[FLOW_KEY_MAX + 1]; |
6bd2a9af | 304 | struct flow_keys flow_keys; |
e5dfb815 PM |
305 | |
306 | if (!tcf_em_tree_match(skb, &f->ematches, NULL)) | |
307 | continue; | |
308 | ||
309 | keymask = f->keymask; | |
6bd2a9af | 310 | if (keymask & FLOW_KEYS_NEEDED) |
cd79a238 | 311 | skb_flow_dissect_flow_keys(skb, &flow_keys, 0); |
e5dfb815 PM |
312 | |
313 | for (n = 0; n < f->nkeys; n++) { | |
314 | key = ffs(keymask) - 1; | |
315 | keymask &= ~(1 << key); | |
6bd2a9af | 316 | keys[n] = flow_key_get(skb, key, &flow_keys); |
e5dfb815 PM |
317 | } |
318 | ||
319 | if (f->mode == FLOW_MODE_HASH) | |
72d9794f | 320 | classid = jhash2(keys, f->nkeys, f->hashrnd); |
e5dfb815 PM |
321 | else { |
322 | classid = keys[0]; | |
323 | classid = (classid & f->mask) ^ f->xor; | |
324 | classid = (classid >> f->rshift) + f->addend; | |
325 | } | |
326 | ||
327 | if (f->divisor) | |
328 | classid %= f->divisor; | |
329 | ||
330 | res->class = 0; | |
331 | res->classid = TC_H_MAKE(f->baseclass, f->baseclass + classid); | |
332 | ||
333 | r = tcf_exts_exec(skb, &f->exts, res); | |
334 | if (r < 0) | |
335 | continue; | |
336 | return r; | |
337 | } | |
338 | return -1; | |
339 | } | |
340 | ||
72d9794f PM |
341 | static void flow_perturbation(unsigned long arg) |
342 | { | |
343 | struct flow_filter *f = (struct flow_filter *)arg; | |
344 | ||
345 | get_random_bytes(&f->hashrnd, 4); | |
346 | if (f->perturb_period) | |
347 | mod_timer(&f->perturb_timer, jiffies + f->perturb_period); | |
348 | } | |
349 | ||
e5dfb815 PM |
350 | static const struct nla_policy flow_policy[TCA_FLOW_MAX + 1] = { |
351 | [TCA_FLOW_KEYS] = { .type = NLA_U32 }, | |
352 | [TCA_FLOW_MODE] = { .type = NLA_U32 }, | |
353 | [TCA_FLOW_BASECLASS] = { .type = NLA_U32 }, | |
354 | [TCA_FLOW_RSHIFT] = { .type = NLA_U32 }, | |
355 | [TCA_FLOW_ADDEND] = { .type = NLA_U32 }, | |
356 | [TCA_FLOW_MASK] = { .type = NLA_U32 }, | |
357 | [TCA_FLOW_XOR] = { .type = NLA_U32 }, | |
358 | [TCA_FLOW_DIVISOR] = { .type = NLA_U32 }, | |
359 | [TCA_FLOW_ACT] = { .type = NLA_NESTED }, | |
360 | [TCA_FLOW_POLICE] = { .type = NLA_NESTED }, | |
361 | [TCA_FLOW_EMATCHES] = { .type = NLA_NESTED }, | |
72d9794f | 362 | [TCA_FLOW_PERTURB] = { .type = NLA_U32 }, |
e5dfb815 PM |
363 | }; |
364 | ||
70da9f0b JF |
365 | static void flow_destroy_filter(struct rcu_head *head) |
366 | { | |
367 | struct flow_filter *f = container_of(head, struct flow_filter, rcu); | |
368 | ||
369 | del_timer_sync(&f->perturb_timer); | |
18d0264f | 370 | tcf_exts_destroy(&f->exts); |
82a470f1 | 371 | tcf_em_tree_destroy(&f->ematches); |
70da9f0b JF |
372 | kfree(f); |
373 | } | |
374 | ||
c1b52739 | 375 | static int flow_change(struct net *net, struct sk_buff *in_skb, |
af4c6641 | 376 | struct tcf_proto *tp, unsigned long base, |
e5dfb815 | 377 | u32 handle, struct nlattr **tca, |
2f7ef2f8 | 378 | unsigned long *arg, bool ovr) |
e5dfb815 | 379 | { |
70da9f0b JF |
380 | struct flow_head *head = rtnl_dereference(tp->root); |
381 | struct flow_filter *fold, *fnew; | |
e5dfb815 PM |
382 | struct nlattr *opt = tca[TCA_OPTIONS]; |
383 | struct nlattr *tb[TCA_FLOW_MAX + 1]; | |
384 | struct tcf_exts e; | |
385 | struct tcf_ematch_tree t; | |
386 | unsigned int nkeys = 0; | |
72d9794f | 387 | unsigned int perturb_period = 0; |
e5dfb815 PM |
388 | u32 baseclass = 0; |
389 | u32 keymask = 0; | |
390 | u32 mode; | |
391 | int err; | |
392 | ||
393 | if (opt == NULL) | |
394 | return -EINVAL; | |
395 | ||
396 | err = nla_parse_nested(tb, TCA_FLOW_MAX, opt, flow_policy); | |
397 | if (err < 0) | |
398 | return err; | |
399 | ||
400 | if (tb[TCA_FLOW_BASECLASS]) { | |
401 | baseclass = nla_get_u32(tb[TCA_FLOW_BASECLASS]); | |
402 | if (TC_H_MIN(baseclass) == 0) | |
403 | return -EINVAL; | |
404 | } | |
405 | ||
406 | if (tb[TCA_FLOW_KEYS]) { | |
407 | keymask = nla_get_u32(tb[TCA_FLOW_KEYS]); | |
e5dfb815 PM |
408 | |
409 | nkeys = hweight32(keymask); | |
410 | if (nkeys == 0) | |
411 | return -EINVAL; | |
4f250491 PM |
412 | |
413 | if (fls(keymask) - 1 > FLOW_KEY_MAX) | |
414 | return -EOPNOTSUPP; | |
a6c6796c EB |
415 | |
416 | if ((keymask & (FLOW_KEY_SKUID|FLOW_KEY_SKGID)) && | |
e32123e5 | 417 | sk_user_ns(NETLINK_CB(in_skb).sk) != &init_user_ns) |
a6c6796c | 418 | return -EOPNOTSUPP; |
e5dfb815 PM |
419 | } |
420 | ||
b9a24bb7 WC |
421 | err = tcf_exts_init(&e, TCA_FLOW_ACT, TCA_FLOW_POLICE); |
422 | if (err < 0) | |
423 | goto err1; | |
2f7ef2f8 | 424 | err = tcf_exts_validate(net, tp, tb, tca[TCA_RATE], &e, ovr); |
e5dfb815 | 425 | if (err < 0) |
b9a24bb7 | 426 | goto err1; |
e5dfb815 PM |
427 | |
428 | err = tcf_em_tree_validate(tp, tb[TCA_FLOW_EMATCHES], &t); | |
429 | if (err < 0) | |
430 | goto err1; | |
431 | ||
70da9f0b JF |
432 | err = -ENOBUFS; |
433 | fnew = kzalloc(sizeof(*fnew), GFP_KERNEL); | |
434 | if (!fnew) | |
435 | goto err2; | |
436 | ||
b9a24bb7 WC |
437 | err = tcf_exts_init(&fnew->exts, TCA_FLOW_ACT, TCA_FLOW_POLICE); |
438 | if (err < 0) | |
439 | goto err3; | |
32b2f4b1 | 440 | |
70da9f0b JF |
441 | fold = (struct flow_filter *)*arg; |
442 | if (fold) { | |
e5dfb815 | 443 | err = -EINVAL; |
70da9f0b | 444 | if (fold->handle != handle && handle) |
b9a24bb7 | 445 | goto err3; |
e5dfb815 | 446 | |
70da9f0b | 447 | /* Copy fold into fnew */ |
70da9f0b | 448 | fnew->tp = fold->tp; |
70da9f0b JF |
449 | fnew->handle = fold->handle; |
450 | fnew->nkeys = fold->nkeys; | |
451 | fnew->keymask = fold->keymask; | |
452 | fnew->mode = fold->mode; | |
453 | fnew->mask = fold->mask; | |
454 | fnew->xor = fold->xor; | |
455 | fnew->rshift = fold->rshift; | |
456 | fnew->addend = fold->addend; | |
457 | fnew->divisor = fold->divisor; | |
458 | fnew->baseclass = fold->baseclass; | |
459 | fnew->hashrnd = fold->hashrnd; | |
460 | ||
461 | mode = fold->mode; | |
e5dfb815 PM |
462 | if (tb[TCA_FLOW_MODE]) |
463 | mode = nla_get_u32(tb[TCA_FLOW_MODE]); | |
464 | if (mode != FLOW_MODE_HASH && nkeys > 1) | |
b9a24bb7 | 465 | goto err3; |
72d9794f PM |
466 | |
467 | if (mode == FLOW_MODE_HASH) | |
70da9f0b | 468 | perturb_period = fold->perturb_period; |
72d9794f PM |
469 | if (tb[TCA_FLOW_PERTURB]) { |
470 | if (mode != FLOW_MODE_HASH) | |
b9a24bb7 | 471 | goto err3; |
72d9794f PM |
472 | perturb_period = nla_get_u32(tb[TCA_FLOW_PERTURB]) * HZ; |
473 | } | |
e5dfb815 PM |
474 | } else { |
475 | err = -EINVAL; | |
476 | if (!handle) | |
b9a24bb7 | 477 | goto err3; |
e5dfb815 | 478 | if (!tb[TCA_FLOW_KEYS]) |
b9a24bb7 | 479 | goto err3; |
e5dfb815 PM |
480 | |
481 | mode = FLOW_MODE_MAP; | |
482 | if (tb[TCA_FLOW_MODE]) | |
483 | mode = nla_get_u32(tb[TCA_FLOW_MODE]); | |
484 | if (mode != FLOW_MODE_HASH && nkeys > 1) | |
b9a24bb7 | 485 | goto err3; |
e5dfb815 | 486 | |
72d9794f PM |
487 | if (tb[TCA_FLOW_PERTURB]) { |
488 | if (mode != FLOW_MODE_HASH) | |
b9a24bb7 | 489 | goto err3; |
72d9794f PM |
490 | perturb_period = nla_get_u32(tb[TCA_FLOW_PERTURB]) * HZ; |
491 | } | |
492 | ||
e5dfb815 PM |
493 | if (TC_H_MAJ(baseclass) == 0) |
494 | baseclass = TC_H_MAKE(tp->q->handle, baseclass); | |
495 | if (TC_H_MIN(baseclass) == 0) | |
496 | baseclass = TC_H_MAKE(baseclass, 1); | |
497 | ||
70da9f0b JF |
498 | fnew->handle = handle; |
499 | fnew->mask = ~0U; | |
500 | fnew->tp = tp; | |
501 | get_random_bytes(&fnew->hashrnd, 4); | |
e5dfb815 PM |
502 | } |
503 | ||
70da9f0b JF |
504 | fnew->perturb_timer.function = flow_perturbation; |
505 | fnew->perturb_timer.data = (unsigned long)fnew; | |
506 | init_timer_deferrable(&fnew->perturb_timer); | |
e5dfb815 | 507 | |
70da9f0b JF |
508 | tcf_exts_change(tp, &fnew->exts, &e); |
509 | tcf_em_tree_change(tp, &fnew->ematches, &t); | |
e5dfb815 | 510 | |
02875878 ED |
511 | netif_keep_dst(qdisc_dev(tp->q)); |
512 | ||
e5dfb815 | 513 | if (tb[TCA_FLOW_KEYS]) { |
70da9f0b JF |
514 | fnew->keymask = keymask; |
515 | fnew->nkeys = nkeys; | |
e5dfb815 PM |
516 | } |
517 | ||
70da9f0b | 518 | fnew->mode = mode; |
e5dfb815 PM |
519 | |
520 | if (tb[TCA_FLOW_MASK]) | |
70da9f0b | 521 | fnew->mask = nla_get_u32(tb[TCA_FLOW_MASK]); |
e5dfb815 | 522 | if (tb[TCA_FLOW_XOR]) |
70da9f0b | 523 | fnew->xor = nla_get_u32(tb[TCA_FLOW_XOR]); |
e5dfb815 | 524 | if (tb[TCA_FLOW_RSHIFT]) |
70da9f0b | 525 | fnew->rshift = nla_get_u32(tb[TCA_FLOW_RSHIFT]); |
e5dfb815 | 526 | if (tb[TCA_FLOW_ADDEND]) |
70da9f0b | 527 | fnew->addend = nla_get_u32(tb[TCA_FLOW_ADDEND]); |
e5dfb815 PM |
528 | |
529 | if (tb[TCA_FLOW_DIVISOR]) | |
70da9f0b | 530 | fnew->divisor = nla_get_u32(tb[TCA_FLOW_DIVISOR]); |
e5dfb815 | 531 | if (baseclass) |
70da9f0b | 532 | fnew->baseclass = baseclass; |
e5dfb815 | 533 | |
70da9f0b | 534 | fnew->perturb_period = perturb_period; |
72d9794f | 535 | if (perturb_period) |
70da9f0b | 536 | mod_timer(&fnew->perturb_timer, jiffies + perturb_period); |
72d9794f | 537 | |
e5dfb815 | 538 | if (*arg == 0) |
70da9f0b JF |
539 | list_add_tail_rcu(&fnew->list, &head->filters); |
540 | else | |
32b2f4b1 | 541 | list_replace_rcu(&fold->list, &fnew->list); |
e5dfb815 | 542 | |
70da9f0b | 543 | *arg = (unsigned long)fnew; |
e5dfb815 | 544 | |
70da9f0b JF |
545 | if (fold) |
546 | call_rcu(&fold->rcu, flow_destroy_filter); | |
e5dfb815 PM |
547 | return 0; |
548 | ||
b9a24bb7 WC |
549 | err3: |
550 | tcf_exts_destroy(&fnew->exts); | |
e5dfb815 | 551 | err2: |
82a470f1 | 552 | tcf_em_tree_destroy(&t); |
70da9f0b | 553 | kfree(fnew); |
e5dfb815 | 554 | err1: |
18d0264f | 555 | tcf_exts_destroy(&e); |
e5dfb815 PM |
556 | return err; |
557 | } | |
558 | ||
e5dfb815 PM |
559 | static int flow_delete(struct tcf_proto *tp, unsigned long arg) |
560 | { | |
561 | struct flow_filter *f = (struct flow_filter *)arg; | |
562 | ||
70da9f0b JF |
563 | list_del_rcu(&f->list); |
564 | call_rcu(&f->rcu, flow_destroy_filter); | |
e5dfb815 PM |
565 | return 0; |
566 | } | |
567 | ||
568 | static int flow_init(struct tcf_proto *tp) | |
569 | { | |
570 | struct flow_head *head; | |
571 | ||
e5dfb815 PM |
572 | head = kzalloc(sizeof(*head), GFP_KERNEL); |
573 | if (head == NULL) | |
574 | return -ENOBUFS; | |
575 | INIT_LIST_HEAD(&head->filters); | |
70da9f0b | 576 | rcu_assign_pointer(tp->root, head); |
e5dfb815 PM |
577 | return 0; |
578 | } | |
579 | ||
1e052be6 | 580 | static bool flow_destroy(struct tcf_proto *tp, bool force) |
e5dfb815 | 581 | { |
70da9f0b | 582 | struct flow_head *head = rtnl_dereference(tp->root); |
e5dfb815 PM |
583 | struct flow_filter *f, *next; |
584 | ||
1e052be6 CW |
585 | if (!force && !list_empty(&head->filters)) |
586 | return false; | |
587 | ||
e5dfb815 | 588 | list_for_each_entry_safe(f, next, &head->filters, list) { |
70da9f0b JF |
589 | list_del_rcu(&f->list); |
590 | call_rcu(&f->rcu, flow_destroy_filter); | |
e5dfb815 | 591 | } |
70da9f0b JF |
592 | RCU_INIT_POINTER(tp->root, NULL); |
593 | kfree_rcu(head, rcu); | |
1e052be6 | 594 | return true; |
e5dfb815 PM |
595 | } |
596 | ||
597 | static unsigned long flow_get(struct tcf_proto *tp, u32 handle) | |
598 | { | |
70da9f0b | 599 | struct flow_head *head = rtnl_dereference(tp->root); |
e5dfb815 PM |
600 | struct flow_filter *f; |
601 | ||
6a659cd0 | 602 | list_for_each_entry(f, &head->filters, list) |
e5dfb815 PM |
603 | if (f->handle == handle) |
604 | return (unsigned long)f; | |
605 | return 0; | |
606 | } | |
607 | ||
832d1d5b | 608 | static int flow_dump(struct net *net, struct tcf_proto *tp, unsigned long fh, |
e5dfb815 PM |
609 | struct sk_buff *skb, struct tcmsg *t) |
610 | { | |
611 | struct flow_filter *f = (struct flow_filter *)fh; | |
612 | struct nlattr *nest; | |
613 | ||
614 | if (f == NULL) | |
615 | return skb->len; | |
616 | ||
617 | t->tcm_handle = f->handle; | |
618 | ||
619 | nest = nla_nest_start(skb, TCA_OPTIONS); | |
620 | if (nest == NULL) | |
621 | goto nla_put_failure; | |
622 | ||
1b34ec43 DM |
623 | if (nla_put_u32(skb, TCA_FLOW_KEYS, f->keymask) || |
624 | nla_put_u32(skb, TCA_FLOW_MODE, f->mode)) | |
625 | goto nla_put_failure; | |
e5dfb815 PM |
626 | |
627 | if (f->mask != ~0 || f->xor != 0) { | |
1b34ec43 DM |
628 | if (nla_put_u32(skb, TCA_FLOW_MASK, f->mask) || |
629 | nla_put_u32(skb, TCA_FLOW_XOR, f->xor)) | |
630 | goto nla_put_failure; | |
e5dfb815 | 631 | } |
1b34ec43 DM |
632 | if (f->rshift && |
633 | nla_put_u32(skb, TCA_FLOW_RSHIFT, f->rshift)) | |
634 | goto nla_put_failure; | |
635 | if (f->addend && | |
636 | nla_put_u32(skb, TCA_FLOW_ADDEND, f->addend)) | |
637 | goto nla_put_failure; | |
e5dfb815 | 638 | |
1b34ec43 DM |
639 | if (f->divisor && |
640 | nla_put_u32(skb, TCA_FLOW_DIVISOR, f->divisor)) | |
641 | goto nla_put_failure; | |
642 | if (f->baseclass && | |
643 | nla_put_u32(skb, TCA_FLOW_BASECLASS, f->baseclass)) | |
644 | goto nla_put_failure; | |
e5dfb815 | 645 | |
1b34ec43 DM |
646 | if (f->perturb_period && |
647 | nla_put_u32(skb, TCA_FLOW_PERTURB, f->perturb_period / HZ)) | |
648 | goto nla_put_failure; | |
72d9794f | 649 | |
5da57f42 | 650 | if (tcf_exts_dump(skb, &f->exts) < 0) |
e5dfb815 | 651 | goto nla_put_failure; |
0aead543 | 652 | #ifdef CONFIG_NET_EMATCH |
e5dfb815 PM |
653 | if (f->ematches.hdr.nmatches && |
654 | tcf_em_tree_dump(skb, &f->ematches, TCA_FLOW_EMATCHES) < 0) | |
655 | goto nla_put_failure; | |
0aead543 | 656 | #endif |
e5dfb815 PM |
657 | nla_nest_end(skb, nest); |
658 | ||
5da57f42 | 659 | if (tcf_exts_dump_stats(skb, &f->exts) < 0) |
e5dfb815 PM |
660 | goto nla_put_failure; |
661 | ||
662 | return skb->len; | |
663 | ||
664 | nla_put_failure: | |
6ea3b446 | 665 | nla_nest_cancel(skb, nest); |
e5dfb815 PM |
666 | return -1; |
667 | } | |
668 | ||
669 | static void flow_walk(struct tcf_proto *tp, struct tcf_walker *arg) | |
670 | { | |
70da9f0b | 671 | struct flow_head *head = rtnl_dereference(tp->root); |
e5dfb815 PM |
672 | struct flow_filter *f; |
673 | ||
6a659cd0 | 674 | list_for_each_entry(f, &head->filters, list) { |
e5dfb815 PM |
675 | if (arg->count < arg->skip) |
676 | goto skip; | |
677 | if (arg->fn(tp, (unsigned long)f, arg) < 0) { | |
678 | arg->stop = 1; | |
679 | break; | |
680 | } | |
681 | skip: | |
682 | arg->count++; | |
683 | } | |
684 | } | |
685 | ||
686 | static struct tcf_proto_ops cls_flow_ops __read_mostly = { | |
687 | .kind = "flow", | |
688 | .classify = flow_classify, | |
689 | .init = flow_init, | |
690 | .destroy = flow_destroy, | |
691 | .change = flow_change, | |
692 | .delete = flow_delete, | |
693 | .get = flow_get, | |
e5dfb815 PM |
694 | .dump = flow_dump, |
695 | .walk = flow_walk, | |
696 | .owner = THIS_MODULE, | |
697 | }; | |
698 | ||
699 | static int __init cls_flow_init(void) | |
700 | { | |
701 | return register_tcf_proto_ops(&cls_flow_ops); | |
702 | } | |
703 | ||
704 | static void __exit cls_flow_exit(void) | |
705 | { | |
706 | unregister_tcf_proto_ops(&cls_flow_ops); | |
707 | } | |
708 | ||
709 | module_init(cls_flow_init); | |
710 | module_exit(cls_flow_exit); | |
711 | ||
712 | MODULE_LICENSE("GPL"); | |
713 | MODULE_AUTHOR("Patrick McHardy <kaber@trash.net>"); | |
714 | MODULE_DESCRIPTION("TC flow classifier"); |