Commit | Line | Data |
---|---|---|
2874c5fd | 1 | // SPDX-License-Identifier: GPL-2.0-or-later |
e5dfb815 PM |
2 | /* |
3 | * net/sched/cls_flow.c Generic flow classifier | |
4 | * | |
5 | * Copyright (c) 2007, 2008 Patrick McHardy <kaber@trash.net> | |
e5dfb815 PM |
6 | */ |
7 | ||
8 | #include <linux/kernel.h> | |
9 | #include <linux/init.h> | |
10 | #include <linux/list.h> | |
11 | #include <linux/jhash.h> | |
12 | #include <linux/random.h> | |
13 | #include <linux/pkt_cls.h> | |
14 | #include <linux/skbuff.h> | |
15 | #include <linux/in.h> | |
16 | #include <linux/ip.h> | |
17 | #include <linux/ipv6.h> | |
9ec13810 | 18 | #include <linux/if_vlan.h> |
5a0e3ad6 | 19 | #include <linux/slab.h> |
3a9a231d | 20 | #include <linux/module.h> |
743b2a66 | 21 | #include <net/inet_sock.h> |
e5dfb815 PM |
22 | |
23 | #include <net/pkt_cls.h> | |
24 | #include <net/ip.h> | |
25 | #include <net/route.h> | |
1bd758eb | 26 | #include <net/flow_dissector.h> |
6bd2a9af | 27 | |
0013de38 | 28 | #if IS_ENABLED(CONFIG_NF_CONNTRACK) |
e5dfb815 PM |
29 | #include <net/netfilter/nf_conntrack.h> |
30 | #endif | |
31 | ||
32 | struct flow_head { | |
33 | struct list_head filters; | |
70da9f0b | 34 | struct rcu_head rcu; |
e5dfb815 PM |
35 | }; |
36 | ||
37 | struct flow_filter { | |
38 | struct list_head list; | |
39 | struct tcf_exts exts; | |
40 | struct tcf_ematch_tree ematches; | |
70da9f0b | 41 | struct tcf_proto *tp; |
72d9794f PM |
42 | struct timer_list perturb_timer; |
43 | u32 perturb_period; | |
e5dfb815 PM |
44 | u32 handle; |
45 | ||
46 | u32 nkeys; | |
47 | u32 keymask; | |
48 | u32 mode; | |
49 | u32 mask; | |
50 | u32 xor; | |
51 | u32 rshift; | |
52 | u32 addend; | |
53 | u32 divisor; | |
54 | u32 baseclass; | |
72d9794f | 55 | u32 hashrnd; |
aaa908ff | 56 | struct rcu_work rwork; |
e5dfb815 PM |
57 | }; |
58 | ||
e5dfb815 PM |
59 | static inline u32 addr_fold(void *addr) |
60 | { | |
61 | unsigned long a = (unsigned long)addr; | |
62 | ||
63 | return (a & 0xFFFFFFFF) ^ (BITS_PER_LONG > 32 ? a >> 32 : 0); | |
64 | } | |
65 | ||
6bd2a9af | 66 | static u32 flow_get_src(const struct sk_buff *skb, const struct flow_keys *flow) |
e5dfb815 | 67 | { |
c3f83241 TH |
68 | __be32 src = flow_get_u32_src(flow); |
69 | ||
70 | if (src) | |
71 | return ntohl(src); | |
72 | ||
4b95c3d4 | 73 | return addr_fold(skb->sk); |
e5dfb815 PM |
74 | } |
75 | ||
6bd2a9af | 76 | static u32 flow_get_dst(const struct sk_buff *skb, const struct flow_keys *flow) |
e5dfb815 | 77 | { |
c3f83241 TH |
78 | __be32 dst = flow_get_u32_dst(flow); |
79 | ||
80 | if (dst) | |
81 | return ntohl(dst); | |
82 | ||
d7bf2ebe | 83 | return addr_fold(skb_dst(skb)) ^ (__force u16)skb_protocol(skb, true); |
e5dfb815 PM |
84 | } |
85 | ||
5a7a5555 JHS |
86 | static u32 flow_get_proto(const struct sk_buff *skb, |
87 | const struct flow_keys *flow) | |
e5dfb815 | 88 | { |
06635a35 | 89 | return flow->basic.ip_proto; |
e5dfb815 PM |
90 | } |
91 | ||
5a7a5555 JHS |
92 | static u32 flow_get_proto_src(const struct sk_buff *skb, |
93 | const struct flow_keys *flow) | |
e5dfb815 | 94 | { |
06635a35 | 95 | if (flow->ports.ports) |
59346afe | 96 | return ntohs(flow->ports.src); |
e5dfb815 | 97 | |
859c2012 ED |
98 | return addr_fold(skb->sk); |
99 | } | |
100 | ||
5a7a5555 JHS |
101 | static u32 flow_get_proto_dst(const struct sk_buff *skb, |
102 | const struct flow_keys *flow) | |
859c2012 | 103 | { |
06635a35 | 104 | if (flow->ports.ports) |
59346afe | 105 | return ntohs(flow->ports.dst); |
e5dfb815 | 106 | |
d7bf2ebe | 107 | return addr_fold(skb_dst(skb)) ^ (__force u16)skb_protocol(skb, true); |
e5dfb815 PM |
108 | } |
109 | ||
110 | static u32 flow_get_iif(const struct sk_buff *skb) | |
111 | { | |
8964be4a | 112 | return skb->skb_iif; |
e5dfb815 PM |
113 | } |
114 | ||
115 | static u32 flow_get_priority(const struct sk_buff *skb) | |
116 | { | |
117 | return skb->priority; | |
118 | } | |
119 | ||
120 | static u32 flow_get_mark(const struct sk_buff *skb) | |
121 | { | |
122 | return skb->mark; | |
123 | } | |
124 | ||
125 | static u32 flow_get_nfct(const struct sk_buff *skb) | |
126 | { | |
0013de38 | 127 | #if IS_ENABLED(CONFIG_NF_CONNTRACK) |
cb9c6836 | 128 | return addr_fold(skb_nfct(skb)); |
e5dfb815 PM |
129 | #else |
130 | return 0; | |
131 | #endif | |
132 | } | |
133 | ||
0013de38 | 134 | #if IS_ENABLED(CONFIG_NF_CONNTRACK) |
e5dfb815 PM |
135 | #define CTTUPLE(skb, member) \ |
136 | ({ \ | |
137 | enum ip_conntrack_info ctinfo; \ | |
859c2012 | 138 | const struct nf_conn *ct = nf_ct_get(skb, &ctinfo); \ |
e5dfb815 PM |
139 | if (ct == NULL) \ |
140 | goto fallback; \ | |
141 | ct->tuplehash[CTINFO2DIR(ctinfo)].tuple.member; \ | |
142 | }) | |
143 | #else | |
144 | #define CTTUPLE(skb, member) \ | |
145 | ({ \ | |
146 | goto fallback; \ | |
147 | 0; \ | |
148 | }) | |
149 | #endif | |
150 | ||
5a7a5555 JHS |
151 | static u32 flow_get_nfct_src(const struct sk_buff *skb, |
152 | const struct flow_keys *flow) | |
e5dfb815 | 153 | { |
d7bf2ebe | 154 | switch (skb_protocol(skb, true)) { |
60678040 | 155 | case htons(ETH_P_IP): |
e5dfb815 | 156 | return ntohl(CTTUPLE(skb, src.u3.ip)); |
60678040 | 157 | case htons(ETH_P_IPV6): |
e5dfb815 PM |
158 | return ntohl(CTTUPLE(skb, src.u3.ip6[3])); |
159 | } | |
160 | fallback: | |
6bd2a9af | 161 | return flow_get_src(skb, flow); |
e5dfb815 PM |
162 | } |
163 | ||
5a7a5555 JHS |
164 | static u32 flow_get_nfct_dst(const struct sk_buff *skb, |
165 | const struct flow_keys *flow) | |
e5dfb815 | 166 | { |
d7bf2ebe | 167 | switch (skb_protocol(skb, true)) { |
60678040 | 168 | case htons(ETH_P_IP): |
e5dfb815 | 169 | return ntohl(CTTUPLE(skb, dst.u3.ip)); |
60678040 | 170 | case htons(ETH_P_IPV6): |
e5dfb815 PM |
171 | return ntohl(CTTUPLE(skb, dst.u3.ip6[3])); |
172 | } | |
173 | fallback: | |
6bd2a9af | 174 | return flow_get_dst(skb, flow); |
e5dfb815 PM |
175 | } |
176 | ||
5a7a5555 JHS |
177 | static u32 flow_get_nfct_proto_src(const struct sk_buff *skb, |
178 | const struct flow_keys *flow) | |
e5dfb815 PM |
179 | { |
180 | return ntohs(CTTUPLE(skb, src.u.all)); | |
181 | fallback: | |
6bd2a9af | 182 | return flow_get_proto_src(skb, flow); |
e5dfb815 PM |
183 | } |
184 | ||
5a7a5555 JHS |
185 | static u32 flow_get_nfct_proto_dst(const struct sk_buff *skb, |
186 | const struct flow_keys *flow) | |
e5dfb815 PM |
187 | { |
188 | return ntohs(CTTUPLE(skb, dst.u.all)); | |
189 | fallback: | |
6bd2a9af | 190 | return flow_get_proto_dst(skb, flow); |
e5dfb815 PM |
191 | } |
192 | ||
193 | static u32 flow_get_rtclassid(const struct sk_buff *skb) | |
194 | { | |
c7066f70 | 195 | #ifdef CONFIG_IP_ROUTE_CLASSID |
adf30907 ED |
196 | if (skb_dst(skb)) |
197 | return skb_dst(skb)->tclassid; | |
e5dfb815 PM |
198 | #endif |
199 | return 0; | |
200 | } | |
201 | ||
202 | static u32 flow_get_skuid(const struct sk_buff *skb) | |
203 | { | |
743b2a66 ED |
204 | struct sock *sk = skb_to_full_sk(skb); |
205 | ||
206 | if (sk && sk->sk_socket && sk->sk_socket->file) { | |
207 | kuid_t skuid = sk->sk_socket->file->f_cred->fsuid; | |
208 | ||
a6c6796c EB |
209 | return from_kuid(&init_user_ns, skuid); |
210 | } | |
e5dfb815 PM |
211 | return 0; |
212 | } | |
213 | ||
214 | static u32 flow_get_skgid(const struct sk_buff *skb) | |
215 | { | |
743b2a66 ED |
216 | struct sock *sk = skb_to_full_sk(skb); |
217 | ||
218 | if (sk && sk->sk_socket && sk->sk_socket->file) { | |
219 | kgid_t skgid = sk->sk_socket->file->f_cred->fsgid; | |
220 | ||
a6c6796c EB |
221 | return from_kgid(&init_user_ns, skgid); |
222 | } | |
e5dfb815 PM |
223 | return 0; |
224 | } | |
225 | ||
9ec13810 PM |
226 | static u32 flow_get_vlan_tag(const struct sk_buff *skb) |
227 | { | |
3f649ab7 | 228 | u16 tag; |
9ec13810 PM |
229 | |
230 | if (vlan_get_tag(skb, &tag) < 0) | |
231 | return 0; | |
232 | return tag & VLAN_VID_MASK; | |
233 | } | |
234 | ||
739a91ef CG |
235 | static u32 flow_get_rxhash(struct sk_buff *skb) |
236 | { | |
3958afa1 | 237 | return skb_get_hash(skb); |
739a91ef CG |
238 | } |
239 | ||
6bd2a9af | 240 | static u32 flow_key_get(struct sk_buff *skb, int key, struct flow_keys *flow) |
e5dfb815 PM |
241 | { |
242 | switch (key) { | |
243 | case FLOW_KEY_SRC: | |
6bd2a9af | 244 | return flow_get_src(skb, flow); |
e5dfb815 | 245 | case FLOW_KEY_DST: |
6bd2a9af | 246 | return flow_get_dst(skb, flow); |
e5dfb815 | 247 | case FLOW_KEY_PROTO: |
6bd2a9af | 248 | return flow_get_proto(skb, flow); |
e5dfb815 | 249 | case FLOW_KEY_PROTO_SRC: |
6bd2a9af | 250 | return flow_get_proto_src(skb, flow); |
e5dfb815 | 251 | case FLOW_KEY_PROTO_DST: |
6bd2a9af | 252 | return flow_get_proto_dst(skb, flow); |
e5dfb815 PM |
253 | case FLOW_KEY_IIF: |
254 | return flow_get_iif(skb); | |
255 | case FLOW_KEY_PRIORITY: | |
256 | return flow_get_priority(skb); | |
257 | case FLOW_KEY_MARK: | |
258 | return flow_get_mark(skb); | |
259 | case FLOW_KEY_NFCT: | |
260 | return flow_get_nfct(skb); | |
261 | case FLOW_KEY_NFCT_SRC: | |
6bd2a9af | 262 | return flow_get_nfct_src(skb, flow); |
e5dfb815 | 263 | case FLOW_KEY_NFCT_DST: |
6bd2a9af | 264 | return flow_get_nfct_dst(skb, flow); |
e5dfb815 | 265 | case FLOW_KEY_NFCT_PROTO_SRC: |
6bd2a9af | 266 | return flow_get_nfct_proto_src(skb, flow); |
e5dfb815 | 267 | case FLOW_KEY_NFCT_PROTO_DST: |
6bd2a9af | 268 | return flow_get_nfct_proto_dst(skb, flow); |
e5dfb815 PM |
269 | case FLOW_KEY_RTCLASSID: |
270 | return flow_get_rtclassid(skb); | |
271 | case FLOW_KEY_SKUID: | |
272 | return flow_get_skuid(skb); | |
273 | case FLOW_KEY_SKGID: | |
274 | return flow_get_skgid(skb); | |
9ec13810 PM |
275 | case FLOW_KEY_VLAN_TAG: |
276 | return flow_get_vlan_tag(skb); | |
739a91ef CG |
277 | case FLOW_KEY_RXHASH: |
278 | return flow_get_rxhash(skb); | |
e5dfb815 PM |
279 | default: |
280 | WARN_ON(1); | |
281 | return 0; | |
282 | } | |
283 | } | |
284 | ||
6bd2a9af ED |
285 | #define FLOW_KEYS_NEEDED ((1 << FLOW_KEY_SRC) | \ |
286 | (1 << FLOW_KEY_DST) | \ | |
287 | (1 << FLOW_KEY_PROTO) | \ | |
288 | (1 << FLOW_KEY_PROTO_SRC) | \ | |
289 | (1 << FLOW_KEY_PROTO_DST) | \ | |
290 | (1 << FLOW_KEY_NFCT_SRC) | \ | |
291 | (1 << FLOW_KEY_NFCT_DST) | \ | |
292 | (1 << FLOW_KEY_NFCT_PROTO_SRC) | \ | |
293 | (1 << FLOW_KEY_NFCT_PROTO_DST)) | |
294 | ||
dc7f9f6e | 295 | static int flow_classify(struct sk_buff *skb, const struct tcf_proto *tp, |
e5dfb815 PM |
296 | struct tcf_result *res) |
297 | { | |
70da9f0b | 298 | struct flow_head *head = rcu_dereference_bh(tp->root); |
e5dfb815 PM |
299 | struct flow_filter *f; |
300 | u32 keymask; | |
301 | u32 classid; | |
302 | unsigned int n, key; | |
303 | int r; | |
304 | ||
70da9f0b | 305 | list_for_each_entry_rcu(f, &head->filters, list) { |
3a53943b | 306 | u32 keys[FLOW_KEY_MAX + 1]; |
6bd2a9af | 307 | struct flow_keys flow_keys; |
e5dfb815 PM |
308 | |
309 | if (!tcf_em_tree_match(skb, &f->ematches, NULL)) | |
310 | continue; | |
311 | ||
312 | keymask = f->keymask; | |
6bd2a9af | 313 | if (keymask & FLOW_KEYS_NEEDED) |
cd79a238 | 314 | skb_flow_dissect_flow_keys(skb, &flow_keys, 0); |
e5dfb815 PM |
315 | |
316 | for (n = 0; n < f->nkeys; n++) { | |
317 | key = ffs(keymask) - 1; | |
318 | keymask &= ~(1 << key); | |
6bd2a9af | 319 | keys[n] = flow_key_get(skb, key, &flow_keys); |
e5dfb815 PM |
320 | } |
321 | ||
322 | if (f->mode == FLOW_MODE_HASH) | |
72d9794f | 323 | classid = jhash2(keys, f->nkeys, f->hashrnd); |
e5dfb815 PM |
324 | else { |
325 | classid = keys[0]; | |
326 | classid = (classid & f->mask) ^ f->xor; | |
327 | classid = (classid >> f->rshift) + f->addend; | |
328 | } | |
329 | ||
330 | if (f->divisor) | |
331 | classid %= f->divisor; | |
332 | ||
333 | res->class = 0; | |
334 | res->classid = TC_H_MAKE(f->baseclass, f->baseclass + classid); | |
335 | ||
336 | r = tcf_exts_exec(skb, &f->exts, res); | |
337 | if (r < 0) | |
338 | continue; | |
339 | return r; | |
340 | } | |
341 | return -1; | |
342 | } | |
343 | ||
cdeabbb8 | 344 | static void flow_perturbation(struct timer_list *t) |
72d9794f | 345 | { |
cdeabbb8 | 346 | struct flow_filter *f = from_timer(f, t, perturb_timer); |
72d9794f PM |
347 | |
348 | get_random_bytes(&f->hashrnd, 4); | |
349 | if (f->perturb_period) | |
350 | mod_timer(&f->perturb_timer, jiffies + f->perturb_period); | |
351 | } | |
352 | ||
e5dfb815 PM |
353 | static const struct nla_policy flow_policy[TCA_FLOW_MAX + 1] = { |
354 | [TCA_FLOW_KEYS] = { .type = NLA_U32 }, | |
355 | [TCA_FLOW_MODE] = { .type = NLA_U32 }, | |
356 | [TCA_FLOW_BASECLASS] = { .type = NLA_U32 }, | |
357 | [TCA_FLOW_RSHIFT] = { .type = NLA_U32 }, | |
358 | [TCA_FLOW_ADDEND] = { .type = NLA_U32 }, | |
359 | [TCA_FLOW_MASK] = { .type = NLA_U32 }, | |
360 | [TCA_FLOW_XOR] = { .type = NLA_U32 }, | |
361 | [TCA_FLOW_DIVISOR] = { .type = NLA_U32 }, | |
362 | [TCA_FLOW_ACT] = { .type = NLA_NESTED }, | |
363 | [TCA_FLOW_POLICE] = { .type = NLA_NESTED }, | |
364 | [TCA_FLOW_EMATCHES] = { .type = NLA_NESTED }, | |
72d9794f | 365 | [TCA_FLOW_PERTURB] = { .type = NLA_U32 }, |
e5dfb815 PM |
366 | }; |
367 | ||
22f7cec9 | 368 | static void __flow_destroy_filter(struct flow_filter *f) |
70da9f0b | 369 | { |
70da9f0b | 370 | del_timer_sync(&f->perturb_timer); |
18d0264f | 371 | tcf_exts_destroy(&f->exts); |
82a470f1 | 372 | tcf_em_tree_destroy(&f->ematches); |
22f7cec9 | 373 | tcf_exts_put_net(&f->exts); |
70da9f0b | 374 | kfree(f); |
22f7cec9 CW |
375 | } |
376 | ||
377 | static void flow_destroy_filter_work(struct work_struct *work) | |
378 | { | |
aaa908ff CW |
379 | struct flow_filter *f = container_of(to_rcu_work(work), |
380 | struct flow_filter, | |
381 | rwork); | |
22f7cec9 CW |
382 | rtnl_lock(); |
383 | __flow_destroy_filter(f); | |
94cdb475 CW |
384 | rtnl_unlock(); |
385 | } | |
386 | ||
c1b52739 | 387 | static int flow_change(struct net *net, struct sk_buff *in_skb, |
af4c6641 | 388 | struct tcf_proto *tp, unsigned long base, |
e5dfb815 | 389 | u32 handle, struct nlattr **tca, |
695176bf | 390 | void **arg, u32 flags, |
12db03b6 | 391 | struct netlink_ext_ack *extack) |
e5dfb815 | 392 | { |
70da9f0b JF |
393 | struct flow_head *head = rtnl_dereference(tp->root); |
394 | struct flow_filter *fold, *fnew; | |
e5dfb815 PM |
395 | struct nlattr *opt = tca[TCA_OPTIONS]; |
396 | struct nlattr *tb[TCA_FLOW_MAX + 1]; | |
e5dfb815 | 397 | unsigned int nkeys = 0; |
72d9794f | 398 | unsigned int perturb_period = 0; |
e5dfb815 PM |
399 | u32 baseclass = 0; |
400 | u32 keymask = 0; | |
401 | u32 mode; | |
402 | int err; | |
403 | ||
404 | if (opt == NULL) | |
405 | return -EINVAL; | |
406 | ||
8cb08174 JB |
407 | err = nla_parse_nested_deprecated(tb, TCA_FLOW_MAX, opt, flow_policy, |
408 | NULL); | |
e5dfb815 PM |
409 | if (err < 0) |
410 | return err; | |
411 | ||
412 | if (tb[TCA_FLOW_BASECLASS]) { | |
413 | baseclass = nla_get_u32(tb[TCA_FLOW_BASECLASS]); | |
414 | if (TC_H_MIN(baseclass) == 0) | |
415 | return -EINVAL; | |
416 | } | |
417 | ||
418 | if (tb[TCA_FLOW_KEYS]) { | |
419 | keymask = nla_get_u32(tb[TCA_FLOW_KEYS]); | |
e5dfb815 PM |
420 | |
421 | nkeys = hweight32(keymask); | |
422 | if (nkeys == 0) | |
423 | return -EINVAL; | |
4f250491 PM |
424 | |
425 | if (fls(keymask) - 1 > FLOW_KEY_MAX) | |
426 | return -EOPNOTSUPP; | |
a6c6796c EB |
427 | |
428 | if ((keymask & (FLOW_KEY_SKUID|FLOW_KEY_SKGID)) && | |
e32123e5 | 429 | sk_user_ns(NETLINK_CB(in_skb).sk) != &init_user_ns) |
a6c6796c | 430 | return -EOPNOTSUPP; |
e5dfb815 PM |
431 | } |
432 | ||
70da9f0b JF |
433 | fnew = kzalloc(sizeof(*fnew), GFP_KERNEL); |
434 | if (!fnew) | |
c09fc2e1 | 435 | return -ENOBUFS; |
4ebc1e3c JP |
436 | |
437 | err = tcf_em_tree_validate(tp, tb[TCA_FLOW_EMATCHES], &fnew->ematches); | |
438 | if (err < 0) | |
c09fc2e1 | 439 | goto err1; |
70da9f0b | 440 | |
14215108 | 441 | err = tcf_exts_init(&fnew->exts, net, TCA_FLOW_ACT, TCA_FLOW_POLICE); |
b9a24bb7 | 442 | if (err < 0) |
c09fc2e1 JP |
443 | goto err2; |
444 | ||
695176bf CW |
445 | err = tcf_exts_validate(net, tp, tb, tca[TCA_RATE], &fnew->exts, flags, |
446 | extack); | |
c09fc2e1 JP |
447 | if (err < 0) |
448 | goto err2; | |
32b2f4b1 | 449 | |
8113c095 | 450 | fold = *arg; |
70da9f0b | 451 | if (fold) { |
e5dfb815 | 452 | err = -EINVAL; |
70da9f0b | 453 | if (fold->handle != handle && handle) |
c09fc2e1 | 454 | goto err2; |
e5dfb815 | 455 | |
70da9f0b | 456 | /* Copy fold into fnew */ |
70da9f0b | 457 | fnew->tp = fold->tp; |
70da9f0b JF |
458 | fnew->handle = fold->handle; |
459 | fnew->nkeys = fold->nkeys; | |
460 | fnew->keymask = fold->keymask; | |
461 | fnew->mode = fold->mode; | |
462 | fnew->mask = fold->mask; | |
463 | fnew->xor = fold->xor; | |
464 | fnew->rshift = fold->rshift; | |
465 | fnew->addend = fold->addend; | |
466 | fnew->divisor = fold->divisor; | |
467 | fnew->baseclass = fold->baseclass; | |
468 | fnew->hashrnd = fold->hashrnd; | |
469 | ||
470 | mode = fold->mode; | |
e5dfb815 PM |
471 | if (tb[TCA_FLOW_MODE]) |
472 | mode = nla_get_u32(tb[TCA_FLOW_MODE]); | |
473 | if (mode != FLOW_MODE_HASH && nkeys > 1) | |
c09fc2e1 | 474 | goto err2; |
72d9794f PM |
475 | |
476 | if (mode == FLOW_MODE_HASH) | |
70da9f0b | 477 | perturb_period = fold->perturb_period; |
72d9794f PM |
478 | if (tb[TCA_FLOW_PERTURB]) { |
479 | if (mode != FLOW_MODE_HASH) | |
c09fc2e1 | 480 | goto err2; |
72d9794f PM |
481 | perturb_period = nla_get_u32(tb[TCA_FLOW_PERTURB]) * HZ; |
482 | } | |
e5dfb815 PM |
483 | } else { |
484 | err = -EINVAL; | |
485 | if (!handle) | |
c09fc2e1 | 486 | goto err2; |
e5dfb815 | 487 | if (!tb[TCA_FLOW_KEYS]) |
c09fc2e1 | 488 | goto err2; |
e5dfb815 PM |
489 | |
490 | mode = FLOW_MODE_MAP; | |
491 | if (tb[TCA_FLOW_MODE]) | |
492 | mode = nla_get_u32(tb[TCA_FLOW_MODE]); | |
493 | if (mode != FLOW_MODE_HASH && nkeys > 1) | |
c09fc2e1 | 494 | goto err2; |
e5dfb815 | 495 | |
72d9794f PM |
496 | if (tb[TCA_FLOW_PERTURB]) { |
497 | if (mode != FLOW_MODE_HASH) | |
c09fc2e1 | 498 | goto err2; |
72d9794f PM |
499 | perturb_period = nla_get_u32(tb[TCA_FLOW_PERTURB]) * HZ; |
500 | } | |
501 | ||
1abf2720 JP |
502 | if (TC_H_MAJ(baseclass) == 0) { |
503 | struct Qdisc *q = tcf_block_q(tp->chain->block); | |
504 | ||
505 | baseclass = TC_H_MAKE(q->handle, baseclass); | |
506 | } | |
e5dfb815 PM |
507 | if (TC_H_MIN(baseclass) == 0) |
508 | baseclass = TC_H_MAKE(baseclass, 1); | |
509 | ||
70da9f0b JF |
510 | fnew->handle = handle; |
511 | fnew->mask = ~0U; | |
512 | fnew->tp = tp; | |
513 | get_random_bytes(&fnew->hashrnd, 4); | |
e5dfb815 PM |
514 | } |
515 | ||
cdeabbb8 | 516 | timer_setup(&fnew->perturb_timer, flow_perturbation, TIMER_DEFERRABLE); |
e5dfb815 | 517 | |
f36fe1c4 | 518 | tcf_block_netif_keep_dst(tp->chain->block); |
02875878 | 519 | |
e5dfb815 | 520 | if (tb[TCA_FLOW_KEYS]) { |
70da9f0b JF |
521 | fnew->keymask = keymask; |
522 | fnew->nkeys = nkeys; | |
e5dfb815 PM |
523 | } |
524 | ||
70da9f0b | 525 | fnew->mode = mode; |
e5dfb815 PM |
526 | |
527 | if (tb[TCA_FLOW_MASK]) | |
70da9f0b | 528 | fnew->mask = nla_get_u32(tb[TCA_FLOW_MASK]); |
e5dfb815 | 529 | if (tb[TCA_FLOW_XOR]) |
70da9f0b | 530 | fnew->xor = nla_get_u32(tb[TCA_FLOW_XOR]); |
e5dfb815 | 531 | if (tb[TCA_FLOW_RSHIFT]) |
70da9f0b | 532 | fnew->rshift = nla_get_u32(tb[TCA_FLOW_RSHIFT]); |
e5dfb815 | 533 | if (tb[TCA_FLOW_ADDEND]) |
70da9f0b | 534 | fnew->addend = nla_get_u32(tb[TCA_FLOW_ADDEND]); |
e5dfb815 PM |
535 | |
536 | if (tb[TCA_FLOW_DIVISOR]) | |
70da9f0b | 537 | fnew->divisor = nla_get_u32(tb[TCA_FLOW_DIVISOR]); |
e5dfb815 | 538 | if (baseclass) |
70da9f0b | 539 | fnew->baseclass = baseclass; |
e5dfb815 | 540 | |
70da9f0b | 541 | fnew->perturb_period = perturb_period; |
72d9794f | 542 | if (perturb_period) |
70da9f0b | 543 | mod_timer(&fnew->perturb_timer, jiffies + perturb_period); |
72d9794f | 544 | |
8113c095 | 545 | if (!*arg) |
70da9f0b JF |
546 | list_add_tail_rcu(&fnew->list, &head->filters); |
547 | else | |
32b2f4b1 | 548 | list_replace_rcu(&fold->list, &fnew->list); |
e5dfb815 | 549 | |
8113c095 | 550 | *arg = fnew; |
e5dfb815 | 551 | |
22f7cec9 CW |
552 | if (fold) { |
553 | tcf_exts_get_net(&fold->exts); | |
aaa908ff | 554 | tcf_queue_work(&fold->rwork, flow_destroy_filter_work); |
22f7cec9 | 555 | } |
e5dfb815 PM |
556 | return 0; |
557 | ||
c09fc2e1 | 558 | err2: |
b9a24bb7 | 559 | tcf_exts_destroy(&fnew->exts); |
4ebc1e3c | 560 | tcf_em_tree_destroy(&fnew->ematches); |
e5dfb815 | 561 | err1: |
c09fc2e1 | 562 | kfree(fnew); |
e5dfb815 PM |
563 | return err; |
564 | } | |
565 | ||
571acf21 | 566 | static int flow_delete(struct tcf_proto *tp, void *arg, bool *last, |
12db03b6 | 567 | bool rtnl_held, struct netlink_ext_ack *extack) |
e5dfb815 | 568 | { |
763dbf63 | 569 | struct flow_head *head = rtnl_dereference(tp->root); |
8113c095 | 570 | struct flow_filter *f = arg; |
e5dfb815 | 571 | |
70da9f0b | 572 | list_del_rcu(&f->list); |
22f7cec9 | 573 | tcf_exts_get_net(&f->exts); |
aaa908ff | 574 | tcf_queue_work(&f->rwork, flow_destroy_filter_work); |
763dbf63 | 575 | *last = list_empty(&head->filters); |
e5dfb815 PM |
576 | return 0; |
577 | } | |
578 | ||
579 | static int flow_init(struct tcf_proto *tp) | |
580 | { | |
581 | struct flow_head *head; | |
582 | ||
e5dfb815 PM |
583 | head = kzalloc(sizeof(*head), GFP_KERNEL); |
584 | if (head == NULL) | |
585 | return -ENOBUFS; | |
586 | INIT_LIST_HEAD(&head->filters); | |
70da9f0b | 587 | rcu_assign_pointer(tp->root, head); |
e5dfb815 PM |
588 | return 0; |
589 | } | |
590 | ||
12db03b6 VB |
591 | static void flow_destroy(struct tcf_proto *tp, bool rtnl_held, |
592 | struct netlink_ext_ack *extack) | |
e5dfb815 | 593 | { |
70da9f0b | 594 | struct flow_head *head = rtnl_dereference(tp->root); |
e5dfb815 PM |
595 | struct flow_filter *f, *next; |
596 | ||
597 | list_for_each_entry_safe(f, next, &head->filters, list) { | |
70da9f0b | 598 | list_del_rcu(&f->list); |
22f7cec9 | 599 | if (tcf_exts_get_net(&f->exts)) |
aaa908ff | 600 | tcf_queue_work(&f->rwork, flow_destroy_filter_work); |
22f7cec9 CW |
601 | else |
602 | __flow_destroy_filter(f); | |
e5dfb815 | 603 | } |
70da9f0b | 604 | kfree_rcu(head, rcu); |
e5dfb815 PM |
605 | } |
606 | ||
8113c095 | 607 | static void *flow_get(struct tcf_proto *tp, u32 handle) |
e5dfb815 | 608 | { |
70da9f0b | 609 | struct flow_head *head = rtnl_dereference(tp->root); |
e5dfb815 PM |
610 | struct flow_filter *f; |
611 | ||
6a659cd0 | 612 | list_for_each_entry(f, &head->filters, list) |
e5dfb815 | 613 | if (f->handle == handle) |
8113c095 WC |
614 | return f; |
615 | return NULL; | |
e5dfb815 PM |
616 | } |
617 | ||
8113c095 | 618 | static int flow_dump(struct net *net, struct tcf_proto *tp, void *fh, |
12db03b6 | 619 | struct sk_buff *skb, struct tcmsg *t, bool rtnl_held) |
e5dfb815 | 620 | { |
8113c095 | 621 | struct flow_filter *f = fh; |
e5dfb815 PM |
622 | struct nlattr *nest; |
623 | ||
624 | if (f == NULL) | |
625 | return skb->len; | |
626 | ||
627 | t->tcm_handle = f->handle; | |
628 | ||
ae0be8de | 629 | nest = nla_nest_start_noflag(skb, TCA_OPTIONS); |
e5dfb815 PM |
630 | if (nest == NULL) |
631 | goto nla_put_failure; | |
632 | ||
1b34ec43 DM |
633 | if (nla_put_u32(skb, TCA_FLOW_KEYS, f->keymask) || |
634 | nla_put_u32(skb, TCA_FLOW_MODE, f->mode)) | |
635 | goto nla_put_failure; | |
e5dfb815 PM |
636 | |
637 | if (f->mask != ~0 || f->xor != 0) { | |
1b34ec43 DM |
638 | if (nla_put_u32(skb, TCA_FLOW_MASK, f->mask) || |
639 | nla_put_u32(skb, TCA_FLOW_XOR, f->xor)) | |
640 | goto nla_put_failure; | |
e5dfb815 | 641 | } |
1b34ec43 DM |
642 | if (f->rshift && |
643 | nla_put_u32(skb, TCA_FLOW_RSHIFT, f->rshift)) | |
644 | goto nla_put_failure; | |
645 | if (f->addend && | |
646 | nla_put_u32(skb, TCA_FLOW_ADDEND, f->addend)) | |
647 | goto nla_put_failure; | |
e5dfb815 | 648 | |
1b34ec43 DM |
649 | if (f->divisor && |
650 | nla_put_u32(skb, TCA_FLOW_DIVISOR, f->divisor)) | |
651 | goto nla_put_failure; | |
652 | if (f->baseclass && | |
653 | nla_put_u32(skb, TCA_FLOW_BASECLASS, f->baseclass)) | |
654 | goto nla_put_failure; | |
e5dfb815 | 655 | |
1b34ec43 DM |
656 | if (f->perturb_period && |
657 | nla_put_u32(skb, TCA_FLOW_PERTURB, f->perturb_period / HZ)) | |
658 | goto nla_put_failure; | |
72d9794f | 659 | |
5da57f42 | 660 | if (tcf_exts_dump(skb, &f->exts) < 0) |
e5dfb815 | 661 | goto nla_put_failure; |
0aead543 | 662 | #ifdef CONFIG_NET_EMATCH |
e5dfb815 PM |
663 | if (f->ematches.hdr.nmatches && |
664 | tcf_em_tree_dump(skb, &f->ematches, TCA_FLOW_EMATCHES) < 0) | |
665 | goto nla_put_failure; | |
0aead543 | 666 | #endif |
e5dfb815 PM |
667 | nla_nest_end(skb, nest); |
668 | ||
5da57f42 | 669 | if (tcf_exts_dump_stats(skb, &f->exts) < 0) |
e5dfb815 PM |
670 | goto nla_put_failure; |
671 | ||
672 | return skb->len; | |
673 | ||
674 | nla_put_failure: | |
6ea3b446 | 675 | nla_nest_cancel(skb, nest); |
e5dfb815 PM |
676 | return -1; |
677 | } | |
678 | ||
12db03b6 VB |
679 | static void flow_walk(struct tcf_proto *tp, struct tcf_walker *arg, |
680 | bool rtnl_held) | |
e5dfb815 | 681 | { |
70da9f0b | 682 | struct flow_head *head = rtnl_dereference(tp->root); |
e5dfb815 PM |
683 | struct flow_filter *f; |
684 | ||
6a659cd0 | 685 | list_for_each_entry(f, &head->filters, list) { |
e5dfb815 PM |
686 | if (arg->count < arg->skip) |
687 | goto skip; | |
8113c095 | 688 | if (arg->fn(tp, f, arg) < 0) { |
e5dfb815 PM |
689 | arg->stop = 1; |
690 | break; | |
691 | } | |
692 | skip: | |
693 | arg->count++; | |
694 | } | |
695 | } | |
696 | ||
697 | static struct tcf_proto_ops cls_flow_ops __read_mostly = { | |
698 | .kind = "flow", | |
699 | .classify = flow_classify, | |
700 | .init = flow_init, | |
701 | .destroy = flow_destroy, | |
702 | .change = flow_change, | |
703 | .delete = flow_delete, | |
704 | .get = flow_get, | |
e5dfb815 PM |
705 | .dump = flow_dump, |
706 | .walk = flow_walk, | |
707 | .owner = THIS_MODULE, | |
708 | }; | |
709 | ||
710 | static int __init cls_flow_init(void) | |
711 | { | |
712 | return register_tcf_proto_ops(&cls_flow_ops); | |
713 | } | |
714 | ||
715 | static void __exit cls_flow_exit(void) | |
716 | { | |
717 | unregister_tcf_proto_ops(&cls_flow_ops); | |
718 | } | |
719 | ||
720 | module_init(cls_flow_init); | |
721 | module_exit(cls_flow_exit); | |
722 | ||
723 | MODULE_LICENSE("GPL"); | |
724 | MODULE_AUTHOR("Patrick McHardy <kaber@trash.net>"); | |
725 | MODULE_DESCRIPTION("TC flow classifier"); |