]> git.proxmox.com Git - mirror_ubuntu-artful-kernel.git/blame - net/sched/act_police.c
net sched actions police: peg drop stats for conforming traffic
[mirror_ubuntu-artful-kernel.git] / net / sched / act_police.c
CommitLineData
1da177e4 1/*
0c6965dd 2 * net/sched/act_police.c Input police filter
1da177e4
LT
3 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
8 *
9 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
10 * J Hadi Salim (action changes)
11 */
12
1da177e4
LT
13#include <linux/module.h>
14#include <linux/types.h>
15#include <linux/kernel.h>
1da177e4 16#include <linux/string.h>
1da177e4 17#include <linux/errno.h>
1da177e4 18#include <linux/skbuff.h>
1da177e4
LT
19#include <linux/rtnetlink.h>
20#include <linux/init.h>
5a0e3ad6 21#include <linux/slab.h>
1da177e4 22#include <net/act_api.h>
dc5fc579 23#include <net/netlink.h>
1da177e4 24
0e243218 25struct tcf_police {
ec0595cc 26 struct tc_action common;
0e243218
JP
27 int tcfp_result;
28 u32 tcfp_ewma_rate;
c6d14ff1 29 s64 tcfp_burst;
0e243218 30 u32 tcfp_mtu;
c6d14ff1
JP
31 s64 tcfp_toks;
32 s64 tcfp_ptoks;
33 s64 tcfp_mtu_ptoks;
34 s64 tcfp_t_c;
35 struct psched_ratecfg rate;
36 bool rate_present;
37 struct psched_ratecfg peak;
38 bool peak_present;
0e243218 39};
a85a970a
WC
40
41#define to_police(pc) ((struct tcf_police *)pc)
0e243218 42
e9ce1cd3 43#define POL_TAB_MASK 15
1da177e4 44
1e9b3d53 45/* old policer structure from before tc actions */
cc7ec456 46struct tc_police_compat {
1e9b3d53
PM
47 u32 index;
48 int action;
49 u32 limit;
50 u32 burst;
51 u32 mtu;
52 struct tc_ratespec rate;
53 struct tc_ratespec peakrate;
54};
55
e9ce1cd3 56/* Each policer is serialized by its individual spinlock */
1da177e4 57
ddf97ccd 58static int police_net_id;
a85a970a 59static struct tc_action_ops act_police_ops;
ddf97ccd
WC
60
61static int tcf_act_police_walker(struct net *net, struct sk_buff *skb,
62 struct netlink_callback *cb, int type,
a85a970a 63 const struct tc_action_ops *ops)
1da177e4 64{
ddf97ccd 65 struct tc_action_net *tn = net_generic(net, police_net_id);
1da177e4 66
b5ac8518 67 return tcf_generic_walker(tn, skb, cb, type, ops);
1da177e4 68}
1da177e4 69
53b2bf3f
PM
70static const struct nla_policy police_policy[TCA_POLICE_MAX + 1] = {
71 [TCA_POLICE_RATE] = { .len = TC_RTAB_SIZE },
72 [TCA_POLICE_PEAKRATE] = { .len = TC_RTAB_SIZE },
73 [TCA_POLICE_AVRATE] = { .type = NLA_U32 },
74 [TCA_POLICE_RESULT] = { .type = NLA_U32 },
75};
76
d9fa17ef 77static int tcf_act_police_init(struct net *net, struct nlattr *nla,
a85a970a 78 struct nlattr *est, struct tc_action **a,
d9fa17ef 79 int ovr, int bind)
1da177e4 80{
1da177e4 81 int ret = 0, err;
7ba699c6 82 struct nlattr *tb[TCA_POLICE_MAX + 1];
1da177e4 83 struct tc_police *parm;
e9ce1cd3 84 struct tcf_police *police;
1da177e4 85 struct qdisc_rate_table *R_tab = NULL, *P_tab = NULL;
ddf97ccd 86 struct tc_action_net *tn = net_generic(net, police_net_id);
0852e455 87 bool exists = false;
1e9b3d53 88 int size;
1da177e4 89
cee63723 90 if (nla == NULL)
1da177e4
LT
91 return -EINVAL;
92
53b2bf3f 93 err = nla_parse_nested(tb, TCA_POLICE_MAX, nla, police_policy);
cee63723
PM
94 if (err < 0)
95 return err;
96
7ba699c6 97 if (tb[TCA_POLICE_TBF] == NULL)
1e9b3d53 98 return -EINVAL;
7ba699c6 99 size = nla_len(tb[TCA_POLICE_TBF]);
1e9b3d53 100 if (size != sizeof(*parm) && size != sizeof(struct tc_police_compat))
1da177e4 101 return -EINVAL;
0852e455 102
7ba699c6 103 parm = nla_data(tb[TCA_POLICE_TBF]);
0852e455
WC
104 exists = tcf_hash_check(tn, parm->index, a, bind);
105 if (exists && bind)
106 return 0;
1da177e4 107
0852e455 108 if (!exists) {
a03e6fe5 109 ret = tcf_hash_create(tn, parm->index, NULL, a,
a85a970a 110 &act_police_ops, bind, false);
a03e6fe5
WC
111 if (ret)
112 return ret;
113 ret = ACT_P_CREATED;
0852e455
WC
114 } else {
115 tcf_hash_release(*a, bind);
116 if (!ovr)
117 return -EEXIST;
1da177e4
LT
118 }
119
a85a970a 120 police = to_police(*a);
1da177e4
LT
121 if (parm->rate.rate) {
122 err = -ENOMEM;
7ba699c6 123 R_tab = qdisc_get_rtab(&parm->rate, tb[TCA_POLICE_RATE]);
1da177e4
LT
124 if (R_tab == NULL)
125 goto failure;
c1b56878 126
1da177e4
LT
127 if (parm->peakrate.rate) {
128 P_tab = qdisc_get_rtab(&parm->peakrate,
7ba699c6 129 tb[TCA_POLICE_PEAKRATE]);
71bcb09a 130 if (P_tab == NULL)
1da177e4 131 goto failure;
1da177e4
LT
132 }
133 }
71bcb09a 134
e9ce1cd3 135 spin_lock_bh(&police->tcf_lock);
71bcb09a 136 if (est) {
22e0f8b9 137 err = gen_replace_estimator(&police->tcf_bstats, NULL,
71bcb09a 138 &police->tcf_rate_est,
edb09eb1
ED
139 &police->tcf_lock,
140 NULL, est);
71bcb09a
SH
141 if (err)
142 goto failure_unlock;
a883bf56
JP
143 } else if (tb[TCA_POLICE_AVRATE] &&
144 (ret == ACT_P_CREATED ||
145 !gen_estimator_active(&police->tcf_bstats,
146 &police->tcf_rate_est))) {
147 err = -EINVAL;
148 goto failure_unlock;
71bcb09a
SH
149 }
150
151 /* No failure allowed after this point */
c6d14ff1
JP
152 police->tcfp_mtu = parm->mtu;
153 if (police->tcfp_mtu == 0) {
154 police->tcfp_mtu = ~0;
155 if (R_tab)
156 police->tcfp_mtu = 255 << R_tab->rate.cell_log;
157 }
158 if (R_tab) {
159 police->rate_present = true;
3e1e3aae 160 psched_ratecfg_precompute(&police->rate, &R_tab->rate, 0);
c6d14ff1
JP
161 qdisc_put_rtab(R_tab);
162 } else {
163 police->rate_present = false;
1da177e4 164 }
c6d14ff1
JP
165 if (P_tab) {
166 police->peak_present = true;
3e1e3aae 167 psched_ratecfg_precompute(&police->peak, &P_tab->rate, 0);
c6d14ff1
JP
168 qdisc_put_rtab(P_tab);
169 } else {
170 police->peak_present = false;
1da177e4
LT
171 }
172
7ba699c6 173 if (tb[TCA_POLICE_RESULT])
1587bac4 174 police->tcfp_result = nla_get_u32(tb[TCA_POLICE_RESULT]);
c6d14ff1
JP
175 police->tcfp_burst = PSCHED_TICKS2NS(parm->burst);
176 police->tcfp_toks = police->tcfp_burst;
177 if (police->peak_present) {
178 police->tcfp_mtu_ptoks = (s64) psched_l2t_ns(&police->peak,
179 police->tcfp_mtu);
180 police->tcfp_ptoks = police->tcfp_mtu_ptoks;
1da177e4 181 }
e9ce1cd3 182 police->tcf_action = parm->action;
1da177e4 183
7ba699c6 184 if (tb[TCA_POLICE_AVRATE])
1587bac4 185 police->tcfp_ewma_rate = nla_get_u32(tb[TCA_POLICE_AVRATE]);
1da177e4 186
e9ce1cd3 187 spin_unlock_bh(&police->tcf_lock);
1da177e4
LT
188 if (ret != ACT_P_CREATED)
189 return ret;
190
d2de875c 191 police->tcfp_t_c = ktime_get_ns();
a85a970a 192 tcf_hash_insert(tn, *a);
1da177e4 193
1da177e4
LT
194 return ret;
195
71bcb09a
SH
196failure_unlock:
197 spin_unlock_bh(&police->tcf_lock);
1da177e4 198failure:
3b69a4c9
YY
199 qdisc_put_rtab(P_tab);
200 qdisc_put_rtab(R_tab);
1da177e4 201 if (ret == ACT_P_CREATED)
a85a970a 202 tcf_hash_cleanup(*a, est);
1da177e4
LT
203 return err;
204}
205
dc7f9f6e 206static int tcf_act_police(struct sk_buff *skb, const struct tc_action *a,
10297b99 207 struct tcf_result *res)
1da177e4 208{
a85a970a 209 struct tcf_police *police = to_police(a);
c6d14ff1
JP
210 s64 now;
211 s64 toks;
212 s64 ptoks = 0;
1da177e4 213
e9ce1cd3 214 spin_lock(&police->tcf_lock);
1da177e4 215
bfe0d029 216 bstats_update(&police->tcf_bstats, skb);
3d3ed181 217 tcf_lastuse_update(&police->tcf_tm);
1da177e4 218
e9ce1cd3
DM
219 if (police->tcfp_ewma_rate &&
220 police->tcf_rate_est.bps >= police->tcfp_ewma_rate) {
221 police->tcf_qstats.overlimits++;
b9647580
JP
222 if (police->tcf_action == TC_ACT_SHOT)
223 police->tcf_qstats.drops++;
e9ce1cd3
DM
224 spin_unlock(&police->tcf_lock);
225 return police->tcf_action;
1da177e4 226 }
1da177e4 227
0abf77e5 228 if (qdisc_pkt_len(skb) <= police->tcfp_mtu) {
c6d14ff1 229 if (!police->rate_present) {
e9ce1cd3
DM
230 spin_unlock(&police->tcf_lock);
231 return police->tcfp_result;
1da177e4
LT
232 }
233
d2de875c 234 now = ktime_get_ns();
c6d14ff1
JP
235 toks = min_t(s64, now - police->tcfp_t_c,
236 police->tcfp_burst);
237 if (police->peak_present) {
e9ce1cd3 238 ptoks = toks + police->tcfp_ptoks;
c6d14ff1
JP
239 if (ptoks > police->tcfp_mtu_ptoks)
240 ptoks = police->tcfp_mtu_ptoks;
241 ptoks -= (s64) psched_l2t_ns(&police->peak,
242 qdisc_pkt_len(skb));
1da177e4 243 }
e9ce1cd3 244 toks += police->tcfp_toks;
c6d14ff1 245 if (toks > police->tcfp_burst)
e9ce1cd3 246 toks = police->tcfp_burst;
c6d14ff1 247 toks -= (s64) psched_l2t_ns(&police->rate, qdisc_pkt_len(skb));
1da177e4 248 if ((toks|ptoks) >= 0) {
e9ce1cd3
DM
249 police->tcfp_t_c = now;
250 police->tcfp_toks = toks;
251 police->tcfp_ptoks = ptoks;
f71b109f
RM
252 if (police->tcfp_result == TC_ACT_SHOT)
253 police->tcf_qstats.drops++;
e9ce1cd3
DM
254 spin_unlock(&police->tcf_lock);
255 return police->tcfp_result;
1da177e4
LT
256 }
257 }
258
e9ce1cd3 259 police->tcf_qstats.overlimits++;
b9647580
JP
260 if (police->tcf_action == TC_ACT_SHOT)
261 police->tcf_qstats.drops++;
e9ce1cd3
DM
262 spin_unlock(&police->tcf_lock);
263 return police->tcf_action;
1da177e4
LT
264}
265
266static int
267tcf_act_police_dump(struct sk_buff *skb, struct tc_action *a, int bind, int ref)
268{
27a884dc 269 unsigned char *b = skb_tail_pointer(skb);
a85a970a 270 struct tcf_police *police = to_police(a);
0f04cfd0
JM
271 struct tc_police opt = {
272 .index = police->tcf_index,
273 .action = police->tcf_action,
274 .mtu = police->tcfp_mtu,
c6d14ff1 275 .burst = PSCHED_NS2TICKS(police->tcfp_burst),
0f04cfd0
JM
276 .refcnt = police->tcf_refcnt - ref,
277 .bindcnt = police->tcf_bindcnt - bind,
278 };
3d3ed181 279 struct tcf_t t;
0f04cfd0 280
c6d14ff1 281 if (police->rate_present)
01cb71d2 282 psched_ratecfg_getrate(&opt.rate, &police->rate);
c6d14ff1 283 if (police->peak_present)
01cb71d2 284 psched_ratecfg_getrate(&opt.peakrate, &police->peak);
1b34ec43
DM
285 if (nla_put(skb, TCA_POLICE_TBF, sizeof(opt), &opt))
286 goto nla_put_failure;
287 if (police->tcfp_result &&
288 nla_put_u32(skb, TCA_POLICE_RESULT, police->tcfp_result))
289 goto nla_put_failure;
290 if (police->tcfp_ewma_rate &&
291 nla_put_u32(skb, TCA_POLICE_AVRATE, police->tcfp_ewma_rate))
292 goto nla_put_failure;
3d3ed181
JHS
293
294 t.install = jiffies_to_clock_t(jiffies - police->tcf_tm.install);
295 t.lastuse = jiffies_to_clock_t(jiffies - police->tcf_tm.lastuse);
53eb440f 296 t.firstuse = jiffies_to_clock_t(jiffies - police->tcf_tm.firstuse);
3d3ed181
JHS
297 t.expires = jiffies_to_clock_t(police->tcf_tm.expires);
298 if (nla_put_64bit(skb, TCA_POLICE_TM, sizeof(t), &t, TCA_POLICE_PAD))
299 goto nla_put_failure;
300
1da177e4
LT
301 return skb->len;
302
7ba699c6 303nla_put_failure:
dc5fc579 304 nlmsg_trim(skb, b);
1da177e4
LT
305 return -1;
306}
307
a85a970a 308static int tcf_police_search(struct net *net, struct tc_action **a, u32 index)
ddf97ccd
WC
309{
310 struct tc_action_net *tn = net_generic(net, police_net_id);
311
312 return tcf_hash_search(tn, a, index);
313}
314
1da177e4
LT
315MODULE_AUTHOR("Alexey Kuznetsov");
316MODULE_DESCRIPTION("Policing actions");
317MODULE_LICENSE("GPL");
318
319static struct tc_action_ops act_police_ops = {
320 .kind = "police",
321 .type = TCA_ID_POLICE,
1da177e4
LT
322 .owner = THIS_MODULE,
323 .act = tcf_act_police,
324 .dump = tcf_act_police_dump,
d9fa17ef 325 .init = tcf_act_police_init,
ddf97ccd
WC
326 .walk = tcf_act_police_walker,
327 .lookup = tcf_police_search,
a85a970a 328 .size = sizeof(struct tcf_police),
ddf97ccd
WC
329};
330
331static __net_init int police_init_net(struct net *net)
332{
333 struct tc_action_net *tn = net_generic(net, police_net_id);
334
335 return tc_action_net_init(tn, &act_police_ops, POL_TAB_MASK);
336}
337
338static void __net_exit police_exit_net(struct net *net)
339{
340 struct tc_action_net *tn = net_generic(net, police_net_id);
341
342 tc_action_net_exit(tn);
343}
344
345static struct pernet_operations police_net_ops = {
346 .init = police_init_net,
347 .exit = police_exit_net,
348 .id = &police_net_id,
349 .size = sizeof(struct tc_action_net),
1da177e4
LT
350};
351
352static int __init
353police_init_module(void)
354{
ddf97ccd 355 return tcf_register_action(&act_police_ops, &police_net_ops);
1da177e4
LT
356}
357
358static void __exit
359police_cleanup_module(void)
360{
ddf97ccd 361 tcf_unregister_action(&act_police_ops, &police_net_ops);
1da177e4
LT
362}
363
364module_init(police_init_module);
365module_exit(police_cleanup_module);