cls_fw.c 9.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452
  1. /*
  2. * net/sched/cls_fw.c Classifier mapping ipchains' fwmark to traffic class.
  3. *
  4. * This program is free software; you can redistribute it and/or
  5. * modify it under the terms of the GNU General Public License
  6. * as published by the Free Software Foundation; either version
  7. * 2 of the License, or (at your option) any later version.
  8. *
  9. * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
  10. *
  11. * Changes:
  12. * Karlis Peisenieks <karlis@mt.lv> : 990415 : fw_walk off by one
  13. * Karlis Peisenieks <karlis@mt.lv> : 990415 : fw_delete killed all the filter (and kernel).
  14. * Alex <alex@pilotsoft.com> : 2004xxyy: Added Action extension
  15. *
  16. * JHS: We should remove the CONFIG_NET_CLS_IND from here
  17. * eventually when the meta match extension is made available
  18. *
  19. */
  20. #include <linux/module.h>
  21. #include <linux/slab.h>
  22. #include <linux/types.h>
  23. #include <linux/kernel.h>
  24. #include <linux/string.h>
  25. #include <linux/errno.h>
  26. #include <linux/skbuff.h>
  27. #include <net/netlink.h>
  28. #include <net/act_api.h>
  29. #include <net/pkt_cls.h>
  30. #define HTSIZE 256
  31. struct fw_head {
  32. u32 mask;
  33. struct fw_filter __rcu *ht[HTSIZE];
  34. struct rcu_head rcu;
  35. };
  36. struct fw_filter {
  37. struct fw_filter __rcu *next;
  38. u32 id;
  39. struct tcf_result res;
  40. #ifdef CONFIG_NET_CLS_IND
  41. int ifindex;
  42. #endif /* CONFIG_NET_CLS_IND */
  43. struct tcf_exts exts;
  44. struct tcf_proto *tp;
  45. struct rcu_head rcu;
  46. };
  47. static u32 fw_hash(u32 handle)
  48. {
  49. handle ^= (handle >> 16);
  50. handle ^= (handle >> 8);
  51. return handle % HTSIZE;
  52. }
  53. static int fw_classify(struct sk_buff *skb, const struct tcf_proto *tp,
  54. struct tcf_result *res)
  55. {
  56. struct fw_head *head = rcu_dereference_bh(tp->root);
  57. struct fw_filter *f;
  58. int r;
  59. u32 id = skb->mark;
  60. if (head != NULL) {
  61. id &= head->mask;
  62. for (f = rcu_dereference_bh(head->ht[fw_hash(id)]); f;
  63. f = rcu_dereference_bh(f->next)) {
  64. if (f->id == id) {
  65. *res = f->res;
  66. #ifdef CONFIG_NET_CLS_IND
  67. if (!tcf_match_indev(skb, f->ifindex))
  68. continue;
  69. #endif /* CONFIG_NET_CLS_IND */
  70. r = tcf_exts_exec(skb, &f->exts, res);
  71. if (r < 0)
  72. continue;
  73. return r;
  74. }
  75. }
  76. } else {
  77. /* Old method: classify the packet using its skb mark. */
  78. if (id && (TC_H_MAJ(id) == 0 ||
  79. !(TC_H_MAJ(id ^ tp->q->handle)))) {
  80. res->classid = id;
  81. res->class = 0;
  82. return 0;
  83. }
  84. }
  85. return -1;
  86. }
  87. static unsigned long fw_get(struct tcf_proto *tp, u32 handle)
  88. {
  89. struct fw_head *head = rtnl_dereference(tp->root);
  90. struct fw_filter *f;
  91. if (head == NULL)
  92. return 0;
  93. f = rtnl_dereference(head->ht[fw_hash(handle)]);
  94. for (; f; f = rtnl_dereference(f->next)) {
  95. if (f->id == handle)
  96. return (unsigned long)f;
  97. }
  98. return 0;
  99. }
  100. static int fw_init(struct tcf_proto *tp)
  101. {
  102. /* We don't allocate fw_head here, because in the old method
  103. * we don't need it at all.
  104. */
  105. return 0;
  106. }
  107. static void fw_delete_filter(struct rcu_head *head)
  108. {
  109. struct fw_filter *f = container_of(head, struct fw_filter, rcu);
  110. tcf_exts_destroy(&f->exts);
  111. kfree(f);
  112. }
  113. static void fw_destroy(struct tcf_proto *tp)
  114. {
  115. struct fw_head *head = rtnl_dereference(tp->root);
  116. struct fw_filter *f;
  117. int h;
  118. if (head == NULL)
  119. return;
  120. for (h = 0; h < HTSIZE; h++) {
  121. while ((f = rtnl_dereference(head->ht[h])) != NULL) {
  122. RCU_INIT_POINTER(head->ht[h],
  123. rtnl_dereference(f->next));
  124. tcf_unbind_filter(tp, &f->res);
  125. call_rcu(&f->rcu, fw_delete_filter);
  126. }
  127. }
  128. kfree_rcu(head, rcu);
  129. }
  130. static int fw_delete(struct tcf_proto *tp, unsigned long arg, bool *last)
  131. {
  132. struct fw_head *head = rtnl_dereference(tp->root);
  133. struct fw_filter *f = (struct fw_filter *)arg;
  134. struct fw_filter __rcu **fp;
  135. struct fw_filter *pfp;
  136. int ret = -EINVAL;
  137. int h;
  138. if (head == NULL || f == NULL)
  139. goto out;
  140. fp = &head->ht[fw_hash(f->id)];
  141. for (pfp = rtnl_dereference(*fp); pfp;
  142. fp = &pfp->next, pfp = rtnl_dereference(*fp)) {
  143. if (pfp == f) {
  144. RCU_INIT_POINTER(*fp, rtnl_dereference(f->next));
  145. tcf_unbind_filter(tp, &f->res);
  146. call_rcu(&f->rcu, fw_delete_filter);
  147. ret = 0;
  148. break;
  149. }
  150. }
  151. *last = true;
  152. for (h = 0; h < HTSIZE; h++) {
  153. if (rcu_access_pointer(head->ht[h])) {
  154. *last = false;
  155. break;
  156. }
  157. }
  158. out:
  159. return ret;
  160. }
  161. static const struct nla_policy fw_policy[TCA_FW_MAX + 1] = {
  162. [TCA_FW_CLASSID] = { .type = NLA_U32 },
  163. [TCA_FW_INDEV] = { .type = NLA_STRING, .len = IFNAMSIZ },
  164. [TCA_FW_MASK] = { .type = NLA_U32 },
  165. };
  166. static int
  167. fw_change_attrs(struct net *net, struct tcf_proto *tp, struct fw_filter *f,
  168. struct nlattr **tb, struct nlattr **tca, unsigned long base,
  169. bool ovr)
  170. {
  171. struct fw_head *head = rtnl_dereference(tp->root);
  172. struct tcf_exts e;
  173. u32 mask;
  174. int err;
  175. err = tcf_exts_init(&e, TCA_FW_ACT, TCA_FW_POLICE);
  176. if (err < 0)
  177. return err;
  178. err = tcf_exts_validate(net, tp, tb, tca[TCA_RATE], &e, ovr);
  179. if (err < 0)
  180. goto errout;
  181. if (tb[TCA_FW_CLASSID]) {
  182. f->res.classid = nla_get_u32(tb[TCA_FW_CLASSID]);
  183. tcf_bind_filter(tp, &f->res, base);
  184. }
  185. #ifdef CONFIG_NET_CLS_IND
  186. if (tb[TCA_FW_INDEV]) {
  187. int ret;
  188. ret = tcf_change_indev(net, tb[TCA_FW_INDEV]);
  189. if (ret < 0) {
  190. err = ret;
  191. goto errout;
  192. }
  193. f->ifindex = ret;
  194. }
  195. #endif /* CONFIG_NET_CLS_IND */
  196. err = -EINVAL;
  197. if (tb[TCA_FW_MASK]) {
  198. mask = nla_get_u32(tb[TCA_FW_MASK]);
  199. if (mask != head->mask)
  200. goto errout;
  201. } else if (head->mask != 0xFFFFFFFF)
  202. goto errout;
  203. tcf_exts_change(tp, &f->exts, &e);
  204. return 0;
  205. errout:
  206. tcf_exts_destroy(&e);
  207. return err;
  208. }
  209. static int fw_change(struct net *net, struct sk_buff *in_skb,
  210. struct tcf_proto *tp, unsigned long base,
  211. u32 handle, struct nlattr **tca, unsigned long *arg,
  212. bool ovr)
  213. {
  214. struct fw_head *head = rtnl_dereference(tp->root);
  215. struct fw_filter *f = (struct fw_filter *) *arg;
  216. struct nlattr *opt = tca[TCA_OPTIONS];
  217. struct nlattr *tb[TCA_FW_MAX + 1];
  218. int err;
  219. if (!opt)
  220. return handle ? -EINVAL : 0; /* Succeed if it is old method. */
  221. err = nla_parse_nested(tb, TCA_FW_MAX, opt, fw_policy, NULL);
  222. if (err < 0)
  223. return err;
  224. if (f) {
  225. struct fw_filter *pfp, *fnew;
  226. struct fw_filter __rcu **fp;
  227. if (f->id != handle && handle)
  228. return -EINVAL;
  229. fnew = kzalloc(sizeof(struct fw_filter), GFP_KERNEL);
  230. if (!fnew)
  231. return -ENOBUFS;
  232. fnew->id = f->id;
  233. fnew->res = f->res;
  234. #ifdef CONFIG_NET_CLS_IND
  235. fnew->ifindex = f->ifindex;
  236. #endif /* CONFIG_NET_CLS_IND */
  237. fnew->tp = f->tp;
  238. err = tcf_exts_init(&fnew->exts, TCA_FW_ACT, TCA_FW_POLICE);
  239. if (err < 0) {
  240. kfree(fnew);
  241. return err;
  242. }
  243. err = fw_change_attrs(net, tp, fnew, tb, tca, base, ovr);
  244. if (err < 0) {
  245. tcf_exts_destroy(&fnew->exts);
  246. kfree(fnew);
  247. return err;
  248. }
  249. fp = &head->ht[fw_hash(fnew->id)];
  250. for (pfp = rtnl_dereference(*fp); pfp;
  251. fp = &pfp->next, pfp = rtnl_dereference(*fp))
  252. if (pfp == f)
  253. break;
  254. RCU_INIT_POINTER(fnew->next, rtnl_dereference(pfp->next));
  255. rcu_assign_pointer(*fp, fnew);
  256. tcf_unbind_filter(tp, &f->res);
  257. call_rcu(&f->rcu, fw_delete_filter);
  258. *arg = (unsigned long)fnew;
  259. return err;
  260. }
  261. if (!handle)
  262. return -EINVAL;
  263. if (!head) {
  264. u32 mask = 0xFFFFFFFF;
  265. if (tb[TCA_FW_MASK])
  266. mask = nla_get_u32(tb[TCA_FW_MASK]);
  267. head = kzalloc(sizeof(*head), GFP_KERNEL);
  268. if (!head)
  269. return -ENOBUFS;
  270. head->mask = mask;
  271. rcu_assign_pointer(tp->root, head);
  272. }
  273. f = kzalloc(sizeof(struct fw_filter), GFP_KERNEL);
  274. if (f == NULL)
  275. return -ENOBUFS;
  276. err = tcf_exts_init(&f->exts, TCA_FW_ACT, TCA_FW_POLICE);
  277. if (err < 0)
  278. goto errout;
  279. f->id = handle;
  280. f->tp = tp;
  281. err = fw_change_attrs(net, tp, f, tb, tca, base, ovr);
  282. if (err < 0)
  283. goto errout;
  284. RCU_INIT_POINTER(f->next, head->ht[fw_hash(handle)]);
  285. rcu_assign_pointer(head->ht[fw_hash(handle)], f);
  286. *arg = (unsigned long)f;
  287. return 0;
  288. errout:
  289. tcf_exts_destroy(&f->exts);
  290. kfree(f);
  291. return err;
  292. }
  293. static void fw_walk(struct tcf_proto *tp, struct tcf_walker *arg)
  294. {
  295. struct fw_head *head = rtnl_dereference(tp->root);
  296. int h;
  297. if (head == NULL)
  298. arg->stop = 1;
  299. if (arg->stop)
  300. return;
  301. for (h = 0; h < HTSIZE; h++) {
  302. struct fw_filter *f;
  303. for (f = rtnl_dereference(head->ht[h]); f;
  304. f = rtnl_dereference(f->next)) {
  305. if (arg->count < arg->skip) {
  306. arg->count++;
  307. continue;
  308. }
  309. if (arg->fn(tp, (unsigned long)f, arg) < 0) {
  310. arg->stop = 1;
  311. return;
  312. }
  313. arg->count++;
  314. }
  315. }
  316. }
  317. static int fw_dump(struct net *net, struct tcf_proto *tp, unsigned long fh,
  318. struct sk_buff *skb, struct tcmsg *t)
  319. {
  320. struct fw_head *head = rtnl_dereference(tp->root);
  321. struct fw_filter *f = (struct fw_filter *)fh;
  322. struct nlattr *nest;
  323. if (f == NULL)
  324. return skb->len;
  325. t->tcm_handle = f->id;
  326. if (!f->res.classid && !tcf_exts_is_available(&f->exts))
  327. return skb->len;
  328. nest = nla_nest_start(skb, TCA_OPTIONS);
  329. if (nest == NULL)
  330. goto nla_put_failure;
  331. if (f->res.classid &&
  332. nla_put_u32(skb, TCA_FW_CLASSID, f->res.classid))
  333. goto nla_put_failure;
  334. #ifdef CONFIG_NET_CLS_IND
  335. if (f->ifindex) {
  336. struct net_device *dev;
  337. dev = __dev_get_by_index(net, f->ifindex);
  338. if (dev && nla_put_string(skb, TCA_FW_INDEV, dev->name))
  339. goto nla_put_failure;
  340. }
  341. #endif /* CONFIG_NET_CLS_IND */
  342. if (head->mask != 0xFFFFFFFF &&
  343. nla_put_u32(skb, TCA_FW_MASK, head->mask))
  344. goto nla_put_failure;
  345. if (tcf_exts_dump(skb, &f->exts) < 0)
  346. goto nla_put_failure;
  347. nla_nest_end(skb, nest);
  348. if (tcf_exts_dump_stats(skb, &f->exts) < 0)
  349. goto nla_put_failure;
  350. return skb->len;
  351. nla_put_failure:
  352. nla_nest_cancel(skb, nest);
  353. return -1;
  354. }
  355. static struct tcf_proto_ops cls_fw_ops __read_mostly = {
  356. .kind = "fw",
  357. .classify = fw_classify,
  358. .init = fw_init,
  359. .destroy = fw_destroy,
  360. .get = fw_get,
  361. .change = fw_change,
  362. .delete = fw_delete,
  363. .walk = fw_walk,
  364. .dump = fw_dump,
  365. .owner = THIS_MODULE,
  366. };
  367. static int __init init_fw(void)
  368. {
  369. return register_tcf_proto_ops(&cls_fw_ops);
  370. }
  371. static void __exit exit_fw(void)
  372. {
  373. unregister_tcf_proto_ops(&cls_fw_ops);
  374. }
  375. module_init(init_fw)
  376. module_exit(exit_fw)
  377. MODULE_LICENSE("GPL");