cls_fw.c 9.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438
  1. /*
  2. * net/sched/cls_fw.c Classifier mapping ipchains' fwmark to traffic class.
  3. *
  4. * This program is free software; you can redistribute it and/or
  5. * modify it under the terms of the GNU General Public License
  6. * as published by the Free Software Foundation; either version
  7. * 2 of the License, or (at your option) any later version.
  8. *
  9. * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
  10. *
  11. * Changes:
  12. * Karlis Peisenieks <karlis@mt.lv> : 990415 : fw_walk off by one
  13. * Karlis Peisenieks <karlis@mt.lv> : 990415 : fw_delete killed all the filter (and kernel).
  14. * Alex <alex@pilotsoft.com> : 2004xxyy: Added Action extension
  15. *
  16. * JHS: We should remove the CONFIG_NET_CLS_IND from here
  17. * eventually when the meta match extension is made available
  18. *
  19. */
  20. #include <linux/module.h>
  21. #include <linux/slab.h>
  22. #include <linux/types.h>
  23. #include <linux/kernel.h>
  24. #include <linux/string.h>
  25. #include <linux/errno.h>
  26. #include <linux/skbuff.h>
  27. #include <net/netlink.h>
  28. #include <net/act_api.h>
  29. #include <net/pkt_cls.h>
  30. #define HTSIZE 256
  31. struct fw_head {
  32. u32 mask;
  33. struct fw_filter __rcu *ht[HTSIZE];
  34. struct rcu_head rcu;
  35. };
  36. struct fw_filter {
  37. struct fw_filter __rcu *next;
  38. u32 id;
  39. struct tcf_result res;
  40. #ifdef CONFIG_NET_CLS_IND
  41. int ifindex;
  42. #endif /* CONFIG_NET_CLS_IND */
  43. struct tcf_exts exts;
  44. struct tcf_proto *tp;
  45. struct rcu_head rcu;
  46. };
  47. static u32 fw_hash(u32 handle)
  48. {
  49. handle ^= (handle >> 16);
  50. handle ^= (handle >> 8);
  51. return handle % HTSIZE;
  52. }
  53. static int fw_classify(struct sk_buff *skb, const struct tcf_proto *tp,
  54. struct tcf_result *res)
  55. {
  56. struct fw_head *head = rcu_dereference_bh(tp->root);
  57. struct fw_filter *f;
  58. int r;
  59. u32 id = skb->mark;
  60. if (head != NULL) {
  61. id &= head->mask;
  62. for (f = rcu_dereference_bh(head->ht[fw_hash(id)]); f;
  63. f = rcu_dereference_bh(f->next)) {
  64. if (f->id == id) {
  65. *res = f->res;
  66. #ifdef CONFIG_NET_CLS_IND
  67. if (!tcf_match_indev(skb, f->ifindex))
  68. continue;
  69. #endif /* CONFIG_NET_CLS_IND */
  70. r = tcf_exts_exec(skb, &f->exts, res);
  71. if (r < 0)
  72. continue;
  73. return r;
  74. }
  75. }
  76. } else {
  77. /* Old method: classify the packet using its skb mark. */
  78. if (id && (TC_H_MAJ(id) == 0 ||
  79. !(TC_H_MAJ(id ^ tp->q->handle)))) {
  80. res->classid = id;
  81. res->class = 0;
  82. return 0;
  83. }
  84. }
  85. return -1;
  86. }
  87. static unsigned long fw_get(struct tcf_proto *tp, u32 handle)
  88. {
  89. struct fw_head *head = rtnl_dereference(tp->root);
  90. struct fw_filter *f;
  91. if (head == NULL)
  92. return 0;
  93. f = rtnl_dereference(head->ht[fw_hash(handle)]);
  94. for (; f; f = rtnl_dereference(f->next)) {
  95. if (f->id == handle)
  96. return (unsigned long)f;
  97. }
  98. return 0;
  99. }
  100. static int fw_init(struct tcf_proto *tp)
  101. {
  102. /* We don't allocate fw_head here, because in the old method
  103. * we don't need it at all.
  104. */
  105. return 0;
  106. }
  107. static void fw_delete_filter(struct rcu_head *head)
  108. {
  109. struct fw_filter *f = container_of(head, struct fw_filter, rcu);
  110. tcf_exts_destroy(&f->exts);
  111. kfree(f);
  112. }
  113. static bool fw_destroy(struct tcf_proto *tp, bool force)
  114. {
  115. struct fw_head *head = rtnl_dereference(tp->root);
  116. struct fw_filter *f;
  117. int h;
  118. if (head == NULL)
  119. return true;
  120. if (!force) {
  121. for (h = 0; h < HTSIZE; h++)
  122. if (rcu_access_pointer(head->ht[h]))
  123. return false;
  124. }
  125. for (h = 0; h < HTSIZE; h++) {
  126. while ((f = rtnl_dereference(head->ht[h])) != NULL) {
  127. RCU_INIT_POINTER(head->ht[h],
  128. rtnl_dereference(f->next));
  129. tcf_unbind_filter(tp, &f->res);
  130. call_rcu(&f->rcu, fw_delete_filter);
  131. }
  132. }
  133. RCU_INIT_POINTER(tp->root, NULL);
  134. kfree_rcu(head, rcu);
  135. return true;
  136. }
  137. static int fw_delete(struct tcf_proto *tp, unsigned long arg)
  138. {
  139. struct fw_head *head = rtnl_dereference(tp->root);
  140. struct fw_filter *f = (struct fw_filter *)arg;
  141. struct fw_filter __rcu **fp;
  142. struct fw_filter *pfp;
  143. if (head == NULL || f == NULL)
  144. goto out;
  145. fp = &head->ht[fw_hash(f->id)];
  146. for (pfp = rtnl_dereference(*fp); pfp;
  147. fp = &pfp->next, pfp = rtnl_dereference(*fp)) {
  148. if (pfp == f) {
  149. RCU_INIT_POINTER(*fp, rtnl_dereference(f->next));
  150. tcf_unbind_filter(tp, &f->res);
  151. call_rcu(&f->rcu, fw_delete_filter);
  152. return 0;
  153. }
  154. }
  155. out:
  156. return -EINVAL;
  157. }
  158. static const struct nla_policy fw_policy[TCA_FW_MAX + 1] = {
  159. [TCA_FW_CLASSID] = { .type = NLA_U32 },
  160. [TCA_FW_INDEV] = { .type = NLA_STRING, .len = IFNAMSIZ },
  161. [TCA_FW_MASK] = { .type = NLA_U32 },
  162. };
  163. static int
  164. fw_change_attrs(struct net *net, struct tcf_proto *tp, struct fw_filter *f,
  165. struct nlattr **tb, struct nlattr **tca, unsigned long base, bool ovr)
  166. {
  167. struct fw_head *head = rtnl_dereference(tp->root);
  168. struct tcf_exts e;
  169. u32 mask;
  170. int err;
  171. tcf_exts_init(&e, TCA_FW_ACT, TCA_FW_POLICE);
  172. err = tcf_exts_validate(net, tp, tb, tca[TCA_RATE], &e, ovr);
  173. if (err < 0)
  174. return err;
  175. if (tb[TCA_FW_CLASSID]) {
  176. f->res.classid = nla_get_u32(tb[TCA_FW_CLASSID]);
  177. tcf_bind_filter(tp, &f->res, base);
  178. }
  179. #ifdef CONFIG_NET_CLS_IND
  180. if (tb[TCA_FW_INDEV]) {
  181. int ret;
  182. ret = tcf_change_indev(net, tb[TCA_FW_INDEV]);
  183. if (ret < 0) {
  184. err = ret;
  185. goto errout;
  186. }
  187. f->ifindex = ret;
  188. }
  189. #endif /* CONFIG_NET_CLS_IND */
  190. err = -EINVAL;
  191. if (tb[TCA_FW_MASK]) {
  192. mask = nla_get_u32(tb[TCA_FW_MASK]);
  193. if (mask != head->mask)
  194. goto errout;
  195. } else if (head->mask != 0xFFFFFFFF)
  196. goto errout;
  197. tcf_exts_change(tp, &f->exts, &e);
  198. return 0;
  199. errout:
  200. tcf_exts_destroy(&e);
  201. return err;
  202. }
  203. static int fw_change(struct net *net, struct sk_buff *in_skb,
  204. struct tcf_proto *tp, unsigned long base,
  205. u32 handle,
  206. struct nlattr **tca,
  207. unsigned long *arg, bool ovr)
  208. {
  209. struct fw_head *head = rtnl_dereference(tp->root);
  210. struct fw_filter *f = (struct fw_filter *) *arg;
  211. struct nlattr *opt = tca[TCA_OPTIONS];
  212. struct nlattr *tb[TCA_FW_MAX + 1];
  213. int err;
  214. if (!opt)
  215. return handle ? -EINVAL : 0; /* Succeed if it is old method. */
  216. err = nla_parse_nested(tb, TCA_FW_MAX, opt, fw_policy);
  217. if (err < 0)
  218. return err;
  219. if (f) {
  220. struct fw_filter *pfp, *fnew;
  221. struct fw_filter __rcu **fp;
  222. if (f->id != handle && handle)
  223. return -EINVAL;
  224. fnew = kzalloc(sizeof(struct fw_filter), GFP_KERNEL);
  225. if (!fnew)
  226. return -ENOBUFS;
  227. fnew->id = f->id;
  228. fnew->res = f->res;
  229. #ifdef CONFIG_NET_CLS_IND
  230. fnew->ifindex = f->ifindex;
  231. #endif /* CONFIG_NET_CLS_IND */
  232. fnew->tp = f->tp;
  233. tcf_exts_init(&fnew->exts, TCA_FW_ACT, TCA_FW_POLICE);
  234. err = fw_change_attrs(net, tp, fnew, tb, tca, base, ovr);
  235. if (err < 0) {
  236. kfree(fnew);
  237. return err;
  238. }
  239. fp = &head->ht[fw_hash(fnew->id)];
  240. for (pfp = rtnl_dereference(*fp); pfp;
  241. fp = &pfp->next, pfp = rtnl_dereference(*fp))
  242. if (pfp == f)
  243. break;
  244. RCU_INIT_POINTER(fnew->next, rtnl_dereference(pfp->next));
  245. rcu_assign_pointer(*fp, fnew);
  246. tcf_unbind_filter(tp, &f->res);
  247. call_rcu(&f->rcu, fw_delete_filter);
  248. *arg = (unsigned long)fnew;
  249. return err;
  250. }
  251. if (!handle)
  252. return -EINVAL;
  253. if (!head) {
  254. u32 mask = 0xFFFFFFFF;
  255. if (tb[TCA_FW_MASK])
  256. mask = nla_get_u32(tb[TCA_FW_MASK]);
  257. head = kzalloc(sizeof(*head), GFP_KERNEL);
  258. if (!head)
  259. return -ENOBUFS;
  260. head->mask = mask;
  261. rcu_assign_pointer(tp->root, head);
  262. }
  263. f = kzalloc(sizeof(struct fw_filter), GFP_KERNEL);
  264. if (f == NULL)
  265. return -ENOBUFS;
  266. tcf_exts_init(&f->exts, TCA_FW_ACT, TCA_FW_POLICE);
  267. f->id = handle;
  268. f->tp = tp;
  269. err = fw_change_attrs(net, tp, f, tb, tca, base, ovr);
  270. if (err < 0)
  271. goto errout;
  272. RCU_INIT_POINTER(f->next, head->ht[fw_hash(handle)]);
  273. rcu_assign_pointer(head->ht[fw_hash(handle)], f);
  274. *arg = (unsigned long)f;
  275. return 0;
  276. errout:
  277. kfree(f);
  278. return err;
  279. }
  280. static void fw_walk(struct tcf_proto *tp, struct tcf_walker *arg)
  281. {
  282. struct fw_head *head = rtnl_dereference(tp->root);
  283. int h;
  284. if (head == NULL)
  285. arg->stop = 1;
  286. if (arg->stop)
  287. return;
  288. for (h = 0; h < HTSIZE; h++) {
  289. struct fw_filter *f;
  290. for (f = rtnl_dereference(head->ht[h]); f;
  291. f = rtnl_dereference(f->next)) {
  292. if (arg->count < arg->skip) {
  293. arg->count++;
  294. continue;
  295. }
  296. if (arg->fn(tp, (unsigned long)f, arg) < 0) {
  297. arg->stop = 1;
  298. return;
  299. }
  300. arg->count++;
  301. }
  302. }
  303. }
  304. static int fw_dump(struct net *net, struct tcf_proto *tp, unsigned long fh,
  305. struct sk_buff *skb, struct tcmsg *t)
  306. {
  307. struct fw_head *head = rtnl_dereference(tp->root);
  308. struct fw_filter *f = (struct fw_filter *)fh;
  309. struct nlattr *nest;
  310. if (f == NULL)
  311. return skb->len;
  312. t->tcm_handle = f->id;
  313. if (!f->res.classid && !tcf_exts_is_available(&f->exts))
  314. return skb->len;
  315. nest = nla_nest_start(skb, TCA_OPTIONS);
  316. if (nest == NULL)
  317. goto nla_put_failure;
  318. if (f->res.classid &&
  319. nla_put_u32(skb, TCA_FW_CLASSID, f->res.classid))
  320. goto nla_put_failure;
  321. #ifdef CONFIG_NET_CLS_IND
  322. if (f->ifindex) {
  323. struct net_device *dev;
  324. dev = __dev_get_by_index(net, f->ifindex);
  325. if (dev && nla_put_string(skb, TCA_FW_INDEV, dev->name))
  326. goto nla_put_failure;
  327. }
  328. #endif /* CONFIG_NET_CLS_IND */
  329. if (head->mask != 0xFFFFFFFF &&
  330. nla_put_u32(skb, TCA_FW_MASK, head->mask))
  331. goto nla_put_failure;
  332. if (tcf_exts_dump(skb, &f->exts) < 0)
  333. goto nla_put_failure;
  334. nla_nest_end(skb, nest);
  335. if (tcf_exts_dump_stats(skb, &f->exts) < 0)
  336. goto nla_put_failure;
  337. return skb->len;
  338. nla_put_failure:
  339. nla_nest_cancel(skb, nest);
  340. return -1;
  341. }
  342. static struct tcf_proto_ops cls_fw_ops __read_mostly = {
  343. .kind = "fw",
  344. .classify = fw_classify,
  345. .init = fw_init,
  346. .destroy = fw_destroy,
  347. .get = fw_get,
  348. .change = fw_change,
  349. .delete = fw_delete,
  350. .walk = fw_walk,
  351. .dump = fw_dump,
  352. .owner = THIS_MODULE,
  353. };
  354. static int __init init_fw(void)
  355. {
  356. return register_tcf_proto_ops(&cls_fw_ops);
  357. }
  358. static void __exit exit_fw(void)
  359. {
  360. unregister_tcf_proto_ops(&cls_fw_ops);
  361. }
  362. module_init(init_fw)
  363. module_exit(exit_fw)
  364. MODULE_LICENSE("GPL");