gre_demux.c 8.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384
  1. /*
  2. * GRE over IPv4 demultiplexer driver
  3. *
  4. * Authors: Dmitry Kozlov (xeb@mail.ru)
  5. *
  6. * This program is free software; you can redistribute it and/or
  7. * modify it under the terms of the GNU General Public License
  8. * as published by the Free Software Foundation; either version
  9. * 2 of the License, or (at your option) any later version.
  10. *
  11. */
  12. #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
  13. #include <linux/module.h>
  14. #include <linux/if.h>
  15. #include <linux/icmp.h>
  16. #include <linux/kernel.h>
  17. #include <linux/kmod.h>
  18. #include <linux/skbuff.h>
  19. #include <linux/in.h>
  20. #include <linux/ip.h>
  21. #include <linux/netdevice.h>
  22. #include <linux/if_tunnel.h>
  23. #include <linux/spinlock.h>
  24. #include <net/protocol.h>
  25. #include <net/gre.h>
  26. #include <net/icmp.h>
  27. #include <net/route.h>
  28. #include <net/xfrm.h>
  29. static const struct gre_protocol __rcu *gre_proto[GREPROTO_MAX] __read_mostly;
  30. static struct gre_cisco_protocol __rcu *gre_cisco_proto_list[GRE_IP_PROTO_MAX];
  31. int gre_add_protocol(const struct gre_protocol *proto, u8 version)
  32. {
  33. if (version >= GREPROTO_MAX)
  34. return -EINVAL;
  35. return (cmpxchg((const struct gre_protocol **)&gre_proto[version], NULL, proto) == NULL) ?
  36. 0 : -EBUSY;
  37. }
  38. EXPORT_SYMBOL_GPL(gre_add_protocol);
  39. int gre_del_protocol(const struct gre_protocol *proto, u8 version)
  40. {
  41. int ret;
  42. if (version >= GREPROTO_MAX)
  43. return -EINVAL;
  44. ret = (cmpxchg((const struct gre_protocol **)&gre_proto[version], proto, NULL) == proto) ?
  45. 0 : -EBUSY;
  46. if (ret)
  47. return ret;
  48. synchronize_rcu();
  49. return 0;
  50. }
  51. EXPORT_SYMBOL_GPL(gre_del_protocol);
  52. void gre_build_header(struct sk_buff *skb, const struct tnl_ptk_info *tpi,
  53. int hdr_len)
  54. {
  55. struct gre_base_hdr *greh;
  56. skb_push(skb, hdr_len);
  57. greh = (struct gre_base_hdr *)skb->data;
  58. greh->flags = tnl_flags_to_gre_flags(tpi->flags);
  59. greh->protocol = tpi->proto;
  60. if (tpi->flags&(TUNNEL_KEY|TUNNEL_CSUM|TUNNEL_SEQ)) {
  61. __be32 *ptr = (__be32 *)(((u8 *)greh) + hdr_len - 4);
  62. if (tpi->flags&TUNNEL_SEQ) {
  63. *ptr = tpi->seq;
  64. ptr--;
  65. }
  66. if (tpi->flags&TUNNEL_KEY) {
  67. *ptr = tpi->key;
  68. ptr--;
  69. }
  70. if (tpi->flags&TUNNEL_CSUM &&
  71. !(skb_shinfo(skb)->gso_type & SKB_GSO_GRE)) {
  72. *ptr = 0;
  73. *(__sum16 *)ptr = csum_fold(skb_checksum(skb, 0,
  74. skb->len, 0));
  75. }
  76. }
  77. }
  78. EXPORT_SYMBOL_GPL(gre_build_header);
  79. static __sum16 check_checksum(struct sk_buff *skb)
  80. {
  81. __sum16 csum = 0;
  82. switch (skb->ip_summed) {
  83. case CHECKSUM_COMPLETE:
  84. csum = csum_fold(skb->csum);
  85. if (!csum)
  86. break;
  87. /* Fall through. */
  88. case CHECKSUM_NONE:
  89. skb->csum = 0;
  90. csum = __skb_checksum_complete(skb);
  91. skb->ip_summed = CHECKSUM_COMPLETE;
  92. break;
  93. }
  94. return csum;
  95. }
  96. static int parse_gre_header(struct sk_buff *skb, struct tnl_ptk_info *tpi,
  97. bool *csum_err)
  98. {
  99. unsigned int ip_hlen = ip_hdrlen(skb);
  100. const struct gre_base_hdr *greh;
  101. __be32 *options;
  102. int hdr_len;
  103. if (unlikely(!pskb_may_pull(skb, sizeof(struct gre_base_hdr))))
  104. return -EINVAL;
  105. greh = (struct gre_base_hdr *)(skb_network_header(skb) + ip_hlen);
  106. if (unlikely(greh->flags & (GRE_VERSION | GRE_ROUTING)))
  107. return -EINVAL;
  108. tpi->flags = gre_flags_to_tnl_flags(greh->flags);
  109. hdr_len = ip_gre_calc_hlen(tpi->flags);
  110. if (!pskb_may_pull(skb, hdr_len))
  111. return -EINVAL;
  112. greh = (struct gre_base_hdr *)(skb_network_header(skb) + ip_hlen);
  113. tpi->proto = greh->protocol;
  114. options = (__be32 *)(greh + 1);
  115. if (greh->flags & GRE_CSUM) {
  116. if (check_checksum(skb)) {
  117. *csum_err = true;
  118. return -EINVAL;
  119. }
  120. options++;
  121. }
  122. if (greh->flags & GRE_KEY) {
  123. tpi->key = *options;
  124. options++;
  125. } else
  126. tpi->key = 0;
  127. if (unlikely(greh->flags & GRE_SEQ)) {
  128. tpi->seq = *options;
  129. options++;
  130. } else
  131. tpi->seq = 0;
  132. /* WCCP version 1 and 2 protocol decoding.
  133. * - Change protocol to IP
  134. * - When dealing with WCCPv2, Skip extra 4 bytes in GRE header
  135. */
  136. if (greh->flags == 0 && tpi->proto == htons(ETH_P_WCCP)) {
  137. tpi->proto = htons(ETH_P_IP);
  138. if ((*(u8 *)options & 0xF0) != 0x40) {
  139. hdr_len += 4;
  140. if (!pskb_may_pull(skb, hdr_len))
  141. return -EINVAL;
  142. }
  143. }
  144. return iptunnel_pull_header(skb, hdr_len, tpi->proto);
  145. }
  146. static int gre_cisco_rcv(struct sk_buff *skb)
  147. {
  148. struct tnl_ptk_info tpi;
  149. int i;
  150. bool csum_err = false;
  151. #ifdef CONFIG_NET_IPGRE_BROADCAST
  152. if (ipv4_is_multicast(ip_hdr(skb)->daddr)) {
  153. /* Looped back packet, drop it! */
  154. if (rt_is_output_route(skb_rtable(skb)))
  155. goto drop;
  156. }
  157. #endif
  158. if (parse_gre_header(skb, &tpi, &csum_err) < 0)
  159. goto drop;
  160. rcu_read_lock();
  161. for (i = 0; i < GRE_IP_PROTO_MAX; i++) {
  162. struct gre_cisco_protocol *proto;
  163. int ret;
  164. proto = rcu_dereference(gre_cisco_proto_list[i]);
  165. if (!proto)
  166. continue;
  167. ret = proto->handler(skb, &tpi);
  168. if (ret == PACKET_RCVD) {
  169. rcu_read_unlock();
  170. return 0;
  171. }
  172. }
  173. rcu_read_unlock();
  174. icmp_send(skb, ICMP_DEST_UNREACH, ICMP_PORT_UNREACH, 0);
  175. drop:
  176. kfree_skb(skb);
  177. return 0;
  178. }
  179. static void gre_cisco_err(struct sk_buff *skb, u32 info)
  180. {
  181. /* All the routers (except for Linux) return only
  182. * 8 bytes of packet payload. It means, that precise relaying of
  183. * ICMP in the real Internet is absolutely infeasible.
  184. *
  185. * Moreover, Cisco "wise men" put GRE key to the third word
  186. * in GRE header. It makes impossible maintaining even soft
  187. * state for keyed
  188. * GRE tunnels with enabled checksum. Tell them "thank you".
  189. *
  190. * Well, I wonder, rfc1812 was written by Cisco employee,
  191. * what the hell these idiots break standards established
  192. * by themselves???
  193. */
  194. const int type = icmp_hdr(skb)->type;
  195. const int code = icmp_hdr(skb)->code;
  196. struct tnl_ptk_info tpi;
  197. bool csum_err = false;
  198. int i;
  199. if (parse_gre_header(skb, &tpi, &csum_err)) {
  200. if (!csum_err) /* ignore csum errors. */
  201. return;
  202. }
  203. if (type == ICMP_DEST_UNREACH && code == ICMP_FRAG_NEEDED) {
  204. ipv4_update_pmtu(skb, dev_net(skb->dev), info,
  205. skb->dev->ifindex, 0, IPPROTO_GRE, 0);
  206. return;
  207. }
  208. if (type == ICMP_REDIRECT) {
  209. ipv4_redirect(skb, dev_net(skb->dev), skb->dev->ifindex, 0,
  210. IPPROTO_GRE, 0);
  211. return;
  212. }
  213. rcu_read_lock();
  214. for (i = 0; i < GRE_IP_PROTO_MAX; i++) {
  215. struct gre_cisco_protocol *proto;
  216. proto = rcu_dereference(gre_cisco_proto_list[i]);
  217. if (!proto)
  218. continue;
  219. if (proto->err_handler(skb, info, &tpi) == PACKET_RCVD)
  220. goto out;
  221. }
  222. out:
  223. rcu_read_unlock();
  224. }
  225. static int gre_rcv(struct sk_buff *skb)
  226. {
  227. const struct gre_protocol *proto;
  228. u8 ver;
  229. int ret;
  230. if (!pskb_may_pull(skb, 12))
  231. goto drop;
  232. ver = skb->data[1]&0x7f;
  233. if (ver >= GREPROTO_MAX)
  234. goto drop;
  235. rcu_read_lock();
  236. proto = rcu_dereference(gre_proto[ver]);
  237. if (!proto || !proto->handler)
  238. goto drop_unlock;
  239. ret = proto->handler(skb);
  240. rcu_read_unlock();
  241. return ret;
  242. drop_unlock:
  243. rcu_read_unlock();
  244. drop:
  245. kfree_skb(skb);
  246. return NET_RX_DROP;
  247. }
  248. static void gre_err(struct sk_buff *skb, u32 info)
  249. {
  250. const struct gre_protocol *proto;
  251. const struct iphdr *iph = (const struct iphdr *)skb->data;
  252. u8 ver = skb->data[(iph->ihl<<2) + 1]&0x7f;
  253. if (ver >= GREPROTO_MAX)
  254. return;
  255. rcu_read_lock();
  256. proto = rcu_dereference(gre_proto[ver]);
  257. if (proto && proto->err_handler)
  258. proto->err_handler(skb, info);
  259. rcu_read_unlock();
  260. }
  261. static const struct net_protocol net_gre_protocol = {
  262. .handler = gre_rcv,
  263. .err_handler = gre_err,
  264. .netns_ok = 1,
  265. };
  266. static const struct gre_protocol ipgre_protocol = {
  267. .handler = gre_cisco_rcv,
  268. .err_handler = gre_cisco_err,
  269. };
  270. int gre_cisco_register(struct gre_cisco_protocol *newp)
  271. {
  272. struct gre_cisco_protocol **proto = (struct gre_cisco_protocol **)
  273. &gre_cisco_proto_list[newp->priority];
  274. return (cmpxchg(proto, NULL, newp) == NULL) ? 0 : -EBUSY;
  275. }
  276. EXPORT_SYMBOL_GPL(gre_cisco_register);
  277. int gre_cisco_unregister(struct gre_cisco_protocol *del_proto)
  278. {
  279. struct gre_cisco_protocol **proto = (struct gre_cisco_protocol **)
  280. &gre_cisco_proto_list[del_proto->priority];
  281. int ret;
  282. ret = (cmpxchg(proto, del_proto, NULL) == del_proto) ? 0 : -EINVAL;
  283. if (ret)
  284. return ret;
  285. synchronize_net();
  286. return 0;
  287. }
  288. EXPORT_SYMBOL_GPL(gre_cisco_unregister);
  289. static int __init gre_init(void)
  290. {
  291. pr_info("GRE over IPv4 demultiplexor driver\n");
  292. if (inet_add_protocol(&net_gre_protocol, IPPROTO_GRE) < 0) {
  293. pr_err("can't add protocol\n");
  294. goto err;
  295. }
  296. if (gre_add_protocol(&ipgre_protocol, GREPROTO_CISCO) < 0) {
  297. pr_info("%s: can't add ipgre handler\n", __func__);
  298. goto err_gre;
  299. }
  300. return 0;
  301. err_gre:
  302. inet_del_protocol(&net_gre_protocol, IPPROTO_GRE);
  303. err:
  304. return -EAGAIN;
  305. }
  306. static void __exit gre_exit(void)
  307. {
  308. gre_del_protocol(&ipgre_protocol, GREPROTO_CISCO);
  309. inet_del_protocol(&net_gre_protocol, IPPROTO_GRE);
  310. }
  311. module_init(gre_init);
  312. module_exit(gre_exit);
  313. MODULE_DESCRIPTION("GRE over IPv4 demultiplexer driver");
  314. MODULE_AUTHOR("D. Kozlov (xeb@mail.ru)");
  315. MODULE_LICENSE("GPL");