msg.c 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569
  1. /*
  2. * net/tipc/msg.c: TIPC message header routines
  3. *
  4. * Copyright (c) 2000-2006, 2014-2015, Ericsson AB
  5. * Copyright (c) 2005, 2010-2011, Wind River Systems
  6. * All rights reserved.
  7. *
  8. * Redistribution and use in source and binary forms, with or without
  9. * modification, are permitted provided that the following conditions are met:
  10. *
  11. * 1. Redistributions of source code must retain the above copyright
  12. * notice, this list of conditions and the following disclaimer.
  13. * 2. Redistributions in binary form must reproduce the above copyright
  14. * notice, this list of conditions and the following disclaimer in the
  15. * documentation and/or other materials provided with the distribution.
  16. * 3. Neither the names of the copyright holders nor the names of its
  17. * contributors may be used to endorse or promote products derived from
  18. * this software without specific prior written permission.
  19. *
  20. * Alternatively, this software may be distributed under the terms of the
  21. * GNU General Public License ("GPL") version 2 as published by the Free
  22. * Software Foundation.
  23. *
  24. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  25. * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  26. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  27. * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
  28. * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  29. * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  30. * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  31. * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  32. * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  33. * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
  34. * POSSIBILITY OF SUCH DAMAGE.
  35. */
  36. #include <net/sock.h>
  37. #include "core.h"
  38. #include "msg.h"
  39. #include "addr.h"
  40. #include "name_table.h"
  41. #define MAX_FORWARD_SIZE 1024
  42. static unsigned int align(unsigned int i)
  43. {
  44. return (i + 3) & ~3u;
  45. }
  46. /**
  47. * tipc_buf_acquire - creates a TIPC message buffer
  48. * @size: message size (including TIPC header)
  49. *
  50. * Returns a new buffer with data pointers set to the specified size.
  51. *
  52. * NOTE: Headroom is reserved to allow prepending of a data link header.
  53. * There may also be unrequested tailroom present at the buffer's end.
  54. */
  55. struct sk_buff *tipc_buf_acquire(u32 size)
  56. {
  57. struct sk_buff *skb;
  58. unsigned int buf_size = (BUF_HEADROOM + size + 3) & ~3u;
  59. skb = alloc_skb_fclone(buf_size, GFP_ATOMIC);
  60. if (skb) {
  61. skb_reserve(skb, BUF_HEADROOM);
  62. skb_put(skb, size);
  63. skb->next = NULL;
  64. }
  65. return skb;
  66. }
  67. void tipc_msg_init(u32 own_node, struct tipc_msg *m, u32 user, u32 type,
  68. u32 hsize, u32 dnode)
  69. {
  70. memset(m, 0, hsize);
  71. msg_set_version(m);
  72. msg_set_user(m, user);
  73. msg_set_hdr_sz(m, hsize);
  74. msg_set_size(m, hsize);
  75. msg_set_prevnode(m, own_node);
  76. msg_set_type(m, type);
  77. if (hsize > SHORT_H_SIZE) {
  78. msg_set_orignode(m, own_node);
  79. msg_set_destnode(m, dnode);
  80. }
  81. }
  82. struct sk_buff *tipc_msg_create(uint user, uint type,
  83. uint hdr_sz, uint data_sz, u32 dnode,
  84. u32 onode, u32 dport, u32 oport, int errcode)
  85. {
  86. struct tipc_msg *msg;
  87. struct sk_buff *buf;
  88. buf = tipc_buf_acquire(hdr_sz + data_sz);
  89. if (unlikely(!buf))
  90. return NULL;
  91. msg = buf_msg(buf);
  92. tipc_msg_init(onode, msg, user, type, hdr_sz, dnode);
  93. msg_set_size(msg, hdr_sz + data_sz);
  94. msg_set_origport(msg, oport);
  95. msg_set_destport(msg, dport);
  96. msg_set_errcode(msg, errcode);
  97. if (hdr_sz > SHORT_H_SIZE) {
  98. msg_set_orignode(msg, onode);
  99. msg_set_destnode(msg, dnode);
  100. }
  101. return buf;
  102. }
  103. /* tipc_buf_append(): Append a buffer to the fragment list of another buffer
  104. * @*headbuf: in: NULL for first frag, otherwise value returned from prev call
  105. * out: set when successful non-complete reassembly, otherwise NULL
  106. * @*buf: in: the buffer to append. Always defined
  107. * out: head buf after successful complete reassembly, otherwise NULL
  108. * Returns 1 when reassembly complete, otherwise 0
  109. */
  110. int tipc_buf_append(struct sk_buff **headbuf, struct sk_buff **buf)
  111. {
  112. struct sk_buff *head = *headbuf;
  113. struct sk_buff *frag = *buf;
  114. struct sk_buff *tail;
  115. struct tipc_msg *msg;
  116. u32 fragid;
  117. int delta;
  118. bool headstolen;
  119. if (!frag)
  120. goto err;
  121. msg = buf_msg(frag);
  122. fragid = msg_type(msg);
  123. frag->next = NULL;
  124. skb_pull(frag, msg_hdr_sz(msg));
  125. if (fragid == FIRST_FRAGMENT) {
  126. if (unlikely(head))
  127. goto err;
  128. if (unlikely(skb_unclone(frag, GFP_ATOMIC)))
  129. goto err;
  130. head = *headbuf = frag;
  131. skb_frag_list_init(head);
  132. TIPC_SKB_CB(head)->tail = NULL;
  133. *buf = NULL;
  134. return 0;
  135. }
  136. if (!head)
  137. goto err;
  138. if (skb_try_coalesce(head, frag, &headstolen, &delta)) {
  139. kfree_skb_partial(frag, headstolen);
  140. } else {
  141. tail = TIPC_SKB_CB(head)->tail;
  142. if (!skb_has_frag_list(head))
  143. skb_shinfo(head)->frag_list = frag;
  144. else
  145. tail->next = frag;
  146. head->truesize += frag->truesize;
  147. head->data_len += frag->len;
  148. head->len += frag->len;
  149. TIPC_SKB_CB(head)->tail = frag;
  150. }
  151. if (fragid == LAST_FRAGMENT) {
  152. TIPC_SKB_CB(head)->validated = false;
  153. if (unlikely(!tipc_msg_validate(head)))
  154. goto err;
  155. *buf = head;
  156. TIPC_SKB_CB(head)->tail = NULL;
  157. *headbuf = NULL;
  158. return 1;
  159. }
  160. *buf = NULL;
  161. return 0;
  162. err:
  163. pr_warn_ratelimited("Unable to build fragment list\n");
  164. kfree_skb(*buf);
  165. kfree_skb(*headbuf);
  166. *buf = *headbuf = NULL;
  167. return 0;
  168. }
  169. /* tipc_msg_validate - validate basic format of received message
  170. *
  171. * This routine ensures a TIPC message has an acceptable header, and at least
  172. * as much data as the header indicates it should. The routine also ensures
  173. * that the entire message header is stored in the main fragment of the message
  174. * buffer, to simplify future access to message header fields.
  175. *
  176. * Note: Having extra info present in the message header or data areas is OK.
  177. * TIPC will ignore the excess, under the assumption that it is optional info
  178. * introduced by a later release of the protocol.
  179. */
  180. bool tipc_msg_validate(struct sk_buff *skb)
  181. {
  182. struct tipc_msg *msg;
  183. int msz, hsz;
  184. if (unlikely(TIPC_SKB_CB(skb)->validated))
  185. return true;
  186. if (unlikely(!pskb_may_pull(skb, MIN_H_SIZE)))
  187. return false;
  188. hsz = msg_hdr_sz(buf_msg(skb));
  189. if (unlikely(hsz < MIN_H_SIZE) || (hsz > MAX_H_SIZE))
  190. return false;
  191. if (unlikely(!pskb_may_pull(skb, hsz)))
  192. return false;
  193. msg = buf_msg(skb);
  194. if (unlikely(msg_version(msg) != TIPC_VERSION))
  195. return false;
  196. msz = msg_size(msg);
  197. if (unlikely(msz < hsz))
  198. return false;
  199. if (unlikely((msz - hsz) > TIPC_MAX_USER_MSG_SIZE))
  200. return false;
  201. if (unlikely(skb->len < msz))
  202. return false;
  203. TIPC_SKB_CB(skb)->validated = true;
  204. return true;
  205. }
  206. /**
  207. * tipc_msg_build - create buffer chain containing specified header and data
  208. * @mhdr: Message header, to be prepended to data
  209. * @m: User message
  210. * @dsz: Total length of user data
  211. * @pktmax: Max packet size that can be used
  212. * @list: Buffer or chain of buffers to be returned to caller
  213. *
  214. * Returns message data size or errno: -ENOMEM, -EFAULT
  215. */
  216. int tipc_msg_build(struct tipc_msg *mhdr, struct msghdr *m,
  217. int offset, int dsz, int pktmax, struct sk_buff_head *list)
  218. {
  219. int mhsz = msg_hdr_sz(mhdr);
  220. int msz = mhsz + dsz;
  221. int pktno = 1;
  222. int pktsz;
  223. int pktrem = pktmax;
  224. int drem = dsz;
  225. struct tipc_msg pkthdr;
  226. struct sk_buff *skb;
  227. char *pktpos;
  228. int rc;
  229. msg_set_size(mhdr, msz);
  230. /* No fragmentation needed? */
  231. if (likely(msz <= pktmax)) {
  232. skb = tipc_buf_acquire(msz);
  233. if (unlikely(!skb))
  234. return -ENOMEM;
  235. skb_orphan(skb);
  236. __skb_queue_tail(list, skb);
  237. skb_copy_to_linear_data(skb, mhdr, mhsz);
  238. pktpos = skb->data + mhsz;
  239. if (copy_from_iter(pktpos, dsz, &m->msg_iter) == dsz)
  240. return dsz;
  241. rc = -EFAULT;
  242. goto error;
  243. }
  244. /* Prepare reusable fragment header */
  245. tipc_msg_init(msg_prevnode(mhdr), &pkthdr, MSG_FRAGMENTER,
  246. FIRST_FRAGMENT, INT_H_SIZE, msg_destnode(mhdr));
  247. msg_set_size(&pkthdr, pktmax);
  248. msg_set_fragm_no(&pkthdr, pktno);
  249. msg_set_importance(&pkthdr, msg_importance(mhdr));
  250. /* Prepare first fragment */
  251. skb = tipc_buf_acquire(pktmax);
  252. if (!skb)
  253. return -ENOMEM;
  254. skb_orphan(skb);
  255. __skb_queue_tail(list, skb);
  256. pktpos = skb->data;
  257. skb_copy_to_linear_data(skb, &pkthdr, INT_H_SIZE);
  258. pktpos += INT_H_SIZE;
  259. pktrem -= INT_H_SIZE;
  260. skb_copy_to_linear_data_offset(skb, INT_H_SIZE, mhdr, mhsz);
  261. pktpos += mhsz;
  262. pktrem -= mhsz;
  263. do {
  264. if (drem < pktrem)
  265. pktrem = drem;
  266. if (copy_from_iter(pktpos, pktrem, &m->msg_iter) != pktrem) {
  267. rc = -EFAULT;
  268. goto error;
  269. }
  270. drem -= pktrem;
  271. if (!drem)
  272. break;
  273. /* Prepare new fragment: */
  274. if (drem < (pktmax - INT_H_SIZE))
  275. pktsz = drem + INT_H_SIZE;
  276. else
  277. pktsz = pktmax;
  278. skb = tipc_buf_acquire(pktsz);
  279. if (!skb) {
  280. rc = -ENOMEM;
  281. goto error;
  282. }
  283. skb_orphan(skb);
  284. __skb_queue_tail(list, skb);
  285. msg_set_type(&pkthdr, FRAGMENT);
  286. msg_set_size(&pkthdr, pktsz);
  287. msg_set_fragm_no(&pkthdr, ++pktno);
  288. skb_copy_to_linear_data(skb, &pkthdr, INT_H_SIZE);
  289. pktpos = skb->data + INT_H_SIZE;
  290. pktrem = pktsz - INT_H_SIZE;
  291. } while (1);
  292. msg_set_type(buf_msg(skb), LAST_FRAGMENT);
  293. return dsz;
  294. error:
  295. __skb_queue_purge(list);
  296. __skb_queue_head_init(list);
  297. return rc;
  298. }
  299. /**
  300. * tipc_msg_bundle(): Append contents of a buffer to tail of an existing one
  301. * @bskb: the buffer to append to ("bundle")
  302. * @skb: buffer to be appended
  303. * @mtu: max allowable size for the bundle buffer
  304. * Consumes buffer if successful
  305. * Returns true if bundling could be performed, otherwise false
  306. */
  307. bool tipc_msg_bundle(struct sk_buff *bskb, struct sk_buff *skb, u32 mtu)
  308. {
  309. struct tipc_msg *bmsg;
  310. struct tipc_msg *msg = buf_msg(skb);
  311. unsigned int bsz;
  312. unsigned int msz = msg_size(msg);
  313. u32 start, pad;
  314. u32 max = mtu - INT_H_SIZE;
  315. if (likely(msg_user(msg) == MSG_FRAGMENTER))
  316. return false;
  317. if (!bskb)
  318. return false;
  319. bmsg = buf_msg(bskb);
  320. bsz = msg_size(bmsg);
  321. start = align(bsz);
  322. pad = start - bsz;
  323. if (unlikely(msg_user(msg) == CHANGEOVER_PROTOCOL))
  324. return false;
  325. if (unlikely(msg_user(msg) == BCAST_PROTOCOL))
  326. return false;
  327. if (likely(msg_user(bmsg) != MSG_BUNDLER))
  328. return false;
  329. if (unlikely(skb_tailroom(bskb) < (pad + msz)))
  330. return false;
  331. if (unlikely(max < (start + msz)))
  332. return false;
  333. skb_put(bskb, pad + msz);
  334. skb_copy_to_linear_data_offset(bskb, start, skb->data, msz);
  335. msg_set_size(bmsg, start + msz);
  336. msg_set_msgcnt(bmsg, msg_msgcnt(bmsg) + 1);
  337. kfree_skb(skb);
  338. return true;
  339. }
  340. /**
  341. * tipc_msg_extract(): extract bundled inner packet from buffer
  342. * @skb: buffer to be extracted from.
  343. * @iskb: extracted inner buffer, to be returned
  344. * @pos: position in outer message of msg to be extracted.
  345. * Returns position of next msg
  346. * Consumes outer buffer when last packet extracted
  347. * Returns true when when there is an extracted buffer, otherwise false
  348. */
  349. bool tipc_msg_extract(struct sk_buff *skb, struct sk_buff **iskb, int *pos)
  350. {
  351. struct tipc_msg *msg;
  352. int imsz, offset;
  353. *iskb = NULL;
  354. if (unlikely(skb_linearize(skb)))
  355. goto none;
  356. msg = buf_msg(skb);
  357. offset = msg_hdr_sz(msg) + *pos;
  358. if (unlikely(offset > (msg_size(msg) - MIN_H_SIZE)))
  359. goto none;
  360. *iskb = skb_clone(skb, GFP_ATOMIC);
  361. if (unlikely(!*iskb))
  362. goto none;
  363. skb_pull(*iskb, offset);
  364. imsz = msg_size(buf_msg(*iskb));
  365. skb_trim(*iskb, imsz);
  366. if (unlikely(!tipc_msg_validate(*iskb)))
  367. goto none;
  368. *pos += align(imsz);
  369. return true;
  370. none:
  371. kfree_skb(skb);
  372. kfree_skb(*iskb);
  373. *iskb = NULL;
  374. return false;
  375. }
  376. /**
  377. * tipc_msg_make_bundle(): Create bundle buf and append message to its tail
  378. * @list: the buffer chain
  379. * @skb: buffer to be appended and replaced
  380. * @mtu: max allowable size for the bundle buffer, inclusive header
  381. * @dnode: destination node for message. (Not always present in header)
  382. * Replaces buffer if successful
  383. * Returns true if success, otherwise false
  384. */
  385. bool tipc_msg_make_bundle(struct sk_buff **skb, u32 mtu, u32 dnode)
  386. {
  387. struct sk_buff *bskb;
  388. struct tipc_msg *bmsg;
  389. struct tipc_msg *msg = buf_msg(*skb);
  390. u32 msz = msg_size(msg);
  391. u32 max = mtu - INT_H_SIZE;
  392. if (msg_user(msg) == MSG_FRAGMENTER)
  393. return false;
  394. if (msg_user(msg) == CHANGEOVER_PROTOCOL)
  395. return false;
  396. if (msg_user(msg) == BCAST_PROTOCOL)
  397. return false;
  398. if (msz > (max / 2))
  399. return false;
  400. bskb = tipc_buf_acquire(max);
  401. if (!bskb)
  402. return false;
  403. skb_trim(bskb, INT_H_SIZE);
  404. bmsg = buf_msg(bskb);
  405. tipc_msg_init(msg_prevnode(msg), bmsg, MSG_BUNDLER, 0,
  406. INT_H_SIZE, dnode);
  407. msg_set_seqno(bmsg, msg_seqno(msg));
  408. msg_set_ack(bmsg, msg_ack(msg));
  409. msg_set_bcast_ack(bmsg, msg_bcast_ack(msg));
  410. tipc_msg_bundle(bskb, *skb, mtu);
  411. *skb = bskb;
  412. return true;
  413. }
  414. /**
  415. * tipc_msg_reverse(): swap source and destination addresses and add error code
  416. * @buf: buffer containing message to be reversed
  417. * @dnode: return value: node where to send message after reversal
  418. * @err: error code to be set in message
  419. * Consumes buffer if failure
  420. * Returns true if success, otherwise false
  421. */
  422. bool tipc_msg_reverse(u32 own_addr, struct sk_buff *buf, u32 *dnode,
  423. int err)
  424. {
  425. struct tipc_msg *msg = buf_msg(buf);
  426. struct tipc_msg ohdr;
  427. uint rdsz = min_t(uint, msg_data_sz(msg), MAX_FORWARD_SIZE);
  428. if (skb_linearize(buf))
  429. goto exit;
  430. msg = buf_msg(buf);
  431. if (msg_dest_droppable(msg))
  432. goto exit;
  433. if (msg_errcode(msg))
  434. goto exit;
  435. memcpy(&ohdr, msg, msg_hdr_sz(msg));
  436. msg_set_errcode(msg, err);
  437. msg_set_origport(msg, msg_destport(&ohdr));
  438. msg_set_destport(msg, msg_origport(&ohdr));
  439. msg_set_prevnode(msg, own_addr);
  440. if (!msg_short(msg)) {
  441. msg_set_orignode(msg, msg_destnode(&ohdr));
  442. msg_set_destnode(msg, msg_orignode(&ohdr));
  443. }
  444. msg_set_size(msg, msg_hdr_sz(msg) + rdsz);
  445. skb_trim(buf, msg_size(msg));
  446. skb_orphan(buf);
  447. *dnode = msg_orignode(&ohdr);
  448. return true;
  449. exit:
  450. kfree_skb(buf);
  451. *dnode = 0;
  452. return false;
  453. }
  454. /**
  455. * tipc_msg_lookup_dest(): try to find new destination for named message
  456. * @skb: the buffer containing the message.
  457. * @dnode: return value: next-hop node, if destination found
  458. * @err: return value: error code to use, if message to be rejected
  459. * Does not consume buffer
  460. * Returns true if a destination is found, false otherwise
  461. */
  462. bool tipc_msg_lookup_dest(struct net *net, struct sk_buff *skb,
  463. u32 *dnode, int *err)
  464. {
  465. struct tipc_msg *msg = buf_msg(skb);
  466. u32 dport;
  467. if (!msg_isdata(msg))
  468. return false;
  469. if (!msg_named(msg))
  470. return false;
  471. *err = -TIPC_ERR_NO_NAME;
  472. if (skb_linearize(skb))
  473. return false;
  474. if (msg_reroute_cnt(msg) > 0)
  475. return false;
  476. *dnode = addr_domain(net, msg_lookup_scope(msg));
  477. dport = tipc_nametbl_translate(net, msg_nametype(msg),
  478. msg_nameinst(msg), dnode);
  479. if (!dport)
  480. return false;
  481. msg_incr_reroute_cnt(msg);
  482. msg_set_destnode(msg, *dnode);
  483. msg_set_destport(msg, dport);
  484. *err = TIPC_OK;
  485. return true;
  486. }
  487. /* tipc_msg_reassemble() - clone a buffer chain of fragments and
  488. * reassemble the clones into one message
  489. */
  490. struct sk_buff *tipc_msg_reassemble(struct sk_buff_head *list)
  491. {
  492. struct sk_buff *skb;
  493. struct sk_buff *frag = NULL;
  494. struct sk_buff *head = NULL;
  495. int hdr_sz;
  496. /* Copy header if single buffer */
  497. if (skb_queue_len(list) == 1) {
  498. skb = skb_peek(list);
  499. hdr_sz = skb_headroom(skb) + msg_hdr_sz(buf_msg(skb));
  500. return __pskb_copy(skb, hdr_sz, GFP_ATOMIC);
  501. }
  502. /* Clone all fragments and reassemble */
  503. skb_queue_walk(list, skb) {
  504. frag = skb_clone(skb, GFP_ATOMIC);
  505. if (!frag)
  506. goto error;
  507. frag->next = NULL;
  508. if (tipc_buf_append(&head, &frag))
  509. break;
  510. if (!head)
  511. goto error;
  512. }
  513. return frag;
  514. error:
  515. pr_warn("Failed do clone local mcast rcv buffer\n");
  516. kfree_skb(head);
  517. return NULL;
  518. }