channel.c 26 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938
  1. /*
  2. * Copyright (c) 2009, Microsoft Corporation.
  3. *
  4. * This program is free software; you can redistribute it and/or modify it
  5. * under the terms and conditions of the GNU General Public License,
  6. * version 2, as published by the Free Software Foundation.
  7. *
  8. * This program is distributed in the hope it will be useful, but WITHOUT
  9. * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  10. * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
  11. * more details.
  12. *
  13. * You should have received a copy of the GNU General Public License along with
  14. * this program; if not, write to the Free Software Foundation, Inc., 59 Temple
  15. * Place - Suite 330, Boston, MA 02111-1307 USA.
  16. *
  17. * Authors:
  18. * Haiyang Zhang <haiyangz@microsoft.com>
  19. * Hank Janssen <hjanssen@microsoft.com>
  20. */
  21. #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
  22. #include <linux/kernel.h>
  23. #include <linux/sched.h>
  24. #include <linux/wait.h>
  25. #include <linux/mm.h>
  26. #include <linux/slab.h>
  27. #include <linux/module.h>
  28. #include <linux/hyperv.h>
  29. #include <linux/uio.h>
  30. #include <linux/interrupt.h>
  31. #include <asm/page.h>
  32. #include "hyperv_vmbus.h"
  33. #define NUM_PAGES_SPANNED(addr, len) \
  34. ((PAGE_ALIGN(addr + len) >> PAGE_SHIFT) - (addr >> PAGE_SHIFT))
  35. static unsigned long virt_to_hvpfn(void *addr)
  36. {
  37. unsigned long paddr;
  38. if (is_vmalloc_addr(addr))
  39. paddr = page_to_phys(vmalloc_to_page(addr)) +
  40. offset_in_page(addr);
  41. else
  42. paddr = __pa(addr);
  43. return paddr >> PAGE_SHIFT;
  44. }
  45. /*
  46. * vmbus_setevent- Trigger an event notification on the specified
  47. * channel.
  48. */
  49. void vmbus_setevent(struct vmbus_channel *channel)
  50. {
  51. struct hv_monitor_page *monitorpage;
  52. trace_vmbus_setevent(channel);
  53. /*
  54. * For channels marked as in "low latency" mode
  55. * bypass the monitor page mechanism.
  56. */
  57. if (channel->offermsg.monitor_allocated && !channel->low_latency) {
  58. vmbus_send_interrupt(channel->offermsg.child_relid);
  59. /* Get the child to parent monitor page */
  60. monitorpage = vmbus_connection.monitor_pages[1];
  61. sync_set_bit(channel->monitor_bit,
  62. (unsigned long *)&monitorpage->trigger_group
  63. [channel->monitor_grp].pending);
  64. } else {
  65. vmbus_set_event(channel);
  66. }
  67. }
  68. EXPORT_SYMBOL_GPL(vmbus_setevent);
  69. /* vmbus_free_ring - drop mapping of ring buffer */
  70. void vmbus_free_ring(struct vmbus_channel *channel)
  71. {
  72. hv_ringbuffer_cleanup(&channel->outbound);
  73. hv_ringbuffer_cleanup(&channel->inbound);
  74. if (channel->ringbuffer_page) {
  75. __free_pages(channel->ringbuffer_page,
  76. get_order(channel->ringbuffer_pagecount
  77. << PAGE_SHIFT));
  78. channel->ringbuffer_page = NULL;
  79. }
  80. }
  81. EXPORT_SYMBOL_GPL(vmbus_free_ring);
  82. /* vmbus_alloc_ring - allocate and map pages for ring buffer */
  83. int vmbus_alloc_ring(struct vmbus_channel *newchannel,
  84. u32 send_size, u32 recv_size)
  85. {
  86. struct page *page;
  87. int order;
  88. if (send_size % PAGE_SIZE || recv_size % PAGE_SIZE)
  89. return -EINVAL;
  90. /* Allocate the ring buffer */
  91. order = get_order(send_size + recv_size);
  92. page = alloc_pages_node(cpu_to_node(newchannel->target_cpu),
  93. GFP_KERNEL|__GFP_ZERO, order);
  94. if (!page)
  95. page = alloc_pages(GFP_KERNEL|__GFP_ZERO, order);
  96. if (!page)
  97. return -ENOMEM;
  98. newchannel->ringbuffer_page = page;
  99. newchannel->ringbuffer_pagecount = (send_size + recv_size) >> PAGE_SHIFT;
  100. newchannel->ringbuffer_send_offset = send_size >> PAGE_SHIFT;
  101. return 0;
  102. }
  103. EXPORT_SYMBOL_GPL(vmbus_alloc_ring);
  104. static int __vmbus_open(struct vmbus_channel *newchannel,
  105. void *userdata, u32 userdatalen,
  106. void (*onchannelcallback)(void *context), void *context)
  107. {
  108. struct vmbus_channel_open_channel *open_msg;
  109. struct vmbus_channel_msginfo *open_info = NULL;
  110. struct page *page = newchannel->ringbuffer_page;
  111. u32 send_pages, recv_pages;
  112. unsigned long flags;
  113. int err;
  114. if (userdatalen > MAX_USER_DEFINED_BYTES)
  115. return -EINVAL;
  116. send_pages = newchannel->ringbuffer_send_offset;
  117. recv_pages = newchannel->ringbuffer_pagecount - send_pages;
  118. spin_lock_irqsave(&newchannel->lock, flags);
  119. if (newchannel->state != CHANNEL_OPEN_STATE) {
  120. spin_unlock_irqrestore(&newchannel->lock, flags);
  121. return -EINVAL;
  122. }
  123. spin_unlock_irqrestore(&newchannel->lock, flags);
  124. newchannel->state = CHANNEL_OPENING_STATE;
  125. newchannel->onchannel_callback = onchannelcallback;
  126. newchannel->channel_callback_context = context;
  127. err = hv_ringbuffer_init(&newchannel->outbound, page, send_pages);
  128. if (err)
  129. goto error_clean_ring;
  130. err = hv_ringbuffer_init(&newchannel->inbound,
  131. &page[send_pages], recv_pages);
  132. if (err)
  133. goto error_clean_ring;
  134. /* Establish the gpadl for the ring buffer */
  135. newchannel->ringbuffer_gpadlhandle = 0;
  136. err = vmbus_establish_gpadl(newchannel,
  137. page_address(newchannel->ringbuffer_page),
  138. (send_pages + recv_pages) << PAGE_SHIFT,
  139. &newchannel->ringbuffer_gpadlhandle);
  140. if (err)
  141. goto error_clean_ring;
  142. /* Create and init the channel open message */
  143. open_info = kmalloc(sizeof(*open_info) +
  144. sizeof(struct vmbus_channel_open_channel),
  145. GFP_KERNEL);
  146. if (!open_info) {
  147. err = -ENOMEM;
  148. goto error_free_gpadl;
  149. }
  150. init_completion(&open_info->waitevent);
  151. open_info->waiting_channel = newchannel;
  152. open_msg = (struct vmbus_channel_open_channel *)open_info->msg;
  153. open_msg->header.msgtype = CHANNELMSG_OPENCHANNEL;
  154. open_msg->openid = newchannel->offermsg.child_relid;
  155. open_msg->child_relid = newchannel->offermsg.child_relid;
  156. open_msg->ringbuffer_gpadlhandle = newchannel->ringbuffer_gpadlhandle;
  157. open_msg->downstream_ringbuffer_pageoffset = newchannel->ringbuffer_send_offset;
  158. open_msg->target_vp = newchannel->target_vp;
  159. if (userdatalen)
  160. memcpy(open_msg->userdata, userdata, userdatalen);
  161. spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags);
  162. list_add_tail(&open_info->msglistentry,
  163. &vmbus_connection.chn_msg_list);
  164. spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags);
  165. if (newchannel->rescind) {
  166. err = -ENODEV;
  167. goto error_free_info;
  168. }
  169. err = vmbus_post_msg(open_msg,
  170. sizeof(struct vmbus_channel_open_channel), true);
  171. trace_vmbus_open(open_msg, err);
  172. if (err != 0)
  173. goto error_clean_msglist;
  174. wait_for_completion(&open_info->waitevent);
  175. spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags);
  176. list_del(&open_info->msglistentry);
  177. spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags);
  178. if (newchannel->rescind) {
  179. err = -ENODEV;
  180. goto error_free_info;
  181. }
  182. if (open_info->response.open_result.status) {
  183. err = -EAGAIN;
  184. goto error_free_info;
  185. }
  186. newchannel->state = CHANNEL_OPENED_STATE;
  187. kfree(open_info);
  188. return 0;
  189. error_clean_msglist:
  190. spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags);
  191. list_del(&open_info->msglistentry);
  192. spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags);
  193. error_free_info:
  194. kfree(open_info);
  195. error_free_gpadl:
  196. vmbus_teardown_gpadl(newchannel, newchannel->ringbuffer_gpadlhandle);
  197. newchannel->ringbuffer_gpadlhandle = 0;
  198. error_clean_ring:
  199. hv_ringbuffer_cleanup(&newchannel->outbound);
  200. hv_ringbuffer_cleanup(&newchannel->inbound);
  201. newchannel->state = CHANNEL_OPEN_STATE;
  202. return err;
  203. }
  204. /*
  205. * vmbus_connect_ring - Open the channel but reuse ring buffer
  206. */
  207. int vmbus_connect_ring(struct vmbus_channel *newchannel,
  208. void (*onchannelcallback)(void *context), void *context)
  209. {
  210. return __vmbus_open(newchannel, NULL, 0, onchannelcallback, context);
  211. }
  212. EXPORT_SYMBOL_GPL(vmbus_connect_ring);
  213. /*
  214. * vmbus_open - Open the specified channel.
  215. */
  216. int vmbus_open(struct vmbus_channel *newchannel,
  217. u32 send_ringbuffer_size, u32 recv_ringbuffer_size,
  218. void *userdata, u32 userdatalen,
  219. void (*onchannelcallback)(void *context), void *context)
  220. {
  221. int err;
  222. err = vmbus_alloc_ring(newchannel, send_ringbuffer_size,
  223. recv_ringbuffer_size);
  224. if (err)
  225. return err;
  226. err = __vmbus_open(newchannel, userdata, userdatalen,
  227. onchannelcallback, context);
  228. if (err)
  229. vmbus_free_ring(newchannel);
  230. return err;
  231. }
  232. EXPORT_SYMBOL_GPL(vmbus_open);
  233. /* Used for Hyper-V Socket: a guest client's connect() to the host */
  234. int vmbus_send_tl_connect_request(const uuid_le *shv_guest_servie_id,
  235. const uuid_le *shv_host_servie_id)
  236. {
  237. struct vmbus_channel_tl_connect_request conn_msg;
  238. int ret;
  239. memset(&conn_msg, 0, sizeof(conn_msg));
  240. conn_msg.header.msgtype = CHANNELMSG_TL_CONNECT_REQUEST;
  241. conn_msg.guest_endpoint_id = *shv_guest_servie_id;
  242. conn_msg.host_service_id = *shv_host_servie_id;
  243. ret = vmbus_post_msg(&conn_msg, sizeof(conn_msg), true);
  244. trace_vmbus_send_tl_connect_request(&conn_msg, ret);
  245. return ret;
  246. }
  247. EXPORT_SYMBOL_GPL(vmbus_send_tl_connect_request);
  248. /*
  249. * create_gpadl_header - Creates a gpadl for the specified buffer
  250. */
  251. static int create_gpadl_header(void *kbuffer, u32 size,
  252. struct vmbus_channel_msginfo **msginfo)
  253. {
  254. int i;
  255. int pagecount;
  256. struct vmbus_channel_gpadl_header *gpadl_header;
  257. struct vmbus_channel_gpadl_body *gpadl_body;
  258. struct vmbus_channel_msginfo *msgheader;
  259. struct vmbus_channel_msginfo *msgbody = NULL;
  260. u32 msgsize;
  261. int pfnsum, pfncount, pfnleft, pfncurr, pfnsize;
  262. pagecount = size >> PAGE_SHIFT;
  263. /* do we need a gpadl body msg */
  264. pfnsize = MAX_SIZE_CHANNEL_MESSAGE -
  265. sizeof(struct vmbus_channel_gpadl_header) -
  266. sizeof(struct gpa_range);
  267. pfncount = pfnsize / sizeof(u64);
  268. if (pagecount > pfncount) {
  269. /* we need a gpadl body */
  270. /* fill in the header */
  271. msgsize = sizeof(struct vmbus_channel_msginfo) +
  272. sizeof(struct vmbus_channel_gpadl_header) +
  273. sizeof(struct gpa_range) + pfncount * sizeof(u64);
  274. msgheader = kzalloc(msgsize, GFP_KERNEL);
  275. if (!msgheader)
  276. goto nomem;
  277. INIT_LIST_HEAD(&msgheader->submsglist);
  278. msgheader->msgsize = msgsize;
  279. gpadl_header = (struct vmbus_channel_gpadl_header *)
  280. msgheader->msg;
  281. gpadl_header->rangecount = 1;
  282. gpadl_header->range_buflen = sizeof(struct gpa_range) +
  283. pagecount * sizeof(u64);
  284. gpadl_header->range[0].byte_offset = 0;
  285. gpadl_header->range[0].byte_count = size;
  286. for (i = 0; i < pfncount; i++)
  287. gpadl_header->range[0].pfn_array[i] = virt_to_hvpfn(
  288. kbuffer + PAGE_SIZE * i);
  289. *msginfo = msgheader;
  290. pfnsum = pfncount;
  291. pfnleft = pagecount - pfncount;
  292. /* how many pfns can we fit */
  293. pfnsize = MAX_SIZE_CHANNEL_MESSAGE -
  294. sizeof(struct vmbus_channel_gpadl_body);
  295. pfncount = pfnsize / sizeof(u64);
  296. /* fill in the body */
  297. while (pfnleft) {
  298. if (pfnleft > pfncount)
  299. pfncurr = pfncount;
  300. else
  301. pfncurr = pfnleft;
  302. msgsize = sizeof(struct vmbus_channel_msginfo) +
  303. sizeof(struct vmbus_channel_gpadl_body) +
  304. pfncurr * sizeof(u64);
  305. msgbody = kzalloc(msgsize, GFP_KERNEL);
  306. if (!msgbody) {
  307. struct vmbus_channel_msginfo *pos = NULL;
  308. struct vmbus_channel_msginfo *tmp = NULL;
  309. /*
  310. * Free up all the allocated messages.
  311. */
  312. list_for_each_entry_safe(pos, tmp,
  313. &msgheader->submsglist,
  314. msglistentry) {
  315. list_del(&pos->msglistentry);
  316. kfree(pos);
  317. }
  318. goto nomem;
  319. }
  320. msgbody->msgsize = msgsize;
  321. gpadl_body =
  322. (struct vmbus_channel_gpadl_body *)msgbody->msg;
  323. /*
  324. * Gpadl is u32 and we are using a pointer which could
  325. * be 64-bit
  326. * This is governed by the guest/host protocol and
  327. * so the hypervisor guarantees that this is ok.
  328. */
  329. for (i = 0; i < pfncurr; i++)
  330. gpadl_body->pfn[i] = virt_to_hvpfn(
  331. kbuffer + PAGE_SIZE * (pfnsum + i));
  332. /* add to msg header */
  333. list_add_tail(&msgbody->msglistentry,
  334. &msgheader->submsglist);
  335. pfnsum += pfncurr;
  336. pfnleft -= pfncurr;
  337. }
  338. } else {
  339. /* everything fits in a header */
  340. msgsize = sizeof(struct vmbus_channel_msginfo) +
  341. sizeof(struct vmbus_channel_gpadl_header) +
  342. sizeof(struct gpa_range) + pagecount * sizeof(u64);
  343. msgheader = kzalloc(msgsize, GFP_KERNEL);
  344. if (msgheader == NULL)
  345. goto nomem;
  346. INIT_LIST_HEAD(&msgheader->submsglist);
  347. msgheader->msgsize = msgsize;
  348. gpadl_header = (struct vmbus_channel_gpadl_header *)
  349. msgheader->msg;
  350. gpadl_header->rangecount = 1;
  351. gpadl_header->range_buflen = sizeof(struct gpa_range) +
  352. pagecount * sizeof(u64);
  353. gpadl_header->range[0].byte_offset = 0;
  354. gpadl_header->range[0].byte_count = size;
  355. for (i = 0; i < pagecount; i++)
  356. gpadl_header->range[0].pfn_array[i] = virt_to_hvpfn(
  357. kbuffer + PAGE_SIZE * i);
  358. *msginfo = msgheader;
  359. }
  360. return 0;
  361. nomem:
  362. kfree(msgheader);
  363. kfree(msgbody);
  364. return -ENOMEM;
  365. }
  366. /*
  367. * vmbus_establish_gpadl - Establish a GPADL for the specified buffer
  368. *
  369. * @channel: a channel
  370. * @kbuffer: from kmalloc or vmalloc
  371. * @size: page-size multiple
  372. * @gpadl_handle: some funky thing
  373. */
  374. int vmbus_establish_gpadl(struct vmbus_channel *channel, void *kbuffer,
  375. u32 size, u32 *gpadl_handle)
  376. {
  377. struct vmbus_channel_gpadl_header *gpadlmsg;
  378. struct vmbus_channel_gpadl_body *gpadl_body;
  379. struct vmbus_channel_msginfo *msginfo = NULL;
  380. struct vmbus_channel_msginfo *submsginfo, *tmp;
  381. struct list_head *curr;
  382. u32 next_gpadl_handle;
  383. unsigned long flags;
  384. int ret = 0;
  385. next_gpadl_handle =
  386. (atomic_inc_return(&vmbus_connection.next_gpadl_handle) - 1);
  387. ret = create_gpadl_header(kbuffer, size, &msginfo);
  388. if (ret)
  389. return ret;
  390. init_completion(&msginfo->waitevent);
  391. msginfo->waiting_channel = channel;
  392. gpadlmsg = (struct vmbus_channel_gpadl_header *)msginfo->msg;
  393. gpadlmsg->header.msgtype = CHANNELMSG_GPADL_HEADER;
  394. gpadlmsg->child_relid = channel->offermsg.child_relid;
  395. gpadlmsg->gpadl = next_gpadl_handle;
  396. spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags);
  397. list_add_tail(&msginfo->msglistentry,
  398. &vmbus_connection.chn_msg_list);
  399. spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags);
  400. if (channel->rescind) {
  401. ret = -ENODEV;
  402. goto cleanup;
  403. }
  404. ret = vmbus_post_msg(gpadlmsg, msginfo->msgsize -
  405. sizeof(*msginfo), true);
  406. trace_vmbus_establish_gpadl_header(gpadlmsg, ret);
  407. if (ret != 0)
  408. goto cleanup;
  409. list_for_each(curr, &msginfo->submsglist) {
  410. submsginfo = (struct vmbus_channel_msginfo *)curr;
  411. gpadl_body =
  412. (struct vmbus_channel_gpadl_body *)submsginfo->msg;
  413. gpadl_body->header.msgtype =
  414. CHANNELMSG_GPADL_BODY;
  415. gpadl_body->gpadl = next_gpadl_handle;
  416. ret = vmbus_post_msg(gpadl_body,
  417. submsginfo->msgsize - sizeof(*submsginfo),
  418. true);
  419. trace_vmbus_establish_gpadl_body(gpadl_body, ret);
  420. if (ret != 0)
  421. goto cleanup;
  422. }
  423. wait_for_completion(&msginfo->waitevent);
  424. if (msginfo->response.gpadl_created.creation_status != 0) {
  425. pr_err("Failed to establish GPADL: err = 0x%x\n",
  426. msginfo->response.gpadl_created.creation_status);
  427. ret = -EDQUOT;
  428. goto cleanup;
  429. }
  430. if (channel->rescind) {
  431. ret = -ENODEV;
  432. goto cleanup;
  433. }
  434. /* At this point, we received the gpadl created msg */
  435. *gpadl_handle = gpadlmsg->gpadl;
  436. cleanup:
  437. spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags);
  438. list_del(&msginfo->msglistentry);
  439. spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags);
  440. list_for_each_entry_safe(submsginfo, tmp, &msginfo->submsglist,
  441. msglistentry) {
  442. kfree(submsginfo);
  443. }
  444. kfree(msginfo);
  445. return ret;
  446. }
  447. EXPORT_SYMBOL_GPL(vmbus_establish_gpadl);
  448. /*
  449. * vmbus_teardown_gpadl -Teardown the specified GPADL handle
  450. */
  451. int vmbus_teardown_gpadl(struct vmbus_channel *channel, u32 gpadl_handle)
  452. {
  453. struct vmbus_channel_gpadl_teardown *msg;
  454. struct vmbus_channel_msginfo *info;
  455. unsigned long flags;
  456. int ret;
  457. info = kmalloc(sizeof(*info) +
  458. sizeof(struct vmbus_channel_gpadl_teardown), GFP_KERNEL);
  459. if (!info)
  460. return -ENOMEM;
  461. init_completion(&info->waitevent);
  462. info->waiting_channel = channel;
  463. msg = (struct vmbus_channel_gpadl_teardown *)info->msg;
  464. msg->header.msgtype = CHANNELMSG_GPADL_TEARDOWN;
  465. msg->child_relid = channel->offermsg.child_relid;
  466. msg->gpadl = gpadl_handle;
  467. spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags);
  468. list_add_tail(&info->msglistentry,
  469. &vmbus_connection.chn_msg_list);
  470. spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags);
  471. if (channel->rescind)
  472. goto post_msg_err;
  473. ret = vmbus_post_msg(msg, sizeof(struct vmbus_channel_gpadl_teardown),
  474. true);
  475. trace_vmbus_teardown_gpadl(msg, ret);
  476. if (ret)
  477. goto post_msg_err;
  478. wait_for_completion(&info->waitevent);
  479. post_msg_err:
  480. /*
  481. * If the channel has been rescinded;
  482. * we will be awakened by the rescind
  483. * handler; set the error code to zero so we don't leak memory.
  484. */
  485. if (channel->rescind)
  486. ret = 0;
  487. spin_lock_irqsave(&vmbus_connection.channelmsg_lock, flags);
  488. list_del(&info->msglistentry);
  489. spin_unlock_irqrestore(&vmbus_connection.channelmsg_lock, flags);
  490. kfree(info);
  491. return ret;
  492. }
  493. EXPORT_SYMBOL_GPL(vmbus_teardown_gpadl);
  494. static void reset_channel_cb(void *arg)
  495. {
  496. struct vmbus_channel *channel = arg;
  497. channel->onchannel_callback = NULL;
  498. }
  499. void vmbus_reset_channel_cb(struct vmbus_channel *channel)
  500. {
  501. /*
  502. * vmbus_on_event(), running in the per-channel tasklet, can race
  503. * with vmbus_close_internal() in the case of SMP guest, e.g., when
  504. * the former is accessing channel->inbound.ring_buffer, the latter
  505. * could be freeing the ring_buffer pages, so here we must stop it
  506. * first.
  507. */
  508. tasklet_disable(&channel->callback_event);
  509. channel->sc_creation_callback = NULL;
  510. /* Stop the callback asap */
  511. if (channel->target_cpu != get_cpu()) {
  512. put_cpu();
  513. smp_call_function_single(channel->target_cpu, reset_channel_cb,
  514. channel, true);
  515. } else {
  516. reset_channel_cb(channel);
  517. put_cpu();
  518. }
  519. /* Re-enable tasklet for use on re-open */
  520. tasklet_enable(&channel->callback_event);
  521. }
  522. static int vmbus_close_internal(struct vmbus_channel *channel)
  523. {
  524. struct vmbus_channel_close_channel *msg;
  525. int ret;
  526. vmbus_reset_channel_cb(channel);
  527. /*
  528. * In case a device driver's probe() fails (e.g.,
  529. * util_probe() -> vmbus_open() returns -ENOMEM) and the device is
  530. * rescinded later (e.g., we dynamically disable an Integrated Service
  531. * in Hyper-V Manager), the driver's remove() invokes vmbus_close():
  532. * here we should skip most of the below cleanup work.
  533. */
  534. if (channel->state != CHANNEL_OPENED_STATE)
  535. return -EINVAL;
  536. channel->state = CHANNEL_OPEN_STATE;
  537. /* Send a closing message */
  538. msg = &channel->close_msg.msg;
  539. msg->header.msgtype = CHANNELMSG_CLOSECHANNEL;
  540. msg->child_relid = channel->offermsg.child_relid;
  541. ret = vmbus_post_msg(msg, sizeof(struct vmbus_channel_close_channel),
  542. true);
  543. trace_vmbus_close_internal(msg, ret);
  544. if (ret) {
  545. pr_err("Close failed: close post msg return is %d\n", ret);
  546. /*
  547. * If we failed to post the close msg,
  548. * it is perhaps better to leak memory.
  549. */
  550. }
  551. /* Tear down the gpadl for the channel's ring buffer */
  552. else if (channel->ringbuffer_gpadlhandle) {
  553. ret = vmbus_teardown_gpadl(channel,
  554. channel->ringbuffer_gpadlhandle);
  555. if (ret) {
  556. pr_err("Close failed: teardown gpadl return %d\n", ret);
  557. /*
  558. * If we failed to teardown gpadl,
  559. * it is perhaps better to leak memory.
  560. */
  561. }
  562. channel->ringbuffer_gpadlhandle = 0;
  563. }
  564. return ret;
  565. }
  566. /* disconnect ring - close all channels */
  567. int vmbus_disconnect_ring(struct vmbus_channel *channel)
  568. {
  569. struct vmbus_channel *cur_channel, *tmp;
  570. unsigned long flags;
  571. LIST_HEAD(list);
  572. int ret;
  573. if (channel->primary_channel != NULL)
  574. return -EINVAL;
  575. /* Snapshot the list of subchannels */
  576. spin_lock_irqsave(&channel->lock, flags);
  577. list_splice_init(&channel->sc_list, &list);
  578. channel->num_sc = 0;
  579. spin_unlock_irqrestore(&channel->lock, flags);
  580. list_for_each_entry_safe(cur_channel, tmp, &list, sc_list) {
  581. if (cur_channel->rescind)
  582. wait_for_completion(&cur_channel->rescind_event);
  583. mutex_lock(&vmbus_connection.channel_mutex);
  584. if (vmbus_close_internal(cur_channel) == 0) {
  585. vmbus_free_ring(cur_channel);
  586. if (cur_channel->rescind)
  587. hv_process_channel_removal(cur_channel);
  588. }
  589. mutex_unlock(&vmbus_connection.channel_mutex);
  590. }
  591. /*
  592. * Now close the primary.
  593. */
  594. mutex_lock(&vmbus_connection.channel_mutex);
  595. ret = vmbus_close_internal(channel);
  596. mutex_unlock(&vmbus_connection.channel_mutex);
  597. return ret;
  598. }
  599. EXPORT_SYMBOL_GPL(vmbus_disconnect_ring);
  600. /*
  601. * vmbus_close - Close the specified channel
  602. */
  603. void vmbus_close(struct vmbus_channel *channel)
  604. {
  605. if (vmbus_disconnect_ring(channel) == 0)
  606. vmbus_free_ring(channel);
  607. }
  608. EXPORT_SYMBOL_GPL(vmbus_close);
  609. /**
  610. * vmbus_sendpacket() - Send the specified buffer on the given channel
  611. * @channel: Pointer to vmbus_channel structure
  612. * @buffer: Pointer to the buffer you want to send the data from.
  613. * @bufferlen: Maximum size of what the buffer holds.
  614. * @requestid: Identifier of the request
  615. * @type: Type of packet that is being sent e.g. negotiate, time
  616. * packet etc.
  617. * @flags: 0 or VMBUS_DATA_PACKET_FLAG_COMPLETION_REQUESTED
  618. *
  619. * Sends data in @buffer directly to Hyper-V via the vmbus.
  620. * This will send the data unparsed to Hyper-V.
  621. *
  622. * Mainly used by Hyper-V drivers.
  623. */
  624. int vmbus_sendpacket(struct vmbus_channel *channel, void *buffer,
  625. u32 bufferlen, u64 requestid,
  626. enum vmbus_packet_type type, u32 flags)
  627. {
  628. struct vmpacket_descriptor desc;
  629. u32 packetlen = sizeof(struct vmpacket_descriptor) + bufferlen;
  630. u32 packetlen_aligned = ALIGN(packetlen, sizeof(u64));
  631. struct kvec bufferlist[3];
  632. u64 aligned_data = 0;
  633. int num_vecs = ((bufferlen != 0) ? 3 : 1);
  634. /* Setup the descriptor */
  635. desc.type = type; /* VmbusPacketTypeDataInBand; */
  636. desc.flags = flags; /* VMBUS_DATA_PACKET_FLAG_COMPLETION_REQUESTED; */
  637. /* in 8-bytes granularity */
  638. desc.offset8 = sizeof(struct vmpacket_descriptor) >> 3;
  639. desc.len8 = (u16)(packetlen_aligned >> 3);
  640. desc.trans_id = requestid;
  641. bufferlist[0].iov_base = &desc;
  642. bufferlist[0].iov_len = sizeof(struct vmpacket_descriptor);
  643. bufferlist[1].iov_base = buffer;
  644. bufferlist[1].iov_len = bufferlen;
  645. bufferlist[2].iov_base = &aligned_data;
  646. bufferlist[2].iov_len = (packetlen_aligned - packetlen);
  647. return hv_ringbuffer_write(channel, bufferlist, num_vecs);
  648. }
  649. EXPORT_SYMBOL(vmbus_sendpacket);
  650. /*
  651. * vmbus_sendpacket_pagebuffer - Send a range of single-page buffer
  652. * packets using a GPADL Direct packet type. This interface allows you
  653. * to control notifying the host. This will be useful for sending
  654. * batched data. Also the sender can control the send flags
  655. * explicitly.
  656. */
  657. int vmbus_sendpacket_pagebuffer(struct vmbus_channel *channel,
  658. struct hv_page_buffer pagebuffers[],
  659. u32 pagecount, void *buffer, u32 bufferlen,
  660. u64 requestid)
  661. {
  662. int i;
  663. struct vmbus_channel_packet_page_buffer desc;
  664. u32 descsize;
  665. u32 packetlen;
  666. u32 packetlen_aligned;
  667. struct kvec bufferlist[3];
  668. u64 aligned_data = 0;
  669. if (pagecount > MAX_PAGE_BUFFER_COUNT)
  670. return -EINVAL;
  671. /*
  672. * Adjust the size down since vmbus_channel_packet_page_buffer is the
  673. * largest size we support
  674. */
  675. descsize = sizeof(struct vmbus_channel_packet_page_buffer) -
  676. ((MAX_PAGE_BUFFER_COUNT - pagecount) *
  677. sizeof(struct hv_page_buffer));
  678. packetlen = descsize + bufferlen;
  679. packetlen_aligned = ALIGN(packetlen, sizeof(u64));
  680. /* Setup the descriptor */
  681. desc.type = VM_PKT_DATA_USING_GPA_DIRECT;
  682. desc.flags = VMBUS_DATA_PACKET_FLAG_COMPLETION_REQUESTED;
  683. desc.dataoffset8 = descsize >> 3; /* in 8-bytes granularity */
  684. desc.length8 = (u16)(packetlen_aligned >> 3);
  685. desc.transactionid = requestid;
  686. desc.reserved = 0;
  687. desc.rangecount = pagecount;
  688. for (i = 0; i < pagecount; i++) {
  689. desc.range[i].len = pagebuffers[i].len;
  690. desc.range[i].offset = pagebuffers[i].offset;
  691. desc.range[i].pfn = pagebuffers[i].pfn;
  692. }
  693. bufferlist[0].iov_base = &desc;
  694. bufferlist[0].iov_len = descsize;
  695. bufferlist[1].iov_base = buffer;
  696. bufferlist[1].iov_len = bufferlen;
  697. bufferlist[2].iov_base = &aligned_data;
  698. bufferlist[2].iov_len = (packetlen_aligned - packetlen);
  699. return hv_ringbuffer_write(channel, bufferlist, 3);
  700. }
  701. EXPORT_SYMBOL_GPL(vmbus_sendpacket_pagebuffer);
  702. /*
  703. * vmbus_sendpacket_multipagebuffer - Send a multi-page buffer packet
  704. * using a GPADL Direct packet type.
  705. * The buffer includes the vmbus descriptor.
  706. */
  707. int vmbus_sendpacket_mpb_desc(struct vmbus_channel *channel,
  708. struct vmbus_packet_mpb_array *desc,
  709. u32 desc_size,
  710. void *buffer, u32 bufferlen, u64 requestid)
  711. {
  712. u32 packetlen;
  713. u32 packetlen_aligned;
  714. struct kvec bufferlist[3];
  715. u64 aligned_data = 0;
  716. packetlen = desc_size + bufferlen;
  717. packetlen_aligned = ALIGN(packetlen, sizeof(u64));
  718. /* Setup the descriptor */
  719. desc->type = VM_PKT_DATA_USING_GPA_DIRECT;
  720. desc->flags = VMBUS_DATA_PACKET_FLAG_COMPLETION_REQUESTED;
  721. desc->dataoffset8 = desc_size >> 3; /* in 8-bytes granularity */
  722. desc->length8 = (u16)(packetlen_aligned >> 3);
  723. desc->transactionid = requestid;
  724. desc->reserved = 0;
  725. desc->rangecount = 1;
  726. bufferlist[0].iov_base = desc;
  727. bufferlist[0].iov_len = desc_size;
  728. bufferlist[1].iov_base = buffer;
  729. bufferlist[1].iov_len = bufferlen;
  730. bufferlist[2].iov_base = &aligned_data;
  731. bufferlist[2].iov_len = (packetlen_aligned - packetlen);
  732. return hv_ringbuffer_write(channel, bufferlist, 3);
  733. }
  734. EXPORT_SYMBOL_GPL(vmbus_sendpacket_mpb_desc);
  735. /**
  736. * __vmbus_recvpacket() - Retrieve the user packet on the specified channel
  737. * @channel: Pointer to vmbus_channel structure
  738. * @buffer: Pointer to the buffer you want to receive the data into.
  739. * @bufferlen: Maximum size of what the buffer can hold.
  740. * @buffer_actual_len: The actual size of the data after it was received.
  741. * @requestid: Identifier of the request
  742. * @raw: true means keep the vmpacket_descriptor header in the received data.
  743. *
  744. * Receives directly from the hyper-v vmbus and puts the data it received
  745. * into Buffer. This will receive the data unparsed from hyper-v.
  746. *
  747. * Mainly used by Hyper-V drivers.
  748. */
  749. static inline int
  750. __vmbus_recvpacket(struct vmbus_channel *channel, void *buffer,
  751. u32 bufferlen, u32 *buffer_actual_len, u64 *requestid,
  752. bool raw)
  753. {
  754. return hv_ringbuffer_read(channel, buffer, bufferlen,
  755. buffer_actual_len, requestid, raw);
  756. }
  757. int vmbus_recvpacket(struct vmbus_channel *channel, void *buffer,
  758. u32 bufferlen, u32 *buffer_actual_len,
  759. u64 *requestid)
  760. {
  761. return __vmbus_recvpacket(channel, buffer, bufferlen,
  762. buffer_actual_len, requestid, false);
  763. }
  764. EXPORT_SYMBOL(vmbus_recvpacket);
  765. /*
  766. * vmbus_recvpacket_raw - Retrieve the raw packet on the specified channel
  767. */
  768. int vmbus_recvpacket_raw(struct vmbus_channel *channel, void *buffer,
  769. u32 bufferlen, u32 *buffer_actual_len,
  770. u64 *requestid)
  771. {
  772. return __vmbus_recvpacket(channel, buffer, bufferlen,
  773. buffer_actual_len, requestid, true);
  774. }
  775. EXPORT_SYMBOL_GPL(vmbus_recvpacket_raw);