sunvnet.c 37 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603
  1. /* sunvnet.c: Sun LDOM Virtual Network Driver.
  2. *
  3. * Copyright (C) 2007, 2008 David S. Miller <davem@davemloft.net>
  4. */
  5. #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
  6. #include <linux/module.h>
  7. #include <linux/kernel.h>
  8. #include <linux/types.h>
  9. #include <linux/slab.h>
  10. #include <linux/delay.h>
  11. #include <linux/init.h>
  12. #include <linux/netdevice.h>
  13. #include <linux/ethtool.h>
  14. #include <linux/etherdevice.h>
  15. #include <linux/mutex.h>
  16. #include <linux/if_vlan.h>
  17. #include <asm/vio.h>
  18. #include <asm/ldc.h>
  19. #include "sunvnet.h"
  20. #define DRV_MODULE_NAME "sunvnet"
  21. #define DRV_MODULE_VERSION "1.0"
  22. #define DRV_MODULE_RELDATE "June 25, 2007"
  23. static char version[] =
  24. DRV_MODULE_NAME ".c:v" DRV_MODULE_VERSION " (" DRV_MODULE_RELDATE ")\n";
  25. MODULE_AUTHOR("David S. Miller (davem@davemloft.net)");
  26. MODULE_DESCRIPTION("Sun LDOM virtual network driver");
  27. MODULE_LICENSE("GPL");
  28. MODULE_VERSION(DRV_MODULE_VERSION);
  29. /* Heuristic for the number of times to exponentially backoff and
  30. * retry sending an LDC trigger when EAGAIN is encountered
  31. */
  32. #define VNET_MAX_RETRIES 10
  33. static int __vnet_tx_trigger(struct vnet_port *port, u32 start);
  34. /* Ordered from largest major to lowest */
  35. static struct vio_version vnet_versions[] = {
  36. { .major = 1, .minor = 6 },
  37. { .major = 1, .minor = 0 },
  38. };
  39. static inline u32 vnet_tx_dring_avail(struct vio_dring_state *dr)
  40. {
  41. return vio_dring_avail(dr, VNET_TX_RING_SIZE);
  42. }
  43. static int vnet_handle_unknown(struct vnet_port *port, void *arg)
  44. {
  45. struct vio_msg_tag *pkt = arg;
  46. pr_err("Received unknown msg [%02x:%02x:%04x:%08x]\n",
  47. pkt->type, pkt->stype, pkt->stype_env, pkt->sid);
  48. pr_err("Resetting connection\n");
  49. ldc_disconnect(port->vio.lp);
  50. return -ECONNRESET;
  51. }
  52. static int vnet_send_attr(struct vio_driver_state *vio)
  53. {
  54. struct vnet_port *port = to_vnet_port(vio);
  55. struct net_device *dev = port->vp->dev;
  56. struct vio_net_attr_info pkt;
  57. int framelen = ETH_FRAME_LEN;
  58. int i;
  59. memset(&pkt, 0, sizeof(pkt));
  60. pkt.tag.type = VIO_TYPE_CTRL;
  61. pkt.tag.stype = VIO_SUBTYPE_INFO;
  62. pkt.tag.stype_env = VIO_ATTR_INFO;
  63. pkt.tag.sid = vio_send_sid(vio);
  64. if (vio_version_before(vio, 1, 2))
  65. pkt.xfer_mode = VIO_DRING_MODE;
  66. else
  67. pkt.xfer_mode = VIO_NEW_DRING_MODE;
  68. pkt.addr_type = VNET_ADDR_ETHERMAC;
  69. pkt.ack_freq = 0;
  70. for (i = 0; i < 6; i++)
  71. pkt.addr |= (u64)dev->dev_addr[i] << ((5 - i) * 8);
  72. if (vio_version_after(vio, 1, 3)) {
  73. if (port->rmtu) {
  74. port->rmtu = min(VNET_MAXPACKET, port->rmtu);
  75. pkt.mtu = port->rmtu;
  76. } else {
  77. port->rmtu = VNET_MAXPACKET;
  78. pkt.mtu = port->rmtu;
  79. }
  80. if (vio_version_after_eq(vio, 1, 6))
  81. pkt.options = VIO_TX_DRING;
  82. } else if (vio_version_before(vio, 1, 3)) {
  83. pkt.mtu = framelen;
  84. } else { /* v1.3 */
  85. pkt.mtu = framelen + VLAN_HLEN;
  86. }
  87. pkt.plnk_updt = PHYSLINK_UPDATE_NONE;
  88. pkt.cflags = 0;
  89. viodbg(HS, "SEND NET ATTR xmode[0x%x] atype[0x%x] addr[%llx] "
  90. "ackfreq[%u] plnk_updt[0x%02x] opts[0x%02x] mtu[%llu] "
  91. "cflags[0x%04x] lso_max[%u]\n",
  92. pkt.xfer_mode, pkt.addr_type,
  93. (unsigned long long)pkt.addr,
  94. pkt.ack_freq, pkt.plnk_updt, pkt.options,
  95. (unsigned long long)pkt.mtu, pkt.cflags, pkt.ipv4_lso_maxlen);
  96. return vio_ldc_send(vio, &pkt, sizeof(pkt));
  97. }
  98. static int handle_attr_info(struct vio_driver_state *vio,
  99. struct vio_net_attr_info *pkt)
  100. {
  101. struct vnet_port *port = to_vnet_port(vio);
  102. u64 localmtu;
  103. u8 xfer_mode;
  104. viodbg(HS, "GOT NET ATTR xmode[0x%x] atype[0x%x] addr[%llx] "
  105. "ackfreq[%u] plnk_updt[0x%02x] opts[0x%02x] mtu[%llu] "
  106. " (rmtu[%llu]) cflags[0x%04x] lso_max[%u]\n",
  107. pkt->xfer_mode, pkt->addr_type,
  108. (unsigned long long)pkt->addr,
  109. pkt->ack_freq, pkt->plnk_updt, pkt->options,
  110. (unsigned long long)pkt->mtu, port->rmtu, pkt->cflags,
  111. pkt->ipv4_lso_maxlen);
  112. pkt->tag.sid = vio_send_sid(vio);
  113. xfer_mode = pkt->xfer_mode;
  114. /* for version < 1.2, VIO_DRING_MODE = 0x3 and no bitmask */
  115. if (vio_version_before(vio, 1, 2) && xfer_mode == VIO_DRING_MODE)
  116. xfer_mode = VIO_NEW_DRING_MODE;
  117. /* MTU negotiation:
  118. * < v1.3 - ETH_FRAME_LEN exactly
  119. * > v1.3 - MIN(pkt.mtu, VNET_MAXPACKET, port->rmtu) and change
  120. * pkt->mtu for ACK
  121. * = v1.3 - ETH_FRAME_LEN + VLAN_HLEN exactly
  122. */
  123. if (vio_version_before(vio, 1, 3)) {
  124. localmtu = ETH_FRAME_LEN;
  125. } else if (vio_version_after(vio, 1, 3)) {
  126. localmtu = port->rmtu ? port->rmtu : VNET_MAXPACKET;
  127. localmtu = min(pkt->mtu, localmtu);
  128. pkt->mtu = localmtu;
  129. } else { /* v1.3 */
  130. localmtu = ETH_FRAME_LEN + VLAN_HLEN;
  131. }
  132. port->rmtu = localmtu;
  133. /* for version >= 1.6, ACK packet mode we support */
  134. if (vio_version_after_eq(vio, 1, 6)) {
  135. pkt->xfer_mode = VIO_NEW_DRING_MODE;
  136. pkt->options = VIO_TX_DRING;
  137. }
  138. if (!(xfer_mode | VIO_NEW_DRING_MODE) ||
  139. pkt->addr_type != VNET_ADDR_ETHERMAC ||
  140. pkt->mtu != localmtu) {
  141. viodbg(HS, "SEND NET ATTR NACK\n");
  142. pkt->tag.stype = VIO_SUBTYPE_NACK;
  143. (void) vio_ldc_send(vio, pkt, sizeof(*pkt));
  144. return -ECONNRESET;
  145. } else {
  146. viodbg(HS, "SEND NET ATTR ACK xmode[0x%x] atype[0x%x] "
  147. "addr[%llx] ackfreq[%u] plnk_updt[0x%02x] opts[0x%02x] "
  148. "mtu[%llu] (rmtu[%llu]) cflags[0x%04x] lso_max[%u]\n",
  149. pkt->xfer_mode, pkt->addr_type,
  150. (unsigned long long)pkt->addr,
  151. pkt->ack_freq, pkt->plnk_updt, pkt->options,
  152. (unsigned long long)pkt->mtu, port->rmtu, pkt->cflags,
  153. pkt->ipv4_lso_maxlen);
  154. pkt->tag.stype = VIO_SUBTYPE_ACK;
  155. return vio_ldc_send(vio, pkt, sizeof(*pkt));
  156. }
  157. }
  158. static int handle_attr_ack(struct vio_driver_state *vio,
  159. struct vio_net_attr_info *pkt)
  160. {
  161. viodbg(HS, "GOT NET ATTR ACK\n");
  162. return 0;
  163. }
  164. static int handle_attr_nack(struct vio_driver_state *vio,
  165. struct vio_net_attr_info *pkt)
  166. {
  167. viodbg(HS, "GOT NET ATTR NACK\n");
  168. return -ECONNRESET;
  169. }
  170. static int vnet_handle_attr(struct vio_driver_state *vio, void *arg)
  171. {
  172. struct vio_net_attr_info *pkt = arg;
  173. switch (pkt->tag.stype) {
  174. case VIO_SUBTYPE_INFO:
  175. return handle_attr_info(vio, pkt);
  176. case VIO_SUBTYPE_ACK:
  177. return handle_attr_ack(vio, pkt);
  178. case VIO_SUBTYPE_NACK:
  179. return handle_attr_nack(vio, pkt);
  180. default:
  181. return -ECONNRESET;
  182. }
  183. }
  184. static void vnet_handshake_complete(struct vio_driver_state *vio)
  185. {
  186. struct vio_dring_state *dr;
  187. dr = &vio->drings[VIO_DRIVER_RX_RING];
  188. dr->snd_nxt = dr->rcv_nxt = 1;
  189. dr = &vio->drings[VIO_DRIVER_TX_RING];
  190. dr->snd_nxt = dr->rcv_nxt = 1;
  191. }
  192. /* The hypervisor interface that implements copying to/from imported
  193. * memory from another domain requires that copies are done to 8-byte
  194. * aligned buffers, and that the lengths of such copies are also 8-byte
  195. * multiples.
  196. *
  197. * So we align skb->data to an 8-byte multiple and pad-out the data
  198. * area so we can round the copy length up to the next multiple of
  199. * 8 for the copy.
  200. *
  201. * The transmitter puts the actual start of the packet 6 bytes into
  202. * the buffer it sends over, so that the IP headers after the ethernet
  203. * header are aligned properly. These 6 bytes are not in the descriptor
  204. * length, they are simply implied. This offset is represented using
  205. * the VNET_PACKET_SKIP macro.
  206. */
  207. static struct sk_buff *alloc_and_align_skb(struct net_device *dev,
  208. unsigned int len)
  209. {
  210. struct sk_buff *skb = netdev_alloc_skb(dev, len+VNET_PACKET_SKIP+8+8);
  211. unsigned long addr, off;
  212. if (unlikely(!skb))
  213. return NULL;
  214. addr = (unsigned long) skb->data;
  215. off = ((addr + 7UL) & ~7UL) - addr;
  216. if (off)
  217. skb_reserve(skb, off);
  218. return skb;
  219. }
  220. static int vnet_rx_one(struct vnet_port *port, unsigned int len,
  221. struct ldc_trans_cookie *cookies, int ncookies)
  222. {
  223. struct net_device *dev = port->vp->dev;
  224. unsigned int copy_len;
  225. struct sk_buff *skb;
  226. int err;
  227. err = -EMSGSIZE;
  228. if (unlikely(len < ETH_ZLEN || len > port->rmtu)) {
  229. dev->stats.rx_length_errors++;
  230. goto out_dropped;
  231. }
  232. skb = alloc_and_align_skb(dev, len);
  233. err = -ENOMEM;
  234. if (unlikely(!skb)) {
  235. dev->stats.rx_missed_errors++;
  236. goto out_dropped;
  237. }
  238. copy_len = (len + VNET_PACKET_SKIP + 7U) & ~7U;
  239. skb_put(skb, copy_len);
  240. err = ldc_copy(port->vio.lp, LDC_COPY_IN,
  241. skb->data, copy_len, 0,
  242. cookies, ncookies);
  243. if (unlikely(err < 0)) {
  244. dev->stats.rx_frame_errors++;
  245. goto out_free_skb;
  246. }
  247. skb_pull(skb, VNET_PACKET_SKIP);
  248. skb_trim(skb, len);
  249. skb->protocol = eth_type_trans(skb, dev);
  250. dev->stats.rx_packets++;
  251. dev->stats.rx_bytes += len;
  252. netif_rx(skb);
  253. return 0;
  254. out_free_skb:
  255. kfree_skb(skb);
  256. out_dropped:
  257. dev->stats.rx_dropped++;
  258. return err;
  259. }
  260. static int vnet_send_ack(struct vnet_port *port, struct vio_dring_state *dr,
  261. u32 start, u32 end, u8 vio_dring_state)
  262. {
  263. struct vio_dring_data hdr = {
  264. .tag = {
  265. .type = VIO_TYPE_DATA,
  266. .stype = VIO_SUBTYPE_ACK,
  267. .stype_env = VIO_DRING_DATA,
  268. .sid = vio_send_sid(&port->vio),
  269. },
  270. .dring_ident = dr->ident,
  271. .start_idx = start,
  272. .end_idx = end,
  273. .state = vio_dring_state,
  274. };
  275. int err, delay;
  276. int retries = 0;
  277. hdr.seq = dr->snd_nxt;
  278. delay = 1;
  279. do {
  280. err = vio_ldc_send(&port->vio, &hdr, sizeof(hdr));
  281. if (err > 0) {
  282. dr->snd_nxt++;
  283. break;
  284. }
  285. udelay(delay);
  286. if ((delay <<= 1) > 128)
  287. delay = 128;
  288. if (retries++ > VNET_MAX_RETRIES) {
  289. pr_info("ECONNRESET %x:%x:%x:%x:%x:%x\n",
  290. port->raddr[0], port->raddr[1],
  291. port->raddr[2], port->raddr[3],
  292. port->raddr[4], port->raddr[5]);
  293. break;
  294. }
  295. } while (err == -EAGAIN);
  296. if (err <= 0 && vio_dring_state == VIO_DRING_STOPPED) {
  297. port->stop_rx_idx = end;
  298. port->stop_rx = true;
  299. } else {
  300. port->stop_rx_idx = 0;
  301. port->stop_rx = false;
  302. }
  303. return err;
  304. }
  305. static u32 next_idx(u32 idx, struct vio_dring_state *dr)
  306. {
  307. if (++idx == dr->num_entries)
  308. idx = 0;
  309. return idx;
  310. }
  311. static u32 prev_idx(u32 idx, struct vio_dring_state *dr)
  312. {
  313. if (idx == 0)
  314. idx = dr->num_entries - 1;
  315. else
  316. idx--;
  317. return idx;
  318. }
  319. static struct vio_net_desc *get_rx_desc(struct vnet_port *port,
  320. struct vio_dring_state *dr,
  321. u32 index)
  322. {
  323. struct vio_net_desc *desc = port->vio.desc_buf;
  324. int err;
  325. err = ldc_get_dring_entry(port->vio.lp, desc, dr->entry_size,
  326. (index * dr->entry_size),
  327. dr->cookies, dr->ncookies);
  328. if (err < 0)
  329. return ERR_PTR(err);
  330. return desc;
  331. }
  332. static int put_rx_desc(struct vnet_port *port,
  333. struct vio_dring_state *dr,
  334. struct vio_net_desc *desc,
  335. u32 index)
  336. {
  337. int err;
  338. err = ldc_put_dring_entry(port->vio.lp, desc, dr->entry_size,
  339. (index * dr->entry_size),
  340. dr->cookies, dr->ncookies);
  341. if (err < 0)
  342. return err;
  343. return 0;
  344. }
  345. static int vnet_walk_rx_one(struct vnet_port *port,
  346. struct vio_dring_state *dr,
  347. u32 index, int *needs_ack)
  348. {
  349. struct vio_net_desc *desc = get_rx_desc(port, dr, index);
  350. struct vio_driver_state *vio = &port->vio;
  351. int err;
  352. if (IS_ERR(desc))
  353. return PTR_ERR(desc);
  354. if (desc->hdr.state != VIO_DESC_READY)
  355. return 1;
  356. rmb();
  357. viodbg(DATA, "vio_walk_rx_one desc[%02x:%02x:%08x:%08x:%llx:%llx]\n",
  358. desc->hdr.state, desc->hdr.ack,
  359. desc->size, desc->ncookies,
  360. desc->cookies[0].cookie_addr,
  361. desc->cookies[0].cookie_size);
  362. err = vnet_rx_one(port, desc->size, desc->cookies, desc->ncookies);
  363. if (err == -ECONNRESET)
  364. return err;
  365. desc->hdr.state = VIO_DESC_DONE;
  366. err = put_rx_desc(port, dr, desc, index);
  367. if (err < 0)
  368. return err;
  369. *needs_ack = desc->hdr.ack;
  370. return 0;
  371. }
  372. static int vnet_walk_rx(struct vnet_port *port, struct vio_dring_state *dr,
  373. u32 start, u32 end)
  374. {
  375. struct vio_driver_state *vio = &port->vio;
  376. int ack_start = -1, ack_end = -1;
  377. end = (end == (u32) -1) ? prev_idx(start, dr) : next_idx(end, dr);
  378. viodbg(DATA, "vnet_walk_rx start[%08x] end[%08x]\n", start, end);
  379. while (start != end) {
  380. int ack = 0, err = vnet_walk_rx_one(port, dr, start, &ack);
  381. if (err == -ECONNRESET)
  382. return err;
  383. if (err != 0)
  384. break;
  385. if (ack_start == -1)
  386. ack_start = start;
  387. ack_end = start;
  388. start = next_idx(start, dr);
  389. if (ack && start != end) {
  390. err = vnet_send_ack(port, dr, ack_start, ack_end,
  391. VIO_DRING_ACTIVE);
  392. if (err == -ECONNRESET)
  393. return err;
  394. ack_start = -1;
  395. }
  396. }
  397. if (unlikely(ack_start == -1))
  398. ack_start = ack_end = prev_idx(start, dr);
  399. return vnet_send_ack(port, dr, ack_start, ack_end, VIO_DRING_STOPPED);
  400. }
  401. static int vnet_rx(struct vnet_port *port, void *msgbuf)
  402. {
  403. struct vio_dring_data *pkt = msgbuf;
  404. struct vio_dring_state *dr = &port->vio.drings[VIO_DRIVER_RX_RING];
  405. struct vio_driver_state *vio = &port->vio;
  406. viodbg(DATA, "vnet_rx stype_env[%04x] seq[%016llx] rcv_nxt[%016llx]\n",
  407. pkt->tag.stype_env, pkt->seq, dr->rcv_nxt);
  408. if (unlikely(pkt->tag.stype_env != VIO_DRING_DATA))
  409. return 0;
  410. if (unlikely(pkt->seq != dr->rcv_nxt)) {
  411. pr_err("RX out of sequence seq[0x%llx] rcv_nxt[0x%llx]\n",
  412. pkt->seq, dr->rcv_nxt);
  413. return 0;
  414. }
  415. dr->rcv_nxt++;
  416. /* XXX Validate pkt->start_idx and pkt->end_idx XXX */
  417. return vnet_walk_rx(port, dr, pkt->start_idx, pkt->end_idx);
  418. }
  419. static int idx_is_pending(struct vio_dring_state *dr, u32 end)
  420. {
  421. u32 idx = dr->cons;
  422. int found = 0;
  423. while (idx != dr->prod) {
  424. if (idx == end) {
  425. found = 1;
  426. break;
  427. }
  428. idx = next_idx(idx, dr);
  429. }
  430. return found;
  431. }
  432. static int vnet_ack(struct vnet_port *port, void *msgbuf)
  433. {
  434. struct vio_dring_state *dr = &port->vio.drings[VIO_DRIVER_TX_RING];
  435. struct vio_dring_data *pkt = msgbuf;
  436. struct net_device *dev;
  437. struct vnet *vp;
  438. u32 end;
  439. struct vio_net_desc *desc;
  440. if (unlikely(pkt->tag.stype_env != VIO_DRING_DATA))
  441. return 0;
  442. end = pkt->end_idx;
  443. if (unlikely(!idx_is_pending(dr, end)))
  444. return 0;
  445. /* sync for race conditions with vnet_start_xmit() and tell xmit it
  446. * is time to send a trigger.
  447. */
  448. dr->cons = next_idx(end, dr);
  449. desc = vio_dring_entry(dr, dr->cons);
  450. if (desc->hdr.state == VIO_DESC_READY && port->start_cons) {
  451. /* vnet_start_xmit() just populated this dring but missed
  452. * sending the "start" LDC message to the consumer.
  453. * Send a "start" trigger on its behalf.
  454. */
  455. if (__vnet_tx_trigger(port, dr->cons) > 0)
  456. port->start_cons = false;
  457. else
  458. port->start_cons = true;
  459. } else {
  460. port->start_cons = true;
  461. }
  462. vp = port->vp;
  463. dev = vp->dev;
  464. if (unlikely(netif_queue_stopped(dev) &&
  465. vnet_tx_dring_avail(dr) >= VNET_TX_WAKEUP_THRESH(dr)))
  466. return 1;
  467. return 0;
  468. }
  469. static int vnet_nack(struct vnet_port *port, void *msgbuf)
  470. {
  471. /* XXX just reset or similar XXX */
  472. return 0;
  473. }
  474. static int handle_mcast(struct vnet_port *port, void *msgbuf)
  475. {
  476. struct vio_net_mcast_info *pkt = msgbuf;
  477. if (pkt->tag.stype != VIO_SUBTYPE_ACK)
  478. pr_err("%s: Got unexpected MCAST reply [%02x:%02x:%04x:%08x]\n",
  479. port->vp->dev->name,
  480. pkt->tag.type,
  481. pkt->tag.stype,
  482. pkt->tag.stype_env,
  483. pkt->tag.sid);
  484. return 0;
  485. }
  486. static void maybe_tx_wakeup(unsigned long param)
  487. {
  488. struct vnet *vp = (struct vnet *)param;
  489. struct net_device *dev = vp->dev;
  490. netif_tx_lock(dev);
  491. if (likely(netif_queue_stopped(dev))) {
  492. struct vnet_port *port;
  493. int wake = 1;
  494. list_for_each_entry(port, &vp->port_list, list) {
  495. struct vio_dring_state *dr;
  496. dr = &port->vio.drings[VIO_DRIVER_TX_RING];
  497. if (vnet_tx_dring_avail(dr) <
  498. VNET_TX_WAKEUP_THRESH(dr)) {
  499. wake = 0;
  500. break;
  501. }
  502. }
  503. if (wake)
  504. netif_wake_queue(dev);
  505. }
  506. netif_tx_unlock(dev);
  507. }
  508. static void vnet_event(void *arg, int event)
  509. {
  510. struct vnet_port *port = arg;
  511. struct vio_driver_state *vio = &port->vio;
  512. unsigned long flags;
  513. int tx_wakeup, err;
  514. spin_lock_irqsave(&vio->lock, flags);
  515. if (unlikely(event == LDC_EVENT_RESET ||
  516. event == LDC_EVENT_UP)) {
  517. vio_link_state_change(vio, event);
  518. spin_unlock_irqrestore(&vio->lock, flags);
  519. if (event == LDC_EVENT_RESET) {
  520. port->rmtu = 0;
  521. vio_port_up(vio);
  522. }
  523. return;
  524. }
  525. if (unlikely(event != LDC_EVENT_DATA_READY)) {
  526. pr_warn("Unexpected LDC event %d\n", event);
  527. spin_unlock_irqrestore(&vio->lock, flags);
  528. return;
  529. }
  530. tx_wakeup = err = 0;
  531. while (1) {
  532. union {
  533. struct vio_msg_tag tag;
  534. u64 raw[8];
  535. } msgbuf;
  536. err = ldc_read(vio->lp, &msgbuf, sizeof(msgbuf));
  537. if (unlikely(err < 0)) {
  538. if (err == -ECONNRESET)
  539. vio_conn_reset(vio);
  540. break;
  541. }
  542. if (err == 0)
  543. break;
  544. viodbg(DATA, "TAG [%02x:%02x:%04x:%08x]\n",
  545. msgbuf.tag.type,
  546. msgbuf.tag.stype,
  547. msgbuf.tag.stype_env,
  548. msgbuf.tag.sid);
  549. err = vio_validate_sid(vio, &msgbuf.tag);
  550. if (err < 0)
  551. break;
  552. if (likely(msgbuf.tag.type == VIO_TYPE_DATA)) {
  553. if (msgbuf.tag.stype == VIO_SUBTYPE_INFO) {
  554. err = vnet_rx(port, &msgbuf);
  555. } else if (msgbuf.tag.stype == VIO_SUBTYPE_ACK) {
  556. err = vnet_ack(port, &msgbuf);
  557. if (err > 0)
  558. tx_wakeup |= err;
  559. } else if (msgbuf.tag.stype == VIO_SUBTYPE_NACK) {
  560. err = vnet_nack(port, &msgbuf);
  561. }
  562. } else if (msgbuf.tag.type == VIO_TYPE_CTRL) {
  563. if (msgbuf.tag.stype_env == VNET_MCAST_INFO)
  564. err = handle_mcast(port, &msgbuf);
  565. else
  566. err = vio_control_pkt_engine(vio, &msgbuf);
  567. if (err)
  568. break;
  569. } else {
  570. err = vnet_handle_unknown(port, &msgbuf);
  571. }
  572. if (err == -ECONNRESET)
  573. break;
  574. }
  575. spin_unlock(&vio->lock);
  576. /* Kick off a tasklet to wake the queue. We cannot call
  577. * maybe_tx_wakeup directly here because we could deadlock on
  578. * netif_tx_lock() with dev_watchdog()
  579. */
  580. if (unlikely(tx_wakeup && err != -ECONNRESET))
  581. tasklet_schedule(&port->vp->vnet_tx_wakeup);
  582. local_irq_restore(flags);
  583. }
  584. static int __vnet_tx_trigger(struct vnet_port *port, u32 start)
  585. {
  586. struct vio_dring_state *dr = &port->vio.drings[VIO_DRIVER_TX_RING];
  587. struct vio_dring_data hdr = {
  588. .tag = {
  589. .type = VIO_TYPE_DATA,
  590. .stype = VIO_SUBTYPE_INFO,
  591. .stype_env = VIO_DRING_DATA,
  592. .sid = vio_send_sid(&port->vio),
  593. },
  594. .dring_ident = dr->ident,
  595. .start_idx = start,
  596. .end_idx = (u32) -1,
  597. };
  598. int err, delay;
  599. int retries = 0;
  600. if (port->stop_rx) {
  601. err = vnet_send_ack(port,
  602. &port->vio.drings[VIO_DRIVER_RX_RING],
  603. port->stop_rx_idx, -1,
  604. VIO_DRING_STOPPED);
  605. if (err <= 0)
  606. return err;
  607. }
  608. hdr.seq = dr->snd_nxt;
  609. delay = 1;
  610. do {
  611. err = vio_ldc_send(&port->vio, &hdr, sizeof(hdr));
  612. if (err > 0) {
  613. dr->snd_nxt++;
  614. break;
  615. }
  616. udelay(delay);
  617. if ((delay <<= 1) > 128)
  618. delay = 128;
  619. if (retries++ > VNET_MAX_RETRIES)
  620. break;
  621. } while (err == -EAGAIN);
  622. return err;
  623. }
  624. static inline bool port_is_up(struct vnet_port *vnet)
  625. {
  626. struct vio_driver_state *vio = &vnet->vio;
  627. return !!(vio->hs_state & VIO_HS_COMPLETE);
  628. }
  629. struct vnet_port *__tx_port_find(struct vnet *vp, struct sk_buff *skb)
  630. {
  631. unsigned int hash = vnet_hashfn(skb->data);
  632. struct hlist_head *hp = &vp->port_hash[hash];
  633. struct vnet_port *port;
  634. hlist_for_each_entry(port, hp, hash) {
  635. if (!port_is_up(port))
  636. continue;
  637. if (ether_addr_equal(port->raddr, skb->data))
  638. return port;
  639. }
  640. list_for_each_entry(port, &vp->port_list, list) {
  641. if (!port->switch_port)
  642. continue;
  643. if (!port_is_up(port))
  644. continue;
  645. return port;
  646. }
  647. return NULL;
  648. }
  649. struct vnet_port *tx_port_find(struct vnet *vp, struct sk_buff *skb)
  650. {
  651. struct vnet_port *ret;
  652. unsigned long flags;
  653. spin_lock_irqsave(&vp->lock, flags);
  654. ret = __tx_port_find(vp, skb);
  655. spin_unlock_irqrestore(&vp->lock, flags);
  656. return ret;
  657. }
  658. static struct sk_buff *vnet_clean_tx_ring(struct vnet_port *port,
  659. unsigned *pending)
  660. {
  661. struct vio_dring_state *dr = &port->vio.drings[VIO_DRIVER_TX_RING];
  662. struct sk_buff *skb = NULL;
  663. int i, txi;
  664. *pending = 0;
  665. txi = dr->prod-1;
  666. if (txi < 0)
  667. txi = VNET_TX_RING_SIZE-1;
  668. for (i = 0; i < VNET_TX_RING_SIZE; ++i) {
  669. struct vio_net_desc *d;
  670. d = vio_dring_entry(dr, txi);
  671. if (d->hdr.state == VIO_DESC_DONE) {
  672. if (port->tx_bufs[txi].skb) {
  673. BUG_ON(port->tx_bufs[txi].skb->next);
  674. port->tx_bufs[txi].skb->next = skb;
  675. skb = port->tx_bufs[txi].skb;
  676. port->tx_bufs[txi].skb = NULL;
  677. ldc_unmap(port->vio.lp,
  678. port->tx_bufs[txi].cookies,
  679. port->tx_bufs[txi].ncookies);
  680. }
  681. d->hdr.state = VIO_DESC_FREE;
  682. } else if (d->hdr.state == VIO_DESC_READY) {
  683. (*pending)++;
  684. } else if (d->hdr.state == VIO_DESC_FREE) {
  685. break;
  686. }
  687. --txi;
  688. if (txi < 0)
  689. txi = VNET_TX_RING_SIZE-1;
  690. }
  691. return skb;
  692. }
  693. static inline void vnet_free_skbs(struct sk_buff *skb)
  694. {
  695. struct sk_buff *next;
  696. while (skb) {
  697. next = skb->next;
  698. skb->next = NULL;
  699. dev_kfree_skb(skb);
  700. skb = next;
  701. }
  702. }
  703. static void vnet_clean_timer_expire(unsigned long port0)
  704. {
  705. struct vnet_port *port = (struct vnet_port *)port0;
  706. struct sk_buff *freeskbs;
  707. unsigned pending;
  708. unsigned long flags;
  709. spin_lock_irqsave(&port->vio.lock, flags);
  710. freeskbs = vnet_clean_tx_ring(port, &pending);
  711. spin_unlock_irqrestore(&port->vio.lock, flags);
  712. vnet_free_skbs(freeskbs);
  713. if (pending)
  714. (void)mod_timer(&port->clean_timer,
  715. jiffies + VNET_CLEAN_TIMEOUT);
  716. else
  717. del_timer(&port->clean_timer);
  718. }
  719. static inline struct sk_buff *vnet_skb_shape(struct sk_buff *skb, void **pstart,
  720. int *plen)
  721. {
  722. struct sk_buff *nskb;
  723. int len, pad;
  724. len = skb->len;
  725. pad = 0;
  726. if (len < ETH_ZLEN) {
  727. pad += ETH_ZLEN - skb->len;
  728. len += pad;
  729. }
  730. len += VNET_PACKET_SKIP;
  731. pad += 8 - (len & 7);
  732. len += 8 - (len & 7);
  733. if (((unsigned long)skb->data & 7) != VNET_PACKET_SKIP ||
  734. skb_tailroom(skb) < pad ||
  735. skb_headroom(skb) < VNET_PACKET_SKIP) {
  736. nskb = alloc_and_align_skb(skb->dev, skb->len);
  737. skb_reserve(nskb, VNET_PACKET_SKIP);
  738. if (skb_copy_bits(skb, 0, nskb->data, skb->len)) {
  739. dev_kfree_skb(nskb);
  740. dev_kfree_skb(skb);
  741. return NULL;
  742. }
  743. (void)skb_put(nskb, skb->len);
  744. dev_kfree_skb(skb);
  745. skb = nskb;
  746. }
  747. *pstart = skb->data - VNET_PACKET_SKIP;
  748. *plen = len;
  749. return skb;
  750. }
  751. static int vnet_start_xmit(struct sk_buff *skb, struct net_device *dev)
  752. {
  753. struct vnet *vp = netdev_priv(dev);
  754. struct vnet_port *port = tx_port_find(vp, skb);
  755. struct vio_dring_state *dr;
  756. struct vio_net_desc *d;
  757. unsigned long flags;
  758. unsigned int len;
  759. struct sk_buff *freeskbs = NULL;
  760. int i, err, txi;
  761. void *start = NULL;
  762. int nlen = 0;
  763. unsigned pending = 0;
  764. if (unlikely(!port))
  765. goto out_dropped;
  766. skb = vnet_skb_shape(skb, &start, &nlen);
  767. if (unlikely(!skb))
  768. goto out_dropped;
  769. if (skb->len > port->rmtu)
  770. goto out_dropped;
  771. spin_lock_irqsave(&port->vio.lock, flags);
  772. dr = &port->vio.drings[VIO_DRIVER_TX_RING];
  773. if (unlikely(vnet_tx_dring_avail(dr) < 2)) {
  774. if (!netif_queue_stopped(dev)) {
  775. netif_stop_queue(dev);
  776. /* This is a hard error, log it. */
  777. netdev_err(dev, "BUG! Tx Ring full when queue awake!\n");
  778. dev->stats.tx_errors++;
  779. }
  780. spin_unlock_irqrestore(&port->vio.lock, flags);
  781. return NETDEV_TX_BUSY;
  782. }
  783. d = vio_dring_cur(dr);
  784. txi = dr->prod;
  785. freeskbs = vnet_clean_tx_ring(port, &pending);
  786. BUG_ON(port->tx_bufs[txi].skb);
  787. len = skb->len;
  788. if (len < ETH_ZLEN)
  789. len = ETH_ZLEN;
  790. port->tx_bufs[txi].skb = skb;
  791. skb = NULL;
  792. err = ldc_map_single(port->vio.lp, start, nlen,
  793. port->tx_bufs[txi].cookies, VNET_MAXCOOKIES,
  794. (LDC_MAP_SHADOW | LDC_MAP_DIRECT | LDC_MAP_RW));
  795. if (err < 0) {
  796. netdev_info(dev, "tx buffer map error %d\n", err);
  797. goto out_dropped_unlock;
  798. }
  799. port->tx_bufs[txi].ncookies = err;
  800. /* We don't rely on the ACKs to free the skb in vnet_start_xmit(),
  801. * thus it is safe to not set VIO_ACK_ENABLE for each transmission:
  802. * the protocol itself does not require it as long as the peer
  803. * sends a VIO_SUBTYPE_ACK for VIO_DRING_STOPPED.
  804. *
  805. * An ACK for every packet in the ring is expensive as the
  806. * sending of LDC messages is slow and affects performance.
  807. */
  808. d->hdr.ack = VIO_ACK_DISABLE;
  809. d->size = len;
  810. d->ncookies = port->tx_bufs[txi].ncookies;
  811. for (i = 0; i < d->ncookies; i++)
  812. d->cookies[i] = port->tx_bufs[txi].cookies[i];
  813. /* This has to be a non-SMP write barrier because we are writing
  814. * to memory which is shared with the peer LDOM.
  815. */
  816. wmb();
  817. d->hdr.state = VIO_DESC_READY;
  818. /* Exactly one ldc "start" trigger (for dr->cons) needs to be sent
  819. * to notify the consumer that some descriptors are READY.
  820. * After that "start" trigger, no additional triggers are needed until
  821. * a DRING_STOPPED is received from the consumer. The dr->cons field
  822. * (set up by vnet_ack()) has the value of the next dring index
  823. * that has not yet been ack-ed. We send a "start" trigger here
  824. * if, and only if, start_cons is true (reset it afterward). Conversely,
  825. * vnet_ack() should check if the dring corresponding to cons
  826. * is marked READY, but start_cons was false.
  827. * If so, vnet_ack() should send out the missed "start" trigger.
  828. *
  829. * Note that the wmb() above makes sure the cookies et al. are
  830. * not globally visible before the VIO_DESC_READY, and that the
  831. * stores are ordered correctly by the compiler. The consumer will
  832. * not proceed until the VIO_DESC_READY is visible assuring that
  833. * the consumer does not observe anything related to descriptors
  834. * out of order. The HV trap from the LDC start trigger is the
  835. * producer to consumer announcement that work is available to the
  836. * consumer
  837. */
  838. if (!port->start_cons)
  839. goto ldc_start_done; /* previous trigger suffices */
  840. err = __vnet_tx_trigger(port, dr->cons);
  841. if (unlikely(err < 0)) {
  842. netdev_info(dev, "TX trigger error %d\n", err);
  843. d->hdr.state = VIO_DESC_FREE;
  844. dev->stats.tx_carrier_errors++;
  845. goto out_dropped_unlock;
  846. }
  847. ldc_start_done:
  848. port->start_cons = false;
  849. dev->stats.tx_packets++;
  850. dev->stats.tx_bytes += port->tx_bufs[txi].skb->len;
  851. dr->prod = (dr->prod + 1) & (VNET_TX_RING_SIZE - 1);
  852. if (unlikely(vnet_tx_dring_avail(dr) < 2)) {
  853. netif_stop_queue(dev);
  854. if (vnet_tx_dring_avail(dr) > VNET_TX_WAKEUP_THRESH(dr))
  855. netif_wake_queue(dev);
  856. }
  857. spin_unlock_irqrestore(&port->vio.lock, flags);
  858. vnet_free_skbs(freeskbs);
  859. (void)mod_timer(&port->clean_timer, jiffies + VNET_CLEAN_TIMEOUT);
  860. return NETDEV_TX_OK;
  861. out_dropped_unlock:
  862. spin_unlock_irqrestore(&port->vio.lock, flags);
  863. out_dropped:
  864. if (skb)
  865. dev_kfree_skb(skb);
  866. vnet_free_skbs(freeskbs);
  867. if (pending)
  868. (void)mod_timer(&port->clean_timer,
  869. jiffies + VNET_CLEAN_TIMEOUT);
  870. else
  871. del_timer(&port->clean_timer);
  872. dev->stats.tx_dropped++;
  873. return NETDEV_TX_OK;
  874. }
  875. static void vnet_tx_timeout(struct net_device *dev)
  876. {
  877. /* XXX Implement me XXX */
  878. }
  879. static int vnet_open(struct net_device *dev)
  880. {
  881. netif_carrier_on(dev);
  882. netif_start_queue(dev);
  883. return 0;
  884. }
  885. static int vnet_close(struct net_device *dev)
  886. {
  887. netif_stop_queue(dev);
  888. netif_carrier_off(dev);
  889. return 0;
  890. }
  891. static struct vnet_mcast_entry *__vnet_mc_find(struct vnet *vp, u8 *addr)
  892. {
  893. struct vnet_mcast_entry *m;
  894. for (m = vp->mcast_list; m; m = m->next) {
  895. if (ether_addr_equal(m->addr, addr))
  896. return m;
  897. }
  898. return NULL;
  899. }
  900. static void __update_mc_list(struct vnet *vp, struct net_device *dev)
  901. {
  902. struct netdev_hw_addr *ha;
  903. netdev_for_each_mc_addr(ha, dev) {
  904. struct vnet_mcast_entry *m;
  905. m = __vnet_mc_find(vp, ha->addr);
  906. if (m) {
  907. m->hit = 1;
  908. continue;
  909. }
  910. if (!m) {
  911. m = kzalloc(sizeof(*m), GFP_ATOMIC);
  912. if (!m)
  913. continue;
  914. memcpy(m->addr, ha->addr, ETH_ALEN);
  915. m->hit = 1;
  916. m->next = vp->mcast_list;
  917. vp->mcast_list = m;
  918. }
  919. }
  920. }
  921. static void __send_mc_list(struct vnet *vp, struct vnet_port *port)
  922. {
  923. struct vio_net_mcast_info info;
  924. struct vnet_mcast_entry *m, **pp;
  925. int n_addrs;
  926. memset(&info, 0, sizeof(info));
  927. info.tag.type = VIO_TYPE_CTRL;
  928. info.tag.stype = VIO_SUBTYPE_INFO;
  929. info.tag.stype_env = VNET_MCAST_INFO;
  930. info.tag.sid = vio_send_sid(&port->vio);
  931. info.set = 1;
  932. n_addrs = 0;
  933. for (m = vp->mcast_list; m; m = m->next) {
  934. if (m->sent)
  935. continue;
  936. m->sent = 1;
  937. memcpy(&info.mcast_addr[n_addrs * ETH_ALEN],
  938. m->addr, ETH_ALEN);
  939. if (++n_addrs == VNET_NUM_MCAST) {
  940. info.count = n_addrs;
  941. (void) vio_ldc_send(&port->vio, &info,
  942. sizeof(info));
  943. n_addrs = 0;
  944. }
  945. }
  946. if (n_addrs) {
  947. info.count = n_addrs;
  948. (void) vio_ldc_send(&port->vio, &info, sizeof(info));
  949. }
  950. info.set = 0;
  951. n_addrs = 0;
  952. pp = &vp->mcast_list;
  953. while ((m = *pp) != NULL) {
  954. if (m->hit) {
  955. m->hit = 0;
  956. pp = &m->next;
  957. continue;
  958. }
  959. memcpy(&info.mcast_addr[n_addrs * ETH_ALEN],
  960. m->addr, ETH_ALEN);
  961. if (++n_addrs == VNET_NUM_MCAST) {
  962. info.count = n_addrs;
  963. (void) vio_ldc_send(&port->vio, &info,
  964. sizeof(info));
  965. n_addrs = 0;
  966. }
  967. *pp = m->next;
  968. kfree(m);
  969. }
  970. if (n_addrs) {
  971. info.count = n_addrs;
  972. (void) vio_ldc_send(&port->vio, &info, sizeof(info));
  973. }
  974. }
  975. static void vnet_set_rx_mode(struct net_device *dev)
  976. {
  977. struct vnet *vp = netdev_priv(dev);
  978. struct vnet_port *port;
  979. unsigned long flags;
  980. spin_lock_irqsave(&vp->lock, flags);
  981. if (!list_empty(&vp->port_list)) {
  982. port = list_entry(vp->port_list.next, struct vnet_port, list);
  983. if (port->switch_port) {
  984. __update_mc_list(vp, dev);
  985. __send_mc_list(vp, port);
  986. }
  987. }
  988. spin_unlock_irqrestore(&vp->lock, flags);
  989. }
  990. static int vnet_change_mtu(struct net_device *dev, int new_mtu)
  991. {
  992. if (new_mtu < 68 || new_mtu > 65535)
  993. return -EINVAL;
  994. dev->mtu = new_mtu;
  995. return 0;
  996. }
  997. static int vnet_set_mac_addr(struct net_device *dev, void *p)
  998. {
  999. return -EINVAL;
  1000. }
  1001. static void vnet_get_drvinfo(struct net_device *dev,
  1002. struct ethtool_drvinfo *info)
  1003. {
  1004. strlcpy(info->driver, DRV_MODULE_NAME, sizeof(info->driver));
  1005. strlcpy(info->version, DRV_MODULE_VERSION, sizeof(info->version));
  1006. }
  1007. static u32 vnet_get_msglevel(struct net_device *dev)
  1008. {
  1009. struct vnet *vp = netdev_priv(dev);
  1010. return vp->msg_enable;
  1011. }
  1012. static void vnet_set_msglevel(struct net_device *dev, u32 value)
  1013. {
  1014. struct vnet *vp = netdev_priv(dev);
  1015. vp->msg_enable = value;
  1016. }
  1017. static const struct ethtool_ops vnet_ethtool_ops = {
  1018. .get_drvinfo = vnet_get_drvinfo,
  1019. .get_msglevel = vnet_get_msglevel,
  1020. .set_msglevel = vnet_set_msglevel,
  1021. .get_link = ethtool_op_get_link,
  1022. };
  1023. static void vnet_port_free_tx_bufs(struct vnet_port *port)
  1024. {
  1025. struct vio_dring_state *dr;
  1026. int i;
  1027. dr = &port->vio.drings[VIO_DRIVER_TX_RING];
  1028. if (dr->base) {
  1029. ldc_free_exp_dring(port->vio.lp, dr->base,
  1030. (dr->entry_size * dr->num_entries),
  1031. dr->cookies, dr->ncookies);
  1032. dr->base = NULL;
  1033. dr->entry_size = 0;
  1034. dr->num_entries = 0;
  1035. dr->pending = 0;
  1036. dr->ncookies = 0;
  1037. }
  1038. for (i = 0; i < VNET_TX_RING_SIZE; i++) {
  1039. struct vio_net_desc *d;
  1040. void *skb = port->tx_bufs[i].skb;
  1041. if (!skb)
  1042. continue;
  1043. d = vio_dring_entry(dr, i);
  1044. if (d->hdr.state == VIO_DESC_READY)
  1045. pr_warn("active transmit buffers freed\n");
  1046. ldc_unmap(port->vio.lp,
  1047. port->tx_bufs[i].cookies,
  1048. port->tx_bufs[i].ncookies);
  1049. dev_kfree_skb(skb);
  1050. port->tx_bufs[i].skb = NULL;
  1051. d->hdr.state = VIO_DESC_FREE;
  1052. }
  1053. }
  1054. static int vnet_port_alloc_tx_bufs(struct vnet_port *port)
  1055. {
  1056. struct vio_dring_state *dr;
  1057. unsigned long len;
  1058. int i, err, ncookies;
  1059. void *dring;
  1060. dr = &port->vio.drings[VIO_DRIVER_TX_RING];
  1061. len = (VNET_TX_RING_SIZE *
  1062. (sizeof(struct vio_net_desc) +
  1063. (sizeof(struct ldc_trans_cookie) * 2)));
  1064. ncookies = VIO_MAX_RING_COOKIES;
  1065. dring = ldc_alloc_exp_dring(port->vio.lp, len,
  1066. dr->cookies, &ncookies,
  1067. (LDC_MAP_SHADOW |
  1068. LDC_MAP_DIRECT |
  1069. LDC_MAP_RW));
  1070. if (IS_ERR(dring)) {
  1071. err = PTR_ERR(dring);
  1072. goto err_out;
  1073. }
  1074. dr->base = dring;
  1075. dr->entry_size = (sizeof(struct vio_net_desc) +
  1076. (sizeof(struct ldc_trans_cookie) * 2));
  1077. dr->num_entries = VNET_TX_RING_SIZE;
  1078. dr->prod = dr->cons = 0;
  1079. port->start_cons = true; /* need an initial trigger */
  1080. dr->pending = VNET_TX_RING_SIZE;
  1081. dr->ncookies = ncookies;
  1082. for (i = 0; i < VNET_TX_RING_SIZE; ++i) {
  1083. struct vio_net_desc *d;
  1084. d = vio_dring_entry(dr, i);
  1085. d->hdr.state = VIO_DESC_FREE;
  1086. }
  1087. return 0;
  1088. err_out:
  1089. vnet_port_free_tx_bufs(port);
  1090. return err;
  1091. }
  1092. static LIST_HEAD(vnet_list);
  1093. static DEFINE_MUTEX(vnet_list_mutex);
  1094. static const struct net_device_ops vnet_ops = {
  1095. .ndo_open = vnet_open,
  1096. .ndo_stop = vnet_close,
  1097. .ndo_set_rx_mode = vnet_set_rx_mode,
  1098. .ndo_set_mac_address = vnet_set_mac_addr,
  1099. .ndo_validate_addr = eth_validate_addr,
  1100. .ndo_tx_timeout = vnet_tx_timeout,
  1101. .ndo_change_mtu = vnet_change_mtu,
  1102. .ndo_start_xmit = vnet_start_xmit,
  1103. };
  1104. static struct vnet *vnet_new(const u64 *local_mac)
  1105. {
  1106. struct net_device *dev;
  1107. struct vnet *vp;
  1108. int err, i;
  1109. dev = alloc_etherdev(sizeof(*vp));
  1110. if (!dev)
  1111. return ERR_PTR(-ENOMEM);
  1112. dev->needed_headroom = VNET_PACKET_SKIP + 8;
  1113. dev->needed_tailroom = 8;
  1114. for (i = 0; i < ETH_ALEN; i++)
  1115. dev->dev_addr[i] = (*local_mac >> (5 - i) * 8) & 0xff;
  1116. vp = netdev_priv(dev);
  1117. spin_lock_init(&vp->lock);
  1118. tasklet_init(&vp->vnet_tx_wakeup, maybe_tx_wakeup, (unsigned long)vp);
  1119. vp->dev = dev;
  1120. INIT_LIST_HEAD(&vp->port_list);
  1121. for (i = 0; i < VNET_PORT_HASH_SIZE; i++)
  1122. INIT_HLIST_HEAD(&vp->port_hash[i]);
  1123. INIT_LIST_HEAD(&vp->list);
  1124. vp->local_mac = *local_mac;
  1125. dev->netdev_ops = &vnet_ops;
  1126. dev->ethtool_ops = &vnet_ethtool_ops;
  1127. dev->watchdog_timeo = VNET_TX_TIMEOUT;
  1128. err = register_netdev(dev);
  1129. if (err) {
  1130. pr_err("Cannot register net device, aborting\n");
  1131. goto err_out_free_dev;
  1132. }
  1133. netdev_info(dev, "Sun LDOM vnet %pM\n", dev->dev_addr);
  1134. list_add(&vp->list, &vnet_list);
  1135. return vp;
  1136. err_out_free_dev:
  1137. free_netdev(dev);
  1138. return ERR_PTR(err);
  1139. }
  1140. static struct vnet *vnet_find_or_create(const u64 *local_mac)
  1141. {
  1142. struct vnet *iter, *vp;
  1143. mutex_lock(&vnet_list_mutex);
  1144. vp = NULL;
  1145. list_for_each_entry(iter, &vnet_list, list) {
  1146. if (iter->local_mac == *local_mac) {
  1147. vp = iter;
  1148. break;
  1149. }
  1150. }
  1151. if (!vp)
  1152. vp = vnet_new(local_mac);
  1153. mutex_unlock(&vnet_list_mutex);
  1154. return vp;
  1155. }
  1156. static void vnet_cleanup(void)
  1157. {
  1158. struct vnet *vp;
  1159. struct net_device *dev;
  1160. mutex_lock(&vnet_list_mutex);
  1161. while (!list_empty(&vnet_list)) {
  1162. vp = list_first_entry(&vnet_list, struct vnet, list);
  1163. list_del(&vp->list);
  1164. dev = vp->dev;
  1165. tasklet_kill(&vp->vnet_tx_wakeup);
  1166. /* vio_unregister_driver() should have cleaned up port_list */
  1167. BUG_ON(!list_empty(&vp->port_list));
  1168. unregister_netdev(dev);
  1169. free_netdev(dev);
  1170. }
  1171. mutex_unlock(&vnet_list_mutex);
  1172. }
  1173. static const char *local_mac_prop = "local-mac-address";
  1174. static struct vnet *vnet_find_parent(struct mdesc_handle *hp,
  1175. u64 port_node)
  1176. {
  1177. const u64 *local_mac = NULL;
  1178. u64 a;
  1179. mdesc_for_each_arc(a, hp, port_node, MDESC_ARC_TYPE_BACK) {
  1180. u64 target = mdesc_arc_target(hp, a);
  1181. const char *name;
  1182. name = mdesc_get_property(hp, target, "name", NULL);
  1183. if (!name || strcmp(name, "network"))
  1184. continue;
  1185. local_mac = mdesc_get_property(hp, target,
  1186. local_mac_prop, NULL);
  1187. if (local_mac)
  1188. break;
  1189. }
  1190. if (!local_mac)
  1191. return ERR_PTR(-ENODEV);
  1192. return vnet_find_or_create(local_mac);
  1193. }
  1194. static struct ldc_channel_config vnet_ldc_cfg = {
  1195. .event = vnet_event,
  1196. .mtu = 64,
  1197. .mode = LDC_MODE_UNRELIABLE,
  1198. };
  1199. static struct vio_driver_ops vnet_vio_ops = {
  1200. .send_attr = vnet_send_attr,
  1201. .handle_attr = vnet_handle_attr,
  1202. .handshake_complete = vnet_handshake_complete,
  1203. };
  1204. static void print_version(void)
  1205. {
  1206. printk_once(KERN_INFO "%s", version);
  1207. }
  1208. const char *remote_macaddr_prop = "remote-mac-address";
  1209. static int vnet_port_probe(struct vio_dev *vdev, const struct vio_device_id *id)
  1210. {
  1211. struct mdesc_handle *hp;
  1212. struct vnet_port *port;
  1213. unsigned long flags;
  1214. struct vnet *vp;
  1215. const u64 *rmac;
  1216. int len, i, err, switch_port;
  1217. print_version();
  1218. hp = mdesc_grab();
  1219. vp = vnet_find_parent(hp, vdev->mp);
  1220. if (IS_ERR(vp)) {
  1221. pr_err("Cannot find port parent vnet\n");
  1222. err = PTR_ERR(vp);
  1223. goto err_out_put_mdesc;
  1224. }
  1225. rmac = mdesc_get_property(hp, vdev->mp, remote_macaddr_prop, &len);
  1226. err = -ENODEV;
  1227. if (!rmac) {
  1228. pr_err("Port lacks %s property\n", remote_macaddr_prop);
  1229. goto err_out_put_mdesc;
  1230. }
  1231. port = kzalloc(sizeof(*port), GFP_KERNEL);
  1232. err = -ENOMEM;
  1233. if (!port)
  1234. goto err_out_put_mdesc;
  1235. for (i = 0; i < ETH_ALEN; i++)
  1236. port->raddr[i] = (*rmac >> (5 - i) * 8) & 0xff;
  1237. port->vp = vp;
  1238. err = vio_driver_init(&port->vio, vdev, VDEV_NETWORK,
  1239. vnet_versions, ARRAY_SIZE(vnet_versions),
  1240. &vnet_vio_ops, vp->dev->name);
  1241. if (err)
  1242. goto err_out_free_port;
  1243. err = vio_ldc_alloc(&port->vio, &vnet_ldc_cfg, port);
  1244. if (err)
  1245. goto err_out_free_port;
  1246. err = vnet_port_alloc_tx_bufs(port);
  1247. if (err)
  1248. goto err_out_free_ldc;
  1249. INIT_HLIST_NODE(&port->hash);
  1250. INIT_LIST_HEAD(&port->list);
  1251. switch_port = 0;
  1252. if (mdesc_get_property(hp, vdev->mp, "switch-port", NULL) != NULL)
  1253. switch_port = 1;
  1254. port->switch_port = switch_port;
  1255. spin_lock_irqsave(&vp->lock, flags);
  1256. if (switch_port)
  1257. list_add(&port->list, &vp->port_list);
  1258. else
  1259. list_add_tail(&port->list, &vp->port_list);
  1260. hlist_add_head(&port->hash, &vp->port_hash[vnet_hashfn(port->raddr)]);
  1261. spin_unlock_irqrestore(&vp->lock, flags);
  1262. dev_set_drvdata(&vdev->dev, port);
  1263. pr_info("%s: PORT ( remote-mac %pM%s )\n",
  1264. vp->dev->name, port->raddr, switch_port ? " switch-port" : "");
  1265. setup_timer(&port->clean_timer, vnet_clean_timer_expire,
  1266. (unsigned long)port);
  1267. vio_port_up(&port->vio);
  1268. mdesc_release(hp);
  1269. return 0;
  1270. err_out_free_ldc:
  1271. vio_ldc_free(&port->vio);
  1272. err_out_free_port:
  1273. kfree(port);
  1274. err_out_put_mdesc:
  1275. mdesc_release(hp);
  1276. return err;
  1277. }
  1278. static int vnet_port_remove(struct vio_dev *vdev)
  1279. {
  1280. struct vnet_port *port = dev_get_drvdata(&vdev->dev);
  1281. if (port) {
  1282. struct vnet *vp = port->vp;
  1283. unsigned long flags;
  1284. del_timer_sync(&port->vio.timer);
  1285. del_timer_sync(&port->clean_timer);
  1286. spin_lock_irqsave(&vp->lock, flags);
  1287. list_del(&port->list);
  1288. hlist_del(&port->hash);
  1289. spin_unlock_irqrestore(&vp->lock, flags);
  1290. vnet_port_free_tx_bufs(port);
  1291. vio_ldc_free(&port->vio);
  1292. dev_set_drvdata(&vdev->dev, NULL);
  1293. kfree(port);
  1294. }
  1295. return 0;
  1296. }
  1297. static const struct vio_device_id vnet_port_match[] = {
  1298. {
  1299. .type = "vnet-port",
  1300. },
  1301. {},
  1302. };
  1303. MODULE_DEVICE_TABLE(vio, vnet_port_match);
  1304. static struct vio_driver vnet_port_driver = {
  1305. .id_table = vnet_port_match,
  1306. .probe = vnet_port_probe,
  1307. .remove = vnet_port_remove,
  1308. .name = "vnet_port",
  1309. };
  1310. static int __init vnet_init(void)
  1311. {
  1312. return vio_register_driver(&vnet_port_driver);
  1313. }
  1314. static void __exit vnet_exit(void)
  1315. {
  1316. vio_unregister_driver(&vnet_port_driver);
  1317. vnet_cleanup();
  1318. }
  1319. module_init(vnet_init);
  1320. module_exit(vnet_exit);