ib_addr.h 10.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341
  1. /*
  2. * Copyright (c) 2005 Voltaire Inc. All rights reserved.
  3. * Copyright (c) 2005 Intel Corporation. All rights reserved.
  4. *
  5. * This software is available to you under a choice of one of two
  6. * licenses. You may choose to be licensed under the terms of the GNU
  7. * General Public License (GPL) Version 2, available from the file
  8. * COPYING in the main directory of this source tree, or the
  9. * OpenIB.org BSD license below:
  10. *
  11. * Redistribution and use in source and binary forms, with or
  12. * without modification, are permitted provided that the following
  13. * conditions are met:
  14. *
  15. * - Redistributions of source code must retain the above
  16. * copyright notice, this list of conditions and the following
  17. * disclaimer.
  18. *
  19. * - Redistributions in binary form must reproduce the above
  20. * copyright notice, this list of conditions and the following
  21. * disclaimer in the documentation and/or other materials
  22. * provided with the distribution.
  23. *
  24. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  25. * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  26. * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
  27. * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
  28. * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
  29. * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
  30. * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  31. * SOFTWARE.
  32. */
  33. #if !defined(IB_ADDR_H)
  34. #define IB_ADDR_H
  35. #include <linux/in.h>
  36. #include <linux/in6.h>
  37. #include <linux/if_arp.h>
  38. #include <linux/netdevice.h>
  39. #include <linux/inetdevice.h>
  40. #include <linux/socket.h>
  41. #include <linux/if_vlan.h>
  42. #include <net/ipv6.h>
  43. #include <net/if_inet6.h>
  44. #include <net/ip.h>
  45. #include <rdma/ib_verbs.h>
  46. #include <rdma/ib_pack.h>
  47. #include <net/ipv6.h>
  48. #include <net/net_namespace.h>
  49. struct rdma_addr_client {
  50. atomic_t refcount;
  51. struct completion comp;
  52. };
  53. /**
  54. * rdma_addr_register_client - Register an address client.
  55. */
  56. void rdma_addr_register_client(struct rdma_addr_client *client);
  57. /**
  58. * rdma_addr_unregister_client - Deregister an address client.
  59. * @client: Client object to deregister.
  60. */
  61. void rdma_addr_unregister_client(struct rdma_addr_client *client);
  62. /**
  63. * struct rdma_dev_addr - Contains resolved RDMA hardware addresses
  64. * @src_dev_addr: Source MAC address.
  65. * @dst_dev_addr: Destination MAC address.
  66. * @broadcast: Broadcast address of the device.
  67. * @dev_type: The interface hardware type of the device.
  68. * @bound_dev_if: An optional device interface index.
  69. * @transport: The transport type used.
  70. * @net: Network namespace containing the bound_dev_if net_dev.
  71. */
  72. struct rdma_dev_addr {
  73. unsigned char src_dev_addr[MAX_ADDR_LEN];
  74. unsigned char dst_dev_addr[MAX_ADDR_LEN];
  75. unsigned char broadcast[MAX_ADDR_LEN];
  76. unsigned short dev_type;
  77. int bound_dev_if;
  78. enum rdma_transport_type transport;
  79. struct net *net;
  80. enum rdma_network_type network;
  81. int hoplimit;
  82. };
  83. /**
  84. * rdma_translate_ip - Translate a local IP address to an RDMA hardware
  85. * address.
  86. *
  87. * The dev_addr->net field must be initialized.
  88. */
  89. int rdma_translate_ip(const struct sockaddr *addr,
  90. struct rdma_dev_addr *dev_addr, u16 *vlan_id);
  91. /**
  92. * rdma_resolve_ip - Resolve source and destination IP addresses to
  93. * RDMA hardware addresses.
  94. * @client: Address client associated with request.
  95. * @src_addr: An optional source address to use in the resolution. If a
  96. * source address is not provided, a usable address will be returned via
  97. * the callback.
  98. * @dst_addr: The destination address to resolve.
  99. * @addr: A reference to a data location that will receive the resolved
  100. * addresses. The data location must remain valid until the callback has
  101. * been invoked. The net field of the addr struct must be valid.
  102. * @timeout_ms: Amount of time to wait for the address resolution to complete.
  103. * @callback: Call invoked once address resolution has completed, timed out,
  104. * or been canceled. A status of 0 indicates success.
  105. * @context: User-specified context associated with the call.
  106. */
  107. int rdma_resolve_ip(struct rdma_addr_client *client,
  108. struct sockaddr *src_addr, struct sockaddr *dst_addr,
  109. struct rdma_dev_addr *addr, int timeout_ms,
  110. void (*callback)(int status, struct sockaddr *src_addr,
  111. struct rdma_dev_addr *addr, void *context),
  112. void *context);
  113. int rdma_resolve_ip_route(struct sockaddr *src_addr,
  114. const struct sockaddr *dst_addr,
  115. struct rdma_dev_addr *addr);
  116. void rdma_addr_cancel(struct rdma_dev_addr *addr);
  117. int rdma_copy_addr(struct rdma_dev_addr *dev_addr, struct net_device *dev,
  118. const unsigned char *dst_dev_addr);
  119. int rdma_addr_size(struct sockaddr *addr);
  120. int rdma_addr_find_smac_by_sgid(union ib_gid *sgid, u8 *smac, u16 *vlan_id);
  121. int rdma_addr_find_l2_eth_by_grh(const union ib_gid *sgid,
  122. const union ib_gid *dgid,
  123. u8 *smac, u16 *vlan_id, int *if_index,
  124. int *hoplimit);
  125. static inline u16 ib_addr_get_pkey(struct rdma_dev_addr *dev_addr)
  126. {
  127. return ((u16)dev_addr->broadcast[8] << 8) | (u16)dev_addr->broadcast[9];
  128. }
  129. static inline void ib_addr_set_pkey(struct rdma_dev_addr *dev_addr, u16 pkey)
  130. {
  131. dev_addr->broadcast[8] = pkey >> 8;
  132. dev_addr->broadcast[9] = (unsigned char) pkey;
  133. }
  134. static inline void ib_addr_get_mgid(struct rdma_dev_addr *dev_addr,
  135. union ib_gid *gid)
  136. {
  137. memcpy(gid, dev_addr->broadcast + 4, sizeof *gid);
  138. }
  139. static inline int rdma_addr_gid_offset(struct rdma_dev_addr *dev_addr)
  140. {
  141. return dev_addr->dev_type == ARPHRD_INFINIBAND ? 4 : 0;
  142. }
  143. static inline u16 rdma_vlan_dev_vlan_id(const struct net_device *dev)
  144. {
  145. return is_vlan_dev(dev) ? vlan_dev_vlan_id(dev) : 0xffff;
  146. }
  147. static inline int rdma_ip2gid(struct sockaddr *addr, union ib_gid *gid)
  148. {
  149. switch (addr->sa_family) {
  150. case AF_INET:
  151. ipv6_addr_set_v4mapped(((struct sockaddr_in *)
  152. addr)->sin_addr.s_addr,
  153. (struct in6_addr *)gid);
  154. break;
  155. case AF_INET6:
  156. *(struct in6_addr *)&gid->raw =
  157. ((struct sockaddr_in6 *)addr)->sin6_addr;
  158. break;
  159. default:
  160. return -EINVAL;
  161. }
  162. return 0;
  163. }
  164. /* Important - sockaddr should be a union of sockaddr_in and sockaddr_in6 */
  165. static inline void rdma_gid2ip(struct sockaddr *out, const union ib_gid *gid)
  166. {
  167. if (ipv6_addr_v4mapped((struct in6_addr *)gid)) {
  168. struct sockaddr_in *out_in = (struct sockaddr_in *)out;
  169. memset(out_in, 0, sizeof(*out_in));
  170. out_in->sin_family = AF_INET;
  171. memcpy(&out_in->sin_addr.s_addr, gid->raw + 12, 4);
  172. } else {
  173. struct sockaddr_in6 *out_in = (struct sockaddr_in6 *)out;
  174. memset(out_in, 0, sizeof(*out_in));
  175. out_in->sin6_family = AF_INET6;
  176. memcpy(&out_in->sin6_addr.s6_addr, gid->raw, 16);
  177. }
  178. }
  179. static inline void iboe_addr_get_sgid(struct rdma_dev_addr *dev_addr,
  180. union ib_gid *gid)
  181. {
  182. struct net_device *dev;
  183. struct in_device *ip4;
  184. dev = dev_get_by_index(&init_net, dev_addr->bound_dev_if);
  185. if (dev) {
  186. ip4 = in_dev_get(dev);
  187. if (ip4 && ip4->ifa_list && ip4->ifa_list->ifa_address)
  188. ipv6_addr_set_v4mapped(ip4->ifa_list->ifa_address,
  189. (struct in6_addr *)gid);
  190. if (ip4)
  191. in_dev_put(ip4);
  192. dev_put(dev);
  193. }
  194. }
  195. static inline void rdma_addr_get_sgid(struct rdma_dev_addr *dev_addr, union ib_gid *gid)
  196. {
  197. if (dev_addr->transport == RDMA_TRANSPORT_IB &&
  198. dev_addr->dev_type != ARPHRD_INFINIBAND)
  199. iboe_addr_get_sgid(dev_addr, gid);
  200. else
  201. memcpy(gid, dev_addr->src_dev_addr +
  202. rdma_addr_gid_offset(dev_addr), sizeof *gid);
  203. }
  204. static inline void rdma_addr_set_sgid(struct rdma_dev_addr *dev_addr, union ib_gid *gid)
  205. {
  206. memcpy(dev_addr->src_dev_addr + rdma_addr_gid_offset(dev_addr), gid, sizeof *gid);
  207. }
  208. static inline void rdma_addr_get_dgid(struct rdma_dev_addr *dev_addr, union ib_gid *gid)
  209. {
  210. memcpy(gid, dev_addr->dst_dev_addr + rdma_addr_gid_offset(dev_addr), sizeof *gid);
  211. }
  212. static inline void rdma_addr_set_dgid(struct rdma_dev_addr *dev_addr, union ib_gid *gid)
  213. {
  214. memcpy(dev_addr->dst_dev_addr + rdma_addr_gid_offset(dev_addr), gid, sizeof *gid);
  215. }
  216. static inline enum ib_mtu iboe_get_mtu(int mtu)
  217. {
  218. /*
  219. * Reduce IB headers from effective IBoE MTU.
  220. */
  221. mtu = mtu - (IB_GRH_BYTES + IB_UDP_BYTES + IB_BTH_BYTES +
  222. IB_EXT_XRC_BYTES + IB_EXT_ATOMICETH_BYTES +
  223. IB_ICRC_BYTES);
  224. if (mtu >= ib_mtu_enum_to_int(IB_MTU_4096))
  225. return IB_MTU_4096;
  226. else if (mtu >= ib_mtu_enum_to_int(IB_MTU_2048))
  227. return IB_MTU_2048;
  228. else if (mtu >= ib_mtu_enum_to_int(IB_MTU_1024))
  229. return IB_MTU_1024;
  230. else if (mtu >= ib_mtu_enum_to_int(IB_MTU_512))
  231. return IB_MTU_512;
  232. else if (mtu >= ib_mtu_enum_to_int(IB_MTU_256))
  233. return IB_MTU_256;
  234. else
  235. return 0;
  236. }
  237. static inline int iboe_get_rate(struct net_device *dev)
  238. {
  239. struct ethtool_link_ksettings cmd;
  240. int err;
  241. rtnl_lock();
  242. err = __ethtool_get_link_ksettings(dev, &cmd);
  243. rtnl_unlock();
  244. if (err)
  245. return IB_RATE_PORT_CURRENT;
  246. if (cmd.base.speed >= 40000)
  247. return IB_RATE_40_GBPS;
  248. else if (cmd.base.speed >= 30000)
  249. return IB_RATE_30_GBPS;
  250. else if (cmd.base.speed >= 20000)
  251. return IB_RATE_20_GBPS;
  252. else if (cmd.base.speed >= 10000)
  253. return IB_RATE_10_GBPS;
  254. else
  255. return IB_RATE_PORT_CURRENT;
  256. }
  257. static inline int rdma_link_local_addr(struct in6_addr *addr)
  258. {
  259. if (addr->s6_addr32[0] == htonl(0xfe800000) &&
  260. addr->s6_addr32[1] == 0)
  261. return 1;
  262. return 0;
  263. }
  264. static inline void rdma_get_ll_mac(struct in6_addr *addr, u8 *mac)
  265. {
  266. memcpy(mac, &addr->s6_addr[8], 3);
  267. memcpy(mac + 3, &addr->s6_addr[13], 3);
  268. mac[0] ^= 2;
  269. }
  270. static inline int rdma_is_multicast_addr(struct in6_addr *addr)
  271. {
  272. u32 ipv4_addr;
  273. if (addr->s6_addr[0] == 0xff)
  274. return 1;
  275. memcpy(&ipv4_addr, addr->s6_addr + 12, 4);
  276. return (ipv6_addr_v4mapped(addr) && ipv4_is_multicast(ipv4_addr));
  277. }
  278. static inline void rdma_get_mcast_mac(struct in6_addr *addr, u8 *mac)
  279. {
  280. int i;
  281. mac[0] = 0x33;
  282. mac[1] = 0x33;
  283. for (i = 2; i < 6; ++i)
  284. mac[i] = addr->s6_addr[i + 10];
  285. }
  286. static inline u16 rdma_get_vlan_id(union ib_gid *dgid)
  287. {
  288. u16 vid;
  289. vid = dgid->raw[11] << 8 | dgid->raw[12];
  290. return vid < 0x1000 ? vid : 0xffff;
  291. }
  292. static inline struct net_device *rdma_vlan_dev_real_dev(const struct net_device *dev)
  293. {
  294. return is_vlan_dev(dev) ? vlan_dev_real_dev(dev) : NULL;
  295. }
  296. #endif /* IB_ADDR_H */