ib_addr.h 10.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342
  1. /*
  2. * Copyright (c) 2005 Voltaire Inc. All rights reserved.
  3. * Copyright (c) 2005 Intel Corporation. All rights reserved.
  4. *
  5. * This software is available to you under a choice of one of two
  6. * licenses. You may choose to be licensed under the terms of the GNU
  7. * General Public License (GPL) Version 2, available from the file
  8. * COPYING in the main directory of this source tree, or the
  9. * OpenIB.org BSD license below:
  10. *
  11. * Redistribution and use in source and binary forms, with or
  12. * without modification, are permitted provided that the following
  13. * conditions are met:
  14. *
  15. * - Redistributions of source code must retain the above
  16. * copyright notice, this list of conditions and the following
  17. * disclaimer.
  18. *
  19. * - Redistributions in binary form must reproduce the above
  20. * copyright notice, this list of conditions and the following
  21. * disclaimer in the documentation and/or other materials
  22. * provided with the distribution.
  23. *
  24. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  25. * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  26. * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
  27. * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
  28. * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
  29. * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
  30. * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  31. * SOFTWARE.
  32. */
  33. #if !defined(IB_ADDR_H)
  34. #define IB_ADDR_H
  35. #include <linux/in.h>
  36. #include <linux/in6.h>
  37. #include <linux/if_arp.h>
  38. #include <linux/netdevice.h>
  39. #include <linux/inetdevice.h>
  40. #include <linux/socket.h>
  41. #include <linux/if_vlan.h>
  42. #include <net/ipv6.h>
  43. #include <net/if_inet6.h>
  44. #include <net/ip.h>
  45. #include <rdma/ib_verbs.h>
  46. #include <rdma/ib_pack.h>
  47. #include <net/ipv6.h>
  48. #include <net/net_namespace.h>
  49. struct rdma_addr_client {
  50. atomic_t refcount;
  51. struct completion comp;
  52. };
  53. /**
  54. * rdma_addr_register_client - Register an address client.
  55. */
  56. void rdma_addr_register_client(struct rdma_addr_client *client);
  57. /**
  58. * rdma_addr_unregister_client - Deregister an address client.
  59. * @client: Client object to deregister.
  60. */
  61. void rdma_addr_unregister_client(struct rdma_addr_client *client);
  62. /**
  63. * struct rdma_dev_addr - Contains resolved RDMA hardware addresses
  64. * @src_dev_addr: Source MAC address.
  65. * @dst_dev_addr: Destination MAC address.
  66. * @broadcast: Broadcast address of the device.
  67. * @dev_type: The interface hardware type of the device.
  68. * @bound_dev_if: An optional device interface index.
  69. * @transport: The transport type used.
  70. * @net: Network namespace containing the bound_dev_if net_dev.
  71. */
  72. struct rdma_dev_addr {
  73. unsigned char src_dev_addr[MAX_ADDR_LEN];
  74. unsigned char dst_dev_addr[MAX_ADDR_LEN];
  75. unsigned char broadcast[MAX_ADDR_LEN];
  76. unsigned short dev_type;
  77. int bound_dev_if;
  78. enum rdma_transport_type transport;
  79. struct net *net;
  80. enum rdma_network_type network;
  81. int hoplimit;
  82. };
  83. /**
  84. * rdma_translate_ip - Translate a local IP address to an RDMA hardware
  85. * address.
  86. *
  87. * The dev_addr->net field must be initialized.
  88. */
  89. int rdma_translate_ip(const struct sockaddr *addr,
  90. struct rdma_dev_addr *dev_addr, u16 *vlan_id);
  91. /**
  92. * rdma_resolve_ip - Resolve source and destination IP addresses to
  93. * RDMA hardware addresses.
  94. * @client: Address client associated with request.
  95. * @src_addr: An optional source address to use in the resolution. If a
  96. * source address is not provided, a usable address will be returned via
  97. * the callback.
  98. * @dst_addr: The destination address to resolve.
  99. * @addr: A reference to a data location that will receive the resolved
  100. * addresses. The data location must remain valid until the callback has
  101. * been invoked. The net field of the addr struct must be valid.
  102. * @timeout_ms: Amount of time to wait for the address resolution to complete.
  103. * @callback: Call invoked once address resolution has completed, timed out,
  104. * or been canceled. A status of 0 indicates success.
  105. * @context: User-specified context associated with the call.
  106. */
  107. int rdma_resolve_ip(struct rdma_addr_client *client,
  108. struct sockaddr *src_addr, struct sockaddr *dst_addr,
  109. struct rdma_dev_addr *addr, int timeout_ms,
  110. void (*callback)(int status, struct sockaddr *src_addr,
  111. struct rdma_dev_addr *addr, void *context),
  112. void *context);
  113. int rdma_resolve_ip_route(struct sockaddr *src_addr,
  114. const struct sockaddr *dst_addr,
  115. struct rdma_dev_addr *addr);
  116. void rdma_addr_cancel(struct rdma_dev_addr *addr);
  117. void rdma_copy_addr(struct rdma_dev_addr *dev_addr,
  118. const struct net_device *dev,
  119. const unsigned char *dst_dev_addr);
  120. int rdma_addr_size(struct sockaddr *addr);
  121. int rdma_addr_find_smac_by_sgid(union ib_gid *sgid, u8 *smac, u16 *vlan_id);
  122. int rdma_addr_find_l2_eth_by_grh(const union ib_gid *sgid,
  123. const union ib_gid *dgid,
  124. u8 *smac, u16 *vlan_id, int *if_index,
  125. int *hoplimit);
  126. static inline u16 ib_addr_get_pkey(struct rdma_dev_addr *dev_addr)
  127. {
  128. return ((u16)dev_addr->broadcast[8] << 8) | (u16)dev_addr->broadcast[9];
  129. }
  130. static inline void ib_addr_set_pkey(struct rdma_dev_addr *dev_addr, u16 pkey)
  131. {
  132. dev_addr->broadcast[8] = pkey >> 8;
  133. dev_addr->broadcast[9] = (unsigned char) pkey;
  134. }
  135. static inline void ib_addr_get_mgid(struct rdma_dev_addr *dev_addr,
  136. union ib_gid *gid)
  137. {
  138. memcpy(gid, dev_addr->broadcast + 4, sizeof *gid);
  139. }
  140. static inline int rdma_addr_gid_offset(struct rdma_dev_addr *dev_addr)
  141. {
  142. return dev_addr->dev_type == ARPHRD_INFINIBAND ? 4 : 0;
  143. }
  144. static inline u16 rdma_vlan_dev_vlan_id(const struct net_device *dev)
  145. {
  146. return is_vlan_dev(dev) ? vlan_dev_vlan_id(dev) : 0xffff;
  147. }
  148. static inline int rdma_ip2gid(struct sockaddr *addr, union ib_gid *gid)
  149. {
  150. switch (addr->sa_family) {
  151. case AF_INET:
  152. ipv6_addr_set_v4mapped(((struct sockaddr_in *)
  153. addr)->sin_addr.s_addr,
  154. (struct in6_addr *)gid);
  155. break;
  156. case AF_INET6:
  157. *(struct in6_addr *)&gid->raw =
  158. ((struct sockaddr_in6 *)addr)->sin6_addr;
  159. break;
  160. default:
  161. return -EINVAL;
  162. }
  163. return 0;
  164. }
  165. /* Important - sockaddr should be a union of sockaddr_in and sockaddr_in6 */
  166. static inline void rdma_gid2ip(struct sockaddr *out, const union ib_gid *gid)
  167. {
  168. if (ipv6_addr_v4mapped((struct in6_addr *)gid)) {
  169. struct sockaddr_in *out_in = (struct sockaddr_in *)out;
  170. memset(out_in, 0, sizeof(*out_in));
  171. out_in->sin_family = AF_INET;
  172. memcpy(&out_in->sin_addr.s_addr, gid->raw + 12, 4);
  173. } else {
  174. struct sockaddr_in6 *out_in = (struct sockaddr_in6 *)out;
  175. memset(out_in, 0, sizeof(*out_in));
  176. out_in->sin6_family = AF_INET6;
  177. memcpy(&out_in->sin6_addr.s6_addr, gid->raw, 16);
  178. }
  179. }
  180. static inline void iboe_addr_get_sgid(struct rdma_dev_addr *dev_addr,
  181. union ib_gid *gid)
  182. {
  183. struct net_device *dev;
  184. struct in_device *ip4;
  185. dev = dev_get_by_index(&init_net, dev_addr->bound_dev_if);
  186. if (dev) {
  187. ip4 = in_dev_get(dev);
  188. if (ip4 && ip4->ifa_list && ip4->ifa_list->ifa_address)
  189. ipv6_addr_set_v4mapped(ip4->ifa_list->ifa_address,
  190. (struct in6_addr *)gid);
  191. if (ip4)
  192. in_dev_put(ip4);
  193. dev_put(dev);
  194. }
  195. }
  196. static inline void rdma_addr_get_sgid(struct rdma_dev_addr *dev_addr, union ib_gid *gid)
  197. {
  198. if (dev_addr->transport == RDMA_TRANSPORT_IB &&
  199. dev_addr->dev_type != ARPHRD_INFINIBAND)
  200. iboe_addr_get_sgid(dev_addr, gid);
  201. else
  202. memcpy(gid, dev_addr->src_dev_addr +
  203. rdma_addr_gid_offset(dev_addr), sizeof *gid);
  204. }
  205. static inline void rdma_addr_set_sgid(struct rdma_dev_addr *dev_addr, union ib_gid *gid)
  206. {
  207. memcpy(dev_addr->src_dev_addr + rdma_addr_gid_offset(dev_addr), gid, sizeof *gid);
  208. }
  209. static inline void rdma_addr_get_dgid(struct rdma_dev_addr *dev_addr, union ib_gid *gid)
  210. {
  211. memcpy(gid, dev_addr->dst_dev_addr + rdma_addr_gid_offset(dev_addr), sizeof *gid);
  212. }
  213. static inline void rdma_addr_set_dgid(struct rdma_dev_addr *dev_addr, union ib_gid *gid)
  214. {
  215. memcpy(dev_addr->dst_dev_addr + rdma_addr_gid_offset(dev_addr), gid, sizeof *gid);
  216. }
  217. static inline enum ib_mtu iboe_get_mtu(int mtu)
  218. {
  219. /*
  220. * Reduce IB headers from effective IBoE MTU.
  221. */
  222. mtu = mtu - (IB_GRH_BYTES + IB_UDP_BYTES + IB_BTH_BYTES +
  223. IB_EXT_XRC_BYTES + IB_EXT_ATOMICETH_BYTES +
  224. IB_ICRC_BYTES);
  225. if (mtu >= ib_mtu_enum_to_int(IB_MTU_4096))
  226. return IB_MTU_4096;
  227. else if (mtu >= ib_mtu_enum_to_int(IB_MTU_2048))
  228. return IB_MTU_2048;
  229. else if (mtu >= ib_mtu_enum_to_int(IB_MTU_1024))
  230. return IB_MTU_1024;
  231. else if (mtu >= ib_mtu_enum_to_int(IB_MTU_512))
  232. return IB_MTU_512;
  233. else if (mtu >= ib_mtu_enum_to_int(IB_MTU_256))
  234. return IB_MTU_256;
  235. else
  236. return 0;
  237. }
  238. static inline int iboe_get_rate(struct net_device *dev)
  239. {
  240. struct ethtool_link_ksettings cmd;
  241. int err;
  242. rtnl_lock();
  243. err = __ethtool_get_link_ksettings(dev, &cmd);
  244. rtnl_unlock();
  245. if (err)
  246. return IB_RATE_PORT_CURRENT;
  247. if (cmd.base.speed >= 40000)
  248. return IB_RATE_40_GBPS;
  249. else if (cmd.base.speed >= 30000)
  250. return IB_RATE_30_GBPS;
  251. else if (cmd.base.speed >= 20000)
  252. return IB_RATE_20_GBPS;
  253. else if (cmd.base.speed >= 10000)
  254. return IB_RATE_10_GBPS;
  255. else
  256. return IB_RATE_PORT_CURRENT;
  257. }
  258. static inline int rdma_link_local_addr(struct in6_addr *addr)
  259. {
  260. if (addr->s6_addr32[0] == htonl(0xfe800000) &&
  261. addr->s6_addr32[1] == 0)
  262. return 1;
  263. return 0;
  264. }
  265. static inline void rdma_get_ll_mac(struct in6_addr *addr, u8 *mac)
  266. {
  267. memcpy(mac, &addr->s6_addr[8], 3);
  268. memcpy(mac + 3, &addr->s6_addr[13], 3);
  269. mac[0] ^= 2;
  270. }
  271. static inline int rdma_is_multicast_addr(struct in6_addr *addr)
  272. {
  273. __be32 ipv4_addr;
  274. if (addr->s6_addr[0] == 0xff)
  275. return 1;
  276. ipv4_addr = addr->s6_addr32[3];
  277. return (ipv6_addr_v4mapped(addr) && ipv4_is_multicast(ipv4_addr));
  278. }
  279. static inline void rdma_get_mcast_mac(struct in6_addr *addr, u8 *mac)
  280. {
  281. int i;
  282. mac[0] = 0x33;
  283. mac[1] = 0x33;
  284. for (i = 2; i < 6; ++i)
  285. mac[i] = addr->s6_addr[i + 10];
  286. }
  287. static inline u16 rdma_get_vlan_id(union ib_gid *dgid)
  288. {
  289. u16 vid;
  290. vid = dgid->raw[11] << 8 | dgid->raw[12];
  291. return vid < 0x1000 ? vid : 0xffff;
  292. }
  293. static inline struct net_device *rdma_vlan_dev_real_dev(const struct net_device *dev)
  294. {
  295. return is_vlan_dev(dev) ? vlan_dev_real_dev(dev) : NULL;
  296. }
  297. #endif /* IB_ADDR_H */