ib_addr.h 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344
  1. /*
  2. * Copyright (c) 2005 Voltaire Inc. All rights reserved.
  3. * Copyright (c) 2005 Intel Corporation. All rights reserved.
  4. *
  5. * This software is available to you under a choice of one of two
  6. * licenses. You may choose to be licensed under the terms of the GNU
  7. * General Public License (GPL) Version 2, available from the file
  8. * COPYING in the main directory of this source tree, or the
  9. * OpenIB.org BSD license below:
  10. *
  11. * Redistribution and use in source and binary forms, with or
  12. * without modification, are permitted provided that the following
  13. * conditions are met:
  14. *
  15. * - Redistributions of source code must retain the above
  16. * copyright notice, this list of conditions and the following
  17. * disclaimer.
  18. *
  19. * - Redistributions in binary form must reproduce the above
  20. * copyright notice, this list of conditions and the following
  21. * disclaimer in the documentation and/or other materials
  22. * provided with the distribution.
  23. *
  24. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  25. * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  26. * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
  27. * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
  28. * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
  29. * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
  30. * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  31. * SOFTWARE.
  32. */
  33. #if !defined(IB_ADDR_H)
  34. #define IB_ADDR_H
  35. #include <linux/in.h>
  36. #include <linux/in6.h>
  37. #include <linux/if_arp.h>
  38. #include <linux/netdevice.h>
  39. #include <linux/inetdevice.h>
  40. #include <linux/socket.h>
  41. #include <linux/if_vlan.h>
  42. #include <net/ipv6.h>
  43. #include <net/if_inet6.h>
  44. #include <net/ip.h>
  45. #include <rdma/ib_verbs.h>
  46. #include <rdma/ib_pack.h>
  47. #include <net/ipv6.h>
  48. #include <net/net_namespace.h>
  49. struct rdma_addr_client {
  50. atomic_t refcount;
  51. struct completion comp;
  52. };
  53. /**
  54. * rdma_addr_register_client - Register an address client.
  55. */
  56. void rdma_addr_register_client(struct rdma_addr_client *client);
  57. /**
  58. * rdma_addr_unregister_client - Deregister an address client.
  59. * @client: Client object to deregister.
  60. */
  61. void rdma_addr_unregister_client(struct rdma_addr_client *client);
  62. /**
  63. * struct rdma_dev_addr - Contains resolved RDMA hardware addresses
  64. * @src_dev_addr: Source MAC address.
  65. * @dst_dev_addr: Destination MAC address.
  66. * @broadcast: Broadcast address of the device.
  67. * @dev_type: The interface hardware type of the device.
  68. * @bound_dev_if: An optional device interface index.
  69. * @transport: The transport type used.
  70. * @net: Network namespace containing the bound_dev_if net_dev.
  71. */
  72. struct rdma_dev_addr {
  73. unsigned char src_dev_addr[MAX_ADDR_LEN];
  74. unsigned char dst_dev_addr[MAX_ADDR_LEN];
  75. unsigned char broadcast[MAX_ADDR_LEN];
  76. unsigned short dev_type;
  77. int bound_dev_if;
  78. enum rdma_transport_type transport;
  79. struct net *net;
  80. enum rdma_network_type network;
  81. int hoplimit;
  82. };
  83. /**
  84. * rdma_translate_ip - Translate a local IP address to an RDMA hardware
  85. * address.
  86. *
  87. * The dev_addr->net field must be initialized.
  88. */
  89. int rdma_translate_ip(const struct sockaddr *addr,
  90. struct rdma_dev_addr *dev_addr, u16 *vlan_id);
  91. /**
  92. * rdma_resolve_ip - Resolve source and destination IP addresses to
  93. * RDMA hardware addresses.
  94. * @client: Address client associated with request.
  95. * @src_addr: An optional source address to use in the resolution. If a
  96. * source address is not provided, a usable address will be returned via
  97. * the callback.
  98. * @dst_addr: The destination address to resolve.
  99. * @addr: A reference to a data location that will receive the resolved
  100. * addresses. The data location must remain valid until the callback has
  101. * been invoked. The net field of the addr struct must be valid.
  102. * @timeout_ms: Amount of time to wait for the address resolution to complete.
  103. * @callback: Call invoked once address resolution has completed, timed out,
  104. * or been canceled. A status of 0 indicates success.
  105. * @context: User-specified context associated with the call.
  106. */
  107. int rdma_resolve_ip(struct rdma_addr_client *client,
  108. struct sockaddr *src_addr, struct sockaddr *dst_addr,
  109. struct rdma_dev_addr *addr, int timeout_ms,
  110. void (*callback)(int status, struct sockaddr *src_addr,
  111. struct rdma_dev_addr *addr, void *context),
  112. void *context);
  113. int rdma_resolve_ip_route(struct sockaddr *src_addr,
  114. const struct sockaddr *dst_addr,
  115. struct rdma_dev_addr *addr);
  116. void rdma_addr_cancel(struct rdma_dev_addr *addr);
  117. int rdma_copy_addr(struct rdma_dev_addr *dev_addr, struct net_device *dev,
  118. const unsigned char *dst_dev_addr);
  119. int rdma_addr_size(struct sockaddr *addr);
  120. int rdma_addr_size_in6(struct sockaddr_in6 *addr);
  121. int rdma_addr_size_kss(struct __kernel_sockaddr_storage *addr);
  122. int rdma_addr_find_smac_by_sgid(union ib_gid *sgid, u8 *smac, u16 *vlan_id);
  123. int rdma_addr_find_l2_eth_by_grh(const union ib_gid *sgid,
  124. const union ib_gid *dgid,
  125. u8 *smac, u16 *vlan_id, int *if_index,
  126. int *hoplimit);
  127. static inline u16 ib_addr_get_pkey(struct rdma_dev_addr *dev_addr)
  128. {
  129. return ((u16)dev_addr->broadcast[8] << 8) | (u16)dev_addr->broadcast[9];
  130. }
  131. static inline void ib_addr_set_pkey(struct rdma_dev_addr *dev_addr, u16 pkey)
  132. {
  133. dev_addr->broadcast[8] = pkey >> 8;
  134. dev_addr->broadcast[9] = (unsigned char) pkey;
  135. }
  136. static inline void ib_addr_get_mgid(struct rdma_dev_addr *dev_addr,
  137. union ib_gid *gid)
  138. {
  139. memcpy(gid, dev_addr->broadcast + 4, sizeof *gid);
  140. }
  141. static inline int rdma_addr_gid_offset(struct rdma_dev_addr *dev_addr)
  142. {
  143. return dev_addr->dev_type == ARPHRD_INFINIBAND ? 4 : 0;
  144. }
  145. static inline u16 rdma_vlan_dev_vlan_id(const struct net_device *dev)
  146. {
  147. return is_vlan_dev(dev) ? vlan_dev_vlan_id(dev) : 0xffff;
  148. }
  149. static inline int rdma_ip2gid(struct sockaddr *addr, union ib_gid *gid)
  150. {
  151. switch (addr->sa_family) {
  152. case AF_INET:
  153. ipv6_addr_set_v4mapped(((struct sockaddr_in *)
  154. addr)->sin_addr.s_addr,
  155. (struct in6_addr *)gid);
  156. break;
  157. case AF_INET6:
  158. *(struct in6_addr *)&gid->raw =
  159. ((struct sockaddr_in6 *)addr)->sin6_addr;
  160. break;
  161. default:
  162. return -EINVAL;
  163. }
  164. return 0;
  165. }
  166. /* Important - sockaddr should be a union of sockaddr_in and sockaddr_in6 */
  167. static inline void rdma_gid2ip(struct sockaddr *out, const union ib_gid *gid)
  168. {
  169. if (ipv6_addr_v4mapped((struct in6_addr *)gid)) {
  170. struct sockaddr_in *out_in = (struct sockaddr_in *)out;
  171. memset(out_in, 0, sizeof(*out_in));
  172. out_in->sin_family = AF_INET;
  173. memcpy(&out_in->sin_addr.s_addr, gid->raw + 12, 4);
  174. } else {
  175. struct sockaddr_in6 *out_in = (struct sockaddr_in6 *)out;
  176. memset(out_in, 0, sizeof(*out_in));
  177. out_in->sin6_family = AF_INET6;
  178. memcpy(&out_in->sin6_addr.s6_addr, gid->raw, 16);
  179. }
  180. }
  181. static inline void iboe_addr_get_sgid(struct rdma_dev_addr *dev_addr,
  182. union ib_gid *gid)
  183. {
  184. struct net_device *dev;
  185. struct in_device *ip4;
  186. dev = dev_get_by_index(&init_net, dev_addr->bound_dev_if);
  187. if (dev) {
  188. ip4 = in_dev_get(dev);
  189. if (ip4 && ip4->ifa_list && ip4->ifa_list->ifa_address)
  190. ipv6_addr_set_v4mapped(ip4->ifa_list->ifa_address,
  191. (struct in6_addr *)gid);
  192. if (ip4)
  193. in_dev_put(ip4);
  194. dev_put(dev);
  195. }
  196. }
  197. static inline void rdma_addr_get_sgid(struct rdma_dev_addr *dev_addr, union ib_gid *gid)
  198. {
  199. if (dev_addr->transport == RDMA_TRANSPORT_IB &&
  200. dev_addr->dev_type != ARPHRD_INFINIBAND)
  201. iboe_addr_get_sgid(dev_addr, gid);
  202. else
  203. memcpy(gid, dev_addr->src_dev_addr +
  204. rdma_addr_gid_offset(dev_addr), sizeof *gid);
  205. }
  206. static inline void rdma_addr_set_sgid(struct rdma_dev_addr *dev_addr, union ib_gid *gid)
  207. {
  208. memcpy(dev_addr->src_dev_addr + rdma_addr_gid_offset(dev_addr), gid, sizeof *gid);
  209. }
  210. static inline void rdma_addr_get_dgid(struct rdma_dev_addr *dev_addr, union ib_gid *gid)
  211. {
  212. memcpy(gid, dev_addr->dst_dev_addr + rdma_addr_gid_offset(dev_addr), sizeof *gid);
  213. }
  214. static inline void rdma_addr_set_dgid(struct rdma_dev_addr *dev_addr, union ib_gid *gid)
  215. {
  216. memcpy(dev_addr->dst_dev_addr + rdma_addr_gid_offset(dev_addr), gid, sizeof *gid);
  217. }
  218. static inline enum ib_mtu iboe_get_mtu(int mtu)
  219. {
  220. /*
  221. * Reduce IB headers from effective IBoE MTU.
  222. */
  223. mtu = mtu - (IB_GRH_BYTES + IB_UDP_BYTES + IB_BTH_BYTES +
  224. IB_EXT_XRC_BYTES + IB_EXT_ATOMICETH_BYTES +
  225. IB_ICRC_BYTES);
  226. if (mtu >= ib_mtu_enum_to_int(IB_MTU_4096))
  227. return IB_MTU_4096;
  228. else if (mtu >= ib_mtu_enum_to_int(IB_MTU_2048))
  229. return IB_MTU_2048;
  230. else if (mtu >= ib_mtu_enum_to_int(IB_MTU_1024))
  231. return IB_MTU_1024;
  232. else if (mtu >= ib_mtu_enum_to_int(IB_MTU_512))
  233. return IB_MTU_512;
  234. else if (mtu >= ib_mtu_enum_to_int(IB_MTU_256))
  235. return IB_MTU_256;
  236. else
  237. return 0;
  238. }
  239. static inline int iboe_get_rate(struct net_device *dev)
  240. {
  241. struct ethtool_link_ksettings cmd;
  242. int err;
  243. rtnl_lock();
  244. err = __ethtool_get_link_ksettings(dev, &cmd);
  245. rtnl_unlock();
  246. if (err)
  247. return IB_RATE_PORT_CURRENT;
  248. if (cmd.base.speed >= 40000)
  249. return IB_RATE_40_GBPS;
  250. else if (cmd.base.speed >= 30000)
  251. return IB_RATE_30_GBPS;
  252. else if (cmd.base.speed >= 20000)
  253. return IB_RATE_20_GBPS;
  254. else if (cmd.base.speed >= 10000)
  255. return IB_RATE_10_GBPS;
  256. else
  257. return IB_RATE_PORT_CURRENT;
  258. }
  259. static inline int rdma_link_local_addr(struct in6_addr *addr)
  260. {
  261. if (addr->s6_addr32[0] == htonl(0xfe800000) &&
  262. addr->s6_addr32[1] == 0)
  263. return 1;
  264. return 0;
  265. }
  266. static inline void rdma_get_ll_mac(struct in6_addr *addr, u8 *mac)
  267. {
  268. memcpy(mac, &addr->s6_addr[8], 3);
  269. memcpy(mac + 3, &addr->s6_addr[13], 3);
  270. mac[0] ^= 2;
  271. }
  272. static inline int rdma_is_multicast_addr(struct in6_addr *addr)
  273. {
  274. __be32 ipv4_addr;
  275. if (addr->s6_addr[0] == 0xff)
  276. return 1;
  277. ipv4_addr = addr->s6_addr32[3];
  278. return (ipv6_addr_v4mapped(addr) && ipv4_is_multicast(ipv4_addr));
  279. }
  280. static inline void rdma_get_mcast_mac(struct in6_addr *addr, u8 *mac)
  281. {
  282. int i;
  283. mac[0] = 0x33;
  284. mac[1] = 0x33;
  285. for (i = 2; i < 6; ++i)
  286. mac[i] = addr->s6_addr[i + 10];
  287. }
  288. static inline u16 rdma_get_vlan_id(union ib_gid *dgid)
  289. {
  290. u16 vid;
  291. vid = dgid->raw[11] << 8 | dgid->raw[12];
  292. return vid < 0x1000 ? vid : 0xffff;
  293. }
  294. static inline struct net_device *rdma_vlan_dev_real_dev(const struct net_device *dev)
  295. {
  296. return is_vlan_dev(dev) ? vlan_dev_real_dev(dev) : NULL;
  297. }
  298. #endif /* IB_ADDR_H */