]>
Commit | Line | Data |
---|---|---|
7025fcd3 SH |
1 | /* |
2 | * Copyright (c) 2005 Voltaire Inc. All rights reserved. | |
3 | * Copyright (c) 2005 Intel Corporation. All rights reserved. | |
4 | * | |
a9474917 SH |
5 | * This software is available to you under a choice of one of two |
6 | * licenses. You may choose to be licensed under the terms of the GNU | |
7 | * General Public License (GPL) Version 2, available from the file | |
8 | * COPYING in the main directory of this source tree, or the | |
9 | * OpenIB.org BSD license below: | |
10 | * | |
11 | * Redistribution and use in source and binary forms, with or | |
12 | * without modification, are permitted provided that the following | |
13 | * conditions are met: | |
14 | * | |
15 | * - Redistributions of source code must retain the above | |
16 | * copyright notice, this list of conditions and the following | |
17 | * disclaimer. | |
18 | * | |
19 | * - Redistributions in binary form must reproduce the above | |
20 | * copyright notice, this list of conditions and the following | |
21 | * disclaimer in the documentation and/or other materials | |
22 | * provided with the distribution. | |
23 | * | |
24 | * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, | |
25 | * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF | |
26 | * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND | |
27 | * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS | |
28 | * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN | |
29 | * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN | |
30 | * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE | |
31 | * SOFTWARE. | |
7025fcd3 SH |
32 | */ |
33 | ||
34 | #if !defined(IB_ADDR_H) | |
35 | #define IB_ADDR_H | |
36 | ||
37 | #include <linux/in.h> | |
38 | #include <linux/in6.h> | |
c4315d85 | 39 | #include <linux/if_arp.h> |
7025fcd3 | 40 | #include <linux/netdevice.h> |
7b85627b | 41 | #include <linux/inetdevice.h> |
7025fcd3 | 42 | #include <linux/socket.h> |
af7bd463 | 43 | #include <linux/if_vlan.h> |
7b85627b MS |
44 | #include <net/ipv6.h> |
45 | #include <net/if_inet6.h> | |
46 | #include <net/ip.h> | |
7025fcd3 | 47 | #include <rdma/ib_verbs.h> |
3c86aa70 | 48 | #include <rdma/ib_pack.h> |
dd5f03be | 49 | #include <net/ipv6.h> |
565edd1d | 50 | #include <net/net_namespace.h> |
7025fcd3 | 51 | |
7a118df3 SH |
52 | struct rdma_addr_client { |
53 | atomic_t refcount; | |
54 | struct completion comp; | |
55 | }; | |
56 | ||
57 | /** | |
58 | * rdma_addr_register_client - Register an address client. | |
59 | */ | |
60 | void rdma_addr_register_client(struct rdma_addr_client *client); | |
61 | ||
62 | /** | |
63 | * rdma_addr_unregister_client - Deregister an address client. | |
64 | * @client: Client object to deregister. | |
65 | */ | |
66 | void rdma_addr_unregister_client(struct rdma_addr_client *client); | |
67 | ||
565edd1d GS |
68 | /** |
69 | * struct rdma_dev_addr - Contains resolved RDMA hardware addresses | |
70 | * @src_dev_addr: Source MAC address. | |
71 | * @dst_dev_addr: Destination MAC address. | |
72 | * @broadcast: Broadcast address of the device. | |
73 | * @dev_type: The interface hardware type of the device. | |
74 | * @bound_dev_if: An optional device interface index. | |
75 | * @transport: The transport type used. | |
76 | * @net: Network namespace containing the bound_dev_if net_dev. | |
77 | */ | |
7025fcd3 SH |
78 | struct rdma_dev_addr { |
79 | unsigned char src_dev_addr[MAX_ADDR_LEN]; | |
80 | unsigned char dst_dev_addr[MAX_ADDR_LEN]; | |
81 | unsigned char broadcast[MAX_ADDR_LEN]; | |
c4315d85 | 82 | unsigned short dev_type; |
6266ed6e | 83 | int bound_dev_if; |
3c86aa70 | 84 | enum rdma_transport_type transport; |
565edd1d | 85 | struct net *net; |
c865f246 | 86 | enum rdma_network_type network; |
c3efe750 | 87 | int hoplimit; |
7025fcd3 SH |
88 | }; |
89 | ||
90 | /** | |
91 | * rdma_translate_ip - Translate a local IP address to an RDMA hardware | |
92 | * address. | |
565edd1d GS |
93 | * |
94 | * The dev_addr->net field must be initialized. | |
7025fcd3 | 95 | */ |
20029832 MB |
96 | int rdma_translate_ip(const struct sockaddr *addr, |
97 | struct rdma_dev_addr *dev_addr, u16 *vlan_id); | |
7025fcd3 SH |
98 | |
99 | /** | |
100 | * rdma_resolve_ip - Resolve source and destination IP addresses to | |
101 | * RDMA hardware addresses. | |
7a118df3 | 102 | * @client: Address client associated with request. |
7025fcd3 SH |
103 | * @src_addr: An optional source address to use in the resolution. If a |
104 | * source address is not provided, a usable address will be returned via | |
105 | * the callback. | |
106 | * @dst_addr: The destination address to resolve. | |
107 | * @addr: A reference to a data location that will receive the resolved | |
108 | * addresses. The data location must remain valid until the callback has | |
565edd1d | 109 | * been invoked. The net field of the addr struct must be valid. |
7025fcd3 SH |
110 | * @timeout_ms: Amount of time to wait for the address resolution to complete. |
111 | * @callback: Call invoked once address resolution has completed, timed out, | |
112 | * or been canceled. A status of 0 indicates success. | |
113 | * @context: User-specified context associated with the call. | |
114 | */ | |
7a118df3 SH |
115 | int rdma_resolve_ip(struct rdma_addr_client *client, |
116 | struct sockaddr *src_addr, struct sockaddr *dst_addr, | |
7025fcd3 SH |
117 | struct rdma_dev_addr *addr, int timeout_ms, |
118 | void (*callback)(int status, struct sockaddr *src_addr, | |
119 | struct rdma_dev_addr *addr, void *context), | |
120 | void *context); | |
121 | ||
20029832 MB |
122 | int rdma_resolve_ip_route(struct sockaddr *src_addr, |
123 | const struct sockaddr *dst_addr, | |
124 | struct rdma_dev_addr *addr); | |
125 | ||
7025fcd3 SH |
126 | void rdma_addr_cancel(struct rdma_dev_addr *addr); |
127 | ||
e08ce2e8 YS |
128 | void rdma_copy_addr(struct rdma_dev_addr *dev_addr, |
129 | const struct net_device *dev, | |
130 | const unsigned char *dst_dev_addr); | |
07ebafba | 131 | |
ef560861 | 132 | int rdma_addr_size(struct sockaddr *addr); |
7025fcd3 | 133 | |
dd5f03be | 134 | int rdma_addr_find_smac_by_sgid(union ib_gid *sgid, u8 *smac, u16 *vlan_id); |
f7f4b23e MB |
135 | int rdma_addr_find_l2_eth_by_grh(const union ib_gid *sgid, |
136 | const union ib_gid *dgid, | |
c3efe750 MB |
137 | u8 *smac, u16 *vlan_id, int *if_index, |
138 | int *hoplimit); | |
dd5f03be | 139 | |
7025fcd3 SH |
140 | static inline u16 ib_addr_get_pkey(struct rdma_dev_addr *dev_addr) |
141 | { | |
142 | return ((u16)dev_addr->broadcast[8] << 8) | (u16)dev_addr->broadcast[9]; | |
143 | } | |
144 | ||
145 | static inline void ib_addr_set_pkey(struct rdma_dev_addr *dev_addr, u16 pkey) | |
146 | { | |
147 | dev_addr->broadcast[8] = pkey >> 8; | |
148 | dev_addr->broadcast[9] = (unsigned char) pkey; | |
149 | } | |
150 | ||
faec2f7b SH |
151 | static inline void ib_addr_get_mgid(struct rdma_dev_addr *dev_addr, |
152 | union ib_gid *gid) | |
153 | { | |
154 | memcpy(gid, dev_addr->broadcast + 4, sizeof *gid); | |
155 | } | |
156 | ||
6f8372b6 | 157 | static inline int rdma_addr_gid_offset(struct rdma_dev_addr *dev_addr) |
7025fcd3 | 158 | { |
6f8372b6 | 159 | return dev_addr->dev_type == ARPHRD_INFINIBAND ? 4 : 0; |
7025fcd3 SH |
160 | } |
161 | ||
7b85627b | 162 | static inline u16 rdma_vlan_dev_vlan_id(const struct net_device *dev) |
3c86aa70 | 163 | { |
d0d7b10b | 164 | return is_vlan_dev(dev) ? vlan_dev_vlan_id(dev) : 0xffff; |
3c86aa70 EC |
165 | } |
166 | ||
dd5f03be MB |
167 | static inline int rdma_ip2gid(struct sockaddr *addr, union ib_gid *gid) |
168 | { | |
169 | switch (addr->sa_family) { | |
170 | case AF_INET: | |
171 | ipv6_addr_set_v4mapped(((struct sockaddr_in *) | |
172 | addr)->sin_addr.s_addr, | |
173 | (struct in6_addr *)gid); | |
174 | break; | |
175 | case AF_INET6: | |
5f8a4db7 AB |
176 | *(struct in6_addr *)&gid->raw = |
177 | ((struct sockaddr_in6 *)addr)->sin6_addr; | |
dd5f03be MB |
178 | break; |
179 | default: | |
180 | return -EINVAL; | |
181 | } | |
182 | return 0; | |
183 | } | |
184 | ||
185 | /* Important - sockaddr should be a union of sockaddr_in and sockaddr_in6 */ | |
73cdaaee | 186 | static inline void rdma_gid2ip(struct sockaddr *out, const union ib_gid *gid) |
dd5f03be MB |
187 | { |
188 | if (ipv6_addr_v4mapped((struct in6_addr *)gid)) { | |
189 | struct sockaddr_in *out_in = (struct sockaddr_in *)out; | |
190 | memset(out_in, 0, sizeof(*out_in)); | |
191 | out_in->sin_family = AF_INET; | |
192 | memcpy(&out_in->sin_addr.s_addr, gid->raw + 12, 4); | |
193 | } else { | |
194 | struct sockaddr_in6 *out_in = (struct sockaddr_in6 *)out; | |
195 | memset(out_in, 0, sizeof(*out_in)); | |
196 | out_in->sin6_family = AF_INET6; | |
197 | memcpy(&out_in->sin6_addr.s6_addr, gid->raw, 16); | |
198 | } | |
dd5f03be MB |
199 | } |
200 | ||
3c86aa70 EC |
201 | static inline void iboe_addr_get_sgid(struct rdma_dev_addr *dev_addr, |
202 | union ib_gid *gid) | |
203 | { | |
af7bd463 | 204 | struct net_device *dev; |
7b85627b | 205 | struct in_device *ip4; |
af7bd463 EC |
206 | |
207 | dev = dev_get_by_index(&init_net, dev_addr->bound_dev_if); | |
208 | if (dev) { | |
fba332b0 | 209 | ip4 = in_dev_get(dev); |
963916fd | 210 | if (ip4 && ip4->ifa_list && ip4->ifa_list->ifa_address) |
7b85627b MS |
211 | ipv6_addr_set_v4mapped(ip4->ifa_list->ifa_address, |
212 | (struct in6_addr *)gid); | |
963916fd KM |
213 | |
214 | if (ip4) | |
fba332b0 | 215 | in_dev_put(ip4); |
963916fd | 216 | |
af7bd463 EC |
217 | dev_put(dev); |
218 | } | |
3c86aa70 EC |
219 | } |
220 | ||
6f8372b6 | 221 | static inline void rdma_addr_get_sgid(struct rdma_dev_addr *dev_addr, union ib_gid *gid) |
7025fcd3 | 222 | { |
3c86aa70 EC |
223 | if (dev_addr->transport == RDMA_TRANSPORT_IB && |
224 | dev_addr->dev_type != ARPHRD_INFINIBAND) | |
225 | iboe_addr_get_sgid(dev_addr, gid); | |
226 | else | |
227 | memcpy(gid, dev_addr->src_dev_addr + | |
228 | rdma_addr_gid_offset(dev_addr), sizeof *gid); | |
7025fcd3 SH |
229 | } |
230 | ||
6f8372b6 | 231 | static inline void rdma_addr_set_sgid(struct rdma_dev_addr *dev_addr, union ib_gid *gid) |
7025fcd3 | 232 | { |
6f8372b6 | 233 | memcpy(dev_addr->src_dev_addr + rdma_addr_gid_offset(dev_addr), gid, sizeof *gid); |
7025fcd3 SH |
234 | } |
235 | ||
6f8372b6 | 236 | static inline void rdma_addr_get_dgid(struct rdma_dev_addr *dev_addr, union ib_gid *gid) |
7025fcd3 | 237 | { |
6f8372b6 | 238 | memcpy(gid, dev_addr->dst_dev_addr + rdma_addr_gid_offset(dev_addr), sizeof *gid); |
7025fcd3 SH |
239 | } |
240 | ||
6f8372b6 | 241 | static inline void rdma_addr_set_dgid(struct rdma_dev_addr *dev_addr, union ib_gid *gid) |
07ebafba | 242 | { |
6f8372b6 | 243 | memcpy(dev_addr->dst_dev_addr + rdma_addr_gid_offset(dev_addr), gid, sizeof *gid); |
07ebafba TT |
244 | } |
245 | ||
3c86aa70 EC |
246 | static inline enum ib_mtu iboe_get_mtu(int mtu) |
247 | { | |
248 | /* | |
99260132 | 249 | * Reduce IB headers from effective IBoE MTU. |
3c86aa70 | 250 | */ |
99260132 PP |
251 | mtu = mtu - (IB_GRH_BYTES + IB_UDP_BYTES + IB_BTH_BYTES + |
252 | IB_EXT_XRC_BYTES + IB_EXT_ATOMICETH_BYTES + | |
253 | IB_ICRC_BYTES); | |
3c86aa70 EC |
254 | |
255 | if (mtu >= ib_mtu_enum_to_int(IB_MTU_4096)) | |
256 | return IB_MTU_4096; | |
257 | else if (mtu >= ib_mtu_enum_to_int(IB_MTU_2048)) | |
258 | return IB_MTU_2048; | |
259 | else if (mtu >= ib_mtu_enum_to_int(IB_MTU_1024)) | |
260 | return IB_MTU_1024; | |
261 | else if (mtu >= ib_mtu_enum_to_int(IB_MTU_512)) | |
262 | return IB_MTU_512; | |
263 | else if (mtu >= ib_mtu_enum_to_int(IB_MTU_256)) | |
264 | return IB_MTU_256; | |
265 | else | |
266 | return 0; | |
267 | } | |
268 | ||
269 | static inline int iboe_get_rate(struct net_device *dev) | |
270 | { | |
17605b96 | 271 | struct ethtool_link_ksettings cmd; |
4bc71cb9 | 272 | int err; |
3c86aa70 | 273 | |
4bc71cb9 | 274 | rtnl_lock(); |
17605b96 | 275 | err = __ethtool_get_link_ksettings(dev, &cmd); |
4bc71cb9 JP |
276 | rtnl_unlock(); |
277 | if (err) | |
3c86aa70 EC |
278 | return IB_RATE_PORT_CURRENT; |
279 | ||
17605b96 | 280 | if (cmd.base.speed >= 40000) |
3c86aa70 | 281 | return IB_RATE_40_GBPS; |
17605b96 | 282 | else if (cmd.base.speed >= 30000) |
3c86aa70 | 283 | return IB_RATE_30_GBPS; |
17605b96 | 284 | else if (cmd.base.speed >= 20000) |
3c86aa70 | 285 | return IB_RATE_20_GBPS; |
17605b96 | 286 | else if (cmd.base.speed >= 10000) |
3c86aa70 EC |
287 | return IB_RATE_10_GBPS; |
288 | else | |
289 | return IB_RATE_PORT_CURRENT; | |
290 | } | |
291 | ||
292 | static inline int rdma_link_local_addr(struct in6_addr *addr) | |
293 | { | |
294 | if (addr->s6_addr32[0] == htonl(0xfe800000) && | |
295 | addr->s6_addr32[1] == 0) | |
296 | return 1; | |
297 | ||
298 | return 0; | |
299 | } | |
300 | ||
301 | static inline void rdma_get_ll_mac(struct in6_addr *addr, u8 *mac) | |
302 | { | |
303 | memcpy(mac, &addr->s6_addr[8], 3); | |
304 | memcpy(mac + 3, &addr->s6_addr[13], 3); | |
305 | mac[0] ^= 2; | |
306 | } | |
307 | ||
308 | static inline int rdma_is_multicast_addr(struct in6_addr *addr) | |
309 | { | |
1c3aea2b | 310 | __be32 ipv4_addr; |
be1d325a NO |
311 | |
312 | if (addr->s6_addr[0] == 0xff) | |
313 | return 1; | |
314 | ||
1c3aea2b | 315 | ipv4_addr = addr->s6_addr32[3]; |
be1d325a | 316 | return (ipv6_addr_v4mapped(addr) && ipv4_is_multicast(ipv4_addr)); |
3c86aa70 EC |
317 | } |
318 | ||
319 | static inline void rdma_get_mcast_mac(struct in6_addr *addr, u8 *mac) | |
320 | { | |
321 | int i; | |
322 | ||
323 | mac[0] = 0x33; | |
324 | mac[1] = 0x33; | |
325 | for (i = 2; i < 6; ++i) | |
326 | mac[i] = addr->s6_addr[i + 10]; | |
327 | } | |
328 | ||
af7bd463 EC |
329 | static inline u16 rdma_get_vlan_id(union ib_gid *dgid) |
330 | { | |
331 | u16 vid; | |
332 | ||
333 | vid = dgid->raw[11] << 8 | dgid->raw[12]; | |
334 | return vid < 0x1000 ? vid : 0xffff; | |
335 | } | |
336 | ||
337 | static inline struct net_device *rdma_vlan_dev_real_dev(const struct net_device *dev) | |
338 | { | |
d0d7b10b | 339 | return is_vlan_dev(dev) ? vlan_dev_real_dev(dev) : NULL; |
af7bd463 EC |
340 | } |
341 | ||
7025fcd3 | 342 | #endif /* IB_ADDR_H */ |