]> git.proxmox.com Git - mirror_ubuntu-hirsute-kernel.git/blame - net/rds/rdma_transport.c
rds: Return proper "tos" value to user-space
[mirror_ubuntu-hirsute-kernel.git] / net / rds / rdma_transport.c
CommitLineData
55b7ed0b 1/*
eee2fa6a 2 * Copyright (c) 2009, 2018 Oracle and/or its affiliates. All rights reserved.
55b7ed0b
AG
3 *
4 * This software is available to you under a choice of one of two
5 * licenses. You may choose to be licensed under the terms of the GNU
6 * General Public License (GPL) Version 2, available from the file
7 * COPYING in the main directory of this source tree, or the
8 * OpenIB.org BSD license below:
9 *
10 * Redistribution and use in source and binary forms, with or
11 * without modification, are permitted provided that the following
12 * conditions are met:
13 *
14 * - Redistributions of source code must retain the above
15 * copyright notice, this list of conditions and the following
16 * disclaimer.
17 *
18 * - Redistributions in binary form must reproduce the above
19 * copyright notice, this list of conditions and the following
20 * disclaimer in the documentation and/or other materials
21 * provided with the distribution.
22 *
23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
30 * SOFTWARE.
31 *
32 */
3a9a231d 33#include <linux/module.h>
55b7ed0b
AG
34#include <rdma/rdma_cm.h>
35
0cb43965 36#include "rds_single_path.h"
55b7ed0b 37#include "rdma_transport.h"
ae05368a 38#include "ib.h"
55b7ed0b 39
1e2b44e7 40/* Global IPv4 and IPv6 RDS RDMA listener cm_id */
11bc9421 41static struct rdma_cm_id *rds_rdma_listen_id;
e65d4d96 42#if IS_ENABLED(CONFIG_IPV6)
1e2b44e7 43static struct rdma_cm_id *rds6_rdma_listen_id;
e65d4d96 44#endif
55b7ed0b 45
eee2fa6a
KCP
46static int rds_rdma_cm_event_handler_cmn(struct rdma_cm_id *cm_id,
47 struct rdma_cm_event *event,
48 bool isv6)
55b7ed0b
AG
49{
50 /* this can be null in the listening path */
51 struct rds_connection *conn = cm_id->context;
52 struct rds_transport *trans;
53 int ret = 0;
d021fabf
SS
54 int *err;
55 u8 len;
55b7ed0b 56
59f740a6 57 rdsdebug("conn %p id %p handling event %u (%s)\n", conn, cm_id,
3c88f3dc 58 event->event, rdma_event_msg(event->event));
55b7ed0b 59
dcdede04 60 if (cm_id->device->node_type == RDMA_NODE_IB_CA)
55b7ed0b
AG
61 trans = &rds_ib_transport;
62
63 /* Prevent shutdown from tearing down the connection
64 * while we're executing. */
65 if (conn) {
66 mutex_lock(&conn->c_cm_lock);
67
68 /* If the connection is being shut down, bail out
69 * right away. We return 0 so cm_id doesn't get
70 * destroyed prematurely */
71 if (rds_conn_state(conn) == RDS_CONN_DISCONNECTING) {
72 /* Reject incoming connections while we're tearing
73 * down an existing one. */
74 if (event->event == RDMA_CM_EVENT_CONNECT_REQUEST)
75 ret = 1;
76 goto out;
77 }
78 }
79
80 switch (event->event) {
81 case RDMA_CM_EVENT_CONNECT_REQUEST:
eee2fa6a 82 ret = trans->cm_handle_connect(cm_id, event, isv6);
55b7ed0b
AG
83 break;
84
85 case RDMA_CM_EVENT_ADDR_RESOLVED:
fd261ce6 86 rdma_set_service_type(cm_id, conn->c_tos);
55b7ed0b
AG
87 /* XXX do we need to clean up if this fails? */
88 ret = rdma_resolve_route(cm_id,
89 RDS_RDMA_RESOLVE_TIMEOUT_MS);
90 break;
91
92 case RDMA_CM_EVENT_ROUTE_RESOLVED:
ae05368a 93 /* Connection could have been dropped so make sure the
94 * cm_id is valid before proceeding
95 */
96 if (conn) {
97 struct rds_ib_connection *ibic;
98
99 ibic = conn->c_transport_data;
100 if (ibic && ibic->i_cm_id == cm_id)
eee2fa6a 101 ret = trans->cm_initiate_connect(cm_id, isv6);
ae05368a 102 else
103 rds_conn_drop(conn);
104 }
55b7ed0b
AG
105 break;
106
107 case RDMA_CM_EVENT_ESTABLISHED:
108 trans->cm_connect_complete(conn, event);
109 break;
110
39384f04 111 case RDMA_CM_EVENT_REJECTED:
d021fabf
SS
112 if (!conn)
113 break;
114 err = (int *)rdma_consumer_reject_data(cm_id, event, &len);
8c6166cf
GR
115 if (!err ||
116 (err && len >= sizeof(*err) &&
117 ((*err) <= RDS_RDMA_REJ_INCOMPAT))) {
d021fabf
SS
118 pr_warn("RDS/RDMA: conn <%pI6c, %pI6c> rejected, dropping connection\n",
119 &conn->c_laddr, &conn->c_faddr);
120 conn->c_proposed_version = RDS_PROTOCOL_COMPAT_VERSION;
3eb45036 121 conn->c_tos = 0;
d021fabf
SS
122 rds_conn_drop(conn);
123 }
39384f04
SW
124 rdsdebug("Connection rejected: %s\n",
125 rdma_reject_msg(cm_id, event->status));
d021fabf 126 break;
55b7ed0b
AG
127 case RDMA_CM_EVENT_ADDR_ERROR:
128 case RDMA_CM_EVENT_ROUTE_ERROR:
129 case RDMA_CM_EVENT_CONNECT_ERROR:
130 case RDMA_CM_EVENT_UNREACHABLE:
55b7ed0b
AG
131 case RDMA_CM_EVENT_DEVICE_REMOVAL:
132 case RDMA_CM_EVENT_ADDR_CHANGE:
133 if (conn)
134 rds_conn_drop(conn);
135 break;
136
137 case RDMA_CM_EVENT_DISCONNECTED:
97069788 138 rdsdebug("DISCONNECT event - dropping connection "
eee2fa6a 139 "%pI6c->%pI6c\n", &conn->c_laddr,
55b7ed0b
AG
140 &conn->c_faddr);
141 rds_conn_drop(conn);
142 break;
143
37ea401e 144 case RDMA_CM_EVENT_TIMEWAIT_EXIT:
145 if (conn) {
eee2fa6a 146 pr_info("RDS: RDMA_CM_EVENT_TIMEWAIT_EXIT event: dropping connection %pI6c->%pI6c\n",
37ea401e 147 &conn->c_laddr, &conn->c_faddr);
148 rds_conn_drop(conn);
149 }
150 break;
151
55b7ed0b
AG
152 default:
153 /* things like device disconnect? */
59f740a6 154 printk(KERN_ERR "RDS: unknown event %u (%s)!\n",
3c88f3dc 155 event->event, rdma_event_msg(event->event));
55b7ed0b
AG
156 break;
157 }
158
159out:
160 if (conn)
161 mutex_unlock(&conn->c_cm_lock);
162
59f740a6 163 rdsdebug("id %p event %u (%s) handling ret %d\n", cm_id, event->event,
3c88f3dc 164 rdma_event_msg(event->event), ret);
55b7ed0b
AG
165
166 return ret;
167}
168
eee2fa6a
KCP
169int rds_rdma_cm_event_handler(struct rdma_cm_id *cm_id,
170 struct rdma_cm_event *event)
171{
172 return rds_rdma_cm_event_handler_cmn(cm_id, event, false);
173}
174
e65d4d96 175#if IS_ENABLED(CONFIG_IPV6)
1e2b44e7
KCP
176int rds6_rdma_cm_event_handler(struct rdma_cm_id *cm_id,
177 struct rdma_cm_event *event)
178{
179 return rds_rdma_cm_event_handler_cmn(cm_id, event, true);
180}
e65d4d96 181#endif
1e2b44e7 182
eee2fa6a
KCP
183static int rds_rdma_listen_init_common(rdma_cm_event_handler handler,
184 struct sockaddr *sa,
185 struct rdma_cm_id **ret_cm_id)
55b7ed0b 186{
55b7ed0b
AG
187 struct rdma_cm_id *cm_id;
188 int ret;
189
eee2fa6a 190 cm_id = rdma_create_id(&init_net, handler, NULL,
fa20105e 191 RDMA_PS_TCP, IB_QPT_RC);
55b7ed0b
AG
192 if (IS_ERR(cm_id)) {
193 ret = PTR_ERR(cm_id);
92c330b9 194 printk(KERN_ERR "RDS/RDMA: failed to setup listener, "
55b7ed0b 195 "rdma_create_id() returned %d\n", ret);
24acc689 196 return ret;
55b7ed0b
AG
197 }
198
55b7ed0b
AG
199 /*
200 * XXX I bet this binds the cm_id to a device. If we want to support
201 * fail-over we'll have to take this into consideration.
202 */
eee2fa6a 203 ret = rdma_bind_addr(cm_id, sa);
55b7ed0b 204 if (ret) {
92c330b9 205 printk(KERN_ERR "RDS/RDMA: failed to setup listener, "
55b7ed0b
AG
206 "rdma_bind_addr() returned %d\n", ret);
207 goto out;
208 }
209
210 ret = rdma_listen(cm_id, 128);
211 if (ret) {
92c330b9 212 printk(KERN_ERR "RDS/RDMA: failed to setup listener, "
55b7ed0b
AG
213 "rdma_listen() returned %d\n", ret);
214 goto out;
215 }
216
217 rdsdebug("cm %p listening on port %u\n", cm_id, RDS_PORT);
218
eee2fa6a 219 *ret_cm_id = cm_id;
55b7ed0b
AG
220 cm_id = NULL;
221out:
222 if (cm_id)
223 rdma_destroy_id(cm_id);
224 return ret;
225}
226
eee2fa6a
KCP
227/* Initialize the RDS RDMA listeners. We create two listeners for
228 * compatibility reason. The one on RDS_PORT is used for IPv4
229 * requests only. The one on RDS_CM_PORT is used for IPv6 requests
230 * only. So only IPv6 enabled RDS module will communicate using this
231 * port.
232 */
233static int rds_rdma_listen_init(void)
234{
235 int ret;
e65d4d96 236#if IS_ENABLED(CONFIG_IPV6)
1e2b44e7 237 struct sockaddr_in6 sin6;
e65d4d96 238#endif
eee2fa6a
KCP
239 struct sockaddr_in sin;
240
241 sin.sin_family = PF_INET;
242 sin.sin_addr.s_addr = htonl(INADDR_ANY);
243 sin.sin_port = htons(RDS_PORT);
244 ret = rds_rdma_listen_init_common(rds_rdma_cm_event_handler,
245 (struct sockaddr *)&sin,
246 &rds_rdma_listen_id);
1e2b44e7
KCP
247 if (ret != 0)
248 return ret;
249
e65d4d96 250#if IS_ENABLED(CONFIG_IPV6)
1e2b44e7
KCP
251 sin6.sin6_family = PF_INET6;
252 sin6.sin6_addr = in6addr_any;
253 sin6.sin6_port = htons(RDS_CM_PORT);
254 sin6.sin6_scope_id = 0;
255 sin6.sin6_flowinfo = 0;
256 ret = rds_rdma_listen_init_common(rds6_rdma_cm_event_handler,
257 (struct sockaddr *)&sin6,
258 &rds6_rdma_listen_id);
259 /* Keep going even when IPv6 is not enabled in the system. */
260 if (ret != 0)
261 rdsdebug("Cannot set up IPv6 RDMA listener\n");
e65d4d96 262#endif
1e2b44e7 263 return 0;
eee2fa6a
KCP
264}
265
55b7ed0b
AG
266static void rds_rdma_listen_stop(void)
267{
11bc9421
AG
268 if (rds_rdma_listen_id) {
269 rdsdebug("cm %p\n", rds_rdma_listen_id);
270 rdma_destroy_id(rds_rdma_listen_id);
271 rds_rdma_listen_id = NULL;
55b7ed0b 272 }
e65d4d96 273#if IS_ENABLED(CONFIG_IPV6)
1e2b44e7
KCP
274 if (rds6_rdma_listen_id) {
275 rdsdebug("cm %p\n", rds6_rdma_listen_id);
276 rdma_destroy_id(rds6_rdma_listen_id);
277 rds6_rdma_listen_id = NULL;
278 }
e65d4d96 279#endif
55b7ed0b
AG
280}
281
ff51bf84 282static int rds_rdma_init(void)
55b7ed0b
AG
283{
284 int ret;
285
8d5d8a5f 286 ret = rds_ib_init();
55b7ed0b
AG
287 if (ret)
288 goto out;
289
8d5d8a5f 290 ret = rds_rdma_listen_init();
55b7ed0b 291 if (ret)
8d5d8a5f 292 rds_ib_exit();
55b7ed0b
AG
293out:
294 return ret;
295}
40d86609 296module_init(rds_rdma_init);
55b7ed0b 297
ff51bf84 298static void rds_rdma_exit(void)
55b7ed0b
AG
299{
300 /* stop listening first to ensure no new connections are attempted */
301 rds_rdma_listen_stop();
302 rds_ib_exit();
55b7ed0b 303}
40d86609
AG
304module_exit(rds_rdma_exit);
305
306MODULE_AUTHOR("Oracle Corporation <rds-devel@oss.oracle.com>");
dcdede04 307MODULE_DESCRIPTION("RDS: IB transport");
40d86609 308MODULE_LICENSE("Dual BSD/GPL");