]> git.proxmox.com Git - mirror_ubuntu-bionic-kernel.git/blob - net/smc/smc_clc.c
Merge tag 'for-linus' of git://git.kernel.org/pub/scm/virt/kvm/kvm
[mirror_ubuntu-bionic-kernel.git] / net / smc / smc_clc.c
1 /*
2 * Shared Memory Communications over RDMA (SMC-R) and RoCE
3 *
4 * CLC (connection layer control) handshake over initial TCP socket to
5 * prepare for RDMA traffic
6 *
7 * Copyright IBM Corp. 2016
8 *
9 * Author(s): Ursula Braun <ubraun@linux.vnet.ibm.com>
10 */
11
12 #include <linux/in.h>
13 #include <linux/if_ether.h>
14 #include <net/sock.h>
15 #include <net/tcp.h>
16
17 #include "smc.h"
18 #include "smc_core.h"
19 #include "smc_clc.h"
20 #include "smc_ib.h"
21
22 /* Wait for data on the tcp-socket, analyze received data
23 * Returns:
24 * 0 if success and it was not a decline that we received.
25 * SMC_CLC_DECL_REPLY if decline received for fallback w/o another decl send.
26 * clcsock error, -EINTR, -ECONNRESET, -EPROTO otherwise.
27 */
28 int smc_clc_wait_msg(struct smc_sock *smc, void *buf, int buflen,
29 u8 expected_type)
30 {
31 struct sock *clc_sk = smc->clcsock->sk;
32 struct smc_clc_msg_hdr *clcm = buf;
33 struct msghdr msg = {NULL, 0};
34 int reason_code = 0;
35 struct kvec vec;
36 int len, datlen;
37 int krflags;
38
39 /* peek the first few bytes to determine length of data to receive
40 * so we don't consume any subsequent CLC message or payload data
41 * in the TCP byte stream
42 */
43 vec.iov_base = buf;
44 vec.iov_len = buflen;
45 krflags = MSG_PEEK | MSG_WAITALL;
46 smc->clcsock->sk->sk_rcvtimeo = CLC_WAIT_TIME;
47 len = kernel_recvmsg(smc->clcsock, &msg, &vec, 1,
48 sizeof(struct smc_clc_msg_hdr), krflags);
49 if (signal_pending(current)) {
50 reason_code = -EINTR;
51 clc_sk->sk_err = EINTR;
52 smc->sk.sk_err = EINTR;
53 goto out;
54 }
55 if (clc_sk->sk_err) {
56 reason_code = -clc_sk->sk_err;
57 smc->sk.sk_err = clc_sk->sk_err;
58 goto out;
59 }
60 if (!len) { /* peer has performed orderly shutdown */
61 smc->sk.sk_err = ECONNRESET;
62 reason_code = -ECONNRESET;
63 goto out;
64 }
65 if (len < 0) {
66 smc->sk.sk_err = -len;
67 reason_code = len;
68 goto out;
69 }
70 datlen = ntohs(clcm->length);
71 if ((len < sizeof(struct smc_clc_msg_hdr)) ||
72 (datlen < sizeof(struct smc_clc_msg_decline)) ||
73 (datlen > sizeof(struct smc_clc_msg_accept_confirm)) ||
74 memcmp(clcm->eyecatcher, SMC_EYECATCHER, sizeof(SMC_EYECATCHER)) ||
75 ((clcm->type != SMC_CLC_DECLINE) &&
76 (clcm->type != expected_type))) {
77 smc->sk.sk_err = EPROTO;
78 reason_code = -EPROTO;
79 goto out;
80 }
81
82 /* receive the complete CLC message */
83 vec.iov_base = buf;
84 vec.iov_len = buflen;
85 memset(&msg, 0, sizeof(struct msghdr));
86 krflags = MSG_WAITALL;
87 smc->clcsock->sk->sk_rcvtimeo = CLC_WAIT_TIME;
88 len = kernel_recvmsg(smc->clcsock, &msg, &vec, 1, datlen, krflags);
89 if (len < datlen) {
90 smc->sk.sk_err = EPROTO;
91 reason_code = -EPROTO;
92 goto out;
93 }
94 if (clcm->type == SMC_CLC_DECLINE) {
95 reason_code = SMC_CLC_DECL_REPLY;
96 if (ntohl(((struct smc_clc_msg_decline *)buf)->peer_diagnosis)
97 == SMC_CLC_DECL_SYNCERR)
98 smc->conn.lgr->sync_err = true;
99 }
100
101 out:
102 return reason_code;
103 }
104
105 /* send CLC DECLINE message across internal TCP socket */
106 int smc_clc_send_decline(struct smc_sock *smc, u32 peer_diag_info,
107 u8 out_of_sync)
108 {
109 struct smc_clc_msg_decline dclc;
110 struct msghdr msg;
111 struct kvec vec;
112 int len;
113
114 memset(&dclc, 0, sizeof(dclc));
115 memcpy(dclc.hdr.eyecatcher, SMC_EYECATCHER, sizeof(SMC_EYECATCHER));
116 dclc.hdr.type = SMC_CLC_DECLINE;
117 dclc.hdr.length = htons(sizeof(struct smc_clc_msg_decline));
118 dclc.hdr.version = SMC_CLC_V1;
119 dclc.hdr.flag = out_of_sync ? 1 : 0;
120 memcpy(dclc.id_for_peer, local_systemid, sizeof(local_systemid));
121 dclc.peer_diagnosis = htonl(peer_diag_info);
122 memcpy(dclc.trl.eyecatcher, SMC_EYECATCHER, sizeof(SMC_EYECATCHER));
123
124 memset(&msg, 0, sizeof(msg));
125 vec.iov_base = &dclc;
126 vec.iov_len = sizeof(struct smc_clc_msg_decline);
127 len = kernel_sendmsg(smc->clcsock, &msg, &vec, 1,
128 sizeof(struct smc_clc_msg_decline));
129 if (len < sizeof(struct smc_clc_msg_decline))
130 smc->sk.sk_err = EPROTO;
131 if (len < 0)
132 smc->sk.sk_err = -len;
133 return len;
134 }
135
136 /* send CLC PROPOSAL message across internal TCP socket */
137 int smc_clc_send_proposal(struct smc_sock *smc,
138 struct smc_ib_device *smcibdev,
139 u8 ibport)
140 {
141 struct smc_clc_msg_proposal pclc;
142 int reason_code = 0;
143 struct msghdr msg;
144 struct kvec vec;
145 int len, rc;
146
147 /* send SMC Proposal CLC message */
148 memset(&pclc, 0, sizeof(pclc));
149 memcpy(pclc.hdr.eyecatcher, SMC_EYECATCHER, sizeof(SMC_EYECATCHER));
150 pclc.hdr.type = SMC_CLC_PROPOSAL;
151 pclc.hdr.length = htons(sizeof(pclc));
152 pclc.hdr.version = SMC_CLC_V1; /* SMC version */
153 memcpy(pclc.lcl.id_for_peer, local_systemid, sizeof(local_systemid));
154 memcpy(&pclc.lcl.gid, &smcibdev->gid[ibport - 1], SMC_GID_SIZE);
155 memcpy(&pclc.lcl.mac, &smcibdev->mac[ibport - 1], ETH_ALEN);
156
157 /* determine subnet and mask from internal TCP socket */
158 rc = smc_netinfo_by_tcpsk(smc->clcsock, &pclc.outgoing_subnet,
159 &pclc.prefix_len);
160 if (rc)
161 return SMC_CLC_DECL_CNFERR; /* configuration error */
162 memcpy(pclc.trl.eyecatcher, SMC_EYECATCHER, sizeof(SMC_EYECATCHER));
163 memset(&msg, 0, sizeof(msg));
164 vec.iov_base = &pclc;
165 vec.iov_len = sizeof(pclc);
166 /* due to the few bytes needed for clc-handshake this cannot block */
167 len = kernel_sendmsg(smc->clcsock, &msg, &vec, 1, sizeof(pclc));
168 if (len < sizeof(pclc)) {
169 if (len >= 0) {
170 reason_code = -ENETUNREACH;
171 smc->sk.sk_err = -reason_code;
172 } else {
173 smc->sk.sk_err = smc->clcsock->sk->sk_err;
174 reason_code = -smc->sk.sk_err;
175 }
176 }
177
178 return reason_code;
179 }
180
181 /* send CLC CONFIRM message across internal TCP socket */
182 int smc_clc_send_confirm(struct smc_sock *smc)
183 {
184 struct smc_connection *conn = &smc->conn;
185 struct smc_clc_msg_accept_confirm cclc;
186 struct smc_link *link;
187 int reason_code = 0;
188 struct msghdr msg;
189 struct kvec vec;
190 int len;
191
192 link = &conn->lgr->lnk[SMC_SINGLE_LINK];
193 /* send SMC Confirm CLC msg */
194 memset(&cclc, 0, sizeof(cclc));
195 memcpy(cclc.hdr.eyecatcher, SMC_EYECATCHER, sizeof(SMC_EYECATCHER));
196 cclc.hdr.type = SMC_CLC_CONFIRM;
197 cclc.hdr.length = htons(sizeof(cclc));
198 cclc.hdr.version = SMC_CLC_V1; /* SMC version */
199 memcpy(cclc.lcl.id_for_peer, local_systemid, sizeof(local_systemid));
200 memcpy(&cclc.lcl.gid, &link->smcibdev->gid[link->ibport - 1],
201 SMC_GID_SIZE);
202 memcpy(&cclc.lcl.mac, &link->smcibdev->mac[link->ibport - 1], ETH_ALEN);
203 hton24(cclc.qpn, link->roce_qp->qp_num);
204 cclc.rmb_rkey =
205 htonl(conn->rmb_desc->mr_rx[SMC_SINGLE_LINK]->rkey);
206 cclc.conn_idx = 1; /* for now: 1 RMB = 1 RMBE */
207 cclc.rmbe_alert_token = htonl(conn->alert_token_local);
208 cclc.qp_mtu = min(link->path_mtu, link->peer_mtu);
209 cclc.rmbe_size = conn->rmbe_size_short;
210 cclc.rmb_dma_addr =
211 cpu_to_be64((u64)conn->rmb_desc->dma_addr[SMC_SINGLE_LINK]);
212 hton24(cclc.psn, link->psn_initial);
213
214 memcpy(cclc.trl.eyecatcher, SMC_EYECATCHER, sizeof(SMC_EYECATCHER));
215
216 memset(&msg, 0, sizeof(msg));
217 vec.iov_base = &cclc;
218 vec.iov_len = sizeof(cclc);
219 len = kernel_sendmsg(smc->clcsock, &msg, &vec, 1, sizeof(cclc));
220 if (len < sizeof(cclc)) {
221 if (len >= 0) {
222 reason_code = -ENETUNREACH;
223 smc->sk.sk_err = -reason_code;
224 } else {
225 smc->sk.sk_err = smc->clcsock->sk->sk_err;
226 reason_code = -smc->sk.sk_err;
227 }
228 }
229 return reason_code;
230 }
231
232 /* send CLC ACCEPT message across internal TCP socket */
233 int smc_clc_send_accept(struct smc_sock *new_smc, int srv_first_contact)
234 {
235 struct smc_connection *conn = &new_smc->conn;
236 struct smc_clc_msg_accept_confirm aclc;
237 struct smc_link *link;
238 struct msghdr msg;
239 struct kvec vec;
240 int rc = 0;
241 int len;
242
243 link = &conn->lgr->lnk[SMC_SINGLE_LINK];
244 memset(&aclc, 0, sizeof(aclc));
245 memcpy(aclc.hdr.eyecatcher, SMC_EYECATCHER, sizeof(SMC_EYECATCHER));
246 aclc.hdr.type = SMC_CLC_ACCEPT;
247 aclc.hdr.length = htons(sizeof(aclc));
248 aclc.hdr.version = SMC_CLC_V1; /* SMC version */
249 if (srv_first_contact)
250 aclc.hdr.flag = 1;
251 memcpy(aclc.lcl.id_for_peer, local_systemid, sizeof(local_systemid));
252 memcpy(&aclc.lcl.gid, &link->smcibdev->gid[link->ibport - 1],
253 SMC_GID_SIZE);
254 memcpy(&aclc.lcl.mac, link->smcibdev->mac[link->ibport - 1], ETH_ALEN);
255 hton24(aclc.qpn, link->roce_qp->qp_num);
256 aclc.rmb_rkey =
257 htonl(conn->rmb_desc->mr_rx[SMC_SINGLE_LINK]->rkey);
258 aclc.conn_idx = 1; /* as long as 1 RMB = 1 RMBE */
259 aclc.rmbe_alert_token = htonl(conn->alert_token_local);
260 aclc.qp_mtu = link->path_mtu;
261 aclc.rmbe_size = conn->rmbe_size_short,
262 aclc.rmb_dma_addr =
263 cpu_to_be64((u64)conn->rmb_desc->dma_addr[SMC_SINGLE_LINK]);
264 hton24(aclc.psn, link->psn_initial);
265 memcpy(aclc.trl.eyecatcher, SMC_EYECATCHER, sizeof(SMC_EYECATCHER));
266
267 memset(&msg, 0, sizeof(msg));
268 vec.iov_base = &aclc;
269 vec.iov_len = sizeof(aclc);
270 len = kernel_sendmsg(new_smc->clcsock, &msg, &vec, 1, sizeof(aclc));
271 if (len < sizeof(aclc)) {
272 if (len >= 0)
273 new_smc->sk.sk_err = EPROTO;
274 else
275 new_smc->sk.sk_err = new_smc->clcsock->sk->sk_err;
276 rc = sock_error(&new_smc->sk);
277 }
278
279 return rc;
280 }