]>
Commit | Line | Data |
---|---|---|
f0cbd3ec FB |
1 | /* |
2 | * Copyright (c) 1995 Danny Gasparovski. | |
5fafdf24 TS |
3 | * |
4 | * Please read the file COPYRIGHT for the | |
f0cbd3ec FB |
5 | * terms and conditions of the copyright. |
6 | */ | |
7 | ||
7df7482b | 8 | #include "qemu/osdep.h" |
e1c5a2b3 | 9 | #include "qemu-common.h" |
f0cbd3ec FB |
10 | #include <slirp.h> |
11 | #include "ip_icmp.h" | |
ec530c81 FB |
12 | #ifdef __sun__ |
13 | #include <sys/filio.h> | |
14 | #endif | |
f0cbd3ec | 15 | |
9634d903 BS |
16 | static void sofcantrcvmore(struct socket *so); |
17 | static void sofcantsendmore(struct socket *so); | |
18 | ||
8a87f121 GS |
19 | struct socket *solookup(struct socket **last, struct socket *head, |
20 | struct sockaddr_storage *lhost, struct sockaddr_storage *fhost) | |
f0cbd3ec | 21 | { |
a5fd24aa | 22 | struct socket *so = *last; |
5fafdf24 | 23 | |
a5fd24aa | 24 | /* Optimisation */ |
8a87f121 GS |
25 | if (so != head && sockaddr_equal(&(so->lhost.ss), lhost) |
26 | && (!fhost || sockaddr_equal(&so->fhost.ss, fhost))) { | |
a5fd24aa GS |
27 | return so; |
28 | } | |
5fafdf24 | 29 | |
a5fd24aa | 30 | for (so = head->so_next; so != head; so = so->so_next) { |
8a87f121 GS |
31 | if (sockaddr_equal(&(so->lhost.ss), lhost) |
32 | && (!fhost || sockaddr_equal(&so->fhost.ss, fhost))) { | |
a5fd24aa GS |
33 | *last = so; |
34 | return so; | |
35 | } | |
36 | } | |
5fafdf24 | 37 | |
a5fd24aa | 38 | return (struct socket *)NULL; |
f0cbd3ec FB |
39 | } |
40 | ||
41 | /* | |
42 | * Create a new socket, initialise the fields | |
43 | * It is the responsibility of the caller to | |
44 | * insque() it into the correct linked-list | |
45 | */ | |
46 | struct socket * | |
460fec67 | 47 | socreate(Slirp *slirp) |
f0cbd3ec FB |
48 | { |
49 | struct socket *so; | |
5fafdf24 | 50 | |
f0cbd3ec FB |
51 | so = (struct socket *)malloc(sizeof(struct socket)); |
52 | if(so) { | |
53 | memset(so, 0, sizeof(struct socket)); | |
54 | so->so_state = SS_NOFDREF; | |
55 | so->s = -1; | |
460fec67 | 56 | so->slirp = slirp; |
7bd43ec2 | 57 | so->pollfds_idx = -1; |
f0cbd3ec FB |
58 | } |
59 | return(so); | |
60 | } | |
61 | ||
62 | /* | |
63 | * remque and free a socket, clobber cache | |
64 | */ | |
65 | void | |
511d2b14 | 66 | sofree(struct socket *so) |
f0cbd3ec | 67 | { |
460fec67 JK |
68 | Slirp *slirp = so->slirp; |
69 | ||
f0cbd3ec FB |
70 | if (so->so_emu==EMU_RSH && so->extra) { |
71 | sofree(so->extra); | |
72 | so->extra=NULL; | |
73 | } | |
460fec67 JK |
74 | if (so == slirp->tcp_last_so) { |
75 | slirp->tcp_last_so = &slirp->tcb; | |
76 | } else if (so == slirp->udp_last_so) { | |
77 | slirp->udp_last_so = &slirp->udb; | |
e6d43cfb JK |
78 | } else if (so == slirp->icmp_last_so) { |
79 | slirp->icmp_last_so = &slirp->icmp; | |
460fec67 | 80 | } |
f0cbd3ec | 81 | m_free(so->so_m); |
5fafdf24 TS |
82 | |
83 | if(so->so_next && so->so_prev) | |
f0cbd3ec FB |
84 | remque(so); /* crashes if so is not in a queue */ |
85 | ||
86 | free(so); | |
87 | } | |
88 | ||
e1c5a2b3 | 89 | size_t sopreprbuf(struct socket *so, struct iovec *iov, int *np) |
f0cbd3ec | 90 | { |
e1c5a2b3 | 91 | int n, lss, total; |
f0cbd3ec FB |
92 | struct sbuf *sb = &so->so_snd; |
93 | int len = sb->sb_datalen - sb->sb_cc; | |
f0cbd3ec | 94 | int mss = so->so_tcpcb->t_maxseg; |
5fafdf24 | 95 | |
e1c5a2b3 | 96 | DEBUG_CALL("sopreprbuf"); |
ecc804ca | 97 | DEBUG_ARG("so = %p", so); |
5fafdf24 | 98 | |
e1c5a2b3 AL |
99 | if (len <= 0) |
100 | return 0; | |
101 | ||
f0cbd3ec | 102 | iov[0].iov_base = sb->sb_wptr; |
66029f6a BS |
103 | iov[1].iov_base = NULL; |
104 | iov[1].iov_len = 0; | |
f0cbd3ec FB |
105 | if (sb->sb_wptr < sb->sb_rptr) { |
106 | iov[0].iov_len = sb->sb_rptr - sb->sb_wptr; | |
107 | /* Should never succeed, but... */ | |
108 | if (iov[0].iov_len > len) | |
109 | iov[0].iov_len = len; | |
110 | if (iov[0].iov_len > mss) | |
111 | iov[0].iov_len -= iov[0].iov_len%mss; | |
112 | n = 1; | |
113 | } else { | |
114 | iov[0].iov_len = (sb->sb_data + sb->sb_datalen) - sb->sb_wptr; | |
115 | /* Should never succeed, but... */ | |
116 | if (iov[0].iov_len > len) iov[0].iov_len = len; | |
117 | len -= iov[0].iov_len; | |
118 | if (len) { | |
119 | iov[1].iov_base = sb->sb_data; | |
120 | iov[1].iov_len = sb->sb_rptr - sb->sb_data; | |
121 | if(iov[1].iov_len > len) | |
122 | iov[1].iov_len = len; | |
123 | total = iov[0].iov_len + iov[1].iov_len; | |
124 | if (total > mss) { | |
125 | lss = total%mss; | |
126 | if (iov[1].iov_len > lss) { | |
127 | iov[1].iov_len -= lss; | |
128 | n = 2; | |
129 | } else { | |
130 | lss -= iov[1].iov_len; | |
131 | iov[0].iov_len -= lss; | |
132 | n = 1; | |
133 | } | |
134 | } else | |
135 | n = 2; | |
136 | } else { | |
137 | if (iov[0].iov_len > mss) | |
138 | iov[0].iov_len -= iov[0].iov_len%mss; | |
139 | n = 1; | |
140 | } | |
141 | } | |
e1c5a2b3 AL |
142 | if (np) |
143 | *np = n; | |
144 | ||
145 | return iov[0].iov_len + (n - 1) * iov[1].iov_len; | |
146 | } | |
147 | ||
148 | /* | |
149 | * Read from so's socket into sb_snd, updating all relevant sbuf fields | |
150 | * NOTE: This will only be called if it is select()ed for reading, so | |
151 | * a read() of 0 (or less) means it's disconnected | |
152 | */ | |
153 | int | |
511d2b14 | 154 | soread(struct socket *so) |
e1c5a2b3 AL |
155 | { |
156 | int n, nn; | |
157 | struct sbuf *sb = &so->so_snd; | |
158 | struct iovec iov[2]; | |
159 | ||
160 | DEBUG_CALL("soread"); | |
ecc804ca | 161 | DEBUG_ARG("so = %p", so); |
e1c5a2b3 AL |
162 | |
163 | /* | |
164 | * No need to check if there's enough room to read. | |
165 | * soread wouldn't have been called if there weren't | |
166 | */ | |
167 | sopreprbuf(so, iov, &n); | |
5fafdf24 | 168 | |
f0cbd3ec FB |
169 | #ifdef HAVE_READV |
170 | nn = readv(so->s, (struct iovec *)iov, n); | |
171 | DEBUG_MISC((dfd, " ... read nn = %d bytes\n", nn)); | |
172 | #else | |
00aa0040 | 173 | nn = qemu_recv(so->s, iov[0].iov_base, iov[0].iov_len,0); |
5fafdf24 | 174 | #endif |
f0cbd3ec FB |
175 | if (nn <= 0) { |
176 | if (nn < 0 && (errno == EINTR || errno == EAGAIN)) | |
177 | return 0; | |
178 | else { | |
179 | DEBUG_MISC((dfd, " --- soread() disconnected, nn = %d, errno = %d-%s\n", nn, errno,strerror(errno))); | |
180 | sofcantrcvmore(so); | |
181 | tcp_sockclosed(sototcpcb(so)); | |
182 | return -1; | |
183 | } | |
184 | } | |
5fafdf24 | 185 | |
f0cbd3ec FB |
186 | #ifndef HAVE_READV |
187 | /* | |
188 | * If there was no error, try and read the second time round | |
189 | * We read again if n = 2 (ie, there's another part of the buffer) | |
190 | * and we read as much as we could in the first read | |
191 | * We don't test for <= 0 this time, because there legitimately | |
192 | * might not be any more data (since the socket is non-blocking), | |
193 | * a close will be detected on next iteration. | |
194 | * A return of -1 wont (shouldn't) happen, since it didn't happen above | |
195 | */ | |
17444c9c FB |
196 | if (n == 2 && nn == iov[0].iov_len) { |
197 | int ret; | |
00aa0040 | 198 | ret = qemu_recv(so->s, iov[1].iov_base, iov[1].iov_len,0); |
17444c9c FB |
199 | if (ret > 0) |
200 | nn += ret; | |
201 | } | |
5fafdf24 | 202 | |
f0cbd3ec FB |
203 | DEBUG_MISC((dfd, " ... read nn = %d bytes\n", nn)); |
204 | #endif | |
5fafdf24 | 205 | |
f0cbd3ec FB |
206 | /* Update fields */ |
207 | sb->sb_cc += nn; | |
208 | sb->sb_wptr += nn; | |
209 | if (sb->sb_wptr >= (sb->sb_data + sb->sb_datalen)) | |
210 | sb->sb_wptr -= sb->sb_datalen; | |
211 | return nn; | |
212 | } | |
5fafdf24 | 213 | |
e1c5a2b3 AL |
214 | int soreadbuf(struct socket *so, const char *buf, int size) |
215 | { | |
216 | int n, nn, copy = size; | |
217 | struct sbuf *sb = &so->so_snd; | |
218 | struct iovec iov[2]; | |
219 | ||
220 | DEBUG_CALL("soreadbuf"); | |
ecc804ca | 221 | DEBUG_ARG("so = %p", so); |
e1c5a2b3 AL |
222 | |
223 | /* | |
224 | * No need to check if there's enough room to read. | |
225 | * soread wouldn't have been called if there weren't | |
226 | */ | |
227 | if (sopreprbuf(so, iov, &n) < size) | |
228 | goto err; | |
229 | ||
230 | nn = MIN(iov[0].iov_len, copy); | |
231 | memcpy(iov[0].iov_base, buf, nn); | |
232 | ||
233 | copy -= nn; | |
234 | buf += nn; | |
235 | ||
236 | if (copy == 0) | |
237 | goto done; | |
238 | ||
239 | memcpy(iov[1].iov_base, buf, copy); | |
240 | ||
241 | done: | |
242 | /* Update fields */ | |
243 | sb->sb_cc += size; | |
244 | sb->sb_wptr += size; | |
245 | if (sb->sb_wptr >= (sb->sb_data + sb->sb_datalen)) | |
246 | sb->sb_wptr -= sb->sb_datalen; | |
247 | return size; | |
248 | err: | |
249 | ||
250 | sofcantrcvmore(so); | |
251 | tcp_sockclosed(sototcpcb(so)); | |
252 | fprintf(stderr, "soreadbuf buffer to small"); | |
253 | return -1; | |
254 | } | |
255 | ||
f0cbd3ec FB |
256 | /* |
257 | * Get urgent data | |
5fafdf24 | 258 | * |
f0cbd3ec FB |
259 | * When the socket is created, we set it SO_OOBINLINE, |
260 | * so when OOB data arrives, we soread() it and everything | |
261 | * in the send buffer is sent as urgent data | |
262 | */ | |
bfb1ac14 | 263 | int |
511d2b14 | 264 | sorecvoob(struct socket *so) |
f0cbd3ec FB |
265 | { |
266 | struct tcpcb *tp = sototcpcb(so); | |
bfb1ac14 | 267 | int ret; |
f0cbd3ec FB |
268 | |
269 | DEBUG_CALL("sorecvoob"); | |
ecc804ca | 270 | DEBUG_ARG("so = %p", so); |
5fafdf24 | 271 | |
f0cbd3ec FB |
272 | /* |
273 | * We take a guess at how much urgent data has arrived. | |
274 | * In most situations, when urgent data arrives, the next | |
275 | * read() should get all the urgent data. This guess will | |
276 | * be wrong however if more data arrives just after the | |
5fafdf24 | 277 | * urgent data, or the read() doesn't return all the |
f0cbd3ec FB |
278 | * urgent data. |
279 | */ | |
bfb1ac14 SL |
280 | ret = soread(so); |
281 | if (ret > 0) { | |
282 | tp->snd_up = tp->snd_una + so->so_snd.sb_cc; | |
283 | tp->t_force = 1; | |
284 | tcp_output(tp); | |
285 | tp->t_force = 0; | |
286 | } | |
287 | ||
288 | return ret; | |
f0cbd3ec FB |
289 | } |
290 | ||
291 | /* | |
292 | * Send urgent data | |
293 | * There's a lot duplicated code here, but... | |
294 | */ | |
295 | int | |
511d2b14 | 296 | sosendoob(struct socket *so) |
f0cbd3ec FB |
297 | { |
298 | struct sbuf *sb = &so->so_rcv; | |
299 | char buff[2048]; /* XXX Shouldn't be sending more oob data than this */ | |
5fafdf24 | 300 | |
f0cbd3ec | 301 | int n, len; |
5fafdf24 | 302 | |
f0cbd3ec | 303 | DEBUG_CALL("sosendoob"); |
ecc804ca | 304 | DEBUG_ARG("so = %p", so); |
f0cbd3ec | 305 | DEBUG_ARG("sb->sb_cc = %d", sb->sb_cc); |
5fafdf24 | 306 | |
f0cbd3ec FB |
307 | if (so->so_urgc > 2048) |
308 | so->so_urgc = 2048; /* XXXX */ | |
5fafdf24 | 309 | |
f0cbd3ec FB |
310 | if (sb->sb_rptr < sb->sb_wptr) { |
311 | /* We can send it directly */ | |
e1c5a2b3 | 312 | n = slirp_send(so, sb->sb_rptr, so->so_urgc, (MSG_OOB)); /* |MSG_DONTWAIT)); */ |
f0cbd3ec | 313 | so->so_urgc -= n; |
3b46e624 | 314 | |
f0cbd3ec FB |
315 | DEBUG_MISC((dfd, " --- sent %d bytes urgent data, %d urgent bytes left\n", n, so->so_urgc)); |
316 | } else { | |
5fafdf24 | 317 | /* |
f0cbd3ec FB |
318 | * Since there's no sendv or sendtov like writev, |
319 | * we must copy all data to a linear buffer then | |
320 | * send it all | |
321 | */ | |
322 | len = (sb->sb_data + sb->sb_datalen) - sb->sb_rptr; | |
323 | if (len > so->so_urgc) len = so->so_urgc; | |
324 | memcpy(buff, sb->sb_rptr, len); | |
325 | so->so_urgc -= len; | |
326 | if (so->so_urgc) { | |
327 | n = sb->sb_wptr - sb->sb_data; | |
328 | if (n > so->so_urgc) n = so->so_urgc; | |
329 | memcpy((buff + len), sb->sb_data, n); | |
330 | so->so_urgc -= n; | |
331 | len += n; | |
332 | } | |
e1c5a2b3 | 333 | n = slirp_send(so, buff, len, (MSG_OOB)); /* |MSG_DONTWAIT)); */ |
f0cbd3ec FB |
334 | #ifdef DEBUG |
335 | if (n != len) | |
336 | DEBUG_ERROR((dfd, "Didn't send all data urgently XXXXX\n")); | |
3b46e624 | 337 | #endif |
f0cbd3ec FB |
338 | DEBUG_MISC((dfd, " ---2 sent %d bytes urgent data, %d urgent bytes left\n", n, so->so_urgc)); |
339 | } | |
5fafdf24 | 340 | |
f0cbd3ec FB |
341 | sb->sb_cc -= n; |
342 | sb->sb_rptr += n; | |
343 | if (sb->sb_rptr >= (sb->sb_data + sb->sb_datalen)) | |
344 | sb->sb_rptr -= sb->sb_datalen; | |
5fafdf24 | 345 | |
f0cbd3ec FB |
346 | return n; |
347 | } | |
348 | ||
349 | /* | |
5fafdf24 | 350 | * Write data from so_rcv to so's socket, |
f0cbd3ec FB |
351 | * updating all sbuf field as necessary |
352 | */ | |
353 | int | |
511d2b14 | 354 | sowrite(struct socket *so) |
f0cbd3ec FB |
355 | { |
356 | int n,nn; | |
357 | struct sbuf *sb = &so->so_rcv; | |
358 | int len = sb->sb_cc; | |
359 | struct iovec iov[2]; | |
5fafdf24 | 360 | |
f0cbd3ec | 361 | DEBUG_CALL("sowrite"); |
ecc804ca | 362 | DEBUG_ARG("so = %p", so); |
5fafdf24 | 363 | |
f0cbd3ec FB |
364 | if (so->so_urgc) { |
365 | sosendoob(so); | |
366 | if (sb->sb_cc == 0) | |
367 | return 0; | |
368 | } | |
369 | ||
370 | /* | |
371 | * No need to check if there's something to write, | |
372 | * sowrite wouldn't have been called otherwise | |
373 | */ | |
5fafdf24 | 374 | |
f0cbd3ec | 375 | iov[0].iov_base = sb->sb_rptr; |
66029f6a BS |
376 | iov[1].iov_base = NULL; |
377 | iov[1].iov_len = 0; | |
f0cbd3ec FB |
378 | if (sb->sb_rptr < sb->sb_wptr) { |
379 | iov[0].iov_len = sb->sb_wptr - sb->sb_rptr; | |
380 | /* Should never succeed, but... */ | |
381 | if (iov[0].iov_len > len) iov[0].iov_len = len; | |
382 | n = 1; | |
383 | } else { | |
384 | iov[0].iov_len = (sb->sb_data + sb->sb_datalen) - sb->sb_rptr; | |
385 | if (iov[0].iov_len > len) iov[0].iov_len = len; | |
386 | len -= iov[0].iov_len; | |
387 | if (len) { | |
388 | iov[1].iov_base = sb->sb_data; | |
389 | iov[1].iov_len = sb->sb_wptr - sb->sb_data; | |
390 | if (iov[1].iov_len > len) iov[1].iov_len = len; | |
391 | n = 2; | |
392 | } else | |
393 | n = 1; | |
394 | } | |
395 | /* Check if there's urgent data to send, and if so, send it */ | |
396 | ||
397 | #ifdef HAVE_READV | |
398 | nn = writev(so->s, (const struct iovec *)iov, n); | |
5fafdf24 | 399 | |
f0cbd3ec FB |
400 | DEBUG_MISC((dfd, " ... wrote nn = %d bytes\n", nn)); |
401 | #else | |
e1c5a2b3 | 402 | nn = slirp_send(so, iov[0].iov_base, iov[0].iov_len,0); |
f0cbd3ec FB |
403 | #endif |
404 | /* This should never happen, but people tell me it does *shrug* */ | |
405 | if (nn < 0 && (errno == EAGAIN || errno == EINTR)) | |
406 | return 0; | |
5fafdf24 | 407 | |
f0cbd3ec FB |
408 | if (nn <= 0) { |
409 | DEBUG_MISC((dfd, " --- sowrite disconnected, so->so_state = %x, errno = %d\n", | |
410 | so->so_state, errno)); | |
411 | sofcantsendmore(so); | |
412 | tcp_sockclosed(sototcpcb(so)); | |
413 | return -1; | |
414 | } | |
5fafdf24 | 415 | |
f0cbd3ec | 416 | #ifndef HAVE_READV |
3bc2175d FB |
417 | if (n == 2 && nn == iov[0].iov_len) { |
418 | int ret; | |
e1c5a2b3 | 419 | ret = slirp_send(so, iov[1].iov_base, iov[1].iov_len,0); |
3bc2175d FB |
420 | if (ret > 0) |
421 | nn += ret; | |
422 | } | |
f0cbd3ec FB |
423 | DEBUG_MISC((dfd, " ... wrote nn = %d bytes\n", nn)); |
424 | #endif | |
5fafdf24 | 425 | |
f0cbd3ec FB |
426 | /* Update sbuf */ |
427 | sb->sb_cc -= nn; | |
428 | sb->sb_rptr += nn; | |
429 | if (sb->sb_rptr >= (sb->sb_data + sb->sb_datalen)) | |
430 | sb->sb_rptr -= sb->sb_datalen; | |
5fafdf24 | 431 | |
f0cbd3ec FB |
432 | /* |
433 | * If in DRAIN mode, and there's no more data, set | |
434 | * it CANTSENDMORE | |
435 | */ | |
436 | if ((so->so_state & SS_FWDRAIN) && sb->sb_cc == 0) | |
437 | sofcantsendmore(so); | |
5fafdf24 | 438 | |
f0cbd3ec FB |
439 | return nn; |
440 | } | |
441 | ||
442 | /* | |
443 | * recvfrom() a UDP socket | |
444 | */ | |
445 | void | |
511d2b14 | 446 | sorecvfrom(struct socket *so) |
f0cbd3ec | 447 | { |
eae303ff | 448 | struct sockaddr_storage addr; |
5379229a | 449 | struct sockaddr_storage saddr, daddr; |
eae303ff | 450 | socklen_t addrlen = sizeof(struct sockaddr_storage); |
5fafdf24 | 451 | |
f0cbd3ec | 452 | DEBUG_CALL("sorecvfrom"); |
ecc804ca | 453 | DEBUG_ARG("so = %p", so); |
5fafdf24 | 454 | |
f0cbd3ec FB |
455 | if (so->so_type == IPPROTO_ICMP) { /* This is a "ping" reply */ |
456 | char buff[256]; | |
457 | int len; | |
3b46e624 | 458 | |
5fafdf24 | 459 | len = recvfrom(so->s, buff, 256, 0, |
f0cbd3ec FB |
460 | (struct sockaddr *)&addr, &addrlen); |
461 | /* XXX Check if reply is "correct"? */ | |
3b46e624 | 462 | |
f0cbd3ec FB |
463 | if(len == -1 || len == 0) { |
464 | u_char code=ICMP_UNREACH_PORT; | |
465 | ||
466 | if(errno == EHOSTUNREACH) code=ICMP_UNREACH_HOST; | |
467 | else if(errno == ENETUNREACH) code=ICMP_UNREACH_NET; | |
3b46e624 | 468 | |
f0cbd3ec FB |
469 | DEBUG_MISC((dfd," udp icmp rx errno = %d-%s\n", |
470 | errno,strerror(errno))); | |
de40abfe | 471 | icmp_send_error(so->so_m, ICMP_UNREACH, code, 0, strerror(errno)); |
f0cbd3ec FB |
472 | } else { |
473 | icmp_reflect(so->so_m); | |
511d2b14 | 474 | so->so_m = NULL; /* Don't m_free() it again! */ |
f0cbd3ec FB |
475 | } |
476 | /* No need for this socket anymore, udp_detach it */ | |
477 | udp_detach(so); | |
478 | } else { /* A "normal" UDP packet */ | |
479 | struct mbuf *m; | |
c5b76b38 BS |
480 | int len; |
481 | #ifdef _WIN32 | |
482 | unsigned long n; | |
483 | #else | |
484 | int n; | |
485 | #endif | |
f0cbd3ec | 486 | |
460fec67 JK |
487 | m = m_get(so->slirp); |
488 | if (!m) { | |
489 | return; | |
490 | } | |
98c63057 GS |
491 | switch (so->so_ffamily) { |
492 | case AF_INET: | |
493 | m->m_data += IF_MAXLINKHDR + sizeof(struct udpiphdr); | |
494 | break; | |
495 | case AF_INET6: | |
496 | m->m_data += IF_MAXLINKHDR + sizeof(struct ip6) | |
497 | + sizeof(struct udphdr); | |
498 | break; | |
499 | default: | |
500 | g_assert_not_reached(); | |
501 | break; | |
502 | } | |
3b46e624 | 503 | |
5fafdf24 | 504 | /* |
f0cbd3ec FB |
505 | * XXX Shouldn't FIONREAD packets destined for port 53, |
506 | * but I don't know the max packet size for DNS lookups | |
507 | */ | |
508 | len = M_FREEROOM(m); | |
509 | /* if (so->so_fport != htons(53)) { */ | |
379ff53d | 510 | ioctlsocket(so->s, FIONREAD, &n); |
3b46e624 | 511 | |
f0cbd3ec FB |
512 | if (n > len) { |
513 | n = (m->m_data - m->m_dat) + m->m_len + n + 1; | |
514 | m_inc(m, n); | |
515 | len = M_FREEROOM(m); | |
516 | } | |
517 | /* } */ | |
3b46e624 | 518 | |
f0cbd3ec FB |
519 | m->m_len = recvfrom(so->s, m->m_data, len, 0, |
520 | (struct sockaddr *)&addr, &addrlen); | |
5fafdf24 | 521 | DEBUG_MISC((dfd, " did recvfrom %d, errno = %d-%s\n", |
f0cbd3ec FB |
522 | m->m_len, errno,strerror(errno))); |
523 | if(m->m_len<0) { | |
15d62af4 GS |
524 | /* Report error as ICMP */ |
525 | switch (so->so_lfamily) { | |
526 | uint8_t code; | |
527 | case AF_INET: | |
528 | code = ICMP_UNREACH_PORT; | |
529 | ||
530 | if (errno == EHOSTUNREACH) { | |
531 | code = ICMP_UNREACH_HOST; | |
532 | } else if (errno == ENETUNREACH) { | |
533 | code = ICMP_UNREACH_NET; | |
534 | } | |
535 | ||
536 | DEBUG_MISC((dfd, " rx error, tx icmp ICMP_UNREACH:%i\n", code)); | |
537 | icmp_send_error(so->so_m, ICMP_UNREACH, code, 0, strerror(errno)); | |
538 | break; | |
539 | case AF_INET6: | |
540 | code = ICMP6_UNREACH_PORT; | |
541 | ||
542 | if (errno == EHOSTUNREACH) { | |
543 | code = ICMP6_UNREACH_ADDRESS; | |
544 | } else if (errno == ENETUNREACH) { | |
545 | code = ICMP6_UNREACH_NO_ROUTE; | |
546 | } | |
547 | ||
548 | DEBUG_MISC((dfd, " rx error, tx icmp6 ICMP_UNREACH:%i\n", code)); | |
549 | icmp6_send_error(so->so_m, ICMP6_UNREACH, code); | |
550 | break; | |
551 | default: | |
552 | g_assert_not_reached(); | |
553 | break; | |
554 | } | |
f0cbd3ec FB |
555 | m_free(m); |
556 | } else { | |
557 | /* | |
558 | * Hack: domain name lookup will be used the most for UDP, | |
559 | * and since they'll only be used once there's no need | |
560 | * for the 4 minute (or whatever) timeout... So we time them | |
561 | * out much quicker (10 seconds for now...) | |
562 | */ | |
563 | if (so->so_expire) { | |
564 | if (so->so_fport == htons(53)) | |
565 | so->so_expire = curtime + SO_EXPIREFAST; | |
566 | else | |
567 | so->so_expire = curtime + SO_EXPIRE; | |
568 | } | |
569 | ||
5fafdf24 | 570 | /* |
f0cbd3ec | 571 | * If this packet was destined for CTL_ADDR, |
5379229a | 572 | * make it look like that's where it came from |
f0cbd3ec | 573 | */ |
5379229a GS |
574 | saddr = addr; |
575 | sotranslate_in(so, &saddr); | |
576 | daddr = so->lhost.ss; | |
577 | ||
eae303ff GS |
578 | switch (so->so_ffamily) { |
579 | case AF_INET: | |
5379229a GS |
580 | udp_output(so, m, (struct sockaddr_in *) &saddr, |
581 | (struct sockaddr_in *) &daddr, | |
582 | so->so_iptos); | |
eae303ff | 583 | break; |
15d62af4 GS |
584 | case AF_INET6: |
585 | udp6_output(so, m, (struct sockaddr_in6 *) &saddr, | |
586 | (struct sockaddr_in6 *) &daddr); | |
587 | break; | |
eae303ff | 588 | default: |
15d62af4 | 589 | g_assert_not_reached(); |
eae303ff GS |
590 | break; |
591 | } | |
f0cbd3ec FB |
592 | } /* rx error */ |
593 | } /* if ping packet */ | |
594 | } | |
595 | ||
596 | /* | |
597 | * sendto() a socket | |
598 | */ | |
599 | int | |
511d2b14 | 600 | sosendto(struct socket *so, struct mbuf *m) |
f0cbd3ec FB |
601 | { |
602 | int ret; | |
5379229a | 603 | struct sockaddr_storage addr; |
f0cbd3ec FB |
604 | |
605 | DEBUG_CALL("sosendto"); | |
ecc804ca SW |
606 | DEBUG_ARG("so = %p", so); |
607 | DEBUG_ARG("m = %p", m); | |
5fafdf24 | 608 | |
5379229a GS |
609 | addr = so->fhost.ss; |
610 | DEBUG_CALL(" sendto()ing)"); | |
611 | sotranslate_out(so, &addr); | |
5fafdf24 | 612 | |
f0cbd3ec FB |
613 | /* Don't care what port we get */ |
614 | ret = sendto(so->s, m->m_data, m->m_len, 0, | |
5379229a | 615 | (struct sockaddr *)&addr, sizeof(addr)); |
f0cbd3ec FB |
616 | if (ret < 0) |
617 | return -1; | |
5fafdf24 | 618 | |
f0cbd3ec FB |
619 | /* |
620 | * Kill the socket if there's no reply in 4 minutes, | |
621 | * but only if it's an expirable socket | |
622 | */ | |
623 | if (so->so_expire) | |
624 | so->so_expire = curtime + SO_EXPIRE; | |
f932b6ce JK |
625 | so->so_state &= SS_PERSISTENT_MASK; |
626 | so->so_state |= SS_ISFCONNECTED; /* So that it gets select()ed */ | |
f0cbd3ec FB |
627 | return 0; |
628 | } | |
629 | ||
630 | /* | |
3c6a0580 | 631 | * Listen for incoming TCP connections |
f0cbd3ec FB |
632 | */ |
633 | struct socket * | |
b6dce92e | 634 | tcp_listen(Slirp *slirp, uint32_t haddr, u_int hport, uint32_t laddr, |
460fec67 | 635 | u_int lport, int flags) |
f0cbd3ec FB |
636 | { |
637 | struct sockaddr_in addr; | |
638 | struct socket *so; | |
242acf3a AZ |
639 | int s, opt = 1; |
640 | socklen_t addrlen = sizeof(addr); | |
ab07b980 | 641 | memset(&addr, 0, addrlen); |
f0cbd3ec | 642 | |
3c6a0580 | 643 | DEBUG_CALL("tcp_listen"); |
9f349498 JK |
644 | DEBUG_ARG("haddr = %x", haddr); |
645 | DEBUG_ARG("hport = %d", hport); | |
f0cbd3ec FB |
646 | DEBUG_ARG("laddr = %x", laddr); |
647 | DEBUG_ARG("lport = %d", lport); | |
648 | DEBUG_ARG("flags = %x", flags); | |
5fafdf24 | 649 | |
460fec67 JK |
650 | so = socreate(slirp); |
651 | if (!so) { | |
f0cbd3ec FB |
652 | return NULL; |
653 | } | |
5fafdf24 | 654 | |
f0cbd3ec FB |
655 | /* Don't tcp_attach... we don't need so_snd nor so_rcv */ |
656 | if ((so->so_tcpcb = tcp_newtcpcb(so)) == NULL) { | |
657 | free(so); | |
658 | return NULL; | |
659 | } | |
460fec67 | 660 | insque(so, &slirp->tcb); |
5fafdf24 TS |
661 | |
662 | /* | |
f0cbd3ec FB |
663 | * SS_FACCEPTONCE sockets must time out. |
664 | */ | |
665 | if (flags & SS_FACCEPTONCE) | |
666 | so->so_tcpcb->t_timer[TCPT_KEEP] = TCPTV_KEEP_INIT*2; | |
5fafdf24 | 667 | |
f932b6ce JK |
668 | so->so_state &= SS_PERSISTENT_MASK; |
669 | so->so_state |= (SS_FACCEPTCONN | flags); | |
eae303ff | 670 | so->so_lfamily = AF_INET; |
f0cbd3ec FB |
671 | so->so_lport = lport; /* Kept in network format */ |
672 | so->so_laddr.s_addr = laddr; /* Ditto */ | |
5fafdf24 | 673 | |
f0cbd3ec | 674 | addr.sin_family = AF_INET; |
3c6a0580 JK |
675 | addr.sin_addr.s_addr = haddr; |
676 | addr.sin_port = hport; | |
5fafdf24 | 677 | |
40ff6d7e | 678 | if (((s = qemu_socket(AF_INET,SOCK_STREAM,0)) < 0) || |
aad1239a | 679 | (socket_set_fast_reuse(s) < 0) || |
f0cbd3ec FB |
680 | (bind(s,(struct sockaddr *)&addr, sizeof(addr)) < 0) || |
681 | (listen(s,1) < 0)) { | |
682 | int tmperrno = errno; /* Don't clobber the real reason we failed */ | |
3b46e624 | 683 | |
f0cbd3ec FB |
684 | close(s); |
685 | sofree(so); | |
686 | /* Restore the real errno */ | |
02d2c54c FB |
687 | #ifdef _WIN32 |
688 | WSASetLastError(tmperrno); | |
689 | #else | |
f0cbd3ec | 690 | errno = tmperrno; |
02d2c54c | 691 | #endif |
f0cbd3ec FB |
692 | return NULL; |
693 | } | |
9957fc7f | 694 | qemu_setsockopt(s, SOL_SOCKET, SO_OOBINLINE, &opt, sizeof(int)); |
5fafdf24 | 695 | |
f0cbd3ec | 696 | getsockname(s,(struct sockaddr *)&addr,&addrlen); |
eae303ff | 697 | so->so_ffamily = AF_INET; |
f0cbd3ec FB |
698 | so->so_fport = addr.sin_port; |
699 | if (addr.sin_addr.s_addr == 0 || addr.sin_addr.s_addr == loopback_addr.s_addr) | |
460fec67 | 700 | so->so_faddr = slirp->vhost_addr; |
f0cbd3ec FB |
701 | else |
702 | so->so_faddr = addr.sin_addr; | |
703 | ||
704 | so->s = s; | |
705 | return so; | |
706 | } | |
707 | ||
f0cbd3ec FB |
708 | /* |
709 | * Various session state calls | |
710 | * XXX Should be #define's | |
711 | * The socket state stuff needs work, these often get call 2 or 3 | |
712 | * times each when only 1 was needed | |
713 | */ | |
714 | void | |
511d2b14 | 715 | soisfconnecting(struct socket *so) |
f0cbd3ec FB |
716 | { |
717 | so->so_state &= ~(SS_NOFDREF|SS_ISFCONNECTED|SS_FCANTRCVMORE| | |
718 | SS_FCANTSENDMORE|SS_FWDRAIN); | |
719 | so->so_state |= SS_ISFCONNECTING; /* Clobber other states */ | |
720 | } | |
721 | ||
722 | void | |
511d2b14 | 723 | soisfconnected(struct socket *so) |
f0cbd3ec FB |
724 | { |
725 | so->so_state &= ~(SS_ISFCONNECTING|SS_FWDRAIN|SS_NOFDREF); | |
726 | so->so_state |= SS_ISFCONNECTED; /* Clobber other states */ | |
727 | } | |
728 | ||
9634d903 BS |
729 | static void |
730 | sofcantrcvmore(struct socket *so) | |
f0cbd3ec FB |
731 | { |
732 | if ((so->so_state & SS_NOFDREF) == 0) { | |
733 | shutdown(so->s,0); | |
f0cbd3ec FB |
734 | } |
735 | so->so_state &= ~(SS_ISFCONNECTING); | |
f932b6ce JK |
736 | if (so->so_state & SS_FCANTSENDMORE) { |
737 | so->so_state &= SS_PERSISTENT_MASK; | |
738 | so->so_state |= SS_NOFDREF; /* Don't select it */ | |
739 | } else { | |
f0cbd3ec | 740 | so->so_state |= SS_FCANTRCVMORE; |
f932b6ce | 741 | } |
f0cbd3ec FB |
742 | } |
743 | ||
9634d903 BS |
744 | static void |
745 | sofcantsendmore(struct socket *so) | |
f0cbd3ec FB |
746 | { |
747 | if ((so->so_state & SS_NOFDREF) == 0) { | |
02d2c54c | 748 | shutdown(so->s,1); /* send FIN to fhost */ |
f0cbd3ec FB |
749 | } |
750 | so->so_state &= ~(SS_ISFCONNECTING); | |
f932b6ce JK |
751 | if (so->so_state & SS_FCANTRCVMORE) { |
752 | so->so_state &= SS_PERSISTENT_MASK; | |
753 | so->so_state |= SS_NOFDREF; /* as above */ | |
754 | } else { | |
f0cbd3ec | 755 | so->so_state |= SS_FCANTSENDMORE; |
f932b6ce | 756 | } |
f0cbd3ec FB |
757 | } |
758 | ||
f0cbd3ec FB |
759 | /* |
760 | * Set write drain mode | |
761 | * Set CANTSENDMORE once all data has been write()n | |
762 | */ | |
763 | void | |
511d2b14 | 764 | sofwdrain(struct socket *so) |
f0cbd3ec FB |
765 | { |
766 | if (so->so_rcv.sb_cc) | |
767 | so->so_state |= SS_FWDRAIN; | |
768 | else | |
769 | sofcantsendmore(so); | |
770 | } | |
5379229a GS |
771 | |
772 | /* | |
773 | * Translate addr in host addr when it is a virtual address | |
774 | */ | |
775 | void sotranslate_out(struct socket *so, struct sockaddr_storage *addr) | |
776 | { | |
777 | Slirp *slirp = so->slirp; | |
778 | struct sockaddr_in *sin = (struct sockaddr_in *)addr; | |
05061d85 | 779 | struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)addr; |
5379229a GS |
780 | |
781 | switch (addr->ss_family) { | |
782 | case AF_INET: | |
783 | if ((so->so_faddr.s_addr & slirp->vnetwork_mask.s_addr) == | |
784 | slirp->vnetwork_addr.s_addr) { | |
785 | /* It's an alias */ | |
786 | if (so->so_faddr.s_addr == slirp->vnameserver_addr.s_addr) { | |
787 | if (get_dns_addr(&sin->sin_addr) < 0) { | |
788 | sin->sin_addr = loopback_addr; | |
789 | } | |
790 | } else { | |
791 | sin->sin_addr = loopback_addr; | |
792 | } | |
793 | } | |
794 | ||
795 | DEBUG_MISC((dfd, " addr.sin_port=%d, " | |
796 | "addr.sin_addr.s_addr=%.16s\n", | |
797 | ntohs(sin->sin_port), inet_ntoa(sin->sin_addr))); | |
798 | break; | |
799 | ||
05061d85 GS |
800 | case AF_INET6: |
801 | if (in6_equal_net(&so->so_faddr6, &slirp->vprefix_addr6, | |
802 | slirp->vprefix_len)) { | |
803 | if (in6_equal(&so->so_faddr6, &slirp->vnameserver_addr6)) { | |
804 | /*if (get_dns_addr(&addr) < 0) {*/ /* TODO */ | |
805 | sin6->sin6_addr = in6addr_loopback; | |
806 | /*}*/ | |
807 | } else { | |
808 | sin6->sin6_addr = in6addr_loopback; | |
809 | } | |
810 | } | |
811 | break; | |
812 | ||
5379229a GS |
813 | default: |
814 | break; | |
815 | } | |
816 | } | |
817 | ||
818 | void sotranslate_in(struct socket *so, struct sockaddr_storage *addr) | |
819 | { | |
820 | Slirp *slirp = so->slirp; | |
821 | struct sockaddr_in *sin = (struct sockaddr_in *)addr; | |
05061d85 | 822 | struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)addr; |
5379229a GS |
823 | |
824 | switch (addr->ss_family) { | |
825 | case AF_INET: | |
826 | if ((so->so_faddr.s_addr & slirp->vnetwork_mask.s_addr) == | |
827 | slirp->vnetwork_addr.s_addr) { | |
828 | uint32_t inv_mask = ~slirp->vnetwork_mask.s_addr; | |
829 | ||
830 | if ((so->so_faddr.s_addr & inv_mask) == inv_mask) { | |
831 | sin->sin_addr = slirp->vhost_addr; | |
832 | } else if (sin->sin_addr.s_addr == loopback_addr.s_addr || | |
833 | so->so_faddr.s_addr != slirp->vhost_addr.s_addr) { | |
834 | sin->sin_addr = so->so_faddr; | |
835 | } | |
836 | } | |
837 | break; | |
838 | ||
05061d85 GS |
839 | case AF_INET6: |
840 | if (in6_equal_net(&so->so_faddr6, &slirp->vprefix_addr6, | |
841 | slirp->vprefix_len)) { | |
842 | if (in6_equal(&sin6->sin6_addr, &in6addr_loopback) | |
843 | || !in6_equal(&so->so_faddr6, &slirp->vhost_addr6)) { | |
844 | sin6->sin6_addr = so->so_faddr6; | |
845 | } | |
846 | } | |
847 | break; | |
848 | ||
5379229a GS |
849 | default: |
850 | break; | |
851 | } | |
852 | } | |
853 | ||
854 | /* | |
855 | * Translate connections from localhost to the real hostname | |
856 | */ | |
857 | void sotranslate_accept(struct socket *so) | |
858 | { | |
859 | Slirp *slirp = so->slirp; | |
860 | ||
861 | switch (so->so_ffamily) { | |
862 | case AF_INET: | |
863 | if (so->so_faddr.s_addr == INADDR_ANY || | |
864 | (so->so_faddr.s_addr & loopback_mask) == | |
865 | (loopback_addr.s_addr & loopback_mask)) { | |
866 | so->so_faddr = slirp->vhost_addr; | |
867 | } | |
868 | break; | |
869 | ||
05061d85 GS |
870 | case AF_INET6: |
871 | if (in6_equal(&so->so_faddr6, &in6addr_any) || | |
872 | in6_equal(&so->so_faddr6, &in6addr_loopback)) { | |
873 | so->so_faddr6 = slirp->vhost_addr6; | |
874 | } | |
875 | break; | |
876 | ||
5379229a GS |
877 | default: |
878 | break; | |
879 | } | |
880 | } |