]>
Commit | Line | Data |
---|---|---|
f0cbd3ec FB |
1 | /* |
2 | * Copyright (c) 1995 Danny Gasparovski. | |
5fafdf24 TS |
3 | * |
4 | * Please read the file COPYRIGHT for the | |
f0cbd3ec FB |
5 | * terms and conditions of the copyright. |
6 | */ | |
7 | ||
7df7482b | 8 | #include "qemu/osdep.h" |
e1c5a2b3 | 9 | #include "qemu-common.h" |
a9c94277 | 10 | #include "slirp.h" |
f0cbd3ec | 11 | #include "ip_icmp.h" |
ec530c81 FB |
12 | #ifdef __sun__ |
13 | #include <sys/filio.h> | |
14 | #endif | |
f0cbd3ec | 15 | |
9634d903 BS |
16 | static void sofcantrcvmore(struct socket *so); |
17 | static void sofcantsendmore(struct socket *so); | |
18 | ||
8a87f121 GS |
19 | struct socket *solookup(struct socket **last, struct socket *head, |
20 | struct sockaddr_storage *lhost, struct sockaddr_storage *fhost) | |
f0cbd3ec | 21 | { |
a5fd24aa | 22 | struct socket *so = *last; |
5fafdf24 | 23 | |
a5fd24aa | 24 | /* Optimisation */ |
8a87f121 GS |
25 | if (so != head && sockaddr_equal(&(so->lhost.ss), lhost) |
26 | && (!fhost || sockaddr_equal(&so->fhost.ss, fhost))) { | |
a5fd24aa GS |
27 | return so; |
28 | } | |
5fafdf24 | 29 | |
a5fd24aa | 30 | for (so = head->so_next; so != head; so = so->so_next) { |
8a87f121 GS |
31 | if (sockaddr_equal(&(so->lhost.ss), lhost) |
32 | && (!fhost || sockaddr_equal(&so->fhost.ss, fhost))) { | |
a5fd24aa GS |
33 | *last = so; |
34 | return so; | |
35 | } | |
36 | } | |
5fafdf24 | 37 | |
a5fd24aa | 38 | return (struct socket *)NULL; |
f0cbd3ec FB |
39 | } |
40 | ||
41 | /* | |
42 | * Create a new socket, initialise the fields | |
43 | * It is the responsibility of the caller to | |
44 | * insque() it into the correct linked-list | |
45 | */ | |
46 | struct socket * | |
460fec67 | 47 | socreate(Slirp *slirp) |
f0cbd3ec FB |
48 | { |
49 | struct socket *so; | |
5fafdf24 | 50 | |
f0cbd3ec FB |
51 | so = (struct socket *)malloc(sizeof(struct socket)); |
52 | if(so) { | |
53 | memset(so, 0, sizeof(struct socket)); | |
54 | so->so_state = SS_NOFDREF; | |
55 | so->s = -1; | |
460fec67 | 56 | so->slirp = slirp; |
7bd43ec2 | 57 | so->pollfds_idx = -1; |
f0cbd3ec FB |
58 | } |
59 | return(so); | |
60 | } | |
61 | ||
62 | /* | |
63 | * remque and free a socket, clobber cache | |
64 | */ | |
65 | void | |
511d2b14 | 66 | sofree(struct socket *so) |
f0cbd3ec | 67 | { |
460fec67 | 68 | Slirp *slirp = so->slirp; |
ea64d5f0 ST |
69 | struct mbuf *ifm; |
70 | ||
71 | for (ifm = (struct mbuf *) slirp->if_fastq.qh_link; | |
72 | (struct quehead *) ifm != &slirp->if_fastq; | |
73 | ifm = ifm->ifq_next) { | |
74 | if (ifm->ifq_so == so) { | |
75 | ifm->ifq_so = NULL; | |
76 | } | |
77 | } | |
78 | ||
79 | for (ifm = (struct mbuf *) slirp->if_batchq.qh_link; | |
80 | (struct quehead *) ifm != &slirp->if_batchq; | |
81 | ifm = ifm->ifq_next) { | |
82 | if (ifm->ifq_so == so) { | |
83 | ifm->ifq_so = NULL; | |
84 | } | |
85 | } | |
460fec67 | 86 | |
f0cbd3ec FB |
87 | if (so->so_emu==EMU_RSH && so->extra) { |
88 | sofree(so->extra); | |
89 | so->extra=NULL; | |
90 | } | |
460fec67 JK |
91 | if (so == slirp->tcp_last_so) { |
92 | slirp->tcp_last_so = &slirp->tcb; | |
93 | } else if (so == slirp->udp_last_so) { | |
94 | slirp->udp_last_so = &slirp->udb; | |
e6d43cfb JK |
95 | } else if (so == slirp->icmp_last_so) { |
96 | slirp->icmp_last_so = &slirp->icmp; | |
460fec67 | 97 | } |
f0cbd3ec | 98 | m_free(so->so_m); |
5fafdf24 TS |
99 | |
100 | if(so->so_next && so->so_prev) | |
f0cbd3ec FB |
101 | remque(so); /* crashes if so is not in a queue */ |
102 | ||
103 | free(so); | |
104 | } | |
105 | ||
e1c5a2b3 | 106 | size_t sopreprbuf(struct socket *so, struct iovec *iov, int *np) |
f0cbd3ec | 107 | { |
e1c5a2b3 | 108 | int n, lss, total; |
f0cbd3ec FB |
109 | struct sbuf *sb = &so->so_snd; |
110 | int len = sb->sb_datalen - sb->sb_cc; | |
f0cbd3ec | 111 | int mss = so->so_tcpcb->t_maxseg; |
5fafdf24 | 112 | |
e1c5a2b3 | 113 | DEBUG_CALL("sopreprbuf"); |
ecc804ca | 114 | DEBUG_ARG("so = %p", so); |
5fafdf24 | 115 | |
e1c5a2b3 AL |
116 | if (len <= 0) |
117 | return 0; | |
118 | ||
f0cbd3ec | 119 | iov[0].iov_base = sb->sb_wptr; |
66029f6a BS |
120 | iov[1].iov_base = NULL; |
121 | iov[1].iov_len = 0; | |
f0cbd3ec FB |
122 | if (sb->sb_wptr < sb->sb_rptr) { |
123 | iov[0].iov_len = sb->sb_rptr - sb->sb_wptr; | |
124 | /* Should never succeed, but... */ | |
125 | if (iov[0].iov_len > len) | |
126 | iov[0].iov_len = len; | |
127 | if (iov[0].iov_len > mss) | |
128 | iov[0].iov_len -= iov[0].iov_len%mss; | |
129 | n = 1; | |
130 | } else { | |
131 | iov[0].iov_len = (sb->sb_data + sb->sb_datalen) - sb->sb_wptr; | |
132 | /* Should never succeed, but... */ | |
133 | if (iov[0].iov_len > len) iov[0].iov_len = len; | |
134 | len -= iov[0].iov_len; | |
135 | if (len) { | |
136 | iov[1].iov_base = sb->sb_data; | |
137 | iov[1].iov_len = sb->sb_rptr - sb->sb_data; | |
138 | if(iov[1].iov_len > len) | |
139 | iov[1].iov_len = len; | |
140 | total = iov[0].iov_len + iov[1].iov_len; | |
141 | if (total > mss) { | |
142 | lss = total%mss; | |
143 | if (iov[1].iov_len > lss) { | |
144 | iov[1].iov_len -= lss; | |
145 | n = 2; | |
146 | } else { | |
147 | lss -= iov[1].iov_len; | |
148 | iov[0].iov_len -= lss; | |
149 | n = 1; | |
150 | } | |
151 | } else | |
152 | n = 2; | |
153 | } else { | |
154 | if (iov[0].iov_len > mss) | |
155 | iov[0].iov_len -= iov[0].iov_len%mss; | |
156 | n = 1; | |
157 | } | |
158 | } | |
e1c5a2b3 AL |
159 | if (np) |
160 | *np = n; | |
161 | ||
162 | return iov[0].iov_len + (n - 1) * iov[1].iov_len; | |
163 | } | |
164 | ||
165 | /* | |
166 | * Read from so's socket into sb_snd, updating all relevant sbuf fields | |
167 | * NOTE: This will only be called if it is select()ed for reading, so | |
168 | * a read() of 0 (or less) means it's disconnected | |
169 | */ | |
170 | int | |
511d2b14 | 171 | soread(struct socket *so) |
e1c5a2b3 AL |
172 | { |
173 | int n, nn; | |
174 | struct sbuf *sb = &so->so_snd; | |
175 | struct iovec iov[2]; | |
176 | ||
177 | DEBUG_CALL("soread"); | |
ecc804ca | 178 | DEBUG_ARG("so = %p", so); |
e1c5a2b3 AL |
179 | |
180 | /* | |
181 | * No need to check if there's enough room to read. | |
182 | * soread wouldn't have been called if there weren't | |
183 | */ | |
184 | sopreprbuf(so, iov, &n); | |
5fafdf24 | 185 | |
f0cbd3ec FB |
186 | #ifdef HAVE_READV |
187 | nn = readv(so->s, (struct iovec *)iov, n); | |
188 | DEBUG_MISC((dfd, " ... read nn = %d bytes\n", nn)); | |
189 | #else | |
00aa0040 | 190 | nn = qemu_recv(so->s, iov[0].iov_base, iov[0].iov_len,0); |
5fafdf24 | 191 | #endif |
f0cbd3ec FB |
192 | if (nn <= 0) { |
193 | if (nn < 0 && (errno == EINTR || errno == EAGAIN)) | |
194 | return 0; | |
195 | else { | |
27d92ebc EI |
196 | int err; |
197 | socklen_t slen = sizeof err; | |
198 | ||
199 | err = errno; | |
200 | if (nn == 0) { | |
201 | getsockopt(so->s, SOL_SOCKET, SO_ERROR, | |
202 | &err, &slen); | |
203 | } | |
204 | ||
f0cbd3ec FB |
205 | DEBUG_MISC((dfd, " --- soread() disconnected, nn = %d, errno = %d-%s\n", nn, errno,strerror(errno))); |
206 | sofcantrcvmore(so); | |
27d92ebc | 207 | |
6625d83a | 208 | if (err == ECONNRESET || err == ECONNREFUSED |
27d92ebc EI |
209 | || err == ENOTCONN || err == EPIPE) { |
210 | tcp_drop(sototcpcb(so), err); | |
211 | } else { | |
212 | tcp_sockclosed(sototcpcb(so)); | |
213 | } | |
f0cbd3ec FB |
214 | return -1; |
215 | } | |
216 | } | |
5fafdf24 | 217 | |
f0cbd3ec FB |
218 | #ifndef HAVE_READV |
219 | /* | |
220 | * If there was no error, try and read the second time round | |
221 | * We read again if n = 2 (ie, there's another part of the buffer) | |
222 | * and we read as much as we could in the first read | |
223 | * We don't test for <= 0 this time, because there legitimately | |
224 | * might not be any more data (since the socket is non-blocking), | |
225 | * a close will be detected on next iteration. | |
cb8d4c8f | 226 | * A return of -1 won't (shouldn't) happen, since it didn't happen above |
f0cbd3ec | 227 | */ |
17444c9c FB |
228 | if (n == 2 && nn == iov[0].iov_len) { |
229 | int ret; | |
00aa0040 | 230 | ret = qemu_recv(so->s, iov[1].iov_base, iov[1].iov_len,0); |
17444c9c FB |
231 | if (ret > 0) |
232 | nn += ret; | |
233 | } | |
5fafdf24 | 234 | |
f0cbd3ec FB |
235 | DEBUG_MISC((dfd, " ... read nn = %d bytes\n", nn)); |
236 | #endif | |
5fafdf24 | 237 | |
f0cbd3ec FB |
238 | /* Update fields */ |
239 | sb->sb_cc += nn; | |
240 | sb->sb_wptr += nn; | |
241 | if (sb->sb_wptr >= (sb->sb_data + sb->sb_datalen)) | |
242 | sb->sb_wptr -= sb->sb_datalen; | |
243 | return nn; | |
244 | } | |
5fafdf24 | 245 | |
e1c5a2b3 AL |
246 | int soreadbuf(struct socket *so, const char *buf, int size) |
247 | { | |
248 | int n, nn, copy = size; | |
249 | struct sbuf *sb = &so->so_snd; | |
250 | struct iovec iov[2]; | |
251 | ||
252 | DEBUG_CALL("soreadbuf"); | |
ecc804ca | 253 | DEBUG_ARG("so = %p", so); |
e1c5a2b3 AL |
254 | |
255 | /* | |
256 | * No need to check if there's enough room to read. | |
257 | * soread wouldn't have been called if there weren't | |
258 | */ | |
259 | if (sopreprbuf(so, iov, &n) < size) | |
260 | goto err; | |
261 | ||
262 | nn = MIN(iov[0].iov_len, copy); | |
263 | memcpy(iov[0].iov_base, buf, nn); | |
264 | ||
265 | copy -= nn; | |
266 | buf += nn; | |
267 | ||
268 | if (copy == 0) | |
269 | goto done; | |
270 | ||
271 | memcpy(iov[1].iov_base, buf, copy); | |
272 | ||
273 | done: | |
274 | /* Update fields */ | |
275 | sb->sb_cc += size; | |
276 | sb->sb_wptr += size; | |
277 | if (sb->sb_wptr >= (sb->sb_data + sb->sb_datalen)) | |
278 | sb->sb_wptr -= sb->sb_datalen; | |
279 | return size; | |
280 | err: | |
281 | ||
282 | sofcantrcvmore(so); | |
283 | tcp_sockclosed(sototcpcb(so)); | |
284 | fprintf(stderr, "soreadbuf buffer to small"); | |
285 | return -1; | |
286 | } | |
287 | ||
f0cbd3ec FB |
288 | /* |
289 | * Get urgent data | |
5fafdf24 | 290 | * |
f0cbd3ec FB |
291 | * When the socket is created, we set it SO_OOBINLINE, |
292 | * so when OOB data arrives, we soread() it and everything | |
293 | * in the send buffer is sent as urgent data | |
294 | */ | |
bfb1ac14 | 295 | int |
511d2b14 | 296 | sorecvoob(struct socket *so) |
f0cbd3ec FB |
297 | { |
298 | struct tcpcb *tp = sototcpcb(so); | |
bfb1ac14 | 299 | int ret; |
f0cbd3ec FB |
300 | |
301 | DEBUG_CALL("sorecvoob"); | |
ecc804ca | 302 | DEBUG_ARG("so = %p", so); |
5fafdf24 | 303 | |
f0cbd3ec FB |
304 | /* |
305 | * We take a guess at how much urgent data has arrived. | |
306 | * In most situations, when urgent data arrives, the next | |
307 | * read() should get all the urgent data. This guess will | |
308 | * be wrong however if more data arrives just after the | |
5fafdf24 | 309 | * urgent data, or the read() doesn't return all the |
f0cbd3ec FB |
310 | * urgent data. |
311 | */ | |
bfb1ac14 SL |
312 | ret = soread(so); |
313 | if (ret > 0) { | |
314 | tp->snd_up = tp->snd_una + so->so_snd.sb_cc; | |
315 | tp->t_force = 1; | |
316 | tcp_output(tp); | |
317 | tp->t_force = 0; | |
318 | } | |
319 | ||
320 | return ret; | |
f0cbd3ec FB |
321 | } |
322 | ||
323 | /* | |
324 | * Send urgent data | |
325 | * There's a lot duplicated code here, but... | |
326 | */ | |
327 | int | |
511d2b14 | 328 | sosendoob(struct socket *so) |
f0cbd3ec FB |
329 | { |
330 | struct sbuf *sb = &so->so_rcv; | |
331 | char buff[2048]; /* XXX Shouldn't be sending more oob data than this */ | |
5fafdf24 | 332 | |
f0cbd3ec | 333 | int n, len; |
5fafdf24 | 334 | |
f0cbd3ec | 335 | DEBUG_CALL("sosendoob"); |
ecc804ca | 336 | DEBUG_ARG("so = %p", so); |
f0cbd3ec | 337 | DEBUG_ARG("sb->sb_cc = %d", sb->sb_cc); |
5fafdf24 | 338 | |
f0cbd3ec FB |
339 | if (so->so_urgc > 2048) |
340 | so->so_urgc = 2048; /* XXXX */ | |
5fafdf24 | 341 | |
f0cbd3ec FB |
342 | if (sb->sb_rptr < sb->sb_wptr) { |
343 | /* We can send it directly */ | |
e1c5a2b3 | 344 | n = slirp_send(so, sb->sb_rptr, so->so_urgc, (MSG_OOB)); /* |MSG_DONTWAIT)); */ |
f0cbd3ec | 345 | so->so_urgc -= n; |
3b46e624 | 346 | |
f0cbd3ec FB |
347 | DEBUG_MISC((dfd, " --- sent %d bytes urgent data, %d urgent bytes left\n", n, so->so_urgc)); |
348 | } else { | |
5fafdf24 | 349 | /* |
f0cbd3ec FB |
350 | * Since there's no sendv or sendtov like writev, |
351 | * we must copy all data to a linear buffer then | |
352 | * send it all | |
353 | */ | |
354 | len = (sb->sb_data + sb->sb_datalen) - sb->sb_rptr; | |
355 | if (len > so->so_urgc) len = so->so_urgc; | |
356 | memcpy(buff, sb->sb_rptr, len); | |
357 | so->so_urgc -= len; | |
358 | if (so->so_urgc) { | |
359 | n = sb->sb_wptr - sb->sb_data; | |
360 | if (n > so->so_urgc) n = so->so_urgc; | |
361 | memcpy((buff + len), sb->sb_data, n); | |
362 | so->so_urgc -= n; | |
363 | len += n; | |
364 | } | |
e1c5a2b3 | 365 | n = slirp_send(so, buff, len, (MSG_OOB)); /* |MSG_DONTWAIT)); */ |
f0cbd3ec FB |
366 | #ifdef DEBUG |
367 | if (n != len) | |
368 | DEBUG_ERROR((dfd, "Didn't send all data urgently XXXXX\n")); | |
3b46e624 | 369 | #endif |
f0cbd3ec FB |
370 | DEBUG_MISC((dfd, " ---2 sent %d bytes urgent data, %d urgent bytes left\n", n, so->so_urgc)); |
371 | } | |
5fafdf24 | 372 | |
f0cbd3ec FB |
373 | sb->sb_cc -= n; |
374 | sb->sb_rptr += n; | |
375 | if (sb->sb_rptr >= (sb->sb_data + sb->sb_datalen)) | |
376 | sb->sb_rptr -= sb->sb_datalen; | |
5fafdf24 | 377 | |
f0cbd3ec FB |
378 | return n; |
379 | } | |
380 | ||
381 | /* | |
5fafdf24 | 382 | * Write data from so_rcv to so's socket, |
f0cbd3ec FB |
383 | * updating all sbuf field as necessary |
384 | */ | |
385 | int | |
511d2b14 | 386 | sowrite(struct socket *so) |
f0cbd3ec FB |
387 | { |
388 | int n,nn; | |
389 | struct sbuf *sb = &so->so_rcv; | |
390 | int len = sb->sb_cc; | |
391 | struct iovec iov[2]; | |
5fafdf24 | 392 | |
f0cbd3ec | 393 | DEBUG_CALL("sowrite"); |
ecc804ca | 394 | DEBUG_ARG("so = %p", so); |
5fafdf24 | 395 | |
f0cbd3ec FB |
396 | if (so->so_urgc) { |
397 | sosendoob(so); | |
398 | if (sb->sb_cc == 0) | |
399 | return 0; | |
400 | } | |
401 | ||
402 | /* | |
403 | * No need to check if there's something to write, | |
404 | * sowrite wouldn't have been called otherwise | |
405 | */ | |
5fafdf24 | 406 | |
f0cbd3ec | 407 | iov[0].iov_base = sb->sb_rptr; |
66029f6a BS |
408 | iov[1].iov_base = NULL; |
409 | iov[1].iov_len = 0; | |
f0cbd3ec FB |
410 | if (sb->sb_rptr < sb->sb_wptr) { |
411 | iov[0].iov_len = sb->sb_wptr - sb->sb_rptr; | |
412 | /* Should never succeed, but... */ | |
413 | if (iov[0].iov_len > len) iov[0].iov_len = len; | |
414 | n = 1; | |
415 | } else { | |
416 | iov[0].iov_len = (sb->sb_data + sb->sb_datalen) - sb->sb_rptr; | |
417 | if (iov[0].iov_len > len) iov[0].iov_len = len; | |
418 | len -= iov[0].iov_len; | |
419 | if (len) { | |
420 | iov[1].iov_base = sb->sb_data; | |
421 | iov[1].iov_len = sb->sb_wptr - sb->sb_data; | |
422 | if (iov[1].iov_len > len) iov[1].iov_len = len; | |
423 | n = 2; | |
424 | } else | |
425 | n = 1; | |
426 | } | |
427 | /* Check if there's urgent data to send, and if so, send it */ | |
428 | ||
429 | #ifdef HAVE_READV | |
430 | nn = writev(so->s, (const struct iovec *)iov, n); | |
5fafdf24 | 431 | |
f0cbd3ec FB |
432 | DEBUG_MISC((dfd, " ... wrote nn = %d bytes\n", nn)); |
433 | #else | |
e1c5a2b3 | 434 | nn = slirp_send(so, iov[0].iov_base, iov[0].iov_len,0); |
f0cbd3ec FB |
435 | #endif |
436 | /* This should never happen, but people tell me it does *shrug* */ | |
437 | if (nn < 0 && (errno == EAGAIN || errno == EINTR)) | |
438 | return 0; | |
5fafdf24 | 439 | |
f0cbd3ec FB |
440 | if (nn <= 0) { |
441 | DEBUG_MISC((dfd, " --- sowrite disconnected, so->so_state = %x, errno = %d\n", | |
442 | so->so_state, errno)); | |
443 | sofcantsendmore(so); | |
444 | tcp_sockclosed(sototcpcb(so)); | |
445 | return -1; | |
446 | } | |
5fafdf24 | 447 | |
f0cbd3ec | 448 | #ifndef HAVE_READV |
3bc2175d FB |
449 | if (n == 2 && nn == iov[0].iov_len) { |
450 | int ret; | |
e1c5a2b3 | 451 | ret = slirp_send(so, iov[1].iov_base, iov[1].iov_len,0); |
3bc2175d FB |
452 | if (ret > 0) |
453 | nn += ret; | |
454 | } | |
f0cbd3ec FB |
455 | DEBUG_MISC((dfd, " ... wrote nn = %d bytes\n", nn)); |
456 | #endif | |
5fafdf24 | 457 | |
f0cbd3ec FB |
458 | /* Update sbuf */ |
459 | sb->sb_cc -= nn; | |
460 | sb->sb_rptr += nn; | |
461 | if (sb->sb_rptr >= (sb->sb_data + sb->sb_datalen)) | |
462 | sb->sb_rptr -= sb->sb_datalen; | |
5fafdf24 | 463 | |
f0cbd3ec FB |
464 | /* |
465 | * If in DRAIN mode, and there's no more data, set | |
466 | * it CANTSENDMORE | |
467 | */ | |
468 | if ((so->so_state & SS_FWDRAIN) && sb->sb_cc == 0) | |
469 | sofcantsendmore(so); | |
5fafdf24 | 470 | |
f0cbd3ec FB |
471 | return nn; |
472 | } | |
473 | ||
474 | /* | |
475 | * recvfrom() a UDP socket | |
476 | */ | |
477 | void | |
511d2b14 | 478 | sorecvfrom(struct socket *so) |
f0cbd3ec | 479 | { |
eae303ff | 480 | struct sockaddr_storage addr; |
5379229a | 481 | struct sockaddr_storage saddr, daddr; |
eae303ff | 482 | socklen_t addrlen = sizeof(struct sockaddr_storage); |
5fafdf24 | 483 | |
f0cbd3ec | 484 | DEBUG_CALL("sorecvfrom"); |
ecc804ca | 485 | DEBUG_ARG("so = %p", so); |
5fafdf24 | 486 | |
f0cbd3ec FB |
487 | if (so->so_type == IPPROTO_ICMP) { /* This is a "ping" reply */ |
488 | char buff[256]; | |
489 | int len; | |
3b46e624 | 490 | |
5fafdf24 | 491 | len = recvfrom(so->s, buff, 256, 0, |
f0cbd3ec FB |
492 | (struct sockaddr *)&addr, &addrlen); |
493 | /* XXX Check if reply is "correct"? */ | |
3b46e624 | 494 | |
f0cbd3ec FB |
495 | if(len == -1 || len == 0) { |
496 | u_char code=ICMP_UNREACH_PORT; | |
497 | ||
498 | if(errno == EHOSTUNREACH) code=ICMP_UNREACH_HOST; | |
499 | else if(errno == ENETUNREACH) code=ICMP_UNREACH_NET; | |
3b46e624 | 500 | |
f0cbd3ec FB |
501 | DEBUG_MISC((dfd," udp icmp rx errno = %d-%s\n", |
502 | errno,strerror(errno))); | |
de40abfe | 503 | icmp_send_error(so->so_m, ICMP_UNREACH, code, 0, strerror(errno)); |
f0cbd3ec FB |
504 | } else { |
505 | icmp_reflect(so->so_m); | |
511d2b14 | 506 | so->so_m = NULL; /* Don't m_free() it again! */ |
f0cbd3ec FB |
507 | } |
508 | /* No need for this socket anymore, udp_detach it */ | |
509 | udp_detach(so); | |
510 | } else { /* A "normal" UDP packet */ | |
511 | struct mbuf *m; | |
c5b76b38 BS |
512 | int len; |
513 | #ifdef _WIN32 | |
514 | unsigned long n; | |
515 | #else | |
516 | int n; | |
517 | #endif | |
f0cbd3ec | 518 | |
460fec67 JK |
519 | m = m_get(so->slirp); |
520 | if (!m) { | |
521 | return; | |
522 | } | |
98c63057 GS |
523 | switch (so->so_ffamily) { |
524 | case AF_INET: | |
525 | m->m_data += IF_MAXLINKHDR + sizeof(struct udpiphdr); | |
526 | break; | |
527 | case AF_INET6: | |
528 | m->m_data += IF_MAXLINKHDR + sizeof(struct ip6) | |
529 | + sizeof(struct udphdr); | |
530 | break; | |
531 | default: | |
532 | g_assert_not_reached(); | |
533 | break; | |
534 | } | |
3b46e624 | 535 | |
5fafdf24 | 536 | /* |
f0cbd3ec FB |
537 | * XXX Shouldn't FIONREAD packets destined for port 53, |
538 | * but I don't know the max packet size for DNS lookups | |
539 | */ | |
540 | len = M_FREEROOM(m); | |
541 | /* if (so->so_fport != htons(53)) { */ | |
379ff53d | 542 | ioctlsocket(so->s, FIONREAD, &n); |
3b46e624 | 543 | |
f0cbd3ec FB |
544 | if (n > len) { |
545 | n = (m->m_data - m->m_dat) + m->m_len + n + 1; | |
546 | m_inc(m, n); | |
547 | len = M_FREEROOM(m); | |
548 | } | |
549 | /* } */ | |
3b46e624 | 550 | |
f0cbd3ec FB |
551 | m->m_len = recvfrom(so->s, m->m_data, len, 0, |
552 | (struct sockaddr *)&addr, &addrlen); | |
5fafdf24 | 553 | DEBUG_MISC((dfd, " did recvfrom %d, errno = %d-%s\n", |
f0cbd3ec FB |
554 | m->m_len, errno,strerror(errno))); |
555 | if(m->m_len<0) { | |
15d62af4 GS |
556 | /* Report error as ICMP */ |
557 | switch (so->so_lfamily) { | |
558 | uint8_t code; | |
559 | case AF_INET: | |
560 | code = ICMP_UNREACH_PORT; | |
561 | ||
562 | if (errno == EHOSTUNREACH) { | |
563 | code = ICMP_UNREACH_HOST; | |
564 | } else if (errno == ENETUNREACH) { | |
565 | code = ICMP_UNREACH_NET; | |
566 | } | |
567 | ||
568 | DEBUG_MISC((dfd, " rx error, tx icmp ICMP_UNREACH:%i\n", code)); | |
569 | icmp_send_error(so->so_m, ICMP_UNREACH, code, 0, strerror(errno)); | |
570 | break; | |
571 | case AF_INET6: | |
572 | code = ICMP6_UNREACH_PORT; | |
573 | ||
574 | if (errno == EHOSTUNREACH) { | |
575 | code = ICMP6_UNREACH_ADDRESS; | |
576 | } else if (errno == ENETUNREACH) { | |
577 | code = ICMP6_UNREACH_NO_ROUTE; | |
578 | } | |
579 | ||
580 | DEBUG_MISC((dfd, " rx error, tx icmp6 ICMP_UNREACH:%i\n", code)); | |
581 | icmp6_send_error(so->so_m, ICMP6_UNREACH, code); | |
582 | break; | |
583 | default: | |
584 | g_assert_not_reached(); | |
585 | break; | |
586 | } | |
f0cbd3ec FB |
587 | m_free(m); |
588 | } else { | |
589 | /* | |
590 | * Hack: domain name lookup will be used the most for UDP, | |
591 | * and since they'll only be used once there's no need | |
592 | * for the 4 minute (or whatever) timeout... So we time them | |
593 | * out much quicker (10 seconds for now...) | |
594 | */ | |
595 | if (so->so_expire) { | |
596 | if (so->so_fport == htons(53)) | |
597 | so->so_expire = curtime + SO_EXPIREFAST; | |
598 | else | |
599 | so->so_expire = curtime + SO_EXPIRE; | |
600 | } | |
601 | ||
5fafdf24 | 602 | /* |
f0cbd3ec | 603 | * If this packet was destined for CTL_ADDR, |
5379229a | 604 | * make it look like that's where it came from |
f0cbd3ec | 605 | */ |
5379229a GS |
606 | saddr = addr; |
607 | sotranslate_in(so, &saddr); | |
608 | daddr = so->lhost.ss; | |
609 | ||
eae303ff GS |
610 | switch (so->so_ffamily) { |
611 | case AF_INET: | |
5379229a GS |
612 | udp_output(so, m, (struct sockaddr_in *) &saddr, |
613 | (struct sockaddr_in *) &daddr, | |
614 | so->so_iptos); | |
eae303ff | 615 | break; |
15d62af4 GS |
616 | case AF_INET6: |
617 | udp6_output(so, m, (struct sockaddr_in6 *) &saddr, | |
618 | (struct sockaddr_in6 *) &daddr); | |
619 | break; | |
eae303ff | 620 | default: |
15d62af4 | 621 | g_assert_not_reached(); |
eae303ff GS |
622 | break; |
623 | } | |
f0cbd3ec FB |
624 | } /* rx error */ |
625 | } /* if ping packet */ | |
626 | } | |
627 | ||
628 | /* | |
629 | * sendto() a socket | |
630 | */ | |
631 | int | |
511d2b14 | 632 | sosendto(struct socket *so, struct mbuf *m) |
f0cbd3ec FB |
633 | { |
634 | int ret; | |
5379229a | 635 | struct sockaddr_storage addr; |
f0cbd3ec FB |
636 | |
637 | DEBUG_CALL("sosendto"); | |
ecc804ca SW |
638 | DEBUG_ARG("so = %p", so); |
639 | DEBUG_ARG("m = %p", m); | |
5fafdf24 | 640 | |
5379229a GS |
641 | addr = so->fhost.ss; |
642 | DEBUG_CALL(" sendto()ing)"); | |
643 | sotranslate_out(so, &addr); | |
5fafdf24 | 644 | |
f0cbd3ec FB |
645 | /* Don't care what port we get */ |
646 | ret = sendto(so->s, m->m_data, m->m_len, 0, | |
0d48dfed | 647 | (struct sockaddr *)&addr, sockaddr_size(&addr)); |
f0cbd3ec FB |
648 | if (ret < 0) |
649 | return -1; | |
5fafdf24 | 650 | |
f0cbd3ec FB |
651 | /* |
652 | * Kill the socket if there's no reply in 4 minutes, | |
653 | * but only if it's an expirable socket | |
654 | */ | |
655 | if (so->so_expire) | |
656 | so->so_expire = curtime + SO_EXPIRE; | |
f932b6ce JK |
657 | so->so_state &= SS_PERSISTENT_MASK; |
658 | so->so_state |= SS_ISFCONNECTED; /* So that it gets select()ed */ | |
f0cbd3ec FB |
659 | return 0; |
660 | } | |
661 | ||
662 | /* | |
3c6a0580 | 663 | * Listen for incoming TCP connections |
f0cbd3ec FB |
664 | */ |
665 | struct socket * | |
b6dce92e | 666 | tcp_listen(Slirp *slirp, uint32_t haddr, u_int hport, uint32_t laddr, |
460fec67 | 667 | u_int lport, int flags) |
f0cbd3ec FB |
668 | { |
669 | struct sockaddr_in addr; | |
670 | struct socket *so; | |
242acf3a AZ |
671 | int s, opt = 1; |
672 | socklen_t addrlen = sizeof(addr); | |
ab07b980 | 673 | memset(&addr, 0, addrlen); |
f0cbd3ec | 674 | |
3c6a0580 | 675 | DEBUG_CALL("tcp_listen"); |
9f349498 JK |
676 | DEBUG_ARG("haddr = %x", haddr); |
677 | DEBUG_ARG("hport = %d", hport); | |
f0cbd3ec FB |
678 | DEBUG_ARG("laddr = %x", laddr); |
679 | DEBUG_ARG("lport = %d", lport); | |
680 | DEBUG_ARG("flags = %x", flags); | |
5fafdf24 | 681 | |
460fec67 JK |
682 | so = socreate(slirp); |
683 | if (!so) { | |
f0cbd3ec FB |
684 | return NULL; |
685 | } | |
5fafdf24 | 686 | |
f0cbd3ec FB |
687 | /* Don't tcp_attach... we don't need so_snd nor so_rcv */ |
688 | if ((so->so_tcpcb = tcp_newtcpcb(so)) == NULL) { | |
689 | free(so); | |
690 | return NULL; | |
691 | } | |
460fec67 | 692 | insque(so, &slirp->tcb); |
5fafdf24 TS |
693 | |
694 | /* | |
f0cbd3ec FB |
695 | * SS_FACCEPTONCE sockets must time out. |
696 | */ | |
697 | if (flags & SS_FACCEPTONCE) | |
698 | so->so_tcpcb->t_timer[TCPT_KEEP] = TCPTV_KEEP_INIT*2; | |
5fafdf24 | 699 | |
f932b6ce JK |
700 | so->so_state &= SS_PERSISTENT_MASK; |
701 | so->so_state |= (SS_FACCEPTCONN | flags); | |
eae303ff | 702 | so->so_lfamily = AF_INET; |
f0cbd3ec FB |
703 | so->so_lport = lport; /* Kept in network format */ |
704 | so->so_laddr.s_addr = laddr; /* Ditto */ | |
5fafdf24 | 705 | |
f0cbd3ec | 706 | addr.sin_family = AF_INET; |
3c6a0580 JK |
707 | addr.sin_addr.s_addr = haddr; |
708 | addr.sin_port = hport; | |
5fafdf24 | 709 | |
40ff6d7e | 710 | if (((s = qemu_socket(AF_INET,SOCK_STREAM,0)) < 0) || |
aad1239a | 711 | (socket_set_fast_reuse(s) < 0) || |
f0cbd3ec FB |
712 | (bind(s,(struct sockaddr *)&addr, sizeof(addr)) < 0) || |
713 | (listen(s,1) < 0)) { | |
714 | int tmperrno = errno; /* Don't clobber the real reason we failed */ | |
3b46e624 | 715 | |
f0cbd3ec FB |
716 | close(s); |
717 | sofree(so); | |
718 | /* Restore the real errno */ | |
02d2c54c FB |
719 | #ifdef _WIN32 |
720 | WSASetLastError(tmperrno); | |
721 | #else | |
f0cbd3ec | 722 | errno = tmperrno; |
02d2c54c | 723 | #endif |
f0cbd3ec FB |
724 | return NULL; |
725 | } | |
9957fc7f | 726 | qemu_setsockopt(s, SOL_SOCKET, SO_OOBINLINE, &opt, sizeof(int)); |
5fafdf24 | 727 | |
f0cbd3ec | 728 | getsockname(s,(struct sockaddr *)&addr,&addrlen); |
eae303ff | 729 | so->so_ffamily = AF_INET; |
f0cbd3ec FB |
730 | so->so_fport = addr.sin_port; |
731 | if (addr.sin_addr.s_addr == 0 || addr.sin_addr.s_addr == loopback_addr.s_addr) | |
460fec67 | 732 | so->so_faddr = slirp->vhost_addr; |
f0cbd3ec FB |
733 | else |
734 | so->so_faddr = addr.sin_addr; | |
735 | ||
736 | so->s = s; | |
737 | return so; | |
738 | } | |
739 | ||
f0cbd3ec FB |
740 | /* |
741 | * Various session state calls | |
742 | * XXX Should be #define's | |
743 | * The socket state stuff needs work, these often get call 2 or 3 | |
744 | * times each when only 1 was needed | |
745 | */ | |
746 | void | |
511d2b14 | 747 | soisfconnecting(struct socket *so) |
f0cbd3ec FB |
748 | { |
749 | so->so_state &= ~(SS_NOFDREF|SS_ISFCONNECTED|SS_FCANTRCVMORE| | |
750 | SS_FCANTSENDMORE|SS_FWDRAIN); | |
751 | so->so_state |= SS_ISFCONNECTING; /* Clobber other states */ | |
752 | } | |
753 | ||
754 | void | |
511d2b14 | 755 | soisfconnected(struct socket *so) |
f0cbd3ec FB |
756 | { |
757 | so->so_state &= ~(SS_ISFCONNECTING|SS_FWDRAIN|SS_NOFDREF); | |
758 | so->so_state |= SS_ISFCONNECTED; /* Clobber other states */ | |
759 | } | |
760 | ||
9634d903 BS |
761 | static void |
762 | sofcantrcvmore(struct socket *so) | |
f0cbd3ec FB |
763 | { |
764 | if ((so->so_state & SS_NOFDREF) == 0) { | |
765 | shutdown(so->s,0); | |
f0cbd3ec FB |
766 | } |
767 | so->so_state &= ~(SS_ISFCONNECTING); | |
f932b6ce JK |
768 | if (so->so_state & SS_FCANTSENDMORE) { |
769 | so->so_state &= SS_PERSISTENT_MASK; | |
770 | so->so_state |= SS_NOFDREF; /* Don't select it */ | |
771 | } else { | |
f0cbd3ec | 772 | so->so_state |= SS_FCANTRCVMORE; |
f932b6ce | 773 | } |
f0cbd3ec FB |
774 | } |
775 | ||
9634d903 BS |
776 | static void |
777 | sofcantsendmore(struct socket *so) | |
f0cbd3ec FB |
778 | { |
779 | if ((so->so_state & SS_NOFDREF) == 0) { | |
02d2c54c | 780 | shutdown(so->s,1); /* send FIN to fhost */ |
f0cbd3ec FB |
781 | } |
782 | so->so_state &= ~(SS_ISFCONNECTING); | |
f932b6ce JK |
783 | if (so->so_state & SS_FCANTRCVMORE) { |
784 | so->so_state &= SS_PERSISTENT_MASK; | |
785 | so->so_state |= SS_NOFDREF; /* as above */ | |
786 | } else { | |
f0cbd3ec | 787 | so->so_state |= SS_FCANTSENDMORE; |
f932b6ce | 788 | } |
f0cbd3ec FB |
789 | } |
790 | ||
f0cbd3ec FB |
791 | /* |
792 | * Set write drain mode | |
793 | * Set CANTSENDMORE once all data has been write()n | |
794 | */ | |
795 | void | |
511d2b14 | 796 | sofwdrain(struct socket *so) |
f0cbd3ec FB |
797 | { |
798 | if (so->so_rcv.sb_cc) | |
799 | so->so_state |= SS_FWDRAIN; | |
800 | else | |
801 | sofcantsendmore(so); | |
802 | } | |
5379229a GS |
803 | |
804 | /* | |
805 | * Translate addr in host addr when it is a virtual address | |
806 | */ | |
807 | void sotranslate_out(struct socket *so, struct sockaddr_storage *addr) | |
808 | { | |
809 | Slirp *slirp = so->slirp; | |
810 | struct sockaddr_in *sin = (struct sockaddr_in *)addr; | |
05061d85 | 811 | struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)addr; |
5379229a GS |
812 | |
813 | switch (addr->ss_family) { | |
814 | case AF_INET: | |
815 | if ((so->so_faddr.s_addr & slirp->vnetwork_mask.s_addr) == | |
816 | slirp->vnetwork_addr.s_addr) { | |
817 | /* It's an alias */ | |
818 | if (so->so_faddr.s_addr == slirp->vnameserver_addr.s_addr) { | |
819 | if (get_dns_addr(&sin->sin_addr) < 0) { | |
820 | sin->sin_addr = loopback_addr; | |
821 | } | |
822 | } else { | |
823 | sin->sin_addr = loopback_addr; | |
824 | } | |
825 | } | |
826 | ||
827 | DEBUG_MISC((dfd, " addr.sin_port=%d, " | |
828 | "addr.sin_addr.s_addr=%.16s\n", | |
829 | ntohs(sin->sin_port), inet_ntoa(sin->sin_addr))); | |
830 | break; | |
831 | ||
05061d85 GS |
832 | case AF_INET6: |
833 | if (in6_equal_net(&so->so_faddr6, &slirp->vprefix_addr6, | |
834 | slirp->vprefix_len)) { | |
835 | if (in6_equal(&so->so_faddr6, &slirp->vnameserver_addr6)) { | |
ef763fa4 ST |
836 | uint32_t scope_id; |
837 | if (get_dns6_addr(&sin6->sin6_addr, &scope_id) >= 0) { | |
838 | sin6->sin6_scope_id = scope_id; | |
839 | } else { | |
05061d85 | 840 | sin6->sin6_addr = in6addr_loopback; |
1d17654e | 841 | } |
05061d85 GS |
842 | } else { |
843 | sin6->sin6_addr = in6addr_loopback; | |
844 | } | |
845 | } | |
846 | break; | |
847 | ||
5379229a GS |
848 | default: |
849 | break; | |
850 | } | |
851 | } | |
852 | ||
853 | void sotranslate_in(struct socket *so, struct sockaddr_storage *addr) | |
854 | { | |
855 | Slirp *slirp = so->slirp; | |
856 | struct sockaddr_in *sin = (struct sockaddr_in *)addr; | |
05061d85 | 857 | struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)addr; |
5379229a GS |
858 | |
859 | switch (addr->ss_family) { | |
860 | case AF_INET: | |
861 | if ((so->so_faddr.s_addr & slirp->vnetwork_mask.s_addr) == | |
862 | slirp->vnetwork_addr.s_addr) { | |
863 | uint32_t inv_mask = ~slirp->vnetwork_mask.s_addr; | |
864 | ||
865 | if ((so->so_faddr.s_addr & inv_mask) == inv_mask) { | |
866 | sin->sin_addr = slirp->vhost_addr; | |
867 | } else if (sin->sin_addr.s_addr == loopback_addr.s_addr || | |
868 | so->so_faddr.s_addr != slirp->vhost_addr.s_addr) { | |
869 | sin->sin_addr = so->so_faddr; | |
870 | } | |
871 | } | |
872 | break; | |
873 | ||
05061d85 GS |
874 | case AF_INET6: |
875 | if (in6_equal_net(&so->so_faddr6, &slirp->vprefix_addr6, | |
876 | slirp->vprefix_len)) { | |
877 | if (in6_equal(&sin6->sin6_addr, &in6addr_loopback) | |
878 | || !in6_equal(&so->so_faddr6, &slirp->vhost_addr6)) { | |
879 | sin6->sin6_addr = so->so_faddr6; | |
880 | } | |
881 | } | |
882 | break; | |
883 | ||
5379229a GS |
884 | default: |
885 | break; | |
886 | } | |
887 | } | |
888 | ||
889 | /* | |
890 | * Translate connections from localhost to the real hostname | |
891 | */ | |
892 | void sotranslate_accept(struct socket *so) | |
893 | { | |
894 | Slirp *slirp = so->slirp; | |
895 | ||
896 | switch (so->so_ffamily) { | |
897 | case AF_INET: | |
898 | if (so->so_faddr.s_addr == INADDR_ANY || | |
899 | (so->so_faddr.s_addr & loopback_mask) == | |
900 | (loopback_addr.s_addr & loopback_mask)) { | |
901 | so->so_faddr = slirp->vhost_addr; | |
902 | } | |
903 | break; | |
904 | ||
05061d85 GS |
905 | case AF_INET6: |
906 | if (in6_equal(&so->so_faddr6, &in6addr_any) || | |
907 | in6_equal(&so->so_faddr6, &in6addr_loopback)) { | |
908 | so->so_faddr6 = slirp->vhost_addr6; | |
909 | } | |
910 | break; | |
911 | ||
5379229a GS |
912 | default: |
913 | break; | |
914 | } | |
915 | } |