VirtualBox

source: vbox/trunk/src/VBox/Devices/Network/slirp/socket.c@ 15355

最後變更 在這個檔案從15355是 15355,由 vboxsync 提交於 16 年 前

slirp:icmp: enabling UDP traceroute on Unix

  • 屬性 svn:eol-style 設為 native
檔案大小: 27.2 KB
 
1/*
2 * Copyright (c) 1995 Danny Gasparovski.
3 *
4 * Please read the file COPYRIGHT for the
5 * terms and conditions of the copyright.
6 */
7
8#define WANT_SYS_IOCTL_H
9#include <slirp.h>
10#include "ip_icmp.h"
11#include "main.h"
12#ifdef __sun__
13#include <sys/filio.h>
14#endif
15#if defined(VBOX_WITH_SLIRP_ICMP) && defined (RT_OS_WINDOWS)
16#include <iphlpapi.h>
17#include <icmpapi.h>
18#endif
19
20#ifdef VBOX_WITH_SLIRP_ICMP
21static void send_icmp_to_guest(PNATState, char *, size_t, struct socket *, const struct sockaddr_in *);
22static void sorecvfrom_icmp_win(PNATState, struct socket *);
23#endif
24static void sorecvfrom_icmp_unix(PNATState, struct socket *);
25
26void
27so_init()
28{
29}
30
31
32struct socket *
33solookup(struct socket *head, struct in_addr laddr,
34 u_int lport, struct in_addr faddr, u_int fport)
35{
36 struct socket *so;
37
38 for (so = head->so_next; so != head; so = so->so_next)
39 {
40 if ( so->so_lport == lport
41 && so->so_laddr.s_addr == laddr.s_addr
42 && so->so_faddr.s_addr == faddr.s_addr
43 && so->so_fport == fport)
44 return so;
45 }
46
47 return (struct socket *)NULL;
48}
49
50/*
51 * Create a new socket, initialise the fields
52 * It is the responsibility of the caller to
53 * insque() it into the correct linked-list
54 */
55struct socket *
56socreate()
57{
58 struct socket *so;
59
60 so = (struct socket *)malloc(sizeof(struct socket));
61 if(so)
62 {
63 memset(so, 0, sizeof(struct socket));
64 so->so_state = SS_NOFDREF;
65 so->s = -1;
66 }
67 return so;
68}
69
70/*
71 * remque and free a socket, clobber cache
72 */
73void
74sofree(PNATState pData, struct socket *so)
75{
76 if (so == tcp_last_so)
77 tcp_last_so = &tcb;
78 else if (so == udp_last_so)
79 udp_last_so = &udb;
80
81 m_free(pData, so->so_m);
82
83 if(so->so_next && so->so_prev)
84 remque(pData, so); /* crashes if so is not in a queue */
85
86 free(so);
87}
88
89/*
90 * Read from so's socket into sb_snd, updating all relevant sbuf fields
91 * NOTE: This will only be called if it is select()ed for reading, so
92 * a read() of 0 (or less) means it's disconnected
93 */
94int
95soread(PNATState pData, struct socket *so, int fCloseIfNothingRead)
96{
97 int n, nn, lss, total;
98 struct sbuf *sb = &so->so_snd;
99 size_t len = sb->sb_datalen - sb->sb_cc;
100 struct iovec iov[2];
101 int mss = so->so_tcpcb->t_maxseg;
102
103 DEBUG_CALL("soread");
104 DEBUG_ARG("so = %lx", (long )so);
105
106 /*
107 * No need to check if there's enough room to read.
108 * soread wouldn't have been called if there weren't
109 */
110
111 len = sb->sb_datalen - sb->sb_cc;
112
113 iov[0].iov_base = sb->sb_wptr;
114 iov[1].iov_base = 0;
115 iov[1].iov_len = 0;
116 if (sb->sb_wptr < sb->sb_rptr)
117 {
118 iov[0].iov_len = sb->sb_rptr - sb->sb_wptr;
119 /* Should never succeed, but... */
120 if (iov[0].iov_len > len)
121 iov[0].iov_len = len;
122 if (iov[0].iov_len > mss)
123 iov[0].iov_len -= iov[0].iov_len%mss;
124 n = 1;
125 }
126 else
127 {
128 iov[0].iov_len = (sb->sb_data + sb->sb_datalen) - sb->sb_wptr;
129 /* Should never succeed, but... */
130 if (iov[0].iov_len > len)
131 iov[0].iov_len = len;
132 len -= iov[0].iov_len;
133 if (len)
134 {
135 iov[1].iov_base = sb->sb_data;
136 iov[1].iov_len = sb->sb_rptr - sb->sb_data;
137 if(iov[1].iov_len > len)
138 iov[1].iov_len = len;
139 total = iov[0].iov_len + iov[1].iov_len;
140 if (total > mss)
141 {
142 lss = total % mss;
143 if (iov[1].iov_len > lss)
144 {
145 iov[1].iov_len -= lss;
146 n = 2;
147 }
148 else
149 {
150 lss -= iov[1].iov_len;
151 iov[0].iov_len -= lss;
152 n = 1;
153 }
154 }
155 else
156 n = 2;
157 }
158 else
159 {
160 if (iov[0].iov_len > mss)
161 iov[0].iov_len -= iov[0].iov_len%mss;
162 n = 1;
163 }
164 }
165
166#ifdef HAVE_READV
167 nn = readv(so->s, (struct iovec *)iov, n);
168 DEBUG_MISC((dfd, " ... read nn = %d bytes\n", nn));
169#else
170 nn = recv(so->s, iov[0].iov_base, iov[0].iov_len,0);
171#endif
172 if (nn <= 0)
173 {
174#if defined(VBOX_WITH_SIMPLIFIED_SLIRP_SYNC) && defined(RT_OS_WINDOWS)
175 /*
176 * Special case for WSAEnumNetworkEvents: If we receive 0 bytes that
177 * _could_ mean that the connection is closed. But we will receive an
178 * FD_CLOSE event later if the connection was _really_ closed. With
179 * www.youtube.com I see this very often. Closing the socket too early
180 * would be dangerous.
181 */
182 if (nn == 0 && !fCloseIfNothingRead)
183 return 0;
184#endif
185 if (nn < 0 && (errno == EINTR || errno == EAGAIN || errno == EWOULDBLOCK))
186 return 0;
187 else
188 {
189 /* nn == 0 means peer has performed an orderly shutdown */
190 DEBUG_MISC((dfd, " --- soread() disconnected, nn = %d, errno = %d-%s\n",
191 nn, errno,strerror(errno)));
192 sofcantrcvmore(so);
193 tcp_sockclosed(pData, sototcpcb(so));
194 return -1;
195 }
196 }
197
198#ifndef HAVE_READV
199 /*
200 * If there was no error, try and read the second time round
201 * We read again if n = 2 (ie, there's another part of the buffer)
202 * and we read as much as we could in the first read
203 * We don't test for <= 0 this time, because there legitimately
204 * might not be any more data (since the socket is non-blocking),
205 * a close will be detected on next iteration.
206 * A return of -1 wont (shouldn't) happen, since it didn't happen above
207 */
208 if (n == 2 && nn == iov[0].iov_len)
209 {
210 int ret;
211 ret = recv(so->s, iov[1].iov_base, iov[1].iov_len,0);
212 if (ret > 0)
213 nn += ret;
214 }
215
216 DEBUG_MISC((dfd, " ... read nn = %d bytes\n", nn));
217#endif
218
219 /* Update fields */
220 sb->sb_cc += nn;
221 sb->sb_wptr += nn;
222 if (sb->sb_wptr >= (sb->sb_data + sb->sb_datalen))
223 sb->sb_wptr -= sb->sb_datalen;
224 return nn;
225}
226
227/*
228 * Get urgent data
229 *
230 * When the socket is created, we set it SO_OOBINLINE,
231 * so when OOB data arrives, we soread() it and everything
232 * in the send buffer is sent as urgent data
233 */
234void
235sorecvoob(PNATState pData, struct socket *so)
236{
237 struct tcpcb *tp = sototcpcb(so);
238
239 DEBUG_CALL("sorecvoob");
240 DEBUG_ARG("so = %lx", (long)so);
241
242 /*
243 * We take a guess at how much urgent data has arrived.
244 * In most situations, when urgent data arrives, the next
245 * read() should get all the urgent data. This guess will
246 * be wrong however if more data arrives just after the
247 * urgent data, or the read() doesn't return all the
248 * urgent data.
249 */
250 soread(pData, so, /*fCloseIfNothingRead=*/false);
251 tp->snd_up = tp->snd_una + so->so_snd.sb_cc;
252 tp->t_force = 1;
253 tcp_output(pData, tp);
254 tp->t_force = 0;
255}
256
257/*
258 * Send urgent data
259 * There's a lot duplicated code here, but...
260 */
261int
262sosendoob(struct socket *so)
263{
264 struct sbuf *sb = &so->so_rcv;
265 char buff[2048]; /* XXX Shouldn't be sending more oob data than this */
266
267 int n, len;
268
269 DEBUG_CALL("sosendoob");
270 DEBUG_ARG("so = %lx", (long)so);
271 DEBUG_ARG("sb->sb_cc = %d", sb->sb_cc);
272
273 if (so->so_urgc > sizeof(buff))
274 so->so_urgc = sizeof(buff); /* XXX */
275
276 if (sb->sb_rptr < sb->sb_wptr)
277 {
278 /* We can send it directly */
279 n = send(so->s, sb->sb_rptr, so->so_urgc, (MSG_OOB)); /* |MSG_DONTWAIT)); */
280 so->so_urgc -= n;
281
282 DEBUG_MISC((dfd, " --- sent %d bytes urgent data, %d urgent bytes left\n",
283 n, so->so_urgc));
284 }
285 else
286 {
287 /*
288 * Since there's no sendv or sendtov like writev,
289 * we must copy all data to a linear buffer then
290 * send it all
291 */
292 len = (sb->sb_data + sb->sb_datalen) - sb->sb_rptr;
293 if (len > so->so_urgc)
294 len = so->so_urgc;
295 memcpy(buff, sb->sb_rptr, len);
296 so->so_urgc -= len;
297 if (so->so_urgc)
298 {
299 n = sb->sb_wptr - sb->sb_data;
300 if (n > so->so_urgc)
301 n = so->so_urgc;
302 memcpy(buff + len, sb->sb_data, n);
303 so->so_urgc -= n;
304 len += n;
305 }
306 n = send(so->s, buff, len, (MSG_OOB)); /* |MSG_DONTWAIT)); */
307#ifdef DEBUG
308 if (n != len)
309 DEBUG_ERROR((dfd, "Didn't send all data urgently XXXXX\n"));
310#endif
311 DEBUG_MISC((dfd, " ---2 sent %d bytes urgent data, %d urgent bytes left\n",
312 n, so->so_urgc));
313 }
314
315 sb->sb_cc -= n;
316 sb->sb_rptr += n;
317 if (sb->sb_rptr >= (sb->sb_data + sb->sb_datalen))
318 sb->sb_rptr -= sb->sb_datalen;
319
320 return n;
321}
322
323/*
324 * Write data from so_rcv to so's socket,
325 * updating all sbuf field as necessary
326 */
327int
328sowrite(PNATState pData, struct socket *so)
329{
330 int n,nn;
331 struct sbuf *sb = &so->so_rcv;
332 size_t len = sb->sb_cc;
333 struct iovec iov[2];
334
335 DEBUG_CALL("sowrite");
336 DEBUG_ARG("so = %lx", (long)so);
337
338 if (so->so_urgc)
339 {
340 sosendoob(so);
341 if (sb->sb_cc == 0)
342 return 0;
343 }
344
345 /*
346 * No need to check if there's something to write,
347 * sowrite wouldn't have been called otherwise
348 */
349
350 len = sb->sb_cc;
351
352 iov[0].iov_base = sb->sb_rptr;
353 iov[1].iov_base = 0;
354 iov[1].iov_len = 0;
355 if (sb->sb_rptr < sb->sb_wptr)
356 {
357 iov[0].iov_len = sb->sb_wptr - sb->sb_rptr;
358 /* Should never succeed, but... */
359 if (iov[0].iov_len > len)
360 iov[0].iov_len = len;
361 n = 1;
362 }
363 else
364 {
365 iov[0].iov_len = (sb->sb_data + sb->sb_datalen) - sb->sb_rptr;
366 if (iov[0].iov_len > len)
367 iov[0].iov_len = len;
368 len -= iov[0].iov_len;
369 if (len)
370 {
371 iov[1].iov_base = sb->sb_data;
372 iov[1].iov_len = sb->sb_wptr - sb->sb_data;
373 if (iov[1].iov_len > len)
374 iov[1].iov_len = len;
375 n = 2;
376 }
377 else
378 n = 1;
379 }
380 /* Check if there's urgent data to send, and if so, send it */
381#ifdef HAVE_READV
382 nn = writev(so->s, (const struct iovec *)iov, n);
383 DEBUG_MISC((dfd, " ... wrote nn = %d bytes\n", nn));
384#else
385 nn = send(so->s, iov[0].iov_base, iov[0].iov_len, 0);
386#endif
387 /* This should never happen, but people tell me it does *shrug* */
388 if (nn < 0 && (errno == EAGAIN || errno == EINTR || errno == EWOULDBLOCK))
389 return 0;
390
391 if (nn < 0 || (nn == 0 && iov[0].iov_len > 0))
392 {
393 DEBUG_MISC((dfd, " --- sowrite disconnected, so->so_state = %x, errno = %d\n",
394 so->so_state, errno));
395 sofcantsendmore(so);
396 tcp_sockclosed(pData, sototcpcb(so));
397 return -1;
398 }
399
400#ifndef HAVE_READV
401 if (n == 2 && nn == iov[0].iov_len)
402 {
403 int ret;
404 ret = send(so->s, iov[1].iov_base, iov[1].iov_len,0);
405 if (ret > 0)
406 nn += ret;
407 }
408 DEBUG_MISC((dfd, " ... wrote nn = %d bytes\n", nn));
409#endif
410
411 /* Update sbuf */
412 sb->sb_cc -= nn;
413 sb->sb_rptr += nn;
414 if (sb->sb_rptr >= (sb->sb_data + sb->sb_datalen))
415 sb->sb_rptr -= sb->sb_datalen;
416
417 /*
418 * If in DRAIN mode, and there's no more data, set
419 * it CANTSENDMORE
420 */
421 if ((so->so_state & SS_FWDRAIN) && sb->sb_cc == 0)
422 sofcantsendmore(so);
423
424 return nn;
425}
426
427/*
428 * recvfrom() a UDP socket
429 */
430void
431sorecvfrom(PNATState pData, struct socket *so)
432{
433 struct sockaddr_in addr;
434 socklen_t addrlen = sizeof(struct sockaddr_in);
435
436 DEBUG_CALL("sorecvfrom");
437 DEBUG_ARG("so = %lx", (long)so);
438
439 if (so->so_type == IPPROTO_ICMP)
440 {
441 /* This is a "ping" reply */
442#if !defined(VBOX_WITH_SLIRP_ICMP) || (defined(VBOX_WITH_SLIRP_ICMP) && !defined(RT_OS_WINDOWS))
443 sorecvfrom_icmp_unix(pData, so);
444#endif
445#if defined(VBOX_WITH_SLIRP_ICMP) && defined(RT_OS_WINDOWS)
446 sorecvfrom_icmp_win(pData, so);
447#endif
448 udp_detach(pData, so);
449 }
450 else
451 {
452 /* A "normal" UDP packet */
453 struct mbuf *m;
454 size_t len;
455 u_long n;
456
457 if (!(m = m_get(pData)))
458 return;
459 m->m_data += if_maxlinkhdr;
460
461 /*
462 * XXX Shouldn't FIONREAD packets destined for port 53,
463 * but I don't know the max packet size for DNS lookups
464 */
465 len = M_FREEROOM(m);
466 /* if (so->so_fport != htons(53)) */
467 {
468 ioctlsocket(so->s, FIONREAD, &n);
469
470 if (n > len)
471 {
472 n = (m->m_data - m->m_dat) + m->m_len + n + 1;
473 m_inc(m, n);
474 len = M_FREEROOM(m);
475 }
476 }
477
478 m->m_len = recvfrom(so->s, m->m_data, len, 0,
479 (struct sockaddr *)&addr, &addrlen);
480 DEBUG_MISC((dfd, " did recvfrom %d, errno = %d-%s\n",
481 m->m_len, errno,strerror(errno)));
482 if(m->m_len < 0)
483 {
484 u_char code = ICMP_UNREACH_PORT;
485
486 if (errno == EHOSTUNREACH)
487 code = ICMP_UNREACH_HOST;
488 else if(errno == ENETUNREACH)
489 code = ICMP_UNREACH_NET;
490
491 DEBUG_MISC((dfd," rx error, tx icmp ICMP_UNREACH:%i\n", code));
492 icmp_error(pData, so->so_m, ICMP_UNREACH,code, 0,strerror(errno));
493 m_free(pData, m);
494 }
495 else
496 {
497 /*
498 * Hack: domain name lookup will be used the most for UDP,
499 * and since they'll only be used once there's no need
500 * for the 4 minute (or whatever) timeout... So we time them
501 * out much quicker (10 seconds for now...)
502 */
503 if (so->so_expire)
504 {
505 if (so->so_fport == htons(53))
506 so->so_expire = curtime + SO_EXPIREFAST;
507 else
508 so->so_expire = curtime + SO_EXPIRE;
509 }
510
511#if 0
512 if (m->m_len == len)
513 {
514 m_inc(m, MINCSIZE);
515 m->m_len = 0;
516 }
517#endif
518
519 /*
520 * If this packet was destined for CTL_ADDR,
521 * make it look like that's where it came from, done by udp_output
522 */
523 udp_output(pData, so, m, &addr);
524 } /* rx error */
525 } /* if ping packet */
526}
527
528/*
529 * sendto() a socket
530 */
531int
532sosendto(PNATState pData, struct socket *so, struct mbuf *m)
533{
534 int ret;
535 struct sockaddr_in addr;
536#if 0
537 struct sockaddr_in host_addr;
538#endif
539
540 DEBUG_CALL("sosendto");
541 DEBUG_ARG("so = %lx", (long)so);
542 DEBUG_ARG("m = %lx", (long)m);
543
544 addr.sin_family = AF_INET;
545 if ((so->so_faddr.s_addr & htonl(pData->netmask)) == special_addr.s_addr)
546 {
547 /* It's an alias */
548 uint32_t last_byte = ntohl(so->so_faddr.s_addr) & ~pData->netmask;
549 switch(last_byte)
550 {
551#if 0
552 /* handle this case at 'default:' */
553 case CTL_BROADCAST:
554 addr.sin_addr.s_addr = INADDR_BROADCAST;
555 /* Send the packet to host to fully emulate broadcast */
556 /** @todo r=klaus: on Linux host this causes the host to receive
557 * the packet twice for some reason. And I cannot find any place
558 * in the man pages which states that sending a broadcast does not
559 * reach the host itself. */
560 host_addr.sin_family = AF_INET;
561 host_addr.sin_port = so->so_fport;
562 host_addr.sin_addr = our_addr;
563 sendto(so->s, m->m_data, m->m_len, 0,
564 (struct sockaddr *)&host_addr, sizeof (struct sockaddr));
565 break;
566#endif
567 case CTL_DNS:
568 if (!get_dns_addr(pData, &dns_addr))
569 addr.sin_addr = dns_addr;
570 else
571 addr.sin_addr = loopback_addr;
572 break;
573 case CTL_ALIAS:
574 default:
575 if (last_byte == ~pData->netmask)
576 addr.sin_addr.s_addr = INADDR_BROADCAST;
577 else
578 addr.sin_addr = loopback_addr;
579 break;
580 }
581 }
582 else
583 addr.sin_addr = so->so_faddr;
584 addr.sin_port = so->so_fport;
585
586 DEBUG_MISC((dfd, " sendto()ing, addr.sin_port=%d, addr.sin_addr.s_addr=%.16s\n",
587 ntohs(addr.sin_port), inet_ntoa(addr.sin_addr)));
588
589 /* Don't care what port we get */
590 ret = sendto(so->s, m->m_data, m->m_len, 0,
591 (struct sockaddr *)&addr, sizeof (struct sockaddr));
592 if (ret < 0)
593 {
594 LogRel(("UDP: sendto fails (%s)\n", strerror(errno)));
595 return -1;
596 }
597
598 /*
599 * Kill the socket if there's no reply in 4 minutes,
600 * but only if it's an expirable socket
601 */
602 if (so->so_expire)
603 so->so_expire = curtime + SO_EXPIRE;
604 so->so_state = SS_ISFCONNECTED; /* So that it gets select()ed */
605 return 0;
606}
607
608/*
609 * XXX This should really be tcp_listen
610 */
611struct socket *
612solisten(PNATState pData, u_int port, u_int32_t laddr, u_int lport, int flags)
613{
614 struct sockaddr_in addr;
615 struct socket *so;
616 socklen_t addrlen = sizeof(addr);
617 int s, opt = 1;
618
619 DEBUG_CALL("solisten");
620 DEBUG_ARG("port = %d", port);
621 DEBUG_ARG("laddr = %x", laddr);
622 DEBUG_ARG("lport = %d", lport);
623 DEBUG_ARG("flags = %x", flags);
624
625 if ((so = socreate()) == NULL)
626 {
627 /* free(so); Not sofree() ??? free(NULL) == NOP */
628 return NULL;
629 }
630
631 /* Don't tcp_attach... we don't need so_snd nor so_rcv */
632 if ((so->so_tcpcb = tcp_newtcpcb(pData, so)) == NULL)
633 {
634 free(so);
635 return NULL;
636 }
637 insque(pData, so,&tcb);
638
639 /*
640 * SS_FACCEPTONCE sockets must time out.
641 */
642 if (flags & SS_FACCEPTONCE)
643 so->so_tcpcb->t_timer[TCPT_KEEP] = TCPTV_KEEP_INIT*2;
644
645 so->so_state = (SS_FACCEPTCONN|flags);
646 so->so_lport = lport; /* Kept in network format */
647 so->so_laddr.s_addr = laddr; /* Ditto */
648
649 addr.sin_family = AF_INET;
650 addr.sin_addr.s_addr = INADDR_ANY;
651 addr.sin_port = port;
652
653 if ( ((s = socket(AF_INET,SOCK_STREAM,0)) < 0)
654 || (setsockopt(s,SOL_SOCKET,SO_REUSEADDR,(char *)&opt,sizeof(int)) < 0)
655 || (bind(s,(struct sockaddr *)&addr, sizeof(addr)) < 0)
656 || (listen(s,1) < 0))
657 {
658#ifdef RT_OS_WINDOWS
659 int tmperrno = WSAGetLastError(); /* Don't clobber the real reason we failed */
660 closesocket(s);
661 sofree(pData, so);
662 /* Restore the real errno */
663 WSASetLastError(tmperrno);
664#else
665 int tmperrno = errno; /* Don't clobber the real reason we failed */
666 close(s);
667 sofree(pData, so);
668 /* Restore the real errno */
669 errno = tmperrno;
670#endif
671 return NULL;
672 }
673 setsockopt(s,SOL_SOCKET,SO_OOBINLINE,(char *)&opt,sizeof(int));
674
675 getsockname(s,(struct sockaddr *)&addr,&addrlen);
676 so->so_fport = addr.sin_port;
677 if (addr.sin_addr.s_addr == 0 || addr.sin_addr.s_addr == loopback_addr.s_addr)
678 so->so_faddr = alias_addr;
679 else
680 so->so_faddr = addr.sin_addr;
681
682 so->s = s;
683 return so;
684}
685
686/*
687 * Data is available in so_rcv
688 * Just write() the data to the socket
689 * XXX not yet...
690 */
691void
692sorwakeup(struct socket *so)
693{
694#if 0
695 sowrite(so);
696 FD_CLR(so->s,&writefds);
697#endif
698}
699
700/*
701 * Data has been freed in so_snd
702 * We have room for a read() if we want to
703 * For now, don't read, it'll be done in the main loop
704 */
705void
706sowwakeup(struct socket *so)
707{
708}
709
710/*
711 * Various session state calls
712 * XXX Should be #define's
713 * The socket state stuff needs work, these often get call 2 or 3
714 * times each when only 1 was needed
715 */
716void
717soisfconnecting(struct socket *so)
718{
719 so->so_state &= ~(SS_NOFDREF|SS_ISFCONNECTED|SS_FCANTRCVMORE|
720 SS_FCANTSENDMORE|SS_FWDRAIN);
721 so->so_state |= SS_ISFCONNECTING; /* Clobber other states */
722}
723
724void
725soisfconnected(struct socket *so)
726{
727 so->so_state &= ~(SS_ISFCONNECTING|SS_FWDRAIN|SS_NOFDREF);
728 so->so_state |= SS_ISFCONNECTED; /* Clobber other states */
729}
730
731void
732sofcantrcvmore(struct socket *so)
733{
734 if ((so->so_state & SS_NOFDREF) == 0)
735 {
736 shutdown(so->s,0);
737 }
738 so->so_state &= ~(SS_ISFCONNECTING);
739 if (so->so_state & SS_FCANTSENDMORE)
740 so->so_state = SS_NOFDREF; /* Don't select it */
741 /* XXX close() here as well? */
742 else
743 so->so_state |= SS_FCANTRCVMORE;
744}
745
746void
747sofcantsendmore(struct socket *so)
748{
749 if ((so->so_state & SS_NOFDREF) == 0)
750 shutdown(so->s, 1); /* send FIN to fhost */
751
752 so->so_state &= ~(SS_ISFCONNECTING);
753 if (so->so_state & SS_FCANTRCVMORE)
754 so->so_state = SS_NOFDREF; /* as above */
755 else
756 so->so_state |= SS_FCANTSENDMORE;
757}
758
759void
760soisfdisconnected(struct socket *so)
761{
762#if 0
763 so->so_state &= ~(SS_ISFCONNECTING|SS_ISFCONNECTED);
764 close(so->s);
765 so->so_state = SS_ISFDISCONNECTED;
766 /*
767 * XXX Do nothing ... ?
768 */
769#endif
770}
771
772/*
773 * Set write drain mode
774 * Set CANTSENDMORE once all data has been write()n
775 */
776void
777sofwdrain(struct socket *so)
778{
779 if (so->so_rcv.sb_cc)
780 so->so_state |= SS_FWDRAIN;
781 else
782 sofcantsendmore(so);
783}
784
785#ifdef VBOX_WITH_SLIRP_ICMP
786static void
787send_icmp_to_guest(PNATState pData, char *buff, size_t len, struct socket *so, const struct sockaddr_in *addr)
788{
789 struct ip *ip;
790 uint32_t dst,src;
791 char ip_copy[256];
792 struct icmp *icp;
793 int old_ip_len;
794 struct mbuf *m;
795 struct icmp_msg *icm;
796
797 ip = (struct ip *)buff;
798 icp = (struct icmp *)((char *)ip + (ip->ip_hl << 2));
799
800 LogRel(("ICMP:received msg(t:%d, c:%d)\n", icp->icmp_type, icp->icmp_code));
801 if (icp->icmp_type != ICMP_ECHOREPLY && icp->icmp_type != ICMP_TIMXCEED)
802 {
803 return;
804 }
805
806 if (icp->icmp_type == ICMP_TIMXCEED)
807 ip = &icp->icmp_ip;
808
809 icm = icmp_find_original_mbuf(pData, ip);
810
811 if (icm == NULL)
812 {
813 LogRel(("NAT: Can't find the corresponding packet for the received ICMP\n"));
814 return;
815 }
816
817 m = icm->im_m;
818 Assert(m != NULL);
819
820 src = addr->sin_addr.s_addr;
821
822 ip = mtod(m, struct ip *);
823 /* Now ip is pointing on header we've sent from guest */
824 if (icp->icmp_type == ICMP_TIMXCEED)
825 {
826 old_ip_len = (ip->ip_hl << 2) + 64;
827 memcpy(ip_copy, ip, old_ip_len);
828 }
829
830 /* source address from original IP packet*/
831 dst = ip->ip_src.s_addr;
832
833 /* overide ther tail of old packet */
834 memcpy(m->m_data, buff, len);
835 m->m_len = len;
836 ip = mtod(m, struct ip *); /* ip is from mbuf we've overrided */
837
838 icp = (struct icmp *)((char *)ip + (ip->ip_hl << 2));
839 if (icp->icmp_type == ICMP_TIMXCEED)
840 {
841 /* according RFC 793 error messages required copy of initial IP header + 64 bit */
842 memcpy(&icp->icmp_ip, ip_copy, old_ip_len);
843 ip->ip_tos = ((ip->ip_tos & 0x1E) | 0xC0); /* high priority for errors */
844 }
845
846 /* the low level expects fields to be in host format so let's convert them*/
847 NTOHS(ip->ip_len);
848 NTOHS(ip->ip_off);
849 NTOHS(ip->ip_id);
850 ip->ip_src.s_addr = src;
851 ip->ip_dst.s_addr = dst;
852 icmp_reflect(pData, m);
853 LIST_REMOVE(icm, im_list);
854 /* Don't call m_free here*/
855 free(icm);
856}
857
858# ifdef RT_OS_WINDOWS
859static void
860sorecvfrom_icmp_win(PNATState pData, struct socket *so)
861{
862 int len;
863 int i;
864 struct ip *ip;
865 struct mbuf *m;
866 struct icmp *icp;
867 struct icmp_msg *icm;
868 struct ip *ip_broken; /* ICMP returns header + 64 bit of packet */
869 uint32_t src;
870 ICMP_ECHO_REPLY *icr;
871 u_char code = ~0;
872 len = pData->pfIcmpParseReplies(pData->pvIcmpBuffer, pData->szIcmpBuffer);
873 if (len < 0)
874 {
875 LogRel(("NAT: Error (%d) occurred on ICMP receiving\n", GetLastError()));
876 return;
877 }
878 if (len == 0)
879 return; /* no error */
880 LogRel(("IcmpParseReplies returns %ld\n", len));
881 icr = (ICMP_ECHO_REPLY *)pData->pvIcmpBuffer;
882 for (i = 0; i < len; ++i)
883 {
884 switch(icr[i].Status)
885 {
886 case IP_DEST_HOST_UNREACHABLE:
887 code = (code != ~0 ? code : ICMP_UNREACH_HOST);
888 case IP_DEST_NET_UNREACHABLE:
889 code = (code != ~0 ? code : ICMP_UNREACH_NET);
890 case IP_DEST_PROT_UNREACHABLE:
891 code = (code != ~0 ? code : ICMP_UNREACH_PROTOCOL);
892 /* UNREACH error inject here */
893 case IP_DEST_PORT_UNREACHABLE:
894 code = (code != ~0 ? code : ICMP_UNREACH_PORT);
895 icmp_error(pData, so->so_m, ICMP_UNREACH, code, 0, "Error occurred!!!");
896 break;
897 case IP_SUCCESS: /* echo replied */
898 m = m_get(pData);
899 ip = mtod(m, struct ip *);
900 ip->ip_src.s_addr = icr[i].Address;
901 ip->ip_p = IPPROTO_ICMP;
902 ip->ip_dst.s_addr = so->so_laddr.s_addr; /*XXX: still the hack*/
903 ip->ip_hl = sizeof(struct ip) >> 2; /* requiered for icmp_reflect, no IP options */
904 ip->ip_ttl = icr[i].Options.Ttl;
905
906 icp = (struct icmp *)&ip[1]; /* no options */
907 icp->icmp_type = ICMP_ECHOREPLY;
908 icp->icmp_code = 0;
909 icp->icmp_id = so->so_icmp_id;
910 icp->icmp_seq = so->so_icmp_seq;
911 memcpy(icp->icmp_data, icr[i].Data, icr[i].DataSize);
912
913 ip->ip_len = sizeof(struct ip) + ICMP_MINLEN + icr[i].DataSize;
914 m->m_len = ip->ip_len;
915
916 icmp_reflect(pData, m);
917 case IP_TTL_EXPIRED_TRANSIT: /* TTL expired */
918
919 ip_broken = icr[i].Data;
920 icm = icmp_find_original_mbuf(pData, ip_broken);
921 if (icm == NULL) {
922 LogRel(("ICMP: can't find original package (first double word %x)\n", *(uint32_t *)ip_broken));
923 return;
924 }
925 m = icm->im_m;
926 ip = mtod(m, struct ip *);
927 ip->ip_ttl = icr[i].Options.Ttl;
928 src = ip->ip_src.s_addr;
929 ip->ip_dst.s_addr = src;
930 ip->ip_dst.s_addr = icr[i].Address;
931 icp = (struct icmp *)((char *)ip + (ip->ip_hl << 2));
932 ip_broken->ip_src.s_addr = src; /*it packet sent from host not from guest*/
933 memcpy(icp->icmp_data, ip_broken, (ip_broken->ip_hl << 2) + 64);
934 icmp_reflect(pData, m);
935 break;
936 default:
937 LogRel(("ICMP(default): message with Status: %x was received from %x\n", icr[i].Status, icr[i].Address));
938 break;
939 }
940 }
941}
942# endif /* RT_OS_WINDOWS */
943#endif /* VBOX_WITH_SLIRP_ICMP */
944
945static void sorecvfrom_icmp_unix(PNATState pData, struct socket *so)
946{
947 struct sockaddr_in addr;
948 socklen_t addrlen = sizeof(struct sockaddr_in);
949 char buff[1500];
950 int len;
951 len = recvfrom(so->s, buff, 1500, 0,
952 (struct sockaddr *)&addr, &addrlen);
953 /* XXX Check if reply is "correct"? */
954
955 if (len == -1 || len == 0)
956 {
957 u_char code = ICMP_UNREACH_PORT;
958
959 if (errno == EHOSTUNREACH)
960 code = ICMP_UNREACH_HOST;
961 else if(errno == ENETUNREACH)
962 code = ICMP_UNREACH_NET;
963
964 DEBUG_MISC((dfd," udp icmp rx errno = %d-%s\n",
965 errno,strerror(errno)));
966 icmp_error(pData, so->so_m, ICMP_UNREACH,code, 0,strerror(errno));
967 }
968 else
969 {
970#ifdef VBOX_WITH_SLIRP_ICMP
971 send_icmp_to_guest(pData, buff, len, so, &addr);
972#else
973 icmp_reflect(pData, so->so_m);
974 so->so_m = 0; /* Don't m_free() it again! */
975#endif
976 }
977}
978
注意: 瀏覽 TracBrowser 來幫助您使用儲存庫瀏覽器

© 2025 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette