VirtualBox

source: vbox/trunk/src/VBox/NetworkServices/NAT/proxy.c@ 54895

Last change on this file since 54895 was 54895, checked in by vboxsync, 10 years ago

NAT/Network: group windows and unix code to make socket non-blocking
into one #if/#elif.

  • Property svn:eol-style set to native
  • Property svn:keywords set to Id Revision
File size: 17.1 KB
Line 
1/* $Id: proxy.c 54895 2015-03-21 21:39:24Z vboxsync $ */
2/** @file
3 * NAT Network - proxy setup and utilities.
4 */
5
6/*
7 * Copyright (C) 2013-2014 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 */
17
18#define LOG_GROUP LOG_GROUP_NAT_SERVICE
19
20#include "winutils.h"
21
22#include "proxy.h"
23#include "proxy_pollmgr.h"
24#include "portfwd.h"
25
26#include "lwip/opt.h"
27
28#include "lwip/sys.h"
29#include "lwip/tcpip.h"
30
31#ifndef RT_OS_WINDOWS
32#include <sys/poll.h>
33#include <sys/socket.h>
34#include <netinet/in.h>
35#include <arpa/inet.h>
36#include <fcntl.h>
37#include <stdio.h>
38#include <iprt/string.h>
39#include <unistd.h>
40#include <err.h>
41#else
42# include <iprt/string.h>
43#endif
44
45#if defined(SOCK_NONBLOCK) && defined(RT_OS_NETBSD) /* XXX: PR kern/47569 */
46# undef SOCK_NONBLOCK
47#endif
48
49#ifndef __arraycount
50# define __arraycount(a) (sizeof(a)/sizeof(a[0]))
51#endif
52
53static FNRTSTRFORMATTYPE proxy_sockerr_rtstrfmt;
54
55static SOCKET proxy_create_socket(int, int);
56
57volatile struct proxy_options *g_proxy_options;
58static sys_thread_t pollmgr_tid;
59
60/* XXX: for mapping loopbacks to addresses in our network (ip4) */
61struct netif *g_proxy_netif;
62
63
64/*
65 * Called on the lwip thread (aka tcpip thread) from tcpip_init() via
66 * its "tcpip_init_done" callback. Raw API is ok to use here
67 * (e.g. rtadvd), but netconn API is not.
68 */
69void
70proxy_init(struct netif *proxy_netif, struct proxy_options *opts)
71{
72 int status;
73
74 LWIP_ASSERT1(opts != NULL);
75 LWIP_UNUSED_ARG(proxy_netif);
76
77 status = RTStrFormatTypeRegister("sockerr", proxy_sockerr_rtstrfmt, NULL);
78 AssertRC(status);
79
80 g_proxy_options = opts;
81 g_proxy_netif = proxy_netif;
82
83#if 1
84 proxy_rtadvd_start(proxy_netif);
85#endif
86
87 /*
88 * XXX: We use stateless DHCPv6 only to report IPv6 address(es) of
89 * nameserver(s). Since we don't yet support IPv6 addresses in
90 * HostDnsService, there's no point in running DHCPv6.
91 */
92#if 0
93 dhcp6ds_init(proxy_netif);
94#endif
95
96 if (opts->tftp_root != NULL) {
97 tftpd_init(proxy_netif, opts->tftp_root);
98 }
99
100 status = pollmgr_init();
101 if (status < 0) {
102 errx(EXIT_FAILURE, "failed to initialize poll manager");
103 /* NOTREACHED */
104 }
105
106 pxtcp_init();
107 pxudp_init();
108
109 portfwd_init();
110
111 pxdns_init(proxy_netif);
112
113 pxping_init(proxy_netif, opts->icmpsock4, opts->icmpsock6);
114
115 pollmgr_tid = sys_thread_new("pollmgr_thread",
116 pollmgr_thread, NULL,
117 DEFAULT_THREAD_STACKSIZE,
118 DEFAULT_THREAD_PRIO);
119 if (!pollmgr_tid) {
120 errx(EXIT_FAILURE, "failed to create poll manager thread");
121 /* NOTREACHED */
122 }
123}
124
125
126#if !defined(RT_OS_WINDOWS)
127/**
128 * Formatter for %R[sockerr] - unix strerror_r() version.
129 */
130static DECLCALLBACK(size_t)
131proxy_sockerr_rtstrfmt(PFNRTSTROUTPUT pfnOutput, void *pvArgOutput,
132 const char *pszType, const void *pvValue,
133 int cchWidth, int cchPrecision, unsigned int fFlags,
134 void *pvUser)
135{
136 const int error = (int)(intptr_t)pvValue;
137 size_t cb = 0;
138
139 const char *msg = NULL;
140 char buf[128];
141
142 NOREF(cchWidth);
143 NOREF(cchPrecision);
144 NOREF(fFlags);
145 NOREF(pvUser);
146
147 AssertReturn(strcmp(pszType, "sockerr") == 0, 0);
148
149 /* make sure return type mismatch is caught */
150#if defined(RT_OS_LINUX) && defined(_GNU_SOURCE)
151 msg = strerror_r(error, buf, sizeof(buf));
152#else
153 {
154 int status = strerror_r(error, buf, sizeof(buf));
155 msg = buf;
156 }
157#endif
158 return RTStrFormat(pfnOutput, pvArgOutput, NULL, NULL, "%s", msg);
159}
160
161#else /* RT_OS_WINDOWS */
162
163/**
164 * Formatter for %R[sockerr] - windows FormatMessage() version.
165 */
166static DECLCALLBACK(size_t)
167proxy_sockerr_rtstrfmt(PFNRTSTROUTPUT pfnOutput, void *pvArgOutput,
168 const char *pszType, const void *pvValue,
169 int cchWidth, int cchPrecision, unsigned int fFlags,
170 void *pvUser)
171{
172 const int error = (int)(intptr_t)pvValue;
173 size_t cb = 0;
174
175 NOREF(cchWidth);
176 NOREF(cchPrecision);
177 NOREF(fFlags);
178 NOREF(pvUser);
179
180 AssertReturn(strcmp(pszType, "sockerr") == 0, 0);
181
182 /*
183 * XXX: Windows strerror() doesn't handle posix error codes, but
184 * since winsock uses its own, it shouldn't be much of a problem.
185 * If you see a strange error message, it's probably from
186 * FormatMessage() for an error from <WinError.h> that has the
187 * same numeric value.
188 */
189 if (error < _sys_nerr) {
190 char buf[128] = "";
191 int status;
192
193 status = strerror_s(buf, sizeof(buf), error);
194 if (status == 0) {
195 if (strcmp(buf, "Unknown error") == 0) {
196 /* windows strerror() doesn't add the numeric value */
197 cb += RTStrFormat(pfnOutput, pvArgOutput, NULL, NULL,
198 "Unknown error: %d", error);
199 }
200 else {
201 cb += RTStrFormat(pfnOutput, pvArgOutput, NULL, NULL,
202 "%s", buf);
203 }
204 }
205 else {
206 cb += RTStrFormat(pfnOutput, pvArgOutput, NULL, NULL,
207 "Unknown error: %d", error);
208 }
209 }
210 else {
211 DWORD nchars;
212 char *msg = NULL;
213
214 nchars = FormatMessageA(FORMAT_MESSAGE_FROM_SYSTEM
215 | FORMAT_MESSAGE_ALLOCATE_BUFFER,
216 NULL, error, LANG_NEUTRAL,
217 (LPSTR)&msg, 0,
218 NULL);
219 if (nchars == 0 || msg == NULL) {
220 cb += RTStrFormat(pfnOutput, pvArgOutput, NULL, NULL,
221 "Unknown error: %d", error);
222 }
223 else {
224 /* FormatMessage() "helpfully" adds newline; get rid of it */
225 char *crpos = strchr(msg, '\r');
226 if (crpos != NULL) {
227 *crpos = '\0';
228 }
229
230 cb += RTStrFormat(pfnOutput, pvArgOutput, NULL, NULL,
231 "%s", msg);
232 }
233
234 if (msg != NULL) {
235 LocalFree(msg);
236 }
237 }
238
239 return cb;
240}
241#endif /* RT_OS_WINDOWS */
242
243
244/**
245 * Send static callback message from poll manager thread to lwip
246 * thread, scheduling a function call in lwip thread context.
247 *
248 * XXX: Existing lwip api only provides non-blocking version for this.
249 * It may fail when lwip thread is not running (mbox invalid) or if
250 * post failed (mbox full). How to handle these?
251 */
252void
253proxy_lwip_post(struct tcpip_msg *msg)
254{
255 struct tcpip_callback_msg *m;
256 err_t error;
257
258 LWIP_ASSERT1(msg != NULL);
259
260 /*
261 * lwip plays games with fake incomplete struct tag to enforce API
262 */
263 m = (struct tcpip_callback_msg *)msg;
264 error = tcpip_callbackmsg(m);
265
266 if (error == ERR_VAL) {
267 /* XXX: lwip thread is not running (mbox invalid) */
268 LWIP_ASSERT1(error != ERR_VAL);
269 }
270
271 LWIP_ASSERT1(error == ERR_OK);
272}
273
274
275/**
276 * Create a non-blocking socket. Disable SIGPIPE for TCP sockets if
277 * possible. On Linux it's not possible and should be disabled for
278 * each send(2) individually.
279 */
280static SOCKET
281proxy_create_socket(int sdom, int stype)
282{
283 SOCKET s;
284 int stype_and_flags;
285 int status;
286
287 LWIP_UNUSED_ARG(status); /* depends on ifdefs */
288
289
290 stype_and_flags = stype;
291
292#if defined(SOCK_NONBLOCK)
293 stype_and_flags |= SOCK_NONBLOCK;
294#endif
295
296 /*
297 * Disable SIGPIPE on disconnected socket. It might be easier to
298 * forgo it and just use MSG_NOSIGNAL on each send*(2), since we
299 * have to do it for Linux anyway, but Darwin does NOT have that
300 * flag (but has SO_NOSIGPIPE socket option).
301 */
302#if !defined(SOCK_NOSIGPIPE) && !defined(SO_NOSIGPIPE) && !defined(MSG_NOSIGNAL)
303#if 0 /* XXX: Solaris has neither, the program should ignore SIGPIPE globally */
304#error Need a way to disable SIGPIPE on connection oriented sockets!
305#endif
306#endif
307
308#if defined(SOCK_NOSIGPIPE)
309 if (stype == SOCK_STREAM) {
310 stype_and_flags |= SOCK_NOSIGPIPE;
311 }
312#endif
313
314 s = socket(sdom, stype_and_flags, 0);
315 if (s == INVALID_SOCKET) {
316 DPRINTF(("socket: %R[sockerr]\n", SOCKERRNO()));
317 return INVALID_SOCKET;
318 }
319
320#if defined(RT_OS_WINDOWS)
321 {
322 u_long mode = 1;
323 status = ioctlsocket(s, FIONBIO, &mode);
324 if (status == SOCKET_ERROR) {
325 DPRINTF(("FIONBIO: %R[sockerr]\n", SOCKERRNO()));
326 closesocket(s);
327 return INVALID_SOCKET;
328 }
329 }
330#elif !defined(SOCK_NONBLOCK)
331 {
332 int sflags;
333
334 sflags = fcntl(s, F_GETFL, 0);
335 if (sflags < 0) {
336 DPRINTF(("F_GETFL: %R[sockerr]\n", SOCKERRNO()));
337 closesocket(s);
338 return INVALID_SOCKET;
339 }
340
341 status = fcntl(s, F_SETFL, sflags | O_NONBLOCK);
342 if (status < 0) {
343 DPRINTF(("O_NONBLOCK: %R[sockerr]\n", SOCKERRNO()));
344 closesocket(s);
345 return INVALID_SOCKET;
346 }
347 }
348#endif
349
350#if !defined(SOCK_NOSIGPIPE) && defined(SO_NOSIGPIPE)
351 if (stype == SOCK_STREAM) {
352 int on = 1;
353 const socklen_t onlen = sizeof(on);
354
355 status = setsockopt(s, SOL_SOCKET, SO_NOSIGPIPE, &on, onlen);
356 if (status < 0) {
357 DPRINTF(("SO_NOSIGPIPE: %R[sockerr]\n", SOCKERRNO()));
358 closesocket(s);
359 return INVALID_SOCKET;
360 }
361 }
362#endif
363
364 return s;
365}
366
367
368/**
369 * Create a socket for outbound connection to dst_addr:dst_port.
370 *
371 * The socket is non-blocking and TCP sockets has SIGPIPE disabled if
372 * possible. On Linux it's not possible and should be disabled for
373 * each send(2) individually.
374 */
375SOCKET
376proxy_connected_socket(int sdom, int stype,
377 ipX_addr_t *dst_addr, u16_t dst_port)
378{
379 struct sockaddr_in6 dst_sin6;
380 struct sockaddr_in dst_sin;
381 struct sockaddr *pdst_sa;
382 socklen_t dst_sa_len;
383 void *pdst_addr;
384 const struct sockaddr *psrc_sa;
385 socklen_t src_sa_len;
386 int status;
387 int sockerr;
388 SOCKET s;
389
390 LWIP_ASSERT1(sdom == PF_INET || sdom == PF_INET6);
391 LWIP_ASSERT1(stype == SOCK_STREAM || stype == SOCK_DGRAM);
392
393 DPRINTF(("---> %s ", stype == SOCK_STREAM ? "TCP" : "UDP"));
394 if (sdom == PF_INET6) {
395 pdst_sa = (struct sockaddr *)&dst_sin6;
396 pdst_addr = (void *)&dst_sin6.sin6_addr;
397
398 memset(&dst_sin6, 0, sizeof(dst_sin6));
399#if HAVE_SA_LEN
400 dst_sin6.sin6_len =
401#endif
402 dst_sa_len = sizeof(dst_sin6);
403 dst_sin6.sin6_family = AF_INET6;
404 memcpy(&dst_sin6.sin6_addr, &dst_addr->ip6, sizeof(ip6_addr_t));
405 dst_sin6.sin6_port = htons(dst_port);
406
407 DPRINTF(("[%RTnaipv6]:%d ", &dst_sin6.sin6_addr, dst_port));
408 }
409 else { /* sdom = PF_INET */
410 pdst_sa = (struct sockaddr *)&dst_sin;
411 pdst_addr = (void *)&dst_sin.sin_addr;
412
413 memset(&dst_sin, 0, sizeof(dst_sin));
414#if HAVE_SA_LEN
415 dst_sin.sin_len =
416#endif
417 dst_sa_len = sizeof(dst_sin);
418 dst_sin.sin_family = AF_INET;
419 dst_sin.sin_addr.s_addr = dst_addr->ip4.addr; /* byte-order? */
420 dst_sin.sin_port = htons(dst_port);
421
422 DPRINTF(("%RTnaipv4:%d ", dst_sin.sin_addr.s_addr, dst_port));
423 }
424
425 s = proxy_create_socket(sdom, stype);
426 if (s == INVALID_SOCKET) {
427 return INVALID_SOCKET;
428 }
429 DPRINTF(("socket %d\n", s));
430
431 /* TODO: needs locking if dynamic modifyvm is allowed */
432 if (sdom == PF_INET6) {
433 psrc_sa = (const struct sockaddr *)g_proxy_options->src6;
434 src_sa_len = sizeof(struct sockaddr_in6);
435 }
436 else {
437 psrc_sa = (const struct sockaddr *)g_proxy_options->src4;
438 src_sa_len = sizeof(struct sockaddr_in);
439 }
440 if (psrc_sa != NULL) {
441 status = bind(s, psrc_sa, src_sa_len);
442 if (status == SOCKET_ERROR) {
443 sockerr = SOCKERRNO();
444 DPRINTF(("socket %d: bind: %R[sockerr]\n", s, sockerr));
445 closesocket(s);
446 SET_SOCKERRNO(sockerr);
447 return INVALID_SOCKET;
448 }
449 }
450
451 status = connect(s, pdst_sa, dst_sa_len);
452 if (status == SOCKET_ERROR
453#if !defined(RT_OS_WINDOWS)
454 && SOCKERRNO() != EINPROGRESS
455#else
456 && SOCKERRNO() != EWOULDBLOCK
457#endif
458 )
459 {
460 sockerr = SOCKERRNO();
461 DPRINTF(("socket %d: connect: %R[sockerr]\n", s, sockerr));
462 closesocket(s);
463 SET_SOCKERRNO(sockerr);
464 return INVALID_SOCKET;
465 }
466
467 return s;
468}
469
470
471/**
472 * Create a socket for inbound (port-forwarded) connections to
473 * src_addr (port is part of sockaddr, so not a separate argument).
474 *
475 * The socket is non-blocking and TCP sockets has SIGPIPE disabled if
476 * possible. On Linux it's not possible and should be disabled for
477 * each send(2) individually.
478 *
479 * TODO?: Support v6-mapped v4 so that user can specify she wants
480 * "udp" and get both versions?
481 */
482SOCKET
483proxy_bound_socket(int sdom, int stype, struct sockaddr *src_addr)
484{
485 SOCKET s;
486 int on;
487 const socklen_t onlen = sizeof(on);
488 int status;
489 int sockerr;
490
491 s = proxy_create_socket(sdom, stype);
492 if (s == INVALID_SOCKET) {
493 return INVALID_SOCKET;
494 }
495 DPRINTF(("socket %d\n", s));
496
497 on = 1;
498 status = setsockopt(s, SOL_SOCKET, SO_REUSEADDR, (char *)&on, onlen);
499 if (status < 0) { /* not good, but not fatal */
500 DPRINTF(("SO_REUSEADDR: %R[sockerr]\n", SOCKERRNO()));
501 }
502
503 status = bind(s, src_addr,
504 sdom == PF_INET ?
505 sizeof(struct sockaddr_in)
506 : sizeof(struct sockaddr_in6));
507 if (status == SOCKET_ERROR) {
508 sockerr = SOCKERRNO();
509 DPRINTF(("bind: %R[sockerr]\n", sockerr));
510 closesocket(s);
511 SET_SOCKERRNO(sockerr);
512 return INVALID_SOCKET;
513 }
514
515 if (stype == SOCK_STREAM) {
516 status = listen(s, 5);
517 if (status == SOCKET_ERROR) {
518 sockerr = SOCKERRNO();
519 DPRINTF(("listen: %R[sockerr]\n", sockerr));
520 closesocket(s);
521 SET_SOCKERRNO(sockerr);
522 return INVALID_SOCKET;
523 }
524 }
525
526 return s;
527}
528
529
530void
531proxy_reset_socket(SOCKET s)
532{
533 struct linger linger;
534
535 linger.l_onoff = 1;
536 linger.l_linger = 0;
537
538 /* On Windows we can run into issue here, perhaps SO_LINGER isn't enough, and
539 * we should use WSA{Send,Recv}Disconnect instead.
540 *
541 * Links for the reference:
542 * http://msdn.microsoft.com/en-us/library/windows/desktop/ms738547%28v=vs.85%29.aspx
543 * http://bugs.sun.com/bugdatabase/view_bug.do?bug_id=4468997
544 */
545 setsockopt(s, SOL_SOCKET, SO_LINGER, (char *)&linger, sizeof(linger));
546
547 closesocket(s);
548}
549
550
551int
552proxy_sendto(SOCKET sock, struct pbuf *p, void *name, size_t namelen)
553{
554 struct pbuf *q;
555 size_t i, clen;
556#ifndef RT_OS_WINDOWS
557 struct msghdr mh;
558 ssize_t nsent;
559#else
560 DWORD nsent;
561#endif
562 int rc;
563 IOVEC fixiov[8]; /* fixed size (typical case) */
564 const size_t fixiovsize = sizeof(fixiov)/sizeof(fixiov[0]);
565 IOVEC *dyniov; /* dynamically sized */
566 IOVEC *iov;
567 int error = 0;
568
569 /*
570 * Static iov[] is usually enough since UDP protocols use small
571 * datagrams to avoid fragmentation, but be prepared.
572 */
573 clen = pbuf_clen(p);
574 if (clen > fixiovsize) {
575 /*
576 * XXX: TODO: check that clen is shorter than IOV_MAX
577 */
578 dyniov = (IOVEC *)malloc(clen * sizeof(*dyniov));
579 if (dyniov == NULL) {
580 error = -errno; /* sic: not a socket error */
581 goto out;
582 }
583 iov = dyniov;
584 }
585 else {
586 dyniov = NULL;
587 iov = fixiov;
588 }
589
590
591 for (q = p, i = 0; i < clen; q = q->next, ++i) {
592 LWIP_ASSERT1(q != NULL);
593
594 IOVEC_SET_BASE(iov[i], q->payload);
595 IOVEC_SET_LEN(iov[i], q->len);
596 }
597
598#ifndef RT_OS_WINDOWS
599 memset(&mh, 0, sizeof(mh));
600 mh.msg_name = name;
601 mh.msg_namelen = namelen;
602 mh.msg_iov = iov;
603 mh.msg_iovlen = clen;
604
605 nsent = sendmsg(sock, &mh, 0);
606 rc = (nsent >= 0) ? 0 : SOCKET_ERROR;
607#else
608 rc = WSASendTo(sock, iov, (DWORD)clen, &nsent, 0,
609 name, (int)namelen, NULL, NULL);
610#endif
611 if (rc == SOCKET_ERROR) {
612 error = SOCKERRNO();
613 DPRINTF(("%s: socket %d: sendmsg: %R[sockerr]\n",
614 __func__, sock, error));
615 error = -error;
616 }
617
618 out:
619 if (dyniov != NULL) {
620 free(dyniov);
621 }
622 return error;
623}
624
625
626static const char *lwiperr[] = {
627 "ERR_OK",
628 "ERR_MEM",
629 "ERR_BUF",
630 "ERR_TIMEOUT",
631 "ERR_RTE",
632 "ERR_INPROGRESS",
633 "ERR_VAL",
634 "ERR_WOULDBLOCK",
635 "ERR_USE",
636 "ERR_ISCONN",
637 "ERR_ABRT",
638 "ERR_RST",
639 "ERR_CLSD",
640 "ERR_CONN",
641 "ERR_ARG",
642 "ERR_IF"
643};
644
645
646const char *
647proxy_lwip_strerr(err_t error)
648{
649 static char buf[32];
650 int e = -error;
651
652 if (0 <= e && e < (int)__arraycount(lwiperr)) {
653 return lwiperr[e];
654 }
655 else {
656 RTStrPrintf(buf, sizeof(buf), "unknown error %d", error);
657 return buf;
658 }
659}
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette