wget/src/connect.c

551 lines
13 KiB
C
Raw Normal View History

1999-12-02 15:42:23 +08:00
/* Establishing and handling network connections.
Copyright (C) 1995, 1996, 1997, 2001, 2002 Free Software Foundation, Inc.
1999-12-02 15:42:23 +08:00
2001-05-28 03:35:15 +08:00
This file is part of GNU Wget.
1999-12-02 15:42:23 +08:00
2001-05-28 03:35:15 +08:00
GNU Wget is free software; you can redistribute it and/or modify
1999-12-02 15:42:23 +08:00
it under the terms of the GNU General Public License as published by
the Free Software Foundation; either version 2 of the License, or
(at your option) any later version.
2001-05-28 03:35:15 +08:00
GNU Wget is distributed in the hope that it will be useful,
1999-12-02 15:42:23 +08:00
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
2001-05-28 03:35:15 +08:00
along with Wget; if not, write to the Free Software
1999-12-02 15:42:23 +08:00
Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. */
#include <config.h>
#include <stdio.h>
#include <sys/types.h>
#ifdef HAVE_UNISTD_H
# include <unistd.h>
#endif
#include <assert.h>
1999-12-02 15:42:23 +08:00
#ifdef WINDOWS
# include <winsock.h>
#else
# include <sys/socket.h>
# include <netdb.h>
# include <netinet/in.h>
#ifndef __BEOS__
1999-12-02 15:42:23 +08:00
# include <arpa/inet.h>
#endif
1999-12-02 15:42:23 +08:00
#endif /* WINDOWS */
#include <errno.h>
#ifdef HAVE_STRING_H
# include <string.h>
#else
# include <strings.h>
#endif /* HAVE_STRING_H */
#ifdef HAVE_SYS_SELECT_H
# include <sys/select.h>
#endif /* HAVE_SYS_SELECT_H */
/* To implement connect with timeout, we need signal and either
sigsetjmp or sigblock. */
#undef UNIX_CONNECT_TIMEOUT
#ifdef HAVE_SIGNAL_H
# include <signal.h>
#endif
#ifdef HAVE_SETJMP_H
# include <setjmp.h>
#endif
/* If sigsetjmp is a macro, configure won't pick it up. */
#ifdef sigsetjmp
# define HAVE_SIGSETJMP
#endif
#ifdef HAVE_SIGNAL
# ifdef HAVE_SIGSETJMP
# define UNIX_CONNECT_TIMEOUT
# endif
# ifdef HAVE_SIGBLOCK
# define UNIX_CONNECT_TIMEOUT
# endif
#endif
1999-12-02 15:42:23 +08:00
#include "wget.h"
#include "host.h"
#include "connect.h"
1999-12-02 15:42:23 +08:00
#ifndef errno
extern int errno;
#endif
/* Variables shared by bindport and acceptport: */
static int msock = -1;
static struct sockaddr *addr;
static ip_address bind_address;
static int bind_address_resolved;
static void
resolve_bind_address (void)
{
struct address_list *al;
if (bind_address_resolved || opt.bind_address == NULL)
/* Nothing to do. */
return;
al = lookup_host (opt.bind_address, 1);
if (!al)
{
logprintf (LOG_NOTQUIET,
_("Unable to convert `%s' to a bind address. Reverting to ANY.\n"),
opt.bind_address);
return;
}
address_list_copy_one (al, 0, &bind_address);
address_list_release (al);
bind_address_resolved = 1;
}
#ifndef UNIX_CONNECT_TIMEOUT
static int
connect_with_timeout (int fd, const struct sockaddr *addr, int addrlen,
int timeout)
{
return connect (fd, addr, addrlen);
}
#else /* UNIX_CONNECT_TIMEOUT */
/* Implementation of connect with timeout. */
#ifdef HAVE_SIGSETJMP
#define SETJMP(env) sigsetjmp (env, 1)
static sigjmp_buf abort_connect_env;
RETSIGTYPE
abort_connect (int ignored)
{
siglongjmp (abort_connect_env, -1);
}
#else /* not HAVE_SIGSETJMP */
#define SETJMP(env) setjmp (env)
static jmp_buf abort_connect_env;
RETSIGTYPE
abort_connect (int ignored)
{
/* We don't have siglongjmp to preserve the set of blocked signals;
if we longjumped out of the handler at this point, SIGALRM would
remain blocked. We must unblock it manually. */
int mask = siggetmask ();
mask &= ~sigmask(SIGALRM);
sigsetmask (mask);
/* Now it's safe to longjump. */
longjmp (abort_connect_env, -1);
}
#endif /* not HAVE_SIGSETJMP */
/* Like connect, but specifies a timeout. If connecting takes longer
than TIMEOUT seconds, -1 is returned and errno is set to
ETIMEDOUT. */
static int
connect_with_timeout (int fd, const struct sockaddr *addr, int addrlen,
int timeout)
{
int result, saved_errno;
if (timeout == 0)
return connect (fd, addr, addrlen);
signal (SIGALRM, abort_connect);
if (SETJMP (abort_connect_env) != 0)
{
/* Longjumped out of connect with a timeout. */
signal (SIGALRM, SIG_DFL);
errno = ETIMEDOUT;
return -1;
}
alarm (timeout);
result = connect (fd, addr, addrlen);
saved_errno = errno; /* In case alarm() or signal() change
errno. */
alarm (0);
signal (SIGALRM, SIG_DFL);
errno = saved_errno;
return result;
}
#endif /* UNIX_CONNECT_TIMEOUT */
/* A kludge, but still better than passing the host name all the way
to connect_to_one. */
static const char *connection_host_name;
1999-12-02 15:42:23 +08:00
void
set_connection_host_name (const char *host)
1999-12-02 15:42:23 +08:00
{
if (host)
assert (connection_host_name == NULL);
else
assert (connection_host_name != NULL);
connection_host_name = host;
}
/* Connect to a remote host whose address has been resolved. */
int
connect_to_one (ip_address *addr, unsigned short port, int silent)
{
wget_sockaddr sa;
int sock, save_errno;
1999-12-02 15:42:23 +08:00
/* Set port and protocol */
wget_sockaddr_set_address (&sa, ip_default_family, port, addr);
if (!silent)
{
char *pretty_addr = pretty_print_address (addr);
if (connection_host_name
&& 0 != strcmp (connection_host_name, pretty_addr))
logprintf (LOG_VERBOSE, _("Connecting to %s[%s]:%hu... "),
connection_host_name, pretty_addr, port);
else
logprintf (LOG_VERBOSE, _("Connecting to %s:%hu... "),
pretty_addr, port);
}
1999-12-02 15:42:23 +08:00
/* Make an internet socket, stream type. */
sock = socket (ip_default_family, SOCK_STREAM, 0);
if (sock < 0)
goto out;
1999-12-02 15:42:23 +08:00
resolve_bind_address ();
if (bind_address_resolved)
{
/* Bind the client side to the requested address. */
wget_sockaddr bsa;
wget_sockaddr_set_address (&bsa, ip_default_family, 0, &bind_address);
if (bind (sock, &bsa.sa, sockaddr_len ()))
{
close (sock);
sock = -1;
goto out;
}
}
1999-12-02 15:42:23 +08:00
/* Connect the socket to the remote host. */
if (connect_with_timeout (sock, &sa.sa, sockaddr_len (), opt.timeout) < 0)
1999-12-02 15:42:23 +08:00
{
close (sock);
sock = -1;
goto out;
1999-12-02 15:42:23 +08:00
}
out:
if (sock >= 0)
{
/* Success. */
if (!silent)
logprintf (LOG_VERBOSE, _("connected.\n"));
DEBUGP (("Created socket %d.\n", sock));
}
else
{
save_errno = errno;
if (!silent)
logprintf (LOG_VERBOSE, "failed: %s.\n", strerror (errno));
errno = save_errno;
}
return sock;
}
/* Connect to a remote host whose address has been resolved. */
int
connect_to_many (struct address_list *al, unsigned short port, int silent)
{
int i, start, end;
address_list_get_bounds (al, &start, &end);
for (i = start; i < end; i++)
{
ip_address addr;
int sock;
address_list_copy_one (al, i, &addr);
sock = connect_to_one (&addr, port, silent);
if (sock >= 0)
/* Success. */
return sock;
address_list_set_faulty (al, i);
/* The attempt to connect has failed. Continue with the loop
and try next address. */
}
return -1;
1999-12-02 15:42:23 +08:00
}
int
test_socket_open (int sock)
{
#ifdef HAVE_SELECT
fd_set check_set;
struct timeval to;
/* Check if we still have a valid (non-EOF) connection. From Andrew
* Maholski's code in the Unix Socket FAQ. */
FD_ZERO (&check_set);
FD_SET (sock, &check_set);
/* Wait one microsecond */
to.tv_sec = 0;
to.tv_usec = 1;
/* If we get a timeout, then that means still connected */
if (select (sock + 1, &check_set, NULL, NULL, &to) == 0)
{
/* Connection is valid (not EOF), so continue */
return 1;
}
else
return 0;
#else
/* Without select, it's hard to know for sure. */
return 1;
#endif
}
1999-12-02 15:42:23 +08:00
/* Bind the local port PORT. This does all the necessary work, which
is creating a socket, setting SO_REUSEADDR option on it, then
calling bind() and listen(). If *PORT is 0, a random port is
chosen by the system, and its value is stored to *PORT. The
internal variable MPORT is set to the value of the ensuing master
socket. Call acceptport() to block for and accept a connection. */
uerr_t
bindport (unsigned short *port, int family)
1999-12-02 15:42:23 +08:00
{
int optval = 1;
wget_sockaddr srv;
memset (&srv, 0, sizeof (wget_sockaddr));
1999-12-02 15:42:23 +08:00
msock = -1;
if ((msock = socket (family, SOCK_STREAM, 0)) < 0)
1999-12-02 15:42:23 +08:00
return CONSOCKERR;
if (setsockopt (msock, SOL_SOCKET, SO_REUSEADDR,
(char *)&optval, sizeof (optval)) < 0)
return CONSOCKERR;
resolve_bind_address ();
wget_sockaddr_set_address (&srv, ip_default_family, htons (*port),
bind_address_resolved ? &bind_address : NULL);
if (bind (msock, &srv.sa, sockaddr_len ()) < 0)
1999-12-02 15:42:23 +08:00
{
CLOSE (msock);
msock = -1;
return BINDERR;
}
DEBUGP (("Master socket fd %d bound.\n", msock));
if (!*port)
{
/* #### addrlen should be a 32-bit type, which int is not
guaranteed to be. Oh, and don't try to make it a size_t,
because that can be 64-bit. */
int sa_len = sockaddr_len ();
if (getsockname (msock, &srv.sa, &sa_len) < 0)
1999-12-02 15:42:23 +08:00
{
CLOSE (msock);
msock = -1;
return CONPORTERR;
}
*port = wget_sockaddr_get_port (&srv);
DEBUGP (("using port %i.\n", *port));
1999-12-02 15:42:23 +08:00
}
if (listen (msock, 1) < 0)
{
CLOSE (msock);
msock = -1;
return LISTENERR;
}
return BINDOK;
}
#ifdef HAVE_SELECT
/* Wait for file descriptor FD to be readable, MAXTIME being the
timeout in seconds. If WRITEP is non-zero, checks for FD being
writable instead.
Returns 1 if FD is accessible, 0 for timeout and -1 for error in
select(). */
int
1999-12-02 15:42:23 +08:00
select_fd (int fd, int maxtime, int writep)
{
fd_set fds, exceptfds;
struct timeval timeout;
FD_ZERO (&fds);
FD_SET (fd, &fds);
FD_ZERO (&exceptfds);
FD_SET (fd, &exceptfds);
timeout.tv_sec = maxtime;
timeout.tv_usec = 0;
/* HPUX reportedly warns here. What is the correct incantation? */
return select (fd + 1, writep ? NULL : &fds, writep ? &fds : NULL,
&exceptfds, &timeout);
}
#endif /* HAVE_SELECT */
/* Call accept() on MSOCK and store the result to *SOCK. This assumes
that bindport() has been used to initialize MSOCK to a correct
value. It blocks the caller until a connection is established. If
no connection is established for OPT.TIMEOUT seconds, the function
exits with an error status. */
uerr_t
acceptport (int *sock)
{
int addrlen = sockaddr_len ();
1999-12-02 15:42:23 +08:00
#ifdef HAVE_SELECT
if (select_fd (msock, opt.timeout, 0) <= 0)
return ACCEPTERR;
#endif
if ((*sock = accept (msock, addr, &addrlen)) < 0)
return ACCEPTERR;
DEBUGP (("Created socket fd %d.\n", *sock));
return ACCEPTOK;
}
/* Close SOCK, as well as the most recently remembered MSOCK, created
via bindport(). If SOCK is -1, close MSOCK only. */
void
closeport (int sock)
{
/*shutdown (sock, 2);*/
if (sock != -1)
CLOSE (sock);
if (msock != -1)
CLOSE (msock);
msock = -1;
}
/* Return the local IP address associated with the connection on FD. */
int
conaddr (int fd, ip_address *ip)
1999-12-02 15:42:23 +08:00
{
wget_sockaddr mysrv;
/* see bindport() for discussion of using `int' here. */
int addrlen = sizeof (mysrv);
if (getsockname (fd, &mysrv.sa, (int *)&addrlen) < 0)
return 0;
switch (mysrv.sa.sa_family)
{
#ifdef INET6
case AF_INET6:
memcpy (ip, &mysrv.sin6.sin6_addr, 16);
return 1;
#endif
case AF_INET:
map_ipv4_to_ip ((ip4_address *)&mysrv.sin.sin_addr, ip);
return 1;
default:
abort ();
}
return 0;
1999-12-02 15:42:23 +08:00
}
/* Read at most LEN bytes from FD, storing them to BUF. This is
virtually the same as read(), but takes care of EINTR braindamage
and uses select() to timeout the stale connections (a connection is
stale if more than OPT.TIMEOUT time is spent in select() or
read()). */
int
iread (int fd, char *buf, int len)
{
int res;
do
{
#ifdef HAVE_SELECT
if (opt.timeout)
{
do
{
res = select_fd (fd, opt.timeout, 0);
}
while (res == -1 && errno == EINTR);
if (res <= 0)
{
/* Set errno to ETIMEDOUT on timeout. */
if (res == 0)
/* #### Potentially evil! */
errno = ETIMEDOUT;
return -1;
}
}
#endif
res = READ (fd, buf, len);
}
while (res == -1 && errno == EINTR);
return res;
}
/* Write LEN bytes from BUF to FD. This is similar to iread(), but
doesn't bother with select(). Unlike iread(), it makes sure that
all of BUF is actually written to FD, so callers needn't bother
with checking that the return value equals to LEN. Instead, you
should simply check for -1. */
int
iwrite (int fd, char *buf, int len)
{
int res = 0;
/* `write' may write less than LEN bytes, thus the outward loop
keeps trying it until all was written, or an error occurred. The
inner loop is reserved for the usual EINTR f*kage, and the
innermost loop deals with the same during select(). */
while (len > 0)
{
do
{
#ifdef HAVE_SELECT
if (opt.timeout)
{
do
{
res = select_fd (fd, opt.timeout, 1);
}
while (res == -1 && errno == EINTR);
if (res <= 0)
{
/* Set errno to ETIMEDOUT on timeout. */
if (res == 0)
/* #### Potentially evil! */
errno = ETIMEDOUT;
return -1;
}
}
#endif
res = WRITE (fd, buf, len);
}
while (res == -1 && errno == EINTR);
if (res <= 0)
break;
buf += res;
len -= res;
}
return res;
}