mirror of
https://github.com/mirror/wget.git
synced 2025-01-22 18:21:03 +08:00
711bf72609
for handling VERY_LONG_TYPE overflows. Make opt.quota a LARGE_INT.
1841 lines
50 KiB
C
1841 lines
50 KiB
C
/* File Transfer Protocol support.
|
|
Copyright (C) 1995, 1996, 1997, 1998, 2000, 2001
|
|
Free Software Foundation, Inc.
|
|
|
|
This file is part of GNU Wget.
|
|
|
|
GNU Wget is free software; you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation; either version 2 of the License, or
|
|
(at your option) any later version.
|
|
|
|
GNU Wget is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with Wget; if not, write to the Free Software
|
|
Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
|
|
|
|
In addition, as a special exception, the Free Software Foundation
|
|
gives permission to link the code of its release of Wget with the
|
|
OpenSSL project's "OpenSSL" library (or with modified versions of it
|
|
that use the same license as the "OpenSSL" library), and distribute
|
|
the linked executables. You must obey the GNU General Public License
|
|
in all respects for all of the code used other than "OpenSSL". If you
|
|
modify this file, you may extend this exception to your version of the
|
|
file, but you are not obligated to do so. If you do not wish to do
|
|
so, delete this exception statement from your version. */
|
|
|
|
#include <config.h>
|
|
|
|
#include <stdio.h>
|
|
#include <stdlib.h>
|
|
#ifdef HAVE_STRING_H
|
|
# include <string.h>
|
|
#else
|
|
# include <strings.h>
|
|
#endif
|
|
#ifdef HAVE_UNISTD_H
|
|
# include <unistd.h>
|
|
#endif
|
|
#include <sys/types.h>
|
|
#include <assert.h>
|
|
#include <errno.h>
|
|
|
|
#include "wget.h"
|
|
#include "utils.h"
|
|
#include "url.h"
|
|
#include "rbuf.h"
|
|
#include "retr.h"
|
|
#include "ftp.h"
|
|
#include "connect.h"
|
|
#include "host.h"
|
|
#include "netrc.h"
|
|
#include "convert.h" /* for downloaded_file */
|
|
|
|
#ifndef errno
|
|
extern int errno;
|
|
#endif
|
|
|
|
extern LARGE_INT total_downloaded_bytes;
|
|
|
|
/* File where the "ls -al" listing will be saved. */
|
|
#define LIST_FILENAME ".listing"
|
|
|
|
extern char ftp_last_respline[];
|
|
|
|
typedef struct
|
|
{
|
|
int st; /* connection status */
|
|
int cmd; /* command code */
|
|
struct rbuf rbuf; /* control connection buffer */
|
|
double dltime; /* time of the download in msecs */
|
|
enum stype rs; /* remote system reported by ftp server */
|
|
char *id; /* initial directory */
|
|
char *target; /* target file name */
|
|
struct url *proxy; /* FTWK-style proxy */
|
|
} ccon;
|
|
|
|
|
|
/* Look for regexp "( *[0-9]+ *byte" (literal parenthesis) anywhere in
|
|
the string S, and return the number converted to long, if found, 0
|
|
otherwise. */
|
|
static long
|
|
ftp_expected_bytes (const char *s)
|
|
{
|
|
long res;
|
|
|
|
while (1)
|
|
{
|
|
while (*s && *s != '(')
|
|
++s;
|
|
if (!*s)
|
|
return 0;
|
|
for (++s; *s && ISSPACE (*s); s++);
|
|
if (!*s)
|
|
return 0;
|
|
if (!ISDIGIT (*s))
|
|
continue;
|
|
res = 0;
|
|
do
|
|
{
|
|
res = (*s - '0') + 10 * res;
|
|
++s;
|
|
}
|
|
while (*s && ISDIGIT (*s));
|
|
if (!*s)
|
|
return 0;
|
|
while (*s && ISSPACE (*s))
|
|
++s;
|
|
if (!*s)
|
|
return 0;
|
|
if (TOLOWER (*s) != 'b')
|
|
continue;
|
|
if (strncasecmp (s, "byte", 4))
|
|
continue;
|
|
else
|
|
break;
|
|
}
|
|
return res;
|
|
}
|
|
|
|
/* Retrieves a file with denoted parameters through opening an FTP
|
|
connection to the server. It always closes the data connection,
|
|
and closes the control connection in case of error. */
|
|
static uerr_t
|
|
getftp (struct url *u, long *len, long restval, ccon *con)
|
|
{
|
|
int csock, dtsock, res;
|
|
uerr_t err;
|
|
FILE *fp;
|
|
char *user, *passwd, *respline;
|
|
char *tms, *tmrate;
|
|
int cmd = con->cmd;
|
|
int pasv_mode_open = 0;
|
|
long expected_bytes = 0L;
|
|
|
|
assert (con != NULL);
|
|
assert (con->target != NULL);
|
|
|
|
/* Debug-check of the sanity of the request by making sure that LIST
|
|
and RETR are never both requested (since we can handle only one
|
|
at a time. */
|
|
assert (!((cmd & DO_LIST) && (cmd & DO_RETR)));
|
|
/* Make sure that at least *something* is requested. */
|
|
assert ((cmd & (DO_LIST | DO_CWD | DO_RETR | DO_LOGIN)) != 0);
|
|
|
|
user = u->user;
|
|
passwd = u->passwd;
|
|
search_netrc (u->host, (const char **)&user, (const char **)&passwd, 1);
|
|
user = user ? user : opt.ftp_acc;
|
|
passwd = passwd ? passwd : opt.ftp_pass;
|
|
assert (user && passwd);
|
|
|
|
dtsock = -1;
|
|
con->dltime = 0;
|
|
|
|
if (!(cmd & DO_LOGIN))
|
|
csock = RBUF_FD (&con->rbuf);
|
|
else /* cmd & DO_LOGIN */
|
|
{
|
|
char type_char;
|
|
struct address_list *al;
|
|
|
|
char *host = con->proxy ? con->proxy->host : u->host;
|
|
int port = con->proxy ? con->proxy->port : u->port;
|
|
char *logname = user;
|
|
|
|
if (con->proxy)
|
|
{
|
|
/* If proxy is in use, log in as username@target-site. */
|
|
logname = xmalloc (strlen (user) + 1 + strlen (u->host) + 1);
|
|
sprintf (logname, "%s@%s", user, u->host);
|
|
}
|
|
|
|
/* Login to the server: */
|
|
|
|
/* First: Establish the control connection. */
|
|
|
|
al = lookup_host (host, 0);
|
|
if (!al)
|
|
return HOSTERR;
|
|
set_connection_host_name (host);
|
|
csock = connect_to_many (al, port, 0);
|
|
set_connection_host_name (NULL);
|
|
address_list_release (al);
|
|
|
|
if (csock < 0)
|
|
return CONNECT_ERROR (errno);
|
|
|
|
if (cmd & LEAVE_PENDING)
|
|
rbuf_initialize (&con->rbuf, csock);
|
|
else
|
|
rbuf_uninitialize (&con->rbuf);
|
|
|
|
/* Since this is a new connection, we may safely discard
|
|
anything left in the buffer. */
|
|
rbuf_discard (&con->rbuf);
|
|
|
|
/* Second: Login with proper USER/PASS sequence. */
|
|
logprintf (LOG_VERBOSE, _("Logging in as %s ... "), user);
|
|
if (opt.server_response)
|
|
logputs (LOG_ALWAYS, "\n");
|
|
err = ftp_login (&con->rbuf, logname, passwd);
|
|
|
|
if (con->proxy)
|
|
xfree (logname);
|
|
|
|
/* FTPRERR, FTPSRVERR, WRITEFAILED, FTPLOGREFUSED, FTPLOGINC */
|
|
switch (err)
|
|
{
|
|
case FTPRERR:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET, _("\
|
|
Error in server response, closing control connection.\n"));
|
|
CLOSE (csock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return err;
|
|
break;
|
|
case FTPSRVERR:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET, _("Error in server greeting.\n"));
|
|
CLOSE (csock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return err;
|
|
break;
|
|
case WRITEFAILED:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET,
|
|
_("Write failed, closing control connection.\n"));
|
|
CLOSE (csock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return err;
|
|
break;
|
|
case FTPLOGREFUSED:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET, _("The server refuses login.\n"));
|
|
CLOSE (csock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return FTPLOGREFUSED;
|
|
break;
|
|
case FTPLOGINC:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET, _("Login incorrect.\n"));
|
|
CLOSE (csock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return FTPLOGINC;
|
|
break;
|
|
case FTPOK:
|
|
if (!opt.server_response)
|
|
logputs (LOG_VERBOSE, _("Logged in!\n"));
|
|
break;
|
|
default:
|
|
abort ();
|
|
exit (1);
|
|
break;
|
|
}
|
|
/* Third: Get the system type */
|
|
if (!opt.server_response)
|
|
logprintf (LOG_VERBOSE, "==> SYST ... ");
|
|
err = ftp_syst (&con->rbuf, &con->rs);
|
|
/* FTPRERR */
|
|
switch (err)
|
|
{
|
|
case FTPRERR:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET, _("\
|
|
Error in server response, closing control connection.\n"));
|
|
CLOSE (csock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return err;
|
|
break;
|
|
case FTPSRVERR:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET,
|
|
_("Server error, can't determine system type.\n"));
|
|
break;
|
|
case FTPOK:
|
|
/* Everything is OK. */
|
|
break;
|
|
default:
|
|
abort ();
|
|
break;
|
|
}
|
|
if (!opt.server_response && err != FTPSRVERR)
|
|
logputs (LOG_VERBOSE, _("done. "));
|
|
|
|
/* Fourth: Find the initial ftp directory */
|
|
|
|
if (!opt.server_response)
|
|
logprintf (LOG_VERBOSE, "==> PWD ... ");
|
|
err = ftp_pwd(&con->rbuf, &con->id);
|
|
/* FTPRERR */
|
|
switch (err)
|
|
{
|
|
case FTPRERR:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET, _("\
|
|
Error in server response, closing control connection.\n"));
|
|
CLOSE (csock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return err;
|
|
break;
|
|
case FTPSRVERR :
|
|
/* PWD unsupported -- assume "/". */
|
|
FREE_MAYBE (con->id);
|
|
con->id = xstrdup ("/");
|
|
break;
|
|
case FTPOK:
|
|
/* Everything is OK. */
|
|
break;
|
|
default:
|
|
abort ();
|
|
break;
|
|
}
|
|
/* VMS will report something like "PUB$DEVICE:[INITIAL.FOLDER]".
|
|
Convert it to "/INITIAL/FOLDER" */
|
|
if (con->rs == ST_VMS)
|
|
{
|
|
char *path = strchr (con->id, '[');
|
|
char *pathend = path ? strchr (path + 1, ']') : NULL;
|
|
if (!path || !pathend)
|
|
DEBUGP (("Initial VMS directory not in the form [...]!\n"));
|
|
else
|
|
{
|
|
char *idir = con->id;
|
|
DEBUGP (("Preprocessing the initial VMS directory\n"));
|
|
DEBUGP ((" old = '%s'\n", con->id));
|
|
/* We do the conversion in-place by copying the stuff
|
|
between [ and ] to the beginning, and changing dots
|
|
to slashes at the same time. */
|
|
*idir++ = '/';
|
|
for (++path; path < pathend; path++, idir++)
|
|
*idir = *path == '.' ? '/' : *path;
|
|
*idir = '\0';
|
|
DEBUGP ((" new = '%s'\n\n", con->id));
|
|
}
|
|
}
|
|
if (!opt.server_response)
|
|
logputs (LOG_VERBOSE, _("done.\n"));
|
|
|
|
/* Fifth: Set the FTP type. */
|
|
type_char = ftp_process_type (u->params);
|
|
if (!opt.server_response)
|
|
logprintf (LOG_VERBOSE, "==> TYPE %c ... ", type_char);
|
|
err = ftp_type (&con->rbuf, type_char);
|
|
/* FTPRERR, WRITEFAILED, FTPUNKNOWNTYPE */
|
|
switch (err)
|
|
{
|
|
case FTPRERR:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET, _("\
|
|
Error in server response, closing control connection.\n"));
|
|
CLOSE (csock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return err;
|
|
break;
|
|
case WRITEFAILED:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET,
|
|
_("Write failed, closing control connection.\n"));
|
|
CLOSE (csock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return err;
|
|
break;
|
|
case FTPUNKNOWNTYPE:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logprintf (LOG_NOTQUIET,
|
|
_("Unknown type `%c', closing control connection.\n"),
|
|
type_char);
|
|
CLOSE (csock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return err;
|
|
case FTPOK:
|
|
/* Everything is OK. */
|
|
break;
|
|
default:
|
|
abort ();
|
|
break;
|
|
}
|
|
if (!opt.server_response)
|
|
logputs (LOG_VERBOSE, _("done. "));
|
|
} /* do login */
|
|
|
|
if (cmd & DO_CWD)
|
|
{
|
|
if (!*u->dir)
|
|
logputs (LOG_VERBOSE, _("==> CWD not needed.\n"));
|
|
else
|
|
{
|
|
char *target = u->dir;
|
|
|
|
DEBUGP (("changing working directory\n"));
|
|
|
|
/* Change working directory. To change to a non-absolute
|
|
Unix directory, we need to prepend initial directory
|
|
(con->id) to it. Absolute directories "just work".
|
|
|
|
A relative directory is one that does not begin with '/'
|
|
and, on non-Unix OS'es, one that doesn't begin with
|
|
"[a-z]:".
|
|
|
|
This is not done for OS400, which doesn't use
|
|
"/"-delimited directories, nor does it support directory
|
|
hierarchies. "CWD foo" followed by "CWD bar" leaves us
|
|
in "bar", not in "foo/bar", as would be customary
|
|
elsewhere. */
|
|
|
|
if (target[0] != '/'
|
|
&& !(con->rs != ST_UNIX
|
|
&& ISALPHA (target[0])
|
|
&& target[1] == ':')
|
|
&& con->rs != ST_OS400)
|
|
{
|
|
int idlen = strlen (con->id);
|
|
char *ntarget, *p;
|
|
|
|
/* Strip trailing slash(es) from con->id. */
|
|
while (idlen > 0 && con->id[idlen - 1] == '/')
|
|
--idlen;
|
|
p = ntarget = (char *)alloca (idlen + 1 + strlen (u->dir) + 1);
|
|
memcpy (p, con->id, idlen);
|
|
p += idlen;
|
|
*p++ = '/';
|
|
strcpy (p, target);
|
|
|
|
DEBUGP (("Prepended initial PWD to relative path:\n"));
|
|
DEBUGP ((" pwd: '%s'\n old: '%s'\n new: '%s'\n",
|
|
con->id, target, ntarget));
|
|
target = ntarget;
|
|
}
|
|
|
|
/* If the FTP host runs VMS, we will have to convert the absolute
|
|
directory path in UNIX notation to absolute directory path in
|
|
VMS notation as VMS FTP servers do not like UNIX notation of
|
|
absolute paths. "VMS notation" is [dir.subdir.subsubdir]. */
|
|
|
|
if (con->rs == ST_VMS)
|
|
{
|
|
char *tmpp;
|
|
char *ntarget = (char *)alloca (strlen (target) + 2);
|
|
/* We use a converted initial dir, so directories in
|
|
TARGET will be separated with slashes, something like
|
|
"/INITIAL/FOLDER/DIR/SUBDIR". Convert that to
|
|
"[INITIAL.FOLDER.DIR.SUBDIR]". */
|
|
strcpy (ntarget, target);
|
|
assert (*ntarget == '/');
|
|
*ntarget = '[';
|
|
for (tmpp = ntarget + 1; *tmpp; tmpp++)
|
|
if (*tmpp == '/')
|
|
*tmpp = '.';
|
|
*tmpp++ = ']';
|
|
*tmpp = '\0';
|
|
DEBUGP (("Changed file name to VMS syntax:\n"));
|
|
DEBUGP ((" Unix: '%s'\n VMS: '%s'\n", target, ntarget));
|
|
target = ntarget;
|
|
}
|
|
|
|
if (!opt.server_response)
|
|
logprintf (LOG_VERBOSE, "==> CWD %s ... ", target);
|
|
err = ftp_cwd (&con->rbuf, target);
|
|
/* FTPRERR, WRITEFAILED, FTPNSFOD */
|
|
switch (err)
|
|
{
|
|
case FTPRERR:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET, _("\
|
|
Error in server response, closing control connection.\n"));
|
|
CLOSE (csock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return err;
|
|
break;
|
|
case WRITEFAILED:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET,
|
|
_("Write failed, closing control connection.\n"));
|
|
CLOSE (csock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return err;
|
|
break;
|
|
case FTPNSFOD:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logprintf (LOG_NOTQUIET, _("No such directory `%s'.\n\n"),
|
|
u->dir);
|
|
CLOSE (csock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return err;
|
|
break;
|
|
case FTPOK:
|
|
/* fine and dandy */
|
|
break;
|
|
default:
|
|
abort ();
|
|
break;
|
|
}
|
|
if (!opt.server_response)
|
|
logputs (LOG_VERBOSE, _("done.\n"));
|
|
}
|
|
}
|
|
else /* do not CWD */
|
|
logputs (LOG_VERBOSE, _("==> CWD not required.\n"));
|
|
|
|
if ((cmd & DO_RETR) && restval && *len == 0)
|
|
{
|
|
if (opt.verbose)
|
|
{
|
|
if (!opt.server_response)
|
|
logprintf (LOG_VERBOSE, "==> SIZE %s ... ", u->file);
|
|
}
|
|
|
|
err = ftp_size(&con->rbuf, u->file, len);
|
|
/* FTPRERR */
|
|
switch (err)
|
|
{
|
|
case FTPRERR:
|
|
case FTPSRVERR :
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET, _("\
|
|
Error in server response, closing control connection.\n"));
|
|
CLOSE (csock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return err;
|
|
break;
|
|
case FTPOK:
|
|
/* Everything is OK. */
|
|
break;
|
|
default:
|
|
abort ();
|
|
break;
|
|
}
|
|
if (!opt.server_response)
|
|
logputs (LOG_VERBOSE, _("done.\n"));
|
|
}
|
|
|
|
/* If anything is to be retrieved, PORT (or PASV) must be sent. */
|
|
if (cmd & (DO_LIST | DO_RETR))
|
|
{
|
|
if (opt.ftp_pasv > 0)
|
|
{
|
|
ip_address passive_addr;
|
|
unsigned short passive_port;
|
|
if (!opt.server_response)
|
|
logputs (LOG_VERBOSE, "==> PASV ... ");
|
|
err = ftp_pasv (&con->rbuf, &passive_addr, &passive_port);
|
|
/* FTPRERR, WRITEFAILED, FTPNOPASV, FTPINVPASV */
|
|
switch (err)
|
|
{
|
|
case FTPRERR:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET, _("\
|
|
Error in server response, closing control connection.\n"));
|
|
CLOSE (csock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return err;
|
|
break;
|
|
case WRITEFAILED:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET,
|
|
_("Write failed, closing control connection.\n"));
|
|
CLOSE (csock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return err;
|
|
break;
|
|
case FTPNOPASV:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET, _("Cannot initiate PASV transfer.\n"));
|
|
break;
|
|
case FTPINVPASV:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET, _("Cannot parse PASV response.\n"));
|
|
break;
|
|
case FTPOK:
|
|
/* fine and dandy */
|
|
break;
|
|
default:
|
|
abort ();
|
|
break;
|
|
} /* switch(err) */
|
|
if (err==FTPOK)
|
|
{
|
|
dtsock = connect_to_one (&passive_addr, passive_port, 1);
|
|
if (dtsock < 0)
|
|
{
|
|
int save_errno = errno;
|
|
CLOSE (csock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
logprintf (LOG_VERBOSE, _("couldn't connect to %s:%hu: %s\n"),
|
|
pretty_print_address (&passive_addr), passive_port,
|
|
strerror (save_errno));
|
|
return CONNECT_ERROR (save_errno);
|
|
}
|
|
|
|
pasv_mode_open = 1; /* Flag to avoid accept port */
|
|
if (!opt.server_response)
|
|
logputs (LOG_VERBOSE, _("done. "));
|
|
} /* err==FTP_OK */
|
|
}
|
|
|
|
if (!pasv_mode_open) /* Try to use a port command if PASV failed */
|
|
{
|
|
if (!opt.server_response)
|
|
logputs (LOG_VERBOSE, "==> PORT ... ");
|
|
err = ftp_port (&con->rbuf);
|
|
/* FTPRERR, WRITEFAILED, bindport (CONSOCKERR, CONPORTERR, BINDERR,
|
|
LISTENERR), HOSTERR, FTPPORTERR */
|
|
switch (err)
|
|
{
|
|
case FTPRERR:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET, _("\
|
|
Error in server response, closing control connection.\n"));
|
|
CLOSE (csock);
|
|
closeport (dtsock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return err;
|
|
break;
|
|
case WRITEFAILED:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET,
|
|
_("Write failed, closing control connection.\n"));
|
|
CLOSE (csock);
|
|
closeport (dtsock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return err;
|
|
break;
|
|
case CONSOCKERR:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logprintf (LOG_NOTQUIET, "socket: %s\n", strerror (errno));
|
|
CLOSE (csock);
|
|
closeport (dtsock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return err;
|
|
break;
|
|
case CONPORTERR: case BINDERR: case LISTENERR:
|
|
/* What now? These problems are local... */
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logprintf (LOG_NOTQUIET, _("Bind error (%s).\n"),
|
|
strerror (errno));
|
|
closeport (dtsock);
|
|
return err;
|
|
break;
|
|
case FTPPORTERR:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET, _("Invalid PORT.\n"));
|
|
CLOSE (csock);
|
|
closeport (dtsock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return err;
|
|
break;
|
|
case FTPOK:
|
|
/* fine and dandy */
|
|
break;
|
|
default:
|
|
abort ();
|
|
break;
|
|
} /* port switch */
|
|
if (!opt.server_response)
|
|
logputs (LOG_VERBOSE, _("done. "));
|
|
} /* dtsock == -1 */
|
|
} /* cmd & (DO_LIST | DO_RETR) */
|
|
|
|
/* Restart if needed. */
|
|
if (restval && (cmd & DO_RETR))
|
|
{
|
|
if (!opt.server_response)
|
|
logprintf (LOG_VERBOSE, "==> REST %ld ... ", restval);
|
|
err = ftp_rest (&con->rbuf, restval);
|
|
|
|
/* FTPRERR, WRITEFAILED, FTPRESTFAIL */
|
|
switch (err)
|
|
{
|
|
case FTPRERR:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET, _("\
|
|
Error in server response, closing control connection.\n"));
|
|
CLOSE (csock);
|
|
closeport (dtsock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return err;
|
|
break;
|
|
case WRITEFAILED:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET,
|
|
_("Write failed, closing control connection.\n"));
|
|
CLOSE (csock);
|
|
closeport (dtsock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return err;
|
|
break;
|
|
case FTPRESTFAIL:
|
|
/* If `-c' is specified and the file already existed when
|
|
Wget was started, it would be a bad idea for us to start
|
|
downloading it from scratch, effectively truncating it. */
|
|
if (opt.always_rest && (cmd & NO_TRUNCATE))
|
|
{
|
|
logprintf (LOG_NOTQUIET,
|
|
_("\nREST failed; will not truncate `%s'.\n"),
|
|
con->target);
|
|
CLOSE (csock);
|
|
closeport (dtsock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return CONTNOTSUPPORTED;
|
|
}
|
|
logputs (LOG_VERBOSE, _("\nREST failed, starting from scratch.\n"));
|
|
restval = 0L;
|
|
break;
|
|
case FTPOK:
|
|
/* fine and dandy */
|
|
break;
|
|
default:
|
|
abort ();
|
|
break;
|
|
}
|
|
if (err != FTPRESTFAIL && !opt.server_response)
|
|
logputs (LOG_VERBOSE, _("done. "));
|
|
} /* restval && cmd & DO_RETR */
|
|
|
|
if (cmd & DO_RETR)
|
|
{
|
|
/* If we're in spider mode, don't really retrieve anything. The
|
|
fact that we got to this point should be proof enough that
|
|
the file exists, vaguely akin to HTTP's concept of a "HEAD"
|
|
request. */
|
|
if (opt.spider)
|
|
{
|
|
CLOSE (csock);
|
|
closeport (dtsock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return RETRFINISHED;
|
|
}
|
|
|
|
if (opt.verbose)
|
|
{
|
|
if (!opt.server_response)
|
|
{
|
|
if (restval)
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logprintf (LOG_VERBOSE, "==> RETR %s ... ", u->file);
|
|
}
|
|
}
|
|
err = ftp_retr (&con->rbuf, u->file);
|
|
/* FTPRERR, WRITEFAILED, FTPNSFOD */
|
|
switch (err)
|
|
{
|
|
case FTPRERR:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET, _("\
|
|
Error in server response, closing control connection.\n"));
|
|
CLOSE (csock);
|
|
closeport (dtsock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return err;
|
|
break;
|
|
case WRITEFAILED:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET,
|
|
_("Write failed, closing control connection.\n"));
|
|
CLOSE (csock);
|
|
closeport (dtsock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return err;
|
|
break;
|
|
case FTPNSFOD:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logprintf (LOG_NOTQUIET, _("No such file `%s'.\n\n"), u->file);
|
|
closeport (dtsock);
|
|
return err;
|
|
break;
|
|
case FTPOK:
|
|
/* fine and dandy */
|
|
break;
|
|
default:
|
|
abort ();
|
|
break;
|
|
}
|
|
|
|
if (!opt.server_response)
|
|
logputs (LOG_VERBOSE, _("done.\n"));
|
|
expected_bytes = ftp_expected_bytes (ftp_last_respline);
|
|
} /* do retrieve */
|
|
|
|
if (cmd & DO_LIST)
|
|
{
|
|
if (!opt.server_response)
|
|
logputs (LOG_VERBOSE, "==> LIST ... ");
|
|
/* As Maciej W. Rozycki (macro@ds2.pg.gda.pl) says, `LIST'
|
|
without arguments is better than `LIST .'; confirmed by
|
|
RFC959. */
|
|
err = ftp_list (&con->rbuf, NULL);
|
|
/* FTPRERR, WRITEFAILED */
|
|
switch (err)
|
|
{
|
|
case FTPRERR:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET, _("\
|
|
Error in server response, closing control connection.\n"));
|
|
CLOSE (csock);
|
|
closeport (dtsock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return err;
|
|
break;
|
|
case WRITEFAILED:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logputs (LOG_NOTQUIET,
|
|
_("Write failed, closing control connection.\n"));
|
|
CLOSE (csock);
|
|
closeport (dtsock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return err;
|
|
break;
|
|
case FTPNSFOD:
|
|
logputs (LOG_VERBOSE, "\n");
|
|
logprintf (LOG_NOTQUIET, _("No such file or directory `%s'.\n\n"),
|
|
".");
|
|
closeport (dtsock);
|
|
return err;
|
|
break;
|
|
case FTPOK:
|
|
/* fine and dandy */
|
|
break;
|
|
default:
|
|
abort ();
|
|
break;
|
|
}
|
|
if (!opt.server_response)
|
|
logputs (LOG_VERBOSE, _("done.\n"));
|
|
expected_bytes = ftp_expected_bytes (ftp_last_respline);
|
|
} /* cmd & DO_LIST */
|
|
|
|
if (!(cmd & (DO_LIST | DO_RETR)) || (opt.spider && !(cmd & DO_LIST)))
|
|
return RETRFINISHED;
|
|
|
|
/* Some FTP servers return the total length of file after REST
|
|
command, others just return the remaining size. */
|
|
if (*len && restval && expected_bytes
|
|
&& (expected_bytes == *len - restval))
|
|
{
|
|
DEBUGP (("Lying FTP server found, adjusting.\n"));
|
|
expected_bytes = *len;
|
|
}
|
|
|
|
/* If no transmission was required, then everything is OK. */
|
|
if (!pasv_mode_open) /* we are not using pasive mode so we need
|
|
to accept */
|
|
{
|
|
/* Open the data transmission socket by calling acceptport(). */
|
|
err = acceptport (&dtsock);
|
|
/* Possible errors: ACCEPTERR. */
|
|
if (err == ACCEPTERR)
|
|
{
|
|
logprintf (LOG_NOTQUIET, "accept: %s\n", strerror (errno));
|
|
return err;
|
|
}
|
|
}
|
|
|
|
/* Open the file -- if opt.dfp is set, use it instead. */
|
|
if (!opt.dfp || con->cmd & DO_LIST)
|
|
{
|
|
mkalldirs (con->target);
|
|
if (opt.backups)
|
|
rotate_backups (con->target);
|
|
/* #### Is this correct? */
|
|
chmod (con->target, 0600);
|
|
|
|
fp = fopen (con->target, restval ? "ab" : "wb");
|
|
if (!fp)
|
|
{
|
|
logprintf (LOG_NOTQUIET, "%s: %s\n", con->target, strerror (errno));
|
|
CLOSE (csock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
closeport (dtsock);
|
|
return FOPENERR;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
extern int global_download_count;
|
|
fp = opt.dfp;
|
|
|
|
/* Rewind the output document if the download starts over and if
|
|
this is the first download. See gethttp() for a longer
|
|
explanation. */
|
|
if (!restval && global_download_count == 0 && opt.dfp != stdout)
|
|
{
|
|
/* This will silently fail for streams that don't correspond
|
|
to regular files, but that's OK. */
|
|
rewind (fp);
|
|
/* ftruncate is needed because opt.dfp is opened in append
|
|
mode if opt.always_rest is set. */
|
|
ftruncate (fileno (fp), 0);
|
|
clearerr (fp);
|
|
}
|
|
}
|
|
|
|
if (*len)
|
|
{
|
|
logprintf (LOG_VERBOSE, _("Length: %s"), legible (*len));
|
|
if (restval)
|
|
logprintf (LOG_VERBOSE, _(" [%s to go]"), legible (*len - restval));
|
|
logputs (LOG_VERBOSE, "\n");
|
|
expected_bytes = *len; /* for get_contents/show_progress */
|
|
}
|
|
else if (expected_bytes)
|
|
{
|
|
logprintf (LOG_VERBOSE, _("Length: %s"), legible (expected_bytes));
|
|
if (restval)
|
|
logprintf (LOG_VERBOSE, _(" [%s to go]"),
|
|
legible (expected_bytes - restval));
|
|
logputs (LOG_VERBOSE, _(" (unauthoritative)\n"));
|
|
}
|
|
|
|
/* Get the contents of the document. */
|
|
res = get_contents (dtsock, fp, len, restval, expected_bytes, &con->rbuf,
|
|
0, &con->dltime);
|
|
tms = time_str (NULL);
|
|
tmrate = retr_rate (*len - restval, con->dltime, 0);
|
|
/* Close data connection socket. */
|
|
closeport (dtsock);
|
|
/* Close the local file. */
|
|
{
|
|
/* Close or flush the file. We have to be careful to check for
|
|
error here. Checking the result of fwrite() is not enough --
|
|
errors could go unnoticed! */
|
|
int flush_res;
|
|
if (!opt.dfp || con->cmd & DO_LIST)
|
|
flush_res = fclose (fp);
|
|
else
|
|
flush_res = fflush (fp);
|
|
if (flush_res == EOF)
|
|
res = -2;
|
|
}
|
|
/* If get_contents couldn't write to fp, bail out. */
|
|
if (res == -2)
|
|
{
|
|
logprintf (LOG_NOTQUIET, _("%s: %s, closing control connection.\n"),
|
|
con->target, strerror (errno));
|
|
CLOSE (csock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return FWRITEERR;
|
|
}
|
|
else if (res == -1)
|
|
{
|
|
logprintf (LOG_NOTQUIET, _("%s (%s) - Data connection: %s; "),
|
|
tms, tmrate, strerror (errno));
|
|
if (opt.server_response)
|
|
logputs (LOG_ALWAYS, "\n");
|
|
}
|
|
|
|
/* Get the server to tell us if everything is retrieved. */
|
|
err = ftp_response (&con->rbuf, &respline);
|
|
/* ...and empty the buffer. */
|
|
rbuf_discard (&con->rbuf);
|
|
if (err != FTPOK)
|
|
{
|
|
xfree (respline);
|
|
/* The control connection is decidedly closed. Print the time
|
|
only if it hasn't already been printed. */
|
|
if (res != -1)
|
|
logprintf (LOG_NOTQUIET, "%s (%s) - ", tms, tmrate);
|
|
logputs (LOG_NOTQUIET, _("Control connection closed.\n"));
|
|
/* If there is an error on the control connection, close it, but
|
|
return FTPRETRINT, since there is a possibility that the
|
|
whole file was retrieved nevertheless (but that is for
|
|
ftp_loop_internal to decide). */
|
|
CLOSE (csock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
return FTPRETRINT;
|
|
} /* err != FTPOK */
|
|
/* If retrieval failed for any reason, return FTPRETRINT, but do not
|
|
close socket, since the control connection is still alive. If
|
|
there is something wrong with the control connection, it will
|
|
become apparent later. */
|
|
if (*respline != '2')
|
|
{
|
|
xfree (respline);
|
|
if (res != -1)
|
|
logprintf (LOG_NOTQUIET, "%s (%s) - ", tms, tmrate);
|
|
logputs (LOG_NOTQUIET, _("Data transfer aborted.\n"));
|
|
return FTPRETRINT;
|
|
}
|
|
xfree (respline);
|
|
|
|
if (res == -1)
|
|
{
|
|
/* What now? The data connection was erroneous, whereas the
|
|
response says everything is OK. We shall play it safe. */
|
|
return FTPRETRINT;
|
|
}
|
|
|
|
if (!(cmd & LEAVE_PENDING))
|
|
{
|
|
/* I should probably send 'QUIT' and check for a reply, but this
|
|
is faster. #### Is it OK, though? */
|
|
CLOSE (csock);
|
|
rbuf_uninitialize (&con->rbuf);
|
|
}
|
|
/* If it was a listing, and opt.server_response is true,
|
|
print it out. */
|
|
if (opt.server_response && (con->cmd & DO_LIST))
|
|
{
|
|
mkalldirs (con->target);
|
|
fp = fopen (con->target, "r");
|
|
if (!fp)
|
|
logprintf (LOG_ALWAYS, "%s: %s\n", con->target, strerror (errno));
|
|
else
|
|
{
|
|
char *line;
|
|
/* The lines are being read with read_whole_line because of
|
|
no-buffering on opt.lfile. */
|
|
while ((line = read_whole_line (fp)))
|
|
{
|
|
logprintf (LOG_ALWAYS, "%s\n", line);
|
|
xfree (line);
|
|
}
|
|
fclose (fp);
|
|
}
|
|
} /* con->cmd & DO_LIST && server_response */
|
|
|
|
return RETRFINISHED;
|
|
}
|
|
|
|
/* A one-file FTP loop. This is the part where FTP retrieval is
|
|
retried, and retried, and retried, and...
|
|
|
|
This loop either gets commands from con, or (if ON_YOUR_OWN is
|
|
set), makes them up to retrieve the file given by the URL. */
|
|
static uerr_t
|
|
ftp_loop_internal (struct url *u, struct fileinfo *f, ccon *con)
|
|
{
|
|
int count, orig_lp;
|
|
long restval, len;
|
|
char *tms, *locf;
|
|
char *tmrate = NULL;
|
|
uerr_t err;
|
|
struct stat st;
|
|
|
|
if (!con->target)
|
|
con->target = url_file_name (u);
|
|
|
|
if (opt.noclobber && file_exists_p (con->target))
|
|
{
|
|
logprintf (LOG_VERBOSE,
|
|
_("File `%s' already there, not retrieving.\n"), con->target);
|
|
/* If the file is there, we suppose it's retrieved OK. */
|
|
return RETROK;
|
|
}
|
|
|
|
/* Remove it if it's a link. */
|
|
remove_link (con->target);
|
|
if (!opt.output_document)
|
|
locf = con->target;
|
|
else
|
|
locf = opt.output_document;
|
|
|
|
count = 0;
|
|
|
|
if (con->st & ON_YOUR_OWN)
|
|
con->st = ON_YOUR_OWN;
|
|
|
|
orig_lp = con->cmd & LEAVE_PENDING ? 1 : 0;
|
|
|
|
/* THE loop. */
|
|
do
|
|
{
|
|
/* Increment the pass counter. */
|
|
++count;
|
|
sleep_between_retrievals (count);
|
|
if (con->st & ON_YOUR_OWN)
|
|
{
|
|
con->cmd = 0;
|
|
con->cmd |= (DO_RETR | LEAVE_PENDING);
|
|
if (rbuf_initialized_p (&con->rbuf))
|
|
con->cmd &= ~ (DO_LOGIN | DO_CWD);
|
|
else
|
|
con->cmd |= (DO_LOGIN | DO_CWD);
|
|
}
|
|
else /* not on your own */
|
|
{
|
|
if (rbuf_initialized_p (&con->rbuf))
|
|
con->cmd &= ~DO_LOGIN;
|
|
else
|
|
con->cmd |= DO_LOGIN;
|
|
if (con->st & DONE_CWD)
|
|
con->cmd &= ~DO_CWD;
|
|
else
|
|
con->cmd |= DO_CWD;
|
|
}
|
|
|
|
/* Assume no restarting. */
|
|
restval = 0L;
|
|
if ((count > 1 || opt.always_rest)
|
|
&& !(con->cmd & DO_LIST)
|
|
&& file_exists_p (locf))
|
|
if (stat (locf, &st) == 0 && S_ISREG (st.st_mode))
|
|
restval = st.st_size;
|
|
|
|
/* In `-c' is used, check whether the file we're writing to
|
|
exists and is of non-zero length. If so, we'll refuse to
|
|
truncate it if the server doesn't support continued
|
|
downloads. */
|
|
if (opt.always_rest && restval > 0)
|
|
con->cmd |= NO_TRUNCATE;
|
|
|
|
/* Get the current time string. */
|
|
tms = time_str (NULL);
|
|
/* Print fetch message, if opt.verbose. */
|
|
if (opt.verbose)
|
|
{
|
|
char *hurl = url_string (u, 1);
|
|
char tmp[15];
|
|
strcpy (tmp, " ");
|
|
if (count > 1)
|
|
sprintf (tmp, _("(try:%2d)"), count);
|
|
logprintf (LOG_VERBOSE, "--%s-- %s\n %s => `%s'\n",
|
|
tms, hurl, tmp, locf);
|
|
#ifdef WINDOWS
|
|
ws_changetitle (hurl, 1);
|
|
#endif
|
|
xfree (hurl);
|
|
}
|
|
/* Send getftp the proper length, if fileinfo was provided. */
|
|
if (f)
|
|
len = f->size;
|
|
else
|
|
len = 0;
|
|
err = getftp (u, &len, restval, con);
|
|
|
|
if (!rbuf_initialized_p (&con->rbuf))
|
|
con->st &= ~DONE_CWD;
|
|
else
|
|
con->st |= DONE_CWD;
|
|
|
|
switch (err)
|
|
{
|
|
case HOSTERR: case CONREFUSED: case FWRITEERR: case FOPENERR:
|
|
case FTPNSFOD: case FTPLOGINC: case FTPNOPASV: case CONTNOTSUPPORTED:
|
|
/* Fatal errors, give up. */
|
|
return err;
|
|
break;
|
|
case CONSOCKERR: case CONERROR: case FTPSRVERR: case FTPRERR:
|
|
case WRITEFAILED: case FTPUNKNOWNTYPE: case CONPORTERR:
|
|
case BINDERR: case LISTENERR: case ACCEPTERR:
|
|
case FTPPORTERR: case FTPLOGREFUSED: case FTPINVPASV:
|
|
printwhat (count, opt.ntry);
|
|
/* non-fatal errors */
|
|
continue;
|
|
break;
|
|
case FTPRETRINT:
|
|
/* If the control connection was closed, the retrieval
|
|
will be considered OK if f->size == len. */
|
|
if (!f || len != f->size)
|
|
{
|
|
printwhat (count, opt.ntry);
|
|
continue;
|
|
}
|
|
break;
|
|
case RETRFINISHED:
|
|
/* Great! */
|
|
break;
|
|
default:
|
|
/* Not as great. */
|
|
abort ();
|
|
}
|
|
/* Time? */
|
|
tms = time_str (NULL);
|
|
if (!opt.spider)
|
|
tmrate = retr_rate (len - restval, con->dltime, 0);
|
|
|
|
/* If we get out of the switch above without continue'ing, we've
|
|
successfully downloaded a file. Remember this fact. */
|
|
downloaded_file (FILE_DOWNLOADED_NORMALLY, locf);
|
|
|
|
if (con->st & ON_YOUR_OWN)
|
|
{
|
|
CLOSE (RBUF_FD (&con->rbuf));
|
|
rbuf_uninitialize (&con->rbuf);
|
|
}
|
|
if (!opt.spider)
|
|
logprintf (LOG_VERBOSE, _("%s (%s) - `%s' saved [%ld]\n\n"),
|
|
tms, tmrate, locf, len);
|
|
if (!opt.verbose && !opt.quiet)
|
|
{
|
|
/* Need to hide the password from the URL. The `if' is here
|
|
so that we don't do the needless allocation every
|
|
time. */
|
|
char *hurl = url_string (u, 1);
|
|
logprintf (LOG_NONVERBOSE, "%s URL: %s [%ld] -> \"%s\" [%d]\n",
|
|
tms, hurl, len, locf, count);
|
|
xfree (hurl);
|
|
}
|
|
|
|
if ((con->cmd & DO_LIST))
|
|
/* This is a directory listing file. */
|
|
{
|
|
if (!opt.remove_listing)
|
|
/* --dont-remove-listing was specified, so do count this towards the
|
|
number of bytes and files downloaded. */
|
|
{
|
|
total_downloaded_bytes += len;
|
|
opt.numurls++;
|
|
}
|
|
|
|
/* Deletion of listing files is not controlled by --delete-after, but
|
|
by the more specific option --dont-remove-listing, and the code
|
|
to do this deletion is in another function. */
|
|
}
|
|
else if (!opt.spider)
|
|
/* This is not a directory listing file. */
|
|
{
|
|
/* Unlike directory listing files, don't pretend normal files weren't
|
|
downloaded if they're going to be deleted. People seeding proxies,
|
|
for instance, may want to know how many bytes and files they've
|
|
downloaded through it. */
|
|
total_downloaded_bytes += len;
|
|
opt.numurls++;
|
|
|
|
if (opt.delete_after)
|
|
{
|
|
DEBUGP (("Removing file due to --delete-after in"
|
|
" ftp_loop_internal():\n"));
|
|
logprintf (LOG_VERBOSE, _("Removing %s.\n"), locf);
|
|
if (unlink (locf))
|
|
logprintf (LOG_NOTQUIET, "unlink: %s\n", strerror (errno));
|
|
}
|
|
}
|
|
|
|
/* Restore the original leave-pendingness. */
|
|
if (orig_lp)
|
|
con->cmd |= LEAVE_PENDING;
|
|
else
|
|
con->cmd &= ~LEAVE_PENDING;
|
|
return RETROK;
|
|
} while (!opt.ntry || (count < opt.ntry));
|
|
|
|
if (rbuf_initialized_p (&con->rbuf) && (con->st & ON_YOUR_OWN))
|
|
{
|
|
CLOSE (RBUF_FD (&con->rbuf));
|
|
rbuf_uninitialize (&con->rbuf);
|
|
}
|
|
return TRYLIMEXC;
|
|
}
|
|
|
|
/* Return the directory listing in a reusable format. The directory
|
|
is specifed in u->dir. */
|
|
uerr_t
|
|
ftp_get_listing (struct url *u, ccon *con, struct fileinfo **f)
|
|
{
|
|
uerr_t err;
|
|
char *uf; /* url file name */
|
|
char *lf; /* list file name */
|
|
char *old_target = con->target;
|
|
|
|
con->st &= ~ON_YOUR_OWN;
|
|
con->cmd |= (DO_LIST | LEAVE_PENDING);
|
|
con->cmd &= ~DO_RETR;
|
|
|
|
/* Find the listing file name. We do it by taking the file name of
|
|
the URL and replacing the last component with the listing file
|
|
name. */
|
|
uf = url_file_name (u);
|
|
lf = file_merge (uf, LIST_FILENAME);
|
|
xfree (uf);
|
|
DEBUGP ((_("Using `%s' as listing tmp file.\n"), lf));
|
|
|
|
con->target = lf;
|
|
err = ftp_loop_internal (u, NULL, con);
|
|
con->target = old_target;
|
|
|
|
if (err == RETROK)
|
|
*f = ftp_parse_ls (lf, con->rs);
|
|
else
|
|
*f = NULL;
|
|
if (opt.remove_listing)
|
|
{
|
|
if (unlink (lf))
|
|
logprintf (LOG_NOTQUIET, "unlink: %s\n", strerror (errno));
|
|
else
|
|
logprintf (LOG_VERBOSE, _("Removed `%s'.\n"), lf);
|
|
}
|
|
xfree (lf);
|
|
con->cmd &= ~DO_LIST;
|
|
return err;
|
|
}
|
|
|
|
static uerr_t ftp_retrieve_dirs PARAMS ((struct url *, struct fileinfo *,
|
|
ccon *));
|
|
static uerr_t ftp_retrieve_glob PARAMS ((struct url *, ccon *, int));
|
|
static struct fileinfo *delelement PARAMS ((struct fileinfo *,
|
|
struct fileinfo **));
|
|
static void freefileinfo PARAMS ((struct fileinfo *f));
|
|
|
|
/* Retrieve a list of files given in struct fileinfo linked list. If
|
|
a file is a symbolic link, do not retrieve it, but rather try to
|
|
set up a similar link on the local disk, if the symlinks are
|
|
supported.
|
|
|
|
If opt.recursive is set, after all files have been retrieved,
|
|
ftp_retrieve_dirs will be called to retrieve the directories. */
|
|
static uerr_t
|
|
ftp_retrieve_list (struct url *u, struct fileinfo *f, ccon *con)
|
|
{
|
|
static int depth = 0;
|
|
uerr_t err;
|
|
struct fileinfo *orig;
|
|
long local_size;
|
|
time_t tml;
|
|
int dlthis;
|
|
|
|
/* Increase the depth. */
|
|
++depth;
|
|
if (opt.reclevel != INFINITE_RECURSION && depth > opt.reclevel)
|
|
{
|
|
DEBUGP ((_("Recursion depth %d exceeded max. depth %d.\n"),
|
|
depth, opt.reclevel));
|
|
--depth;
|
|
return RECLEVELEXC;
|
|
}
|
|
|
|
assert (f != NULL);
|
|
orig = f;
|
|
|
|
con->st &= ~ON_YOUR_OWN;
|
|
if (!(con->st & DONE_CWD))
|
|
con->cmd |= DO_CWD;
|
|
else
|
|
con->cmd &= ~DO_CWD;
|
|
con->cmd |= (DO_RETR | LEAVE_PENDING);
|
|
|
|
if (!rbuf_initialized_p (&con->rbuf))
|
|
con->cmd |= DO_LOGIN;
|
|
else
|
|
con->cmd &= ~DO_LOGIN;
|
|
|
|
err = RETROK; /* in case it's not used */
|
|
|
|
while (f)
|
|
{
|
|
char *old_target, *ofile;
|
|
|
|
if (opt.quota && total_downloaded_bytes > opt.quota)
|
|
{
|
|
--depth;
|
|
return QUOTEXC;
|
|
}
|
|
old_target = con->target;
|
|
|
|
ofile = xstrdup (u->file);
|
|
url_set_file (u, f->name);
|
|
|
|
con->target = url_file_name (u);
|
|
err = RETROK;
|
|
|
|
dlthis = 1;
|
|
if (opt.timestamping && f->type == FT_PLAINFILE)
|
|
{
|
|
struct stat st;
|
|
/* If conversion of HTML files retrieved via FTP is ever implemented,
|
|
we'll need to stat() <file>.orig here when -K has been specified.
|
|
I'm not implementing it now since files on an FTP server are much
|
|
more likely than files on an HTTP server to legitimately have a
|
|
.orig suffix. */
|
|
if (!stat (con->target, &st))
|
|
{
|
|
int eq_size;
|
|
int cor_val;
|
|
/* Else, get it from the file. */
|
|
local_size = st.st_size;
|
|
tml = st.st_mtime;
|
|
#ifdef WINDOWS
|
|
/* Modification time granularity is 2 seconds for Windows, so
|
|
increase local time by 1 second for later comparison. */
|
|
tml++;
|
|
#endif
|
|
/* Compare file sizes only for servers that tell us correct
|
|
values. Assumme sizes being equal for servers that lie
|
|
about file size. */
|
|
cor_val = (con->rs == ST_UNIX || con->rs == ST_WINNT);
|
|
eq_size = cor_val ? (local_size == f->size) : 1 ;
|
|
if (f->tstamp <= tml && eq_size)
|
|
{
|
|
/* Remote file is older, file sizes can be compared and
|
|
are both equal. */
|
|
logprintf (LOG_VERBOSE, _("\
|
|
Remote file no newer than local file `%s' -- not retrieving.\n"), con->target);
|
|
dlthis = 0;
|
|
}
|
|
else if (eq_size)
|
|
{
|
|
/* Remote file is newer or sizes cannot be matched */
|
|
logprintf (LOG_VERBOSE, _("\
|
|
Remote file is newer than local file `%s' -- retrieving.\n\n"),
|
|
con->target);
|
|
}
|
|
else
|
|
{
|
|
/* Sizes do not match */
|
|
logprintf (LOG_VERBOSE, _("\
|
|
The sizes do not match (local %ld) -- retrieving.\n\n"), local_size);
|
|
}
|
|
}
|
|
} /* opt.timestamping && f->type == FT_PLAINFILE */
|
|
switch (f->type)
|
|
{
|
|
case FT_SYMLINK:
|
|
/* If opt.retr_symlinks is defined, we treat symlinks as
|
|
if they were normal files. There is currently no way
|
|
to distinguish whether they might be directories, and
|
|
follow them. */
|
|
if (!opt.retr_symlinks)
|
|
{
|
|
#ifdef HAVE_SYMLINK
|
|
if (!f->linkto)
|
|
logputs (LOG_NOTQUIET,
|
|
_("Invalid name of the symlink, skipping.\n"));
|
|
else
|
|
{
|
|
struct stat st;
|
|
/* Check whether we already have the correct
|
|
symbolic link. */
|
|
int rc = lstat (con->target, &st);
|
|
if (rc == 0)
|
|
{
|
|
size_t len = strlen (f->linkto) + 1;
|
|
if (S_ISLNK (st.st_mode))
|
|
{
|
|
char *link_target = (char *)alloca (len);
|
|
size_t n = readlink (con->target, link_target, len);
|
|
if ((n == len - 1)
|
|
&& (memcmp (link_target, f->linkto, n) == 0))
|
|
{
|
|
logprintf (LOG_VERBOSE, _("\
|
|
Already have correct symlink %s -> %s\n\n"),
|
|
con->target, f->linkto);
|
|
dlthis = 0;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
logprintf (LOG_VERBOSE, _("Creating symlink %s -> %s\n"),
|
|
con->target, f->linkto);
|
|
/* Unlink before creating symlink! */
|
|
unlink (con->target);
|
|
if (symlink (f->linkto, con->target) == -1)
|
|
logprintf (LOG_NOTQUIET, "symlink: %s\n",
|
|
strerror (errno));
|
|
logputs (LOG_VERBOSE, "\n");
|
|
} /* have f->linkto */
|
|
#else /* not HAVE_SYMLINK */
|
|
logprintf (LOG_NOTQUIET,
|
|
_("Symlinks not supported, skipping symlink `%s'.\n"),
|
|
con->target);
|
|
#endif /* not HAVE_SYMLINK */
|
|
}
|
|
else /* opt.retr_symlinks */
|
|
{
|
|
if (dlthis)
|
|
err = ftp_loop_internal (u, f, con);
|
|
} /* opt.retr_symlinks */
|
|
break;
|
|
case FT_DIRECTORY:
|
|
if (!opt.recursive)
|
|
logprintf (LOG_NOTQUIET, _("Skipping directory `%s'.\n"),
|
|
f->name);
|
|
break;
|
|
case FT_PLAINFILE:
|
|
/* Call the retrieve loop. */
|
|
if (dlthis)
|
|
err = ftp_loop_internal (u, f, con);
|
|
break;
|
|
case FT_UNKNOWN:
|
|
logprintf (LOG_NOTQUIET, _("%s: unknown/unsupported file type.\n"),
|
|
f->name);
|
|
break;
|
|
} /* switch */
|
|
|
|
/* Set the time-stamp information to the local file. Symlinks
|
|
are not to be stamped because it sets the stamp on the
|
|
original. :( */
|
|
if (!(f->type == FT_SYMLINK && !opt.retr_symlinks)
|
|
&& f->tstamp != -1
|
|
&& dlthis
|
|
&& file_exists_p (con->target))
|
|
{
|
|
/* #### This code repeats in http.c and ftp.c. Move it to a
|
|
function! */
|
|
const char *fl = NULL;
|
|
if (opt.output_document)
|
|
{
|
|
if (opt.od_known_regular)
|
|
fl = opt.output_document;
|
|
}
|
|
else
|
|
fl = con->target;
|
|
if (fl)
|
|
touch (fl, f->tstamp);
|
|
}
|
|
else if (f->tstamp == -1)
|
|
logprintf (LOG_NOTQUIET, _("%s: corrupt time-stamp.\n"), con->target);
|
|
|
|
if (f->perms && f->type == FT_PLAINFILE && dlthis)
|
|
chmod (con->target, f->perms);
|
|
else
|
|
DEBUGP (("Unrecognized permissions for %s.\n", con->target));
|
|
|
|
xfree (con->target);
|
|
con->target = old_target;
|
|
|
|
url_set_file (u, ofile);
|
|
xfree (ofile);
|
|
|
|
/* Break on fatals. */
|
|
if (err == QUOTEXC || err == HOSTERR || err == FWRITEERR)
|
|
break;
|
|
con->cmd &= ~ (DO_CWD | DO_LOGIN);
|
|
f = f->next;
|
|
}
|
|
|
|
/* We do not want to call ftp_retrieve_dirs here */
|
|
if (opt.recursive &&
|
|
!(opt.reclevel != INFINITE_RECURSION && depth >= opt.reclevel))
|
|
err = ftp_retrieve_dirs (u, orig, con);
|
|
else if (opt.recursive)
|
|
DEBUGP ((_("Will not retrieve dirs since depth is %d (max %d).\n"),
|
|
depth, opt.reclevel));
|
|
--depth;
|
|
return err;
|
|
}
|
|
|
|
/* Retrieve the directories given in a file list. This function works
|
|
by simply going through the linked list and calling
|
|
ftp_retrieve_glob on each directory entry. The function knows
|
|
about excluded directories. */
|
|
static uerr_t
|
|
ftp_retrieve_dirs (struct url *u, struct fileinfo *f, ccon *con)
|
|
{
|
|
char *container = NULL;
|
|
int container_size = 0;
|
|
|
|
for (; f; f = f->next)
|
|
{
|
|
int size;
|
|
char *odir, *newdir;
|
|
|
|
if (opt.quota && total_downloaded_bytes > opt.quota)
|
|
break;
|
|
if (f->type != FT_DIRECTORY)
|
|
continue;
|
|
|
|
/* Allocate u->dir off stack, but reallocate only if a larger
|
|
string is needed. It's a pity there's no "realloca" for an
|
|
item on the bottom of the stack. */
|
|
size = strlen (u->dir) + 1 + strlen (f->name) + 1;
|
|
if (size > container_size)
|
|
container = (char *)alloca (size);
|
|
newdir = container;
|
|
|
|
odir = u->dir;
|
|
if (*odir == '\0'
|
|
|| (*odir == '/' && *(odir + 1) == '\0'))
|
|
/* If ODIR is empty or just "/", simply append f->name to
|
|
ODIR. (In the former case, to preserve u->dir being
|
|
relative; in the latter case, to avoid double slash.) */
|
|
sprintf (newdir, "%s%s", odir, f->name);
|
|
else
|
|
/* Else, use a separator. */
|
|
sprintf (newdir, "%s/%s", odir, f->name);
|
|
|
|
DEBUGP (("Composing new CWD relative to the initial directory.\n"));
|
|
DEBUGP ((" odir = '%s'\n f->name = '%s'\n newdir = '%s'\n\n",
|
|
odir, f->name, newdir));
|
|
if (!accdir (newdir, ALLABS))
|
|
{
|
|
logprintf (LOG_VERBOSE, _("\
|
|
Not descending to `%s' as it is excluded/not-included.\n"), newdir);
|
|
continue;
|
|
}
|
|
|
|
con->st &= ~DONE_CWD;
|
|
|
|
odir = xstrdup (u->dir); /* because url_set_dir will free
|
|
u->dir. */
|
|
url_set_dir (u, newdir);
|
|
ftp_retrieve_glob (u, con, GETALL);
|
|
url_set_dir (u, odir);
|
|
xfree (odir);
|
|
|
|
/* Set the time-stamp? */
|
|
}
|
|
|
|
if (opt.quota && total_downloaded_bytes > opt.quota)
|
|
return QUOTEXC;
|
|
else
|
|
return RETROK;
|
|
}
|
|
|
|
/* Return non-zero if S has a leading '/' or contains '../' */
|
|
static int
|
|
has_insecure_name_p (const char *s)
|
|
{
|
|
if (*s == '/')
|
|
return 1;
|
|
|
|
if (strstr(s, "../") != 0)
|
|
return 1;
|
|
|
|
return 0;
|
|
}
|
|
|
|
/* A near-top-level function to retrieve the files in a directory.
|
|
The function calls ftp_get_listing, to get a linked list of files.
|
|
Then it weeds out the file names that do not match the pattern.
|
|
ftp_retrieve_list is called with this updated list as an argument.
|
|
|
|
If the argument ACTION is GETONE, just download the file (but first
|
|
get the listing, so that the time-stamp is heeded); if it's GLOBALL,
|
|
use globbing; if it's GETALL, download the whole directory. */
|
|
static uerr_t
|
|
ftp_retrieve_glob (struct url *u, ccon *con, int action)
|
|
{
|
|
struct fileinfo *f, *orig, *start;
|
|
uerr_t res;
|
|
|
|
con->cmd |= LEAVE_PENDING;
|
|
|
|
res = ftp_get_listing (u, con, &orig);
|
|
if (res != RETROK)
|
|
return res;
|
|
start = orig;
|
|
/* First: weed out that do not conform the global rules given in
|
|
opt.accepts and opt.rejects. */
|
|
if (opt.accepts || opt.rejects)
|
|
{
|
|
f = orig;
|
|
while (f)
|
|
{
|
|
if (f->type != FT_DIRECTORY && !acceptable (f->name))
|
|
{
|
|
logprintf (LOG_VERBOSE, _("Rejecting `%s'.\n"), f->name);
|
|
f = delelement (f, &start);
|
|
}
|
|
else
|
|
f = f->next;
|
|
}
|
|
}
|
|
/* Remove all files with possible harmful names */
|
|
f = orig;
|
|
while (f)
|
|
{
|
|
if (has_insecure_name_p (f->name))
|
|
{
|
|
logprintf (LOG_VERBOSE, _("Rejecting `%s'.\n"), f->name);
|
|
f = delelement (f, &start);
|
|
}
|
|
else
|
|
f = f->next;
|
|
}
|
|
/* Now weed out the files that do not match our globbing pattern.
|
|
If we are dealing with a globbing pattern, that is. */
|
|
if (*u->file && (action == GLOBALL || action == GETONE))
|
|
{
|
|
int matchres = 0;
|
|
|
|
f = start;
|
|
while (f)
|
|
{
|
|
matchres = fnmatch (u->file, f->name, 0);
|
|
if (matchres == -1)
|
|
{
|
|
logprintf (LOG_NOTQUIET, "%s: %s\n", con->target,
|
|
strerror (errno));
|
|
break;
|
|
}
|
|
if (matchres == FNM_NOMATCH)
|
|
f = delelement (f, &start); /* delete the element from the list */
|
|
else
|
|
f = f->next; /* leave the element in the list */
|
|
}
|
|
if (matchres == -1)
|
|
{
|
|
freefileinfo (start);
|
|
return RETRBADPATTERN;
|
|
}
|
|
}
|
|
res = RETROK;
|
|
if (start)
|
|
{
|
|
/* Just get everything. */
|
|
ftp_retrieve_list (u, start, con);
|
|
}
|
|
else if (!start)
|
|
{
|
|
if (action == GLOBALL)
|
|
{
|
|
/* No luck. */
|
|
/* #### This message SUCKS. We should see what was the
|
|
reason that nothing was retrieved. */
|
|
logprintf (LOG_VERBOSE, _("No matches on pattern `%s'.\n"), u->file);
|
|
}
|
|
else /* GETONE or GETALL */
|
|
{
|
|
/* Let's try retrieving it anyway. */
|
|
con->st |= ON_YOUR_OWN;
|
|
res = ftp_loop_internal (u, NULL, con);
|
|
return res;
|
|
}
|
|
}
|
|
freefileinfo (start);
|
|
if (opt.quota && total_downloaded_bytes > opt.quota)
|
|
return QUOTEXC;
|
|
else
|
|
/* #### Should we return `res' here? */
|
|
return RETROK;
|
|
}
|
|
|
|
/* The wrapper that calls an appropriate routine according to contents
|
|
of URL. Inherently, its capabilities are limited on what can be
|
|
encoded into a URL. */
|
|
uerr_t
|
|
ftp_loop (struct url *u, int *dt, struct url *proxy)
|
|
{
|
|
ccon con; /* FTP connection */
|
|
uerr_t res;
|
|
|
|
*dt = 0;
|
|
|
|
memset (&con, 0, sizeof (con));
|
|
|
|
rbuf_uninitialize (&con.rbuf);
|
|
con.st = ON_YOUR_OWN;
|
|
con.rs = ST_UNIX;
|
|
con.id = NULL;
|
|
con.proxy = proxy;
|
|
res = RETROK; /* in case it's not used */
|
|
|
|
/* If the file name is empty, the user probably wants a directory
|
|
index. We'll provide one, properly HTML-ized. Unless
|
|
opt.htmlify is 0, of course. :-) */
|
|
if (!*u->file && !opt.recursive)
|
|
{
|
|
struct fileinfo *f;
|
|
res = ftp_get_listing (u, &con, &f);
|
|
|
|
if (res == RETROK)
|
|
{
|
|
if (opt.htmlify && !opt.spider)
|
|
{
|
|
char *filename = (opt.output_document
|
|
? xstrdup (opt.output_document)
|
|
: (con.target ? xstrdup (con.target)
|
|
: url_file_name (u)));
|
|
res = ftp_index (filename, u, f);
|
|
if (res == FTPOK && opt.verbose)
|
|
{
|
|
if (!opt.output_document)
|
|
{
|
|
struct stat st;
|
|
long sz;
|
|
if (stat (filename, &st) == 0)
|
|
sz = st.st_size;
|
|
else
|
|
sz = -1;
|
|
logprintf (LOG_NOTQUIET,
|
|
_("Wrote HTML-ized index to `%s' [%ld].\n"),
|
|
filename, sz);
|
|
}
|
|
else
|
|
logprintf (LOG_NOTQUIET,
|
|
_("Wrote HTML-ized index to `%s'.\n"),
|
|
filename);
|
|
}
|
|
xfree (filename);
|
|
}
|
|
freefileinfo (f);
|
|
}
|
|
}
|
|
else
|
|
{
|
|
int wild = has_wildcards_p (u->file);
|
|
if ((opt.ftp_glob && wild) || opt.recursive || opt.timestamping)
|
|
{
|
|
/* ftp_retrieve_glob is a catch-all function that gets called
|
|
if we need globbing, time-stamping or recursion. Its
|
|
third argument is just what we really need. */
|
|
res = ftp_retrieve_glob (u, &con,
|
|
(opt.ftp_glob && wild) ? GLOBALL : GETONE);
|
|
}
|
|
else
|
|
res = ftp_loop_internal (u, NULL, &con);
|
|
}
|
|
if (res == FTPOK)
|
|
res = RETROK;
|
|
if (res == RETROK)
|
|
*dt |= RETROKF;
|
|
/* If a connection was left, quench it. */
|
|
if (rbuf_initialized_p (&con.rbuf))
|
|
CLOSE (RBUF_FD (&con.rbuf));
|
|
FREE_MAYBE (con.id);
|
|
con.id = NULL;
|
|
FREE_MAYBE (con.target);
|
|
con.target = NULL;
|
|
return res;
|
|
}
|
|
|
|
/* Delete an element from the fileinfo linked list. Returns the
|
|
address of the next element, or NULL if the list is exhausted. It
|
|
can modify the start of the list. */
|
|
static struct fileinfo *
|
|
delelement (struct fileinfo *f, struct fileinfo **start)
|
|
{
|
|
struct fileinfo *prev = f->prev;
|
|
struct fileinfo *next = f->next;
|
|
|
|
xfree (f->name);
|
|
FREE_MAYBE (f->linkto);
|
|
xfree (f);
|
|
|
|
if (next)
|
|
next->prev = prev;
|
|
if (prev)
|
|
prev->next = next;
|
|
else
|
|
*start = next;
|
|
return next;
|
|
}
|
|
|
|
/* Free the fileinfo linked list of files. */
|
|
static void
|
|
freefileinfo (struct fileinfo *f)
|
|
{
|
|
while (f)
|
|
{
|
|
struct fileinfo *next = f->next;
|
|
xfree (f->name);
|
|
if (f->linkto)
|
|
xfree (f->linkto);
|
|
xfree (f);
|
|
f = next;
|
|
}
|
|
}
|