1999-12-02 15:42:23 +08:00
|
|
|
|
/* Reading/parsing the initialization file.
|
2001-05-28 03:35:15 +08:00
|
|
|
|
Copyright (C) 1995, 1996, 1997, 1998, 2000, 2001
|
|
|
|
|
Free Software Foundation, Inc.
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
2001-05-28 03:35:15 +08:00
|
|
|
|
This file is part of GNU Wget.
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
2001-05-28 03:35:15 +08:00
|
|
|
|
GNU Wget is free software; you can redistribute it and/or modify
|
1999-12-02 15:42:23 +08:00
|
|
|
|
it under the terms of the GNU General Public License as published by
|
|
|
|
|
the Free Software Foundation; either version 2 of the License, or
|
|
|
|
|
(at your option) any later version.
|
|
|
|
|
|
2001-05-28 03:35:15 +08:00
|
|
|
|
GNU Wget is distributed in the hope that it will be useful,
|
1999-12-02 15:42:23 +08:00
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
|
GNU General Public License for more details.
|
|
|
|
|
|
|
|
|
|
You should have received a copy of the GNU General Public License
|
2001-05-28 03:35:15 +08:00
|
|
|
|
along with Wget; if not, write to the Free Software
|
2002-05-18 10:16:36 +08:00
|
|
|
|
Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
|
|
|
|
|
|
|
|
|
|
In addition, as a special exception, the Free Software Foundation
|
|
|
|
|
gives permission to link the code of its release of Wget with the
|
|
|
|
|
OpenSSL project's "OpenSSL" library (or with modified versions of it
|
|
|
|
|
that use the same license as the "OpenSSL" library), and distribute
|
|
|
|
|
the linked executables. You must obey the GNU General Public License
|
|
|
|
|
in all respects for all of the code used other than "OpenSSL". If you
|
|
|
|
|
modify this file, you may extend this exception to your version of the
|
|
|
|
|
file, but you are not obligated to do so. If you do not wish to do
|
|
|
|
|
so, delete this exception statement from your version. */
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
|
|
|
|
#include <config.h>
|
|
|
|
|
|
|
|
|
|
#include <stdio.h>
|
|
|
|
|
#include <sys/types.h>
|
|
|
|
|
#include <stdlib.h>
|
|
|
|
|
#ifdef HAVE_UNISTD_H
|
|
|
|
|
# include <unistd.h>
|
|
|
|
|
#endif
|
|
|
|
|
#ifdef HAVE_STRING_H
|
|
|
|
|
# include <string.h>
|
|
|
|
|
#else
|
|
|
|
|
# include <strings.h>
|
|
|
|
|
#endif
|
|
|
|
|
#include <errno.h>
|
|
|
|
|
|
2000-10-24 14:19:17 +08:00
|
|
|
|
#ifdef WINDOWS
|
|
|
|
|
# include <winsock.h>
|
|
|
|
|
#else
|
|
|
|
|
# include <sys/socket.h>
|
|
|
|
|
# include <netinet/in.h>
|
2001-11-17 00:58:08 +08:00
|
|
|
|
#ifndef __BEOS__
|
2000-10-24 14:19:17 +08:00
|
|
|
|
# include <arpa/inet.h>
|
|
|
|
|
#endif
|
2001-11-17 00:58:08 +08:00
|
|
|
|
#endif
|
2000-10-24 14:19:17 +08:00
|
|
|
|
|
1999-12-02 15:42:23 +08:00
|
|
|
|
#ifdef HAVE_PWD_H
|
|
|
|
|
#include <pwd.h>
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
#include "wget.h"
|
|
|
|
|
#include "utils.h"
|
|
|
|
|
#include "init.h"
|
|
|
|
|
#include "host.h"
|
|
|
|
|
#include "recur.h"
|
|
|
|
|
#include "netrc.h"
|
2002-04-21 04:46:38 +08:00
|
|
|
|
#include "cookies.h" /* for cookie_jar_delete */
|
2001-12-10 06:25:34 +08:00
|
|
|
|
#include "progress.h"
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
|
|
|
|
#ifndef errno
|
|
|
|
|
extern int errno;
|
|
|
|
|
#endif
|
|
|
|
|
|
2002-04-21 04:46:38 +08:00
|
|
|
|
extern struct cookie_jar *wget_cookie_jar;
|
|
|
|
|
|
2001-04-09 07:59:14 +08:00
|
|
|
|
/* We want tilde expansion enabled only when reading `.wgetrc' lines;
|
|
|
|
|
otherwise, it will be performed by the shell. This variable will
|
|
|
|
|
be set by the wgetrc-reading function. */
|
|
|
|
|
|
|
|
|
|
static int enable_tilde_expansion;
|
|
|
|
|
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
|
|
|
|
#define CMD_DECLARE(func) static int func \
|
|
|
|
|
PARAMS ((const char *, const char *, void *))
|
|
|
|
|
|
|
|
|
|
CMD_DECLARE (cmd_boolean);
|
2000-10-20 14:59:30 +08:00
|
|
|
|
CMD_DECLARE (cmd_bytes);
|
|
|
|
|
CMD_DECLARE (cmd_directory_vector);
|
|
|
|
|
CMD_DECLARE (cmd_lockable_boolean);
|
1999-12-02 15:42:23 +08:00
|
|
|
|
CMD_DECLARE (cmd_number);
|
|
|
|
|
CMD_DECLARE (cmd_number_inf);
|
|
|
|
|
CMD_DECLARE (cmd_string);
|
2001-04-09 07:59:14 +08:00
|
|
|
|
CMD_DECLARE (cmd_file);
|
2002-01-17 09:03:33 +08:00
|
|
|
|
CMD_DECLARE (cmd_directory);
|
1999-12-02 15:42:23 +08:00
|
|
|
|
CMD_DECLARE (cmd_time);
|
2000-10-20 14:59:30 +08:00
|
|
|
|
CMD_DECLARE (cmd_vector);
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
|
|
|
|
CMD_DECLARE (cmd_spec_dirstruct);
|
|
|
|
|
CMD_DECLARE (cmd_spec_header);
|
|
|
|
|
CMD_DECLARE (cmd_spec_htmlify);
|
|
|
|
|
CMD_DECLARE (cmd_spec_mirror);
|
2001-12-10 06:25:34 +08:00
|
|
|
|
CMD_DECLARE (cmd_spec_progress);
|
1999-12-02 15:42:23 +08:00
|
|
|
|
CMD_DECLARE (cmd_spec_recursive);
|
|
|
|
|
CMD_DECLARE (cmd_spec_useragent);
|
|
|
|
|
|
2000-03-11 14:48:06 +08:00
|
|
|
|
/* List of recognized commands, each consisting of name, closure and function.
|
|
|
|
|
When adding a new command, simply add it to the list, but be sure to keep the
|
|
|
|
|
list sorted alphabetically, as comind() depends on it. Also, be sure to add
|
|
|
|
|
any entries that allocate memory (e.g. cmd_string and cmd_vector guys) to the
|
|
|
|
|
cleanup() function below. */
|
1999-12-02 15:42:23 +08:00
|
|
|
|
static struct {
|
|
|
|
|
char *name;
|
|
|
|
|
void *closure;
|
|
|
|
|
int (*action) PARAMS ((const char *, const char *, void *));
|
|
|
|
|
} commands[] = {
|
|
|
|
|
{ "accept", &opt.accepts, cmd_vector },
|
|
|
|
|
{ "addhostdir", &opt.add_hostdir, cmd_boolean },
|
|
|
|
|
{ "alwaysrest", &opt.always_rest, cmd_boolean }, /* deprecated */
|
|
|
|
|
{ "background", &opt.background, cmd_boolean },
|
2000-03-01 08:17:23 +08:00
|
|
|
|
{ "backupconverted", &opt.backup_converted, cmd_boolean },
|
1999-12-02 15:42:23 +08:00
|
|
|
|
{ "backups", &opt.backups, cmd_number },
|
|
|
|
|
{ "base", &opt.base_href, cmd_string },
|
2002-01-25 11:34:23 +08:00
|
|
|
|
{ "bindaddress", &opt.bind_address, cmd_string },
|
2001-04-27 13:26:44 +08:00
|
|
|
|
{ "cache", &opt.allow_cache, cmd_boolean },
|
1999-12-02 15:42:23 +08:00
|
|
|
|
{ "continue", &opt.always_rest, cmd_boolean },
|
|
|
|
|
{ "convertlinks", &opt.convert_links, cmd_boolean },
|
2001-04-09 06:25:24 +08:00
|
|
|
|
{ "cookies", &opt.cookies, cmd_boolean },
|
1999-12-02 15:42:23 +08:00
|
|
|
|
{ "cutdirs", &opt.cut_dirs, cmd_number },
|
|
|
|
|
#ifdef DEBUG
|
|
|
|
|
{ "debug", &opt.debug, cmd_boolean },
|
|
|
|
|
#endif
|
|
|
|
|
{ "deleteafter", &opt.delete_after, cmd_boolean },
|
2002-01-17 09:03:33 +08:00
|
|
|
|
{ "dirprefix", &opt.dir_prefix, cmd_directory },
|
1999-12-02 15:42:23 +08:00
|
|
|
|
{ "dirstruct", NULL, cmd_spec_dirstruct },
|
2003-09-11 03:41:54 +08:00
|
|
|
|
{ "dnscache", &opt.dns_cache, cmd_boolean },
|
1999-12-02 15:42:23 +08:00
|
|
|
|
{ "domains", &opt.domains, cmd_vector },
|
|
|
|
|
{ "dotbytes", &opt.dot_bytes, cmd_bytes },
|
|
|
|
|
{ "dotsinline", &opt.dots_in_line, cmd_number },
|
|
|
|
|
{ "dotspacing", &opt.dot_spacing, cmd_number },
|
2001-11-28 10:44:18 +08:00
|
|
|
|
{ "dotstyle", &opt.dot_style, cmd_string },
|
2002-04-19 17:24:32 +08:00
|
|
|
|
#ifdef HAVE_SSL
|
|
|
|
|
{ "egdfile", &opt.sslegdsock, cmd_file },
|
|
|
|
|
#endif
|
1999-12-02 15:42:23 +08:00
|
|
|
|
{ "excludedirectories", &opt.excludes, cmd_directory_vector },
|
|
|
|
|
{ "excludedomains", &opt.exclude_domains, cmd_vector },
|
|
|
|
|
{ "followftp", &opt.follow_ftp, cmd_boolean },
|
2000-03-11 14:48:06 +08:00
|
|
|
|
{ "followtags", &opt.follow_tags, cmd_vector },
|
1999-12-02 15:42:23 +08:00
|
|
|
|
{ "forcehtml", &opt.force_html, cmd_boolean },
|
|
|
|
|
{ "ftpproxy", &opt.ftp_proxy, cmd_string },
|
|
|
|
|
{ "glob", &opt.ftp_glob, cmd_boolean },
|
|
|
|
|
{ "header", NULL, cmd_spec_header },
|
2000-10-20 13:55:46 +08:00
|
|
|
|
{ "htmlextension", &opt.html_extension, cmd_boolean },
|
1999-12-02 15:42:23 +08:00
|
|
|
|
{ "htmlify", NULL, cmd_spec_htmlify },
|
2000-11-20 08:04:06 +08:00
|
|
|
|
{ "httpkeepalive", &opt.http_keep_alive, cmd_boolean },
|
1999-12-02 15:42:23 +08:00
|
|
|
|
{ "httppasswd", &opt.http_passwd, cmd_string },
|
|
|
|
|
{ "httpproxy", &opt.http_proxy, cmd_string },
|
2000-12-06 07:09:41 +08:00
|
|
|
|
{ "httpsproxy", &opt.https_proxy, cmd_string },
|
2001-02-17 13:26:34 +08:00
|
|
|
|
{ "httpuser", &opt.http_user, cmd_string },
|
1999-12-02 15:42:23 +08:00
|
|
|
|
{ "ignorelength", &opt.ignore_length, cmd_boolean },
|
2000-03-11 14:48:06 +08:00
|
|
|
|
{ "ignoretags", &opt.ignore_tags, cmd_vector },
|
1999-12-02 15:42:23 +08:00
|
|
|
|
{ "includedirectories", &opt.includes, cmd_directory_vector },
|
2001-04-09 07:59:14 +08:00
|
|
|
|
{ "input", &opt.input_filename, cmd_file },
|
1999-12-02 15:42:23 +08:00
|
|
|
|
{ "killlonger", &opt.kill_longer, cmd_boolean },
|
2001-11-27 04:07:13 +08:00
|
|
|
|
{ "limitrate", &opt.limit_rate, cmd_bytes },
|
2001-04-09 07:59:14 +08:00
|
|
|
|
{ "loadcookies", &opt.cookies_input, cmd_file },
|
|
|
|
|
{ "logfile", &opt.lfilename, cmd_file },
|
1999-12-02 15:42:23 +08:00
|
|
|
|
{ "login", &opt.ftp_acc, cmd_string },
|
|
|
|
|
{ "mirror", NULL, cmd_spec_mirror },
|
|
|
|
|
{ "netrc", &opt.netrc, cmd_boolean },
|
|
|
|
|
{ "noclobber", &opt.noclobber, cmd_boolean },
|
|
|
|
|
{ "noparent", &opt.no_parent, cmd_boolean },
|
|
|
|
|
{ "noproxy", &opt.no_proxy, cmd_vector },
|
2000-03-11 14:48:06 +08:00
|
|
|
|
{ "numtries", &opt.ntry, cmd_number_inf },/* deprecated*/
|
2001-04-09 07:59:14 +08:00
|
|
|
|
{ "outputdocument", &opt.output_document, cmd_file },
|
2000-08-30 19:26:21 +08:00
|
|
|
|
{ "pagerequisites", &opt.page_requisites, cmd_boolean },
|
2000-10-20 14:59:30 +08:00
|
|
|
|
{ "passiveftp", &opt.ftp_pasv, cmd_lockable_boolean },
|
1999-12-02 15:42:23 +08:00
|
|
|
|
{ "passwd", &opt.ftp_pass, cmd_string },
|
2002-04-14 12:22:47 +08:00
|
|
|
|
{ "postdata", &opt.post_data, cmd_string },
|
|
|
|
|
{ "postfile", &opt.post_file_name, cmd_file },
|
2001-12-10 06:25:34 +08:00
|
|
|
|
{ "progress", &opt.progress_type, cmd_spec_progress },
|
1999-12-02 15:42:23 +08:00
|
|
|
|
{ "proxypasswd", &opt.proxy_passwd, cmd_string },
|
|
|
|
|
{ "proxyuser", &opt.proxy_user, cmd_string },
|
|
|
|
|
{ "quiet", &opt.quiet, cmd_boolean },
|
|
|
|
|
{ "quota", &opt.quota, cmd_bytes },
|
2001-11-26 05:23:15 +08:00
|
|
|
|
{ "randomwait", &opt.random_wait, cmd_boolean },
|
1999-12-02 15:42:23 +08:00
|
|
|
|
{ "reclevel", &opt.reclevel, cmd_number_inf },
|
|
|
|
|
{ "recursive", NULL, cmd_spec_recursive },
|
2000-03-02 22:23:22 +08:00
|
|
|
|
{ "referer", &opt.referer, cmd_string },
|
1999-12-02 15:42:23 +08:00
|
|
|
|
{ "reject", &opt.rejects, cmd_vector },
|
|
|
|
|
{ "relativeonly", &opt.relative_only, cmd_boolean },
|
|
|
|
|
{ "removelisting", &opt.remove_listing, cmd_boolean },
|
|
|
|
|
{ "retrsymlinks", &opt.retr_symlinks, cmd_boolean },
|
2003-09-05 05:34:58 +08:00
|
|
|
|
{ "retryconnrefused", &opt.retry_connrefused, cmd_boolean },
|
1999-12-02 15:42:23 +08:00
|
|
|
|
{ "robots", &opt.use_robots, cmd_boolean },
|
2001-04-09 07:59:14 +08:00
|
|
|
|
{ "savecookies", &opt.cookies_output, cmd_file },
|
1999-12-02 15:42:23 +08:00
|
|
|
|
{ "saveheaders", &opt.save_headers, cmd_boolean },
|
|
|
|
|
{ "serverresponse", &opt.server_response, cmd_boolean },
|
|
|
|
|
{ "spanhosts", &opt.spanhost, cmd_boolean },
|
|
|
|
|
{ "spider", &opt.spider, cmd_boolean },
|
2001-02-11 06:33:31 +08:00
|
|
|
|
#ifdef HAVE_SSL
|
2002-04-21 10:26:48 +08:00
|
|
|
|
{ "sslcadir", &opt.sslcadir, cmd_directory },
|
|
|
|
|
{ "sslcafile", &opt.sslcafile, cmd_file },
|
2001-04-09 07:59:14 +08:00
|
|
|
|
{ "sslcertfile", &opt.sslcertfile, cmd_file },
|
|
|
|
|
{ "sslcertkey", &opt.sslcertkey, cmd_file },
|
2002-04-21 10:26:48 +08:00
|
|
|
|
{ "sslcerttype", &opt.sslcerttype, cmd_number },
|
|
|
|
|
{ "sslcheckcert", &opt.sslcheckcert, cmd_number },
|
|
|
|
|
{ "sslprotocol", &opt.sslprotocol, cmd_number },
|
2001-02-11 06:33:31 +08:00
|
|
|
|
#endif /* HAVE_SSL */
|
1999-12-02 15:42:23 +08:00
|
|
|
|
{ "timeout", &opt.timeout, cmd_time },
|
|
|
|
|
{ "timestamping", &opt.timestamping, cmd_boolean },
|
|
|
|
|
{ "tries", &opt.ntry, cmd_number_inf },
|
|
|
|
|
{ "useproxy", &opt.use_proxy, cmd_boolean },
|
|
|
|
|
{ "useragent", NULL, cmd_spec_useragent },
|
|
|
|
|
{ "verbose", &opt.verbose, cmd_boolean },
|
2000-03-02 22:45:37 +08:00
|
|
|
|
{ "wait", &opt.wait, cmd_time },
|
|
|
|
|
{ "waitretry", &opt.waitretry, cmd_time }
|
1999-12-02 15:42:23 +08:00
|
|
|
|
};
|
|
|
|
|
|
2002-04-15 02:39:43 +08:00
|
|
|
|
/* Look up COM in the commands[] array and return its index. If COM
|
|
|
|
|
is not found, -1 is returned. This function uses binary search. */
|
|
|
|
|
|
1999-12-02 15:42:23 +08:00
|
|
|
|
static int
|
|
|
|
|
comind (const char *com)
|
|
|
|
|
{
|
2002-04-15 02:39:43 +08:00
|
|
|
|
int lo = 0, hi = ARRAY_SIZE (commands) - 1;
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
2002-04-15 02:39:43 +08:00
|
|
|
|
while (lo <= hi)
|
1999-12-02 15:42:23 +08:00
|
|
|
|
{
|
2002-04-15 02:39:43 +08:00
|
|
|
|
int mid = (lo + hi) >> 1;
|
|
|
|
|
int cmp = strcasecmp (com, commands[mid].name);
|
|
|
|
|
if (cmp < 0)
|
|
|
|
|
hi = mid - 1;
|
|
|
|
|
else if (cmp > 0)
|
|
|
|
|
lo = mid + 1;
|
1999-12-02 15:42:23 +08:00
|
|
|
|
else
|
2002-04-15 02:39:43 +08:00
|
|
|
|
return mid;
|
1999-12-02 15:42:23 +08:00
|
|
|
|
}
|
|
|
|
|
return -1;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* Reset the variables to default values. */
|
|
|
|
|
static void
|
|
|
|
|
defaults (void)
|
|
|
|
|
{
|
|
|
|
|
char *tmp;
|
|
|
|
|
|
|
|
|
|
/* Most of the default values are 0. Just reset everything, and
|
|
|
|
|
fill in the non-zero values. Note that initializing pointers to
|
|
|
|
|
NULL this way is technically illegal, but porting Wget to a
|
|
|
|
|
machine where NULL is not all-zero bit pattern will be the least
|
|
|
|
|
of the implementors' worries. */
|
|
|
|
|
memset (&opt, 0, sizeof (opt));
|
|
|
|
|
|
2001-04-09 06:25:24 +08:00
|
|
|
|
opt.cookies = 1;
|
|
|
|
|
|
1999-12-02 15:42:23 +08:00
|
|
|
|
opt.verbose = -1;
|
|
|
|
|
opt.dir_prefix = xstrdup (".");
|
|
|
|
|
opt.ntry = 20;
|
|
|
|
|
opt.reclevel = 5;
|
|
|
|
|
opt.add_hostdir = 1;
|
2001-04-29 18:53:55 +08:00
|
|
|
|
opt.ftp_acc = xstrdup ("anonymous");
|
|
|
|
|
opt.ftp_pass = xstrdup ("-wget@");
|
1999-12-02 15:42:23 +08:00
|
|
|
|
opt.netrc = 1;
|
|
|
|
|
opt.ftp_glob = 1;
|
|
|
|
|
opt.htmlify = 1;
|
2000-11-20 08:04:06 +08:00
|
|
|
|
opt.http_keep_alive = 1;
|
1999-12-02 15:42:23 +08:00
|
|
|
|
opt.use_proxy = 1;
|
|
|
|
|
tmp = getenv ("no_proxy");
|
|
|
|
|
if (tmp)
|
|
|
|
|
opt.no_proxy = sepstring (tmp);
|
2001-04-27 13:26:44 +08:00
|
|
|
|
opt.allow_cache = 1;
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
|
|
|
|
#ifdef HAVE_SELECT
|
|
|
|
|
opt.timeout = 900;
|
|
|
|
|
#endif
|
|
|
|
|
opt.use_robots = 1;
|
|
|
|
|
|
|
|
|
|
opt.remove_listing = 1;
|
|
|
|
|
|
|
|
|
|
opt.dot_bytes = 1024;
|
|
|
|
|
opt.dot_spacing = 10;
|
|
|
|
|
opt.dots_in_line = 50;
|
2003-09-11 03:41:54 +08:00
|
|
|
|
|
|
|
|
|
opt.dns_cache = 1;
|
1999-12-02 15:42:23 +08:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* Return the user's home directory (strdup-ed), or NULL if none is
|
|
|
|
|
found. */
|
|
|
|
|
char *
|
|
|
|
|
home_dir (void)
|
|
|
|
|
{
|
|
|
|
|
char *home = getenv ("HOME");
|
|
|
|
|
|
|
|
|
|
if (!home)
|
|
|
|
|
{
|
|
|
|
|
#ifndef WINDOWS
|
|
|
|
|
/* If HOME is not defined, try getting it from the password
|
|
|
|
|
file. */
|
|
|
|
|
struct passwd *pwd = getpwuid (getuid ());
|
|
|
|
|
if (!pwd || !pwd->pw_dir)
|
|
|
|
|
return NULL;
|
|
|
|
|
home = pwd->pw_dir;
|
|
|
|
|
#else /* WINDOWS */
|
|
|
|
|
home = "C:\\";
|
|
|
|
|
/* #### Maybe I should grab home_dir from registry, but the best
|
|
|
|
|
that I could get from there is user's Start menu. It sucks! */
|
|
|
|
|
#endif /* WINDOWS */
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return home ? xstrdup (home) : NULL;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* Return the path to the user's .wgetrc. This is either the value of
|
|
|
|
|
`WGETRC' environment variable, or `$HOME/.wgetrc'.
|
|
|
|
|
|
|
|
|
|
If the `WGETRC' variable exists but the file does not exist, the
|
|
|
|
|
function will exit(). */
|
|
|
|
|
static char *
|
|
|
|
|
wgetrc_file_name (void)
|
|
|
|
|
{
|
|
|
|
|
char *env, *home;
|
|
|
|
|
char *file = NULL;
|
|
|
|
|
|
|
|
|
|
/* Try the environment. */
|
|
|
|
|
env = getenv ("WGETRC");
|
|
|
|
|
if (env && *env)
|
|
|
|
|
{
|
|
|
|
|
if (!file_exists_p (env))
|
|
|
|
|
{
|
2001-12-14 03:19:03 +08:00
|
|
|
|
fprintf (stderr, "%s: %s: %s.\n", exec_name, env, strerror (errno));
|
1999-12-02 15:42:23 +08:00
|
|
|
|
exit (1);
|
|
|
|
|
}
|
|
|
|
|
return xstrdup (env);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#ifndef WINDOWS
|
|
|
|
|
/* If that failed, try $HOME/.wgetrc. */
|
|
|
|
|
home = home_dir ();
|
|
|
|
|
if (home)
|
|
|
|
|
{
|
|
|
|
|
file = (char *)xmalloc (strlen (home) + 1 + strlen (".wgetrc") + 1);
|
|
|
|
|
sprintf (file, "%s/.wgetrc", home);
|
|
|
|
|
}
|
2000-03-31 22:08:57 +08:00
|
|
|
|
FREE_MAYBE (home);
|
1999-12-02 15:42:23 +08:00
|
|
|
|
#else /* WINDOWS */
|
|
|
|
|
/* Under Windows, "home" is (for the purposes of this function) the
|
|
|
|
|
directory where `wget.exe' resides, and `wget.ini' will be used
|
|
|
|
|
as file name. SYSTEM_WGETRC should not be defined under WINDOWS.
|
|
|
|
|
|
|
|
|
|
It is not as trivial as I assumed, because on 95 argv[0] is full
|
|
|
|
|
path, but on NT you get what you typed in command line. --dbudor */
|
|
|
|
|
home = ws_mypath ();
|
|
|
|
|
if (home)
|
|
|
|
|
{
|
|
|
|
|
file = (char *)xmalloc (strlen (home) + strlen ("wget.ini") + 1);
|
|
|
|
|
sprintf (file, "%swget.ini", home);
|
|
|
|
|
}
|
|
|
|
|
#endif /* WINDOWS */
|
|
|
|
|
|
|
|
|
|
if (!file)
|
|
|
|
|
return NULL;
|
|
|
|
|
if (!file_exists_p (file))
|
|
|
|
|
{
|
2000-11-23 00:58:28 +08:00
|
|
|
|
xfree (file);
|
1999-12-02 15:42:23 +08:00
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
return file;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* Initialize variables from a wgetrc file */
|
|
|
|
|
static void
|
|
|
|
|
run_wgetrc (const char *file)
|
|
|
|
|
{
|
|
|
|
|
FILE *fp;
|
|
|
|
|
char *line;
|
|
|
|
|
int ln;
|
|
|
|
|
|
|
|
|
|
fp = fopen (file, "rb");
|
|
|
|
|
if (!fp)
|
|
|
|
|
{
|
|
|
|
|
fprintf (stderr, _("%s: Cannot read %s (%s).\n"), exec_name,
|
|
|
|
|
file, strerror (errno));
|
|
|
|
|
return;
|
|
|
|
|
}
|
2001-04-09 07:59:14 +08:00
|
|
|
|
enable_tilde_expansion = 1;
|
1999-12-02 15:42:23 +08:00
|
|
|
|
ln = 1;
|
|
|
|
|
while ((line = read_whole_line (fp)))
|
|
|
|
|
{
|
|
|
|
|
char *com, *val;
|
|
|
|
|
int status;
|
|
|
|
|
|
|
|
|
|
/* Parse the line. */
|
|
|
|
|
status = parse_line (line, &com, &val);
|
2000-11-23 00:58:28 +08:00
|
|
|
|
xfree (line);
|
1999-12-02 15:42:23 +08:00
|
|
|
|
/* If everything is OK, set the value. */
|
|
|
|
|
if (status == 1)
|
|
|
|
|
{
|
|
|
|
|
if (!setval (com, val))
|
|
|
|
|
fprintf (stderr, _("%s: Error in %s at line %d.\n"), exec_name,
|
|
|
|
|
file, ln);
|
2000-11-23 00:58:28 +08:00
|
|
|
|
xfree (com);
|
|
|
|
|
xfree (val);
|
1999-12-02 15:42:23 +08:00
|
|
|
|
}
|
|
|
|
|
else if (status == 0)
|
|
|
|
|
fprintf (stderr, _("%s: Error in %s at line %d.\n"), exec_name,
|
|
|
|
|
file, ln);
|
|
|
|
|
++ln;
|
|
|
|
|
}
|
2001-04-09 07:59:14 +08:00
|
|
|
|
enable_tilde_expansion = 0;
|
1999-12-02 15:42:23 +08:00
|
|
|
|
fclose (fp);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* Initialize the defaults and run the system wgetrc and user's own
|
|
|
|
|
wgetrc. */
|
|
|
|
|
void
|
|
|
|
|
initialize (void)
|
|
|
|
|
{
|
|
|
|
|
char *file;
|
|
|
|
|
|
|
|
|
|
/* Load the hard-coded defaults. */
|
|
|
|
|
defaults ();
|
|
|
|
|
|
|
|
|
|
/* If SYSTEM_WGETRC is defined, use it. */
|
|
|
|
|
#ifdef SYSTEM_WGETRC
|
|
|
|
|
if (file_exists_p (SYSTEM_WGETRC))
|
|
|
|
|
run_wgetrc (SYSTEM_WGETRC);
|
|
|
|
|
#endif
|
|
|
|
|
/* Override it with your own, if one exists. */
|
|
|
|
|
file = wgetrc_file_name ();
|
|
|
|
|
if (!file)
|
|
|
|
|
return;
|
|
|
|
|
/* #### We should somehow canonicalize `file' and SYSTEM_WGETRC,
|
|
|
|
|
really. */
|
|
|
|
|
#ifdef SYSTEM_WGETRC
|
|
|
|
|
if (!strcmp (file, SYSTEM_WGETRC))
|
|
|
|
|
{
|
|
|
|
|
fprintf (stderr, _("\
|
|
|
|
|
%s: Warning: Both system and user wgetrc point to `%s'.\n"),
|
|
|
|
|
exec_name, file);
|
|
|
|
|
}
|
|
|
|
|
else
|
|
|
|
|
#endif
|
|
|
|
|
run_wgetrc (file);
|
2000-11-23 00:58:28 +08:00
|
|
|
|
xfree (file);
|
1999-12-02 15:42:23 +08:00
|
|
|
|
return;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* Parse the line pointed by line, with the syntax:
|
|
|
|
|
<sp>* command <sp>* = <sp>* value <newline>
|
|
|
|
|
Uses malloc to allocate space for command and value.
|
|
|
|
|
If the line is invalid, data is freed and 0 is returned.
|
|
|
|
|
|
|
|
|
|
Return values:
|
|
|
|
|
1 - success
|
|
|
|
|
0 - failure
|
|
|
|
|
-1 - empty */
|
|
|
|
|
int
|
|
|
|
|
parse_line (const char *line, char **com, char **val)
|
|
|
|
|
{
|
|
|
|
|
const char *p = line;
|
|
|
|
|
const char *orig_comptr, *end;
|
|
|
|
|
char *new_comptr;
|
|
|
|
|
|
2000-11-11 02:01:35 +08:00
|
|
|
|
/* Skip whitespace. */
|
|
|
|
|
while (*p && ISSPACE (*p))
|
1999-12-02 15:42:23 +08:00
|
|
|
|
++p;
|
|
|
|
|
|
|
|
|
|
/* Don't process empty lines. */
|
2000-11-11 02:01:35 +08:00
|
|
|
|
if (!*p || *p == '#')
|
1999-12-02 15:42:23 +08:00
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
|
|
for (orig_comptr = p; ISALPHA (*p) || *p == '_' || *p == '-'; p++)
|
|
|
|
|
;
|
|
|
|
|
/* The next char should be space or '='. */
|
|
|
|
|
if (!ISSPACE (*p) && (*p != '='))
|
|
|
|
|
return 0;
|
2000-11-11 02:01:35 +08:00
|
|
|
|
/* Here we cannot use strdupdelim() as we normally would because we
|
|
|
|
|
want to skip the `-' and `_' characters in the input string. */
|
1999-12-02 15:42:23 +08:00
|
|
|
|
*com = (char *)xmalloc (p - orig_comptr + 1);
|
|
|
|
|
for (new_comptr = *com; orig_comptr < p; orig_comptr++)
|
|
|
|
|
{
|
|
|
|
|
if (*orig_comptr == '_' || *orig_comptr == '-')
|
|
|
|
|
continue;
|
|
|
|
|
*new_comptr++ = *orig_comptr;
|
|
|
|
|
}
|
|
|
|
|
*new_comptr = '\0';
|
|
|
|
|
/* If the command is invalid, exit now. */
|
|
|
|
|
if (comind (*com) == -1)
|
|
|
|
|
{
|
2000-11-23 00:58:28 +08:00
|
|
|
|
xfree (*com);
|
1999-12-02 15:42:23 +08:00
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* Skip spaces before '='. */
|
|
|
|
|
for (; ISSPACE (*p); p++);
|
|
|
|
|
/* If '=' not found, bail out. */
|
|
|
|
|
if (*p != '=')
|
|
|
|
|
{
|
2000-11-23 00:58:28 +08:00
|
|
|
|
xfree (*com);
|
1999-12-02 15:42:23 +08:00
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
/* Skip spaces after '='. */
|
|
|
|
|
for (++p; ISSPACE (*p); p++);
|
2000-11-11 02:01:35 +08:00
|
|
|
|
/* Get the ending position for VAL by starting with the end of the
|
|
|
|
|
line and skipping whitespace. */
|
|
|
|
|
end = line + strlen (line) - 1;
|
|
|
|
|
while (end > p && ISSPACE (*end))
|
|
|
|
|
--end;
|
|
|
|
|
*val = strdupdelim (p, end + 1);
|
1999-12-02 15:42:23 +08:00
|
|
|
|
return 1;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* Set COM to VAL. This is the meat behind processing `.wgetrc'. No
|
|
|
|
|
fatals -- error signal prints a warning and resets to default
|
|
|
|
|
value. All error messages are printed to stderr, *not* to
|
|
|
|
|
opt.lfile, since opt.lfile wasn't even generated yet. */
|
|
|
|
|
int
|
|
|
|
|
setval (const char *com, const char *val)
|
|
|
|
|
{
|
|
|
|
|
int ind;
|
|
|
|
|
|
|
|
|
|
if (!com || !val)
|
|
|
|
|
return 0;
|
|
|
|
|
ind = comind (com);
|
|
|
|
|
if (ind == -1)
|
|
|
|
|
{
|
|
|
|
|
/* #### Should I just abort()? */
|
|
|
|
|
#ifdef DEBUG
|
|
|
|
|
fprintf (stderr, _("%s: BUG: unknown command `%s', value `%s'.\n"),
|
|
|
|
|
exec_name, com, val);
|
|
|
|
|
#endif
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
return ((*commands[ind].action) (com, val, commands[ind].closure));
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* Generic helper functions, for use with `commands'. */
|
|
|
|
|
|
|
|
|
|
static int myatoi PARAMS ((const char *s));
|
|
|
|
|
|
|
|
|
|
/* Store the boolean value from VAL to CLOSURE. COM is ignored,
|
|
|
|
|
except for error messages. */
|
|
|
|
|
static int
|
|
|
|
|
cmd_boolean (const char *com, const char *val, void *closure)
|
|
|
|
|
{
|
|
|
|
|
int bool_value;
|
|
|
|
|
|
|
|
|
|
if (!strcasecmp (val, "on")
|
|
|
|
|
|| (*val == '1' && !*(val + 1)))
|
|
|
|
|
bool_value = 1;
|
|
|
|
|
else if (!strcasecmp (val, "off")
|
|
|
|
|
|| (*val == '0' && !*(val + 1)))
|
|
|
|
|
bool_value = 0;
|
|
|
|
|
else
|
|
|
|
|
{
|
|
|
|
|
fprintf (stderr, _("%s: %s: Please specify on or off.\n"),
|
|
|
|
|
exec_name, com);
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
*(int *)closure = bool_value;
|
|
|
|
|
return 1;
|
|
|
|
|
}
|
|
|
|
|
|
2000-10-20 14:59:30 +08:00
|
|
|
|
/* Store the lockable_boolean {2, 1, 0, -1} value from VAL to CLOSURE. COM is
|
|
|
|
|
ignored, except for error messages. Values 2 and -1 indicate that once
|
|
|
|
|
defined, the value may not be changed by successive wgetrc files or
|
|
|
|
|
command-line arguments.
|
|
|
|
|
|
|
|
|
|
Values: 2 - Enable a particular option for good ("always")
|
|
|
|
|
1 - Enable an option ("on")
|
|
|
|
|
0 - Disable an option ("off")
|
|
|
|
|
-1 - Disable an option for good ("never") */
|
|
|
|
|
static int
|
|
|
|
|
cmd_lockable_boolean (const char *com, const char *val, void *closure)
|
|
|
|
|
{
|
|
|
|
|
int lockable_boolean_value;
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* If a config file said "always" or "never", don't allow command line
|
|
|
|
|
* arguments to override the config file.
|
|
|
|
|
*/
|
|
|
|
|
if (*(int *)closure == -1 || *(int *)closure == 2)
|
|
|
|
|
return 1;
|
|
|
|
|
|
|
|
|
|
if (!strcasecmp (val, "always")
|
|
|
|
|
|| (*val == '2' && !*(val + 1)))
|
|
|
|
|
lockable_boolean_value = 2;
|
|
|
|
|
else if (!strcasecmp (val, "on")
|
|
|
|
|
|| (*val == '1' && !*(val + 1)))
|
|
|
|
|
lockable_boolean_value = 1;
|
|
|
|
|
else if (!strcasecmp (val, "off")
|
|
|
|
|
|| (*val == '0' && !*(val + 1)))
|
|
|
|
|
lockable_boolean_value = 0;
|
|
|
|
|
else if (!strcasecmp (val, "never")
|
|
|
|
|
|| (*val == '-' && *(val + 1) == '1' && !*(val + 2)))
|
|
|
|
|
lockable_boolean_value = -1;
|
|
|
|
|
else
|
|
|
|
|
{
|
|
|
|
|
fprintf (stderr, _("%s: %s: Please specify always, on, off, "
|
|
|
|
|
"or never.\n"),
|
|
|
|
|
exec_name, com);
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
*(int *)closure = lockable_boolean_value;
|
|
|
|
|
return 1;
|
|
|
|
|
}
|
|
|
|
|
|
1999-12-02 15:42:23 +08:00
|
|
|
|
/* Set the non-negative integer value from VAL to CLOSURE. With
|
|
|
|
|
incorrect specification, the number remains unchanged. */
|
|
|
|
|
static int
|
|
|
|
|
cmd_number (const char *com, const char *val, void *closure)
|
|
|
|
|
{
|
|
|
|
|
int num = myatoi (val);
|
|
|
|
|
|
|
|
|
|
if (num == -1)
|
|
|
|
|
{
|
|
|
|
|
fprintf (stderr, _("%s: %s: Invalid specification `%s'.\n"),
|
|
|
|
|
exec_name, com, val);
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
*(int *)closure = num;
|
|
|
|
|
return 1;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* Similar to cmd_number(), only accepts `inf' as a synonym for 0. */
|
|
|
|
|
static int
|
|
|
|
|
cmd_number_inf (const char *com, const char *val, void *closure)
|
|
|
|
|
{
|
|
|
|
|
if (!strcasecmp (val, "inf"))
|
|
|
|
|
{
|
|
|
|
|
*(int *)closure = 0;
|
|
|
|
|
return 1;
|
|
|
|
|
}
|
|
|
|
|
return cmd_number (com, val, closure);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* Copy (strdup) the string at COM to a new location and place a
|
|
|
|
|
pointer to *CLOSURE. */
|
|
|
|
|
static int
|
|
|
|
|
cmd_string (const char *com, const char *val, void *closure)
|
|
|
|
|
{
|
|
|
|
|
char **pstring = (char **)closure;
|
|
|
|
|
|
|
|
|
|
FREE_MAYBE (*pstring);
|
|
|
|
|
*pstring = xstrdup (val);
|
|
|
|
|
return 1;
|
|
|
|
|
}
|
|
|
|
|
|
2001-04-09 07:59:14 +08:00
|
|
|
|
/* Like the above, but handles tilde-expansion when reading a user's
|
|
|
|
|
`.wgetrc'. In that case, and if VAL begins with `~', the tilde
|
|
|
|
|
gets expanded to the user's home directory. */
|
|
|
|
|
static int
|
|
|
|
|
cmd_file (const char *com, const char *val, void *closure)
|
|
|
|
|
{
|
|
|
|
|
char **pstring = (char **)closure;
|
|
|
|
|
|
|
|
|
|
FREE_MAYBE (*pstring);
|
2001-12-06 13:35:17 +08:00
|
|
|
|
|
|
|
|
|
/* #### If VAL is empty, perhaps should set *CLOSURE to NULL. */
|
|
|
|
|
|
2002-01-17 09:03:33 +08:00
|
|
|
|
if (!enable_tilde_expansion || !(*val == '~' && (*(val + 1) == '/'
|
|
|
|
|
#ifdef WINDOWS
|
|
|
|
|
|| *(val + 1) == '\\'
|
|
|
|
|
#endif
|
|
|
|
|
)))
|
2001-04-09 07:59:14 +08:00
|
|
|
|
{
|
|
|
|
|
noexpand:
|
|
|
|
|
*pstring = xstrdup (val);
|
|
|
|
|
}
|
|
|
|
|
else
|
|
|
|
|
{
|
|
|
|
|
char *result;
|
|
|
|
|
int homelen;
|
|
|
|
|
char *home = home_dir ();
|
|
|
|
|
if (!home)
|
|
|
|
|
goto noexpand;
|
|
|
|
|
|
|
|
|
|
homelen = strlen (home);
|
2002-01-17 09:03:33 +08:00
|
|
|
|
while (homelen && (home[homelen - 1] == '/'
|
|
|
|
|
#ifdef WINDOWS
|
|
|
|
|
|| home[homelen - 1] == '\\'
|
|
|
|
|
#endif
|
|
|
|
|
))
|
2001-04-09 07:59:14 +08:00
|
|
|
|
home[--homelen] = '\0';
|
|
|
|
|
|
|
|
|
|
/* Skip the leading "~/". */
|
2002-01-17 09:03:33 +08:00
|
|
|
|
#ifdef WINDOWS
|
|
|
|
|
for (++val; *val == '/' || *val == '\\'; val++)
|
|
|
|
|
;
|
|
|
|
|
#else
|
2001-04-09 07:59:14 +08:00
|
|
|
|
for (++val; *val == '/'; val++)
|
|
|
|
|
;
|
2002-01-17 09:03:33 +08:00
|
|
|
|
#endif
|
2001-04-09 07:59:14 +08:00
|
|
|
|
|
2002-08-04 04:34:58 +08:00
|
|
|
|
result = xmalloc (homelen + 1 + strlen (val) + 1);
|
2001-04-09 07:59:14 +08:00
|
|
|
|
memcpy (result, home, homelen);
|
|
|
|
|
result[homelen] = '/';
|
|
|
|
|
strcpy (result + homelen + 1, val);
|
|
|
|
|
|
|
|
|
|
*pstring = result;
|
|
|
|
|
}
|
2002-01-17 09:03:33 +08:00
|
|
|
|
#ifdef WINDOWS
|
|
|
|
|
/* Convert "\" to "/". */
|
|
|
|
|
{
|
|
|
|
|
char *s;
|
|
|
|
|
for (s = *pstring; *s; s++)
|
|
|
|
|
if (*s == '\\')
|
|
|
|
|
*s = '/';
|
|
|
|
|
}
|
|
|
|
|
#endif
|
|
|
|
|
return 1;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* Like cmd_file, but strips trailing '/' characters. */
|
|
|
|
|
static int
|
|
|
|
|
cmd_directory (const char *com, const char *val, void *closure)
|
|
|
|
|
{
|
|
|
|
|
char *s, *t;
|
|
|
|
|
|
|
|
|
|
/* Call cmd_file() for tilde expansion and separator
|
|
|
|
|
canonicalization (backslash -> slash under Windows). These
|
|
|
|
|
things should perhaps be in a separate function. */
|
|
|
|
|
if (!cmd_file (com, val, closure))
|
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
|
|
s = *(char **)closure;
|
|
|
|
|
t = s + strlen (s);
|
|
|
|
|
while (t > s && *--t == '/')
|
|
|
|
|
*t = '\0';
|
|
|
|
|
|
2001-04-09 07:59:14 +08:00
|
|
|
|
return 1;
|
|
|
|
|
}
|
|
|
|
|
|
1999-12-02 15:42:23 +08:00
|
|
|
|
/* Merge the vector (array of strings separated with `,') in COM with
|
|
|
|
|
the vector (NULL-terminated array of strings) pointed to by
|
|
|
|
|
CLOSURE. */
|
|
|
|
|
static int
|
|
|
|
|
cmd_vector (const char *com, const char *val, void *closure)
|
|
|
|
|
{
|
|
|
|
|
char ***pvec = (char ***)closure;
|
|
|
|
|
|
|
|
|
|
if (*val)
|
|
|
|
|
*pvec = merge_vecs (*pvec, sepstring (val));
|
|
|
|
|
else
|
|
|
|
|
{
|
|
|
|
|
free_vec (*pvec);
|
|
|
|
|
*pvec = NULL;
|
|
|
|
|
}
|
|
|
|
|
return 1;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
|
|
|
|
cmd_directory_vector (const char *com, const char *val, void *closure)
|
|
|
|
|
{
|
|
|
|
|
char ***pvec = (char ***)closure;
|
|
|
|
|
|
|
|
|
|
if (*val)
|
|
|
|
|
{
|
|
|
|
|
/* Strip the trailing slashes from directories. */
|
|
|
|
|
char **t, **seps;
|
|
|
|
|
|
|
|
|
|
seps = sepstring (val);
|
|
|
|
|
for (t = seps; t && *t; t++)
|
|
|
|
|
{
|
|
|
|
|
int len = strlen (*t);
|
|
|
|
|
/* Skip degenerate case of root directory. */
|
|
|
|
|
if (len > 1)
|
|
|
|
|
{
|
|
|
|
|
if ((*t)[len - 1] == '/')
|
|
|
|
|
(*t)[len - 1] = '\0';
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
*pvec = merge_vecs (*pvec, seps);
|
|
|
|
|
}
|
|
|
|
|
else
|
|
|
|
|
{
|
|
|
|
|
free_vec (*pvec);
|
|
|
|
|
*pvec = NULL;
|
|
|
|
|
}
|
|
|
|
|
return 1;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* Set the value stored in VAL to CLOSURE (which should point to a
|
|
|
|
|
long int), allowing several postfixes, with the following syntax
|
|
|
|
|
(regexp):
|
|
|
|
|
|
|
|
|
|
[0-9]+ -> bytes
|
|
|
|
|
[0-9]+[kK] -> bytes * 1024
|
|
|
|
|
[0-9]+[mM] -> bytes * 1024 * 1024
|
|
|
|
|
inf -> 0
|
|
|
|
|
|
|
|
|
|
Anything else is flagged as incorrect, and CLOSURE is unchanged. */
|
|
|
|
|
static int
|
|
|
|
|
cmd_bytes (const char *com, const char *val, void *closure)
|
|
|
|
|
{
|
|
|
|
|
long result;
|
|
|
|
|
long *out = (long *)closure;
|
|
|
|
|
const char *p;
|
|
|
|
|
|
|
|
|
|
result = 0;
|
|
|
|
|
p = val;
|
|
|
|
|
/* Check for "inf". */
|
|
|
|
|
if (p[0] == 'i' && p[1] == 'n' && p[2] == 'f' && p[3] == '\0')
|
|
|
|
|
{
|
|
|
|
|
*out = 0;
|
|
|
|
|
return 1;
|
|
|
|
|
}
|
|
|
|
|
/* Search for digits and construct result. */
|
|
|
|
|
for (; *p && ISDIGIT (*p); p++)
|
|
|
|
|
result = (10 * result) + (*p - '0');
|
|
|
|
|
/* If no digits were found, or more than one character is following
|
|
|
|
|
them, bail out. */
|
|
|
|
|
if (p == val || (*p != '\0' && *(p + 1) != '\0'))
|
|
|
|
|
{
|
|
|
|
|
printf (_("%s: Invalid specification `%s'\n"), com, val);
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
/* Search for a designator. */
|
2000-03-31 22:08:57 +08:00
|
|
|
|
switch (TOLOWER (*p))
|
1999-12-02 15:42:23 +08:00
|
|
|
|
{
|
|
|
|
|
case '\0':
|
|
|
|
|
/* None */
|
|
|
|
|
break;
|
|
|
|
|
case 'k':
|
|
|
|
|
/* Kilobytes */
|
|
|
|
|
result *= 1024;
|
|
|
|
|
break;
|
|
|
|
|
case 'm':
|
|
|
|
|
/* Megabytes */
|
|
|
|
|
result *= (long)1024 * 1024;
|
|
|
|
|
break;
|
|
|
|
|
case 'g':
|
|
|
|
|
/* Gigabytes */
|
|
|
|
|
result *= (long)1024 * 1024 * 1024;
|
|
|
|
|
break;
|
|
|
|
|
default:
|
|
|
|
|
printf (_("%s: Invalid specification `%s'\n"), com, val);
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
*out = result;
|
|
|
|
|
return 1;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* Store the value of VAL to *OUT, allowing suffixes for minutes and
|
|
|
|
|
hours. */
|
|
|
|
|
static int
|
|
|
|
|
cmd_time (const char *com, const char *val, void *closure)
|
|
|
|
|
{
|
|
|
|
|
long result = 0;
|
|
|
|
|
const char *p = val;
|
|
|
|
|
|
|
|
|
|
/* Search for digits and construct result. */
|
|
|
|
|
for (; *p && ISDIGIT (*p); p++)
|
|
|
|
|
result = (10 * result) + (*p - '0');
|
|
|
|
|
/* If no digits were found, or more than one character is following
|
|
|
|
|
them, bail out. */
|
|
|
|
|
if (p == val || (*p != '\0' && *(p + 1) != '\0'))
|
|
|
|
|
{
|
|
|
|
|
printf (_("%s: Invalid specification `%s'\n"), com, val);
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
/* Search for a suffix. */
|
2000-03-31 22:08:57 +08:00
|
|
|
|
switch (TOLOWER (*p))
|
1999-12-02 15:42:23 +08:00
|
|
|
|
{
|
|
|
|
|
case '\0':
|
|
|
|
|
/* None */
|
|
|
|
|
break;
|
|
|
|
|
case 'm':
|
|
|
|
|
/* Minutes */
|
|
|
|
|
result *= 60;
|
|
|
|
|
break;
|
|
|
|
|
case 'h':
|
|
|
|
|
/* Seconds */
|
|
|
|
|
result *= 3600;
|
|
|
|
|
break;
|
|
|
|
|
case 'd':
|
|
|
|
|
/* Days (overflow on 16bit machines) */
|
|
|
|
|
result *= 86400L;
|
|
|
|
|
break;
|
|
|
|
|
case 'w':
|
|
|
|
|
/* Weeks :-) */
|
|
|
|
|
result *= 604800L;
|
|
|
|
|
break;
|
|
|
|
|
default:
|
|
|
|
|
printf (_("%s: Invalid specification `%s'\n"), com, val);
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
*(long *)closure = result;
|
|
|
|
|
return 1;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* Specialized helper functions, used by `commands' to handle some
|
|
|
|
|
options specially. */
|
|
|
|
|
|
|
|
|
|
static int check_user_specified_header PARAMS ((const char *));
|
|
|
|
|
|
|
|
|
|
static int
|
|
|
|
|
cmd_spec_dirstruct (const char *com, const char *val, void *closure)
|
|
|
|
|
{
|
|
|
|
|
if (!cmd_boolean (com, val, &opt.dirstruct))
|
|
|
|
|
return 0;
|
|
|
|
|
/* Since dirstruct behaviour is explicitly changed, no_dirstruct
|
|
|
|
|
must be affected inversely. */
|
|
|
|
|
if (opt.dirstruct)
|
|
|
|
|
opt.no_dirstruct = 0;
|
|
|
|
|
else
|
|
|
|
|
opt.no_dirstruct = 1;
|
|
|
|
|
return 1;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
|
|
|
|
cmd_spec_header (const char *com, const char *val, void *closure)
|
|
|
|
|
{
|
|
|
|
|
if (!*val)
|
|
|
|
|
{
|
|
|
|
|
/* Empty header means reset headers. */
|
|
|
|
|
FREE_MAYBE (opt.user_header);
|
|
|
|
|
opt.user_header = NULL;
|
|
|
|
|
}
|
|
|
|
|
else
|
|
|
|
|
{
|
|
|
|
|
int i;
|
|
|
|
|
|
|
|
|
|
if (!check_user_specified_header (val))
|
|
|
|
|
{
|
|
|
|
|
fprintf (stderr, _("%s: %s: Invalid specification `%s'.\n"),
|
|
|
|
|
exec_name, com, val);
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
i = opt.user_header ? strlen (opt.user_header) : 0;
|
|
|
|
|
opt.user_header = (char *)xrealloc (opt.user_header, i + strlen (val)
|
|
|
|
|
+ 2 + 1);
|
|
|
|
|
strcpy (opt.user_header + i, val);
|
|
|
|
|
i += strlen (val);
|
|
|
|
|
opt.user_header[i++] = '\r';
|
|
|
|
|
opt.user_header[i++] = '\n';
|
|
|
|
|
opt.user_header[i] = '\0';
|
|
|
|
|
}
|
|
|
|
|
return 1;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
|
|
|
|
cmd_spec_htmlify (const char *com, const char *val, void *closure)
|
|
|
|
|
{
|
|
|
|
|
int flag = cmd_boolean (com, val, &opt.htmlify);
|
|
|
|
|
if (flag && !opt.htmlify)
|
|
|
|
|
opt.remove_listing = 0;
|
|
|
|
|
return flag;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
|
|
|
|
cmd_spec_mirror (const char *com, const char *val, void *closure)
|
|
|
|
|
{
|
|
|
|
|
int mirror;
|
|
|
|
|
|
|
|
|
|
if (!cmd_boolean (com, val, &mirror))
|
|
|
|
|
return 0;
|
|
|
|
|
if (mirror)
|
|
|
|
|
{
|
|
|
|
|
opt.recursive = 1;
|
|
|
|
|
if (!opt.no_dirstruct)
|
|
|
|
|
opt.dirstruct = 1;
|
|
|
|
|
opt.timestamping = 1;
|
2000-08-30 19:26:21 +08:00
|
|
|
|
opt.reclevel = INFINITE_RECURSION;
|
1999-12-02 15:42:23 +08:00
|
|
|
|
opt.remove_listing = 0;
|
|
|
|
|
}
|
|
|
|
|
return 1;
|
|
|
|
|
}
|
|
|
|
|
|
2001-11-23 12:59:52 +08:00
|
|
|
|
static int
|
|
|
|
|
cmd_spec_progress (const char *com, const char *val, void *closure)
|
|
|
|
|
{
|
|
|
|
|
if (!valid_progress_implementation_p (val))
|
|
|
|
|
{
|
|
|
|
|
fprintf (stderr, _("%s: %s: Invalid progress type `%s'.\n"),
|
|
|
|
|
exec_name, com, val);
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
2001-12-10 06:25:34 +08:00
|
|
|
|
FREE_MAYBE (opt.progress_type);
|
|
|
|
|
|
|
|
|
|
/* Don't call set_progress_implementation here. It will be called
|
|
|
|
|
in main() when it becomes clear what the log output is. */
|
|
|
|
|
opt.progress_type = xstrdup (val);
|
2001-11-23 12:59:52 +08:00
|
|
|
|
return 1;
|
|
|
|
|
}
|
|
|
|
|
|
1999-12-02 15:42:23 +08:00
|
|
|
|
static int
|
|
|
|
|
cmd_spec_recursive (const char *com, const char *val, void *closure)
|
|
|
|
|
{
|
|
|
|
|
if (!cmd_boolean (com, val, &opt.recursive))
|
|
|
|
|
return 0;
|
|
|
|
|
else
|
|
|
|
|
{
|
|
|
|
|
if (opt.recursive && !opt.no_dirstruct)
|
|
|
|
|
opt.dirstruct = 1;
|
|
|
|
|
}
|
|
|
|
|
return 1;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
|
|
|
|
cmd_spec_useragent (const char *com, const char *val, void *closure)
|
|
|
|
|
{
|
|
|
|
|
/* Just check for empty string and newline, so we don't throw total
|
|
|
|
|
junk to the server. */
|
|
|
|
|
if (!*val || strchr (val, '\n'))
|
|
|
|
|
{
|
|
|
|
|
fprintf (stderr, _("%s: %s: Invalid specification `%s'.\n"),
|
|
|
|
|
exec_name, com, val);
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
opt.useragent = xstrdup (val);
|
|
|
|
|
return 1;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* Miscellaneous useful routines. */
|
|
|
|
|
|
|
|
|
|
/* Return the integer value of a positive integer written in S, or -1
|
|
|
|
|
if an error was encountered. */
|
|
|
|
|
static int
|
|
|
|
|
myatoi (const char *s)
|
|
|
|
|
{
|
|
|
|
|
int res;
|
|
|
|
|
const char *orig = s;
|
|
|
|
|
|
|
|
|
|
for (res = 0; *s && ISDIGIT (*s); s++)
|
|
|
|
|
res = 10 * res + (*s - '0');
|
|
|
|
|
if (*s || orig == s)
|
|
|
|
|
return -1;
|
|
|
|
|
else
|
|
|
|
|
return res;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#define ISODIGIT(x) ((x) >= '0' && (x) <= '7')
|
|
|
|
|
|
|
|
|
|
static int
|
|
|
|
|
check_user_specified_header (const char *s)
|
|
|
|
|
{
|
|
|
|
|
const char *p;
|
|
|
|
|
|
|
|
|
|
for (p = s; *p && *p != ':' && !ISSPACE (*p); p++);
|
|
|
|
|
/* The header MUST contain `:' preceded by at least one
|
|
|
|
|
non-whitespace character. */
|
|
|
|
|
if (*p != ':' || p == s)
|
|
|
|
|
return 0;
|
|
|
|
|
/* The header MUST NOT contain newlines. */
|
|
|
|
|
if (strchr (s, '\n'))
|
|
|
|
|
return 0;
|
|
|
|
|
return 1;
|
|
|
|
|
}
|
|
|
|
|
|
2000-11-23 06:15:45 +08:00
|
|
|
|
void cleanup_html_url PARAMS ((void));
|
2001-11-25 11:10:34 +08:00
|
|
|
|
void res_cleanup PARAMS ((void));
|
2000-11-23 06:15:45 +08:00
|
|
|
|
void downloaded_files_free PARAMS ((void));
|
2001-11-26 13:36:33 +08:00
|
|
|
|
void http_cleanup PARAMS ((void));
|
2000-11-23 06:15:45 +08:00
|
|
|
|
|
|
|
|
|
|
1999-12-02 15:42:23 +08:00
|
|
|
|
/* Free the memory allocated by global variables. */
|
|
|
|
|
void
|
|
|
|
|
cleanup (void)
|
|
|
|
|
{
|
2001-11-25 11:10:34 +08:00
|
|
|
|
/* Free external resources, close files, etc. */
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
|
|
|
|
if (opt.dfp)
|
|
|
|
|
fclose (opt.dfp);
|
2001-11-25 11:10:34 +08:00
|
|
|
|
|
|
|
|
|
/* We're exiting anyway so there's no real need to call free()
|
|
|
|
|
hundreds of times. Skipping the frees will make Wget exit
|
|
|
|
|
faster.
|
|
|
|
|
|
|
|
|
|
However, when detecting leaks, it's crucial to free() everything
|
|
|
|
|
because then you can find the real leaks, i.e. the allocated
|
|
|
|
|
memory which grows with the size of the program. */
|
|
|
|
|
|
|
|
|
|
#ifdef DEBUG_MALLOC
|
|
|
|
|
recursive_cleanup ();
|
|
|
|
|
res_cleanup ();
|
2001-11-26 13:36:33 +08:00
|
|
|
|
http_cleanup ();
|
|
|
|
|
cleanup_html_url ();
|
|
|
|
|
downloaded_files_free ();
|
2001-11-25 11:10:34 +08:00
|
|
|
|
host_cleanup ();
|
2002-04-21 04:46:38 +08:00
|
|
|
|
cookie_jar_delete (wget_cookie_jar);
|
2001-11-26 13:36:33 +08:00
|
|
|
|
|
2001-11-25 11:10:34 +08:00
|
|
|
|
{
|
|
|
|
|
extern acc_t *netrc_list;
|
|
|
|
|
free_netrc (netrc_list);
|
|
|
|
|
}
|
1999-12-02 15:42:23 +08:00
|
|
|
|
FREE_MAYBE (opt.lfilename);
|
2000-11-23 00:58:28 +08:00
|
|
|
|
xfree (opt.dir_prefix);
|
1999-12-02 15:42:23 +08:00
|
|
|
|
FREE_MAYBE (opt.input_filename);
|
|
|
|
|
FREE_MAYBE (opt.output_document);
|
|
|
|
|
free_vec (opt.accepts);
|
|
|
|
|
free_vec (opt.rejects);
|
|
|
|
|
free_vec (opt.excludes);
|
|
|
|
|
free_vec (opt.includes);
|
|
|
|
|
free_vec (opt.domains);
|
2000-03-11 14:48:06 +08:00
|
|
|
|
free_vec (opt.follow_tags);
|
|
|
|
|
free_vec (opt.ignore_tags);
|
2001-11-25 11:10:34 +08:00
|
|
|
|
FREE_MAYBE (opt.progress_type);
|
2000-11-23 00:58:28 +08:00
|
|
|
|
xfree (opt.ftp_acc);
|
2000-11-23 06:15:45 +08:00
|
|
|
|
FREE_MAYBE (opt.ftp_pass);
|
1999-12-02 15:42:23 +08:00
|
|
|
|
FREE_MAYBE (opt.ftp_proxy);
|
2000-12-06 07:09:41 +08:00
|
|
|
|
FREE_MAYBE (opt.https_proxy);
|
1999-12-02 15:42:23 +08:00
|
|
|
|
FREE_MAYBE (opt.http_proxy);
|
|
|
|
|
free_vec (opt.no_proxy);
|
|
|
|
|
FREE_MAYBE (opt.useragent);
|
2000-03-02 22:23:22 +08:00
|
|
|
|
FREE_MAYBE (opt.referer);
|
1999-12-02 15:42:23 +08:00
|
|
|
|
FREE_MAYBE (opt.http_user);
|
|
|
|
|
FREE_MAYBE (opt.http_passwd);
|
|
|
|
|
FREE_MAYBE (opt.user_header);
|
2001-02-11 06:33:31 +08:00
|
|
|
|
#ifdef HAVE_SSL
|
|
|
|
|
FREE_MAYBE (opt.sslcertkey);
|
|
|
|
|
FREE_MAYBE (opt.sslcertfile);
|
|
|
|
|
#endif /* HAVE_SSL */
|
2001-04-02 06:23:52 +08:00
|
|
|
|
FREE_MAYBE (opt.bind_address);
|
2001-04-09 06:25:24 +08:00
|
|
|
|
FREE_MAYBE (opt.cookies_input);
|
|
|
|
|
FREE_MAYBE (opt.cookies_output);
|
2001-11-25 11:10:34 +08:00
|
|
|
|
#endif
|
1999-12-02 15:42:23 +08:00
|
|
|
|
}
|