1999-12-02 15:42:23 +08:00
|
|
|
|
/* Miscellaneous declarations.
|
|
|
|
|
Copyright (C) 1995, 1996, 1997, 1998 Free Software Foundation, Inc.
|
|
|
|
|
|
2001-05-28 03:35:15 +08:00
|
|
|
|
This file is part of GNU Wget.
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
2001-05-28 03:35:15 +08:00
|
|
|
|
GNU Wget is free software; you can redistribute it and/or modify
|
1999-12-02 15:42:23 +08:00
|
|
|
|
it under the terms of the GNU General Public License as published by
|
|
|
|
|
the Free Software Foundation; either version 2 of the License, or
|
|
|
|
|
(at your option) any later version.
|
|
|
|
|
|
2001-05-28 03:35:15 +08:00
|
|
|
|
GNU Wget is distributed in the hope that it will be useful,
|
1999-12-02 15:42:23 +08:00
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
|
GNU General Public License for more details.
|
|
|
|
|
|
|
|
|
|
You should have received a copy of the GNU General Public License
|
2001-05-28 03:35:15 +08:00
|
|
|
|
along with Wget; if not, write to the Free Software
|
2002-05-18 10:16:36 +08:00
|
|
|
|
Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
|
|
|
|
|
|
|
|
|
|
In addition, as a special exception, the Free Software Foundation
|
|
|
|
|
gives permission to link the code of its release of Wget with the
|
|
|
|
|
OpenSSL project's "OpenSSL" library (or with modified versions of it
|
|
|
|
|
that use the same license as the "OpenSSL" library), and distribute
|
|
|
|
|
the linked executables. You must obey the GNU General Public License
|
|
|
|
|
in all respects for all of the code used other than "OpenSSL". If you
|
|
|
|
|
modify this file, you may extend this exception to your version of the
|
|
|
|
|
file, but you are not obligated to do so. If you do not wish to do
|
|
|
|
|
so, delete this exception statement from your version. */
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
|
|
|
|
/* This file contains some declarations that don't fit anywhere else.
|
|
|
|
|
It also contains some useful includes, like the obnoxious TIME_H
|
|
|
|
|
inclusion. */
|
|
|
|
|
|
|
|
|
|
#ifndef WGET_H
|
|
|
|
|
#define WGET_H
|
|
|
|
|
|
2003-10-08 08:05:51 +08:00
|
|
|
|
/* Disable assertions when debug support is not compiled in. */
|
|
|
|
|
#ifndef ENABLE_DEBUG
|
|
|
|
|
# define NDEBUG
|
|
|
|
|
#endif
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
2001-11-25 11:10:34 +08:00
|
|
|
|
/* Define this if you want primitive but extensive malloc debugging.
|
|
|
|
|
It will make Wget extremely slow, so only do it in development
|
|
|
|
|
builds. */
|
|
|
|
|
#undef DEBUG_MALLOC
|
|
|
|
|
|
1999-12-02 15:42:23 +08:00
|
|
|
|
#ifndef PARAMS
|
|
|
|
|
# if PROTOTYPES
|
|
|
|
|
# define PARAMS(args) args
|
|
|
|
|
# else
|
|
|
|
|
# define PARAMS(args) ()
|
|
|
|
|
# endif
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
/* `gettext (FOO)' is long to write, so we use `_(FOO)'. If NLS is
|
|
|
|
|
unavailable, _(STRING) simply returns STRING. */
|
|
|
|
|
#ifdef HAVE_NLS
|
|
|
|
|
# define _(string) gettext (string)
|
|
|
|
|
# ifdef HAVE_LIBINTL_H
|
|
|
|
|
# include <libintl.h>
|
|
|
|
|
# endif /* HAVE_LIBINTL_H */
|
|
|
|
|
#else /* not HAVE_NLS */
|
|
|
|
|
# define _(string) string
|
|
|
|
|
#endif /* not HAVE_NLS */
|
|
|
|
|
|
2003-10-02 03:59:48 +08:00
|
|
|
|
/* No-op version of gettext, used for constant strings. */
|
|
|
|
|
#define N_(string) (string)
|
|
|
|
|
|
2003-10-08 08:05:51 +08:00
|
|
|
|
/* I18N NOTE: You will notice that none of the DEBUGP messages are
|
1999-12-02 15:42:23 +08:00
|
|
|
|
marked as translatable. This is intentional, for a few reasons:
|
|
|
|
|
|
|
|
|
|
1) The debug messages are not meant for the users to look at, but
|
|
|
|
|
for the developers; as such, they should be considered more like
|
|
|
|
|
source comments than real program output.
|
|
|
|
|
|
|
|
|
|
2) The messages are numerous, and yet they are random and frivolous
|
|
|
|
|
("double yuck!" and such). There would be a lot of work with no
|
|
|
|
|
gain.
|
|
|
|
|
|
|
|
|
|
3) Finally, the debug messages are meant to be a clue for me to
|
|
|
|
|
debug problems with Wget. If I get them in a language I don't
|
2001-11-25 11:10:34 +08:00
|
|
|
|
understand, debugging will become a new challenge of its own! */
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/* Include these, so random files need not include them. */
|
|
|
|
|
#include "sysdep.h"
|
|
|
|
|
#include "options.h"
|
2001-03-31 06:36:59 +08:00
|
|
|
|
/* locale independent replacement for ctype.h */
|
|
|
|
|
#include "safe-ctype.h"
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
|
|
|
|
#define DO_NOTHING do {} while (0)
|
|
|
|
|
|
|
|
|
|
/* Print X if debugging is enabled; a no-op otherwise. */
|
2003-10-08 08:05:51 +08:00
|
|
|
|
#ifdef ENABLE_DEBUG
|
2000-11-20 04:50:10 +08:00
|
|
|
|
# define DEBUGP(x) do { if (opt.debug) { debug_logprintf x; } } while (0)
|
2003-10-08 08:05:51 +08:00
|
|
|
|
#else /* not ENABLE_DEBUG */
|
1999-12-02 15:42:23 +08:00
|
|
|
|
# define DEBUGP(x) DO_NOTHING
|
2003-10-08 08:05:51 +08:00
|
|
|
|
#endif /* not ENABLE_DEBUG */
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
2003-10-31 22:31:56 +08:00
|
|
|
|
/* Everything uses this, so include them here directly. */
|
|
|
|
|
#include "xmalloc.h"
|
|
|
|
|
|
|
|
|
|
/* Likewise for logging functions. */
|
|
|
|
|
#include "log.h"
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
|
|
|
|
/* #### Find a better place for this. */
|
|
|
|
|
/* The log file to which Wget writes to after HUP. */
|
|
|
|
|
#define DEFAULT_LOGFILE "wget-log"
|
|
|
|
|
|
|
|
|
|
/* Useful macros used across the code: */
|
|
|
|
|
|
2003-10-31 22:31:56 +08:00
|
|
|
|
/* The number of elements in an array. For example:
|
|
|
|
|
static char a[] = "foo"; -- countof(a) == 4 (for terminating \0)
|
|
|
|
|
int a[5] = {1, 2}; -- countof(a) == 5
|
|
|
|
|
char *a[] = { -- countof(a) == 3
|
|
|
|
|
"foo", "bar", "baz"
|
|
|
|
|
}; */
|
|
|
|
|
#define countof(array) (sizeof (array) / sizeof ((array)[0]))
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
2003-10-31 22:31:56 +08:00
|
|
|
|
/* Zero out a value. */
|
2003-10-31 22:55:50 +08:00
|
|
|
|
#define xzero(x) memset (&(x), '\0', sizeof ((x)))
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
2003-09-19 22:08:37 +08:00
|
|
|
|
/* Convert an ASCII hex digit to the corresponding number between 0
|
|
|
|
|
and 15. X should be a hexadecimal digit that satisfies isxdigit;
|
|
|
|
|
otherwise, the result is undefined. */
|
2003-10-31 22:31:56 +08:00
|
|
|
|
#define XDIGIT_TO_NUM(h) ((h) < 'A' ? (h) - '0' : TOUPPER (h) - 'A' + 10)
|
2003-09-19 22:08:37 +08:00
|
|
|
|
#define X2DIGITS_TO_NUM(h1, h2) ((XDIGIT_TO_NUM (h1) << 4) + XDIGIT_TO_NUM (h2))
|
|
|
|
|
|
|
|
|
|
/* The reverse of the above: convert a number in the [0, 16) range to
|
2003-10-31 22:31:56 +08:00
|
|
|
|
the ASCII representation of the corresponding hex digit. The `+ 0'
|
|
|
|
|
is so you don't accidentally use it as an lvalue. */
|
|
|
|
|
#define XNUM_TO_DIGIT(x) ("0123456789ABCDEF"[x] + 0)
|
|
|
|
|
#define XNUM_TO_digit(x) ("0123456789abcdef"[x] + 0)
|
2003-10-07 08:47:08 +08:00
|
|
|
|
|
2001-04-09 06:25:24 +08:00
|
|
|
|
/* Copy the data delimited with BEG and END to alloca-allocated
|
2003-09-19 22:08:37 +08:00
|
|
|
|
storage, and zero-terminate it. Arguments are evaluated only once,
|
|
|
|
|
in the order BEG, END, PLACE. */
|
2001-04-09 06:25:24 +08:00
|
|
|
|
#define BOUNDED_TO_ALLOCA(beg, end, place) do { \
|
2003-09-19 22:08:37 +08:00
|
|
|
|
const char *BTA_beg = (beg); \
|
|
|
|
|
int BTA_len = (end) - BTA_beg; \
|
|
|
|
|
char **BTA_dest = &(place); \
|
|
|
|
|
*BTA_dest = alloca (BTA_len + 1); \
|
|
|
|
|
memcpy (*BTA_dest, BTA_beg, BTA_len); \
|
|
|
|
|
(*BTA_dest)[BTA_len] = '\0'; \
|
2001-04-09 06:25:24 +08:00
|
|
|
|
} while (0)
|
|
|
|
|
|
|
|
|
|
/* Return non-zero if string bounded between BEG and END is equal to
|
|
|
|
|
STRING_LITERAL. The comparison is case-sensitive. */
|
|
|
|
|
#define BOUNDED_EQUAL(beg, end, string_literal) \
|
|
|
|
|
((end) - (beg) == sizeof (string_literal) - 1 \
|
|
|
|
|
&& !memcmp ((beg), (string_literal), \
|
|
|
|
|
sizeof (string_literal) - 1))
|
|
|
|
|
|
|
|
|
|
/* The same as above, except the comparison is case-insensitive. */
|
|
|
|
|
#define BOUNDED_EQUAL_NO_CASE(beg, end, string_literal) \
|
|
|
|
|
((end) - (beg) == sizeof (string_literal) - 1 \
|
|
|
|
|
&& !strncasecmp ((beg), (string_literal), \
|
|
|
|
|
sizeof (string_literal) - 1))
|
|
|
|
|
|
1999-12-02 15:42:23 +08:00
|
|
|
|
/* Note that this much more elegant definition cannot be used:
|
|
|
|
|
|
|
|
|
|
#define STRDUP_ALLOCA(str) (strcpy ((char *)alloca (strlen (str) + 1), str))
|
|
|
|
|
|
|
|
|
|
This is because some compilers don't handle alloca() as argument to
|
2003-10-31 22:31:56 +08:00
|
|
|
|
function correctly. Gcc on Intel platforms has been reported to
|
|
|
|
|
offend in this case. */
|
|
|
|
|
|
|
|
|
|
#define STRDUP_ALLOCA(ptr, str) do { \
|
|
|
|
|
char **SA_dest = &(ptr); \
|
|
|
|
|
const char *SA_src = (str); \
|
|
|
|
|
*SA_dest = (char *)alloca (strlen (SA_src) + 1); \
|
|
|
|
|
strcpy (*SA_dest, SA_src); \
|
1999-12-02 15:42:23 +08:00
|
|
|
|
} while (0)
|
|
|
|
|
|
|
|
|
|
/* Generally useful if you want to avoid arbitrary size limits but
|
|
|
|
|
don't need a full dynamic array. Assumes that BASEVAR points to a
|
|
|
|
|
malloced array of TYPE objects (or possibly a NULL pointer, if
|
|
|
|
|
SIZEVAR is 0), with the total size stored in SIZEVAR. This macro
|
|
|
|
|
will realloc BASEVAR as necessary so that it can hold at least
|
|
|
|
|
NEEDED_SIZE objects. The reallocing is done by doubling, which
|
|
|
|
|
ensures constant amortized time per element. */
|
2003-10-31 22:31:56 +08:00
|
|
|
|
#define DO_REALLOC(basevar, sizevar, needed_size, type) do { \
|
|
|
|
|
/* Avoid side effects by prefixing the local vars. */ \
|
2000-11-07 05:24:57 +08:00
|
|
|
|
long do_realloc_needed_size = (needed_size); \
|
2003-10-03 06:20:44 +08:00
|
|
|
|
long do_realloc_newsize = 0; \
|
|
|
|
|
while ((sizevar) < (do_realloc_needed_size)) { \
|
|
|
|
|
do_realloc_newsize = 2*(sizevar); \
|
|
|
|
|
if (do_realloc_newsize < 32) \
|
|
|
|
|
do_realloc_newsize = 32; \
|
|
|
|
|
(sizevar) = do_realloc_newsize; \
|
2000-11-07 05:24:57 +08:00
|
|
|
|
} \
|
2003-10-03 06:20:44 +08:00
|
|
|
|
if (do_realloc_newsize) \
|
|
|
|
|
basevar = (type *)xrealloc (basevar, do_realloc_newsize * sizeof (type)); \
|
2000-03-21 23:47:45 +08:00
|
|
|
|
} while (0)
|
|
|
|
|
|
1999-12-02 15:42:23 +08:00
|
|
|
|
/* Free FOO if it is non-NULL. */
|
2003-10-31 22:31:56 +08:00
|
|
|
|
#define FREE_MAYBE(foo) do { if (foo) xfree ((foo)); } while (0)
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
|
|
|
|
extern const char *exec_name;
|
|
|
|
|
|
2000-10-20 13:55:46 +08:00
|
|
|
|
/* Document type ("dt") flags */
|
1999-12-02 15:42:23 +08:00
|
|
|
|
enum
|
|
|
|
|
{
|
2003-09-21 20:02:57 +08:00
|
|
|
|
TEXTHTML = 0x0001, /* document is of type text/html
|
|
|
|
|
or application/xhtml+xml */
|
2000-10-20 13:55:46 +08:00
|
|
|
|
RETROKF = 0x0002, /* retrieval was OK */
|
|
|
|
|
HEAD_ONLY = 0x0004, /* only send the HEAD request */
|
|
|
|
|
SEND_NOCACHE = 0x0008, /* send Pragma: no-cache directive */
|
|
|
|
|
ACCEPTRANGES = 0x0010, /* Accept-ranges header was found */
|
2000-11-02 07:17:31 +08:00
|
|
|
|
ADDED_HTML_EXTENSION = 0x0020 /* added ".html" extension due to -E */
|
1999-12-02 15:42:23 +08:00
|
|
|
|
};
|
|
|
|
|
|
2003-09-19 22:08:37 +08:00
|
|
|
|
/* Universal error type -- used almost everywhere. Error reporting of
|
|
|
|
|
this detail is not generally used or needed and should be
|
|
|
|
|
simplified. */
|
1999-12-02 15:42:23 +08:00
|
|
|
|
typedef enum
|
|
|
|
|
{
|
2000-12-06 07:09:41 +08:00
|
|
|
|
NOCONERROR, HOSTERR, CONSOCKERR, CONERROR, CONSSLERR,
|
2003-10-30 07:13:25 +08:00
|
|
|
|
CONIMPOSSIBLE, NEWLOCATION, NOTENOUGHMEM, CONPORTERR,
|
1999-12-02 15:42:23 +08:00
|
|
|
|
BINDERR, BINDOK, LISTENERR, ACCEPTERR, ACCEPTOK,
|
|
|
|
|
CONCLOSED, FTPOK, FTPLOGINC, FTPLOGREFUSED, FTPPORTERR,
|
|
|
|
|
FTPNSFOD, FTPRETROK, FTPUNKNOWNTYPE, FTPRERR,
|
2001-11-22 08:24:28 +08:00
|
|
|
|
FTPREXC, FTPSRVERR, FTPRETRINT, FTPRESTFAIL, URLERROR,
|
|
|
|
|
FOPENERR, FWRITEERR, HOK, HLEXC, HEOF,
|
1999-12-02 15:42:23 +08:00
|
|
|
|
HERR, RETROK, RECLEVELEXC, FTPACCDENIED, WRONGCODE,
|
|
|
|
|
FTPINVPASV, FTPNOPASV,
|
2001-04-29 00:22:20 +08:00
|
|
|
|
CONTNOTSUPPORTED, RETRUNNEEDED, RETRFINISHED, READERR, TRYLIMEXC,
|
2001-04-02 04:04:21 +08:00
|
|
|
|
URLBADPATTERN, FILEBADFILE, RANGEERR, RETRBADPATTERN,
|
|
|
|
|
RETNOTSUP, ROBOTSOK, NOROBOTS, PROXERR, AUTHFAILED,
|
|
|
|
|
QUOTEXC, WRITEFAILED,
|
2001-02-11 06:33:31 +08:00
|
|
|
|
SSLERRCERTFILE,SSLERRCERTKEY,SSLERRCTXCREATE
|
1999-12-02 15:42:23 +08:00
|
|
|
|
} uerr_t;
|
|
|
|
|
|
2003-10-31 22:31:56 +08:00
|
|
|
|
/* These are not used widely. They should either be removed or used
|
|
|
|
|
consistently. */
|
2000-03-02 14:33:48 +08:00
|
|
|
|
typedef unsigned char boolean;
|
|
|
|
|
#ifndef FALSE
|
2003-10-31 22:31:56 +08:00
|
|
|
|
# define FALSE 0
|
2000-03-02 14:33:48 +08:00
|
|
|
|
#endif
|
|
|
|
|
#ifndef TRUE
|
2003-10-31 22:31:56 +08:00
|
|
|
|
# define TRUE 1
|
2000-03-02 14:33:48 +08:00
|
|
|
|
#endif
|
|
|
|
|
|
2003-10-31 22:31:56 +08:00
|
|
|
|
/* For most options, 0 means no limits, but with -p in the picture,
|
|
|
|
|
that causes a problem on the maximum recursion depth variable. To
|
|
|
|
|
retain backwards compatibility we allow users to consider "0" to be
|
|
|
|
|
synonymous with "inf" for -l, but internally infinite recursion is
|
|
|
|
|
specified by -1 and 0 means to only retrieve the requisites of a
|
|
|
|
|
single document. */
|
2000-08-30 19:26:21 +08:00
|
|
|
|
#define INFINITE_RECURSION -1
|
|
|
|
|
|
2003-10-30 07:13:25 +08:00
|
|
|
|
/* In case old systems don't have EAFNOSUPPORT, which we use below. */
|
|
|
|
|
#ifndef EAFNOSUPPORT
|
|
|
|
|
# define EAFNOSUPPORT EINVAL
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
#define CONNECT_ERROR(err) (( (err) == EAFNOSUPPORT \
|
|
|
|
|
|| (err) == EINVAL \
|
|
|
|
|
|| ((err) == ECONNREFUSED \
|
|
|
|
|
&& !opt.retry_connrefused)) \
|
|
|
|
|
? CONIMPOSSIBLE : CONERROR)
|
2003-09-05 05:34:58 +08:00
|
|
|
|
|
1999-12-02 15:42:23 +08:00
|
|
|
|
#endif /* WGET_H */
|