1999-12-02 15:42:23 +08:00
|
|
|
|
/* Miscellaneous declarations.
|
|
|
|
|
Copyright (C) 1995, 1996, 1997, 1998 Free Software Foundation, Inc.
|
|
|
|
|
|
2001-05-28 03:35:15 +08:00
|
|
|
|
This file is part of GNU Wget.
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
2001-05-28 03:35:15 +08:00
|
|
|
|
GNU Wget is free software; you can redistribute it and/or modify
|
1999-12-02 15:42:23 +08:00
|
|
|
|
it under the terms of the GNU General Public License as published by
|
|
|
|
|
the Free Software Foundation; either version 2 of the License, or
|
|
|
|
|
(at your option) any later version.
|
|
|
|
|
|
2001-05-28 03:35:15 +08:00
|
|
|
|
GNU Wget is distributed in the hope that it will be useful,
|
1999-12-02 15:42:23 +08:00
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
|
GNU General Public License for more details.
|
|
|
|
|
|
|
|
|
|
You should have received a copy of the GNU General Public License
|
2001-05-28 03:35:15 +08:00
|
|
|
|
along with Wget; if not, write to the Free Software
|
2002-05-18 10:16:36 +08:00
|
|
|
|
Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
|
|
|
|
|
|
|
|
|
|
In addition, as a special exception, the Free Software Foundation
|
|
|
|
|
gives permission to link the code of its release of Wget with the
|
|
|
|
|
OpenSSL project's "OpenSSL" library (or with modified versions of it
|
|
|
|
|
that use the same license as the "OpenSSL" library), and distribute
|
|
|
|
|
the linked executables. You must obey the GNU General Public License
|
|
|
|
|
in all respects for all of the code used other than "OpenSSL". If you
|
|
|
|
|
modify this file, you may extend this exception to your version of the
|
|
|
|
|
file, but you are not obligated to do so. If you do not wish to do
|
|
|
|
|
so, delete this exception statement from your version. */
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
|
|
|
|
/* This file contains some declarations that don't fit anywhere else.
|
|
|
|
|
It also contains some useful includes, like the obnoxious TIME_H
|
|
|
|
|
inclusion. */
|
|
|
|
|
|
|
|
|
|
#ifndef WGET_H
|
|
|
|
|
#define WGET_H
|
|
|
|
|
|
|
|
|
|
#ifndef DEBUG
|
|
|
|
|
# define NDEBUG /* To kill off assertions */
|
|
|
|
|
#endif /* not DEBUG */
|
|
|
|
|
|
2001-11-25 11:10:34 +08:00
|
|
|
|
/* Define this if you want primitive but extensive malloc debugging.
|
|
|
|
|
It will make Wget extremely slow, so only do it in development
|
|
|
|
|
builds. */
|
|
|
|
|
#undef DEBUG_MALLOC
|
|
|
|
|
|
1999-12-02 15:42:23 +08:00
|
|
|
|
#ifndef PARAMS
|
|
|
|
|
# if PROTOTYPES
|
|
|
|
|
# define PARAMS(args) args
|
|
|
|
|
# else
|
|
|
|
|
# define PARAMS(args) ()
|
|
|
|
|
# endif
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
/* `gettext (FOO)' is long to write, so we use `_(FOO)'. If NLS is
|
|
|
|
|
unavailable, _(STRING) simply returns STRING. */
|
|
|
|
|
#ifdef HAVE_NLS
|
|
|
|
|
# define _(string) gettext (string)
|
|
|
|
|
# ifdef HAVE_LIBINTL_H
|
|
|
|
|
# include <libintl.h>
|
|
|
|
|
# endif /* HAVE_LIBINTL_H */
|
|
|
|
|
#else /* not HAVE_NLS */
|
|
|
|
|
# define _(string) string
|
|
|
|
|
#endif /* not HAVE_NLS */
|
|
|
|
|
|
2003-10-02 03:59:48 +08:00
|
|
|
|
/* No-op version of gettext, used for constant strings. */
|
|
|
|
|
#define N_(string) (string)
|
|
|
|
|
|
1999-12-02 15:42:23 +08:00
|
|
|
|
/* I18N NOTE: You will notice that none of the DEBUG messages are
|
|
|
|
|
marked as translatable. This is intentional, for a few reasons:
|
|
|
|
|
|
|
|
|
|
1) The debug messages are not meant for the users to look at, but
|
|
|
|
|
for the developers; as such, they should be considered more like
|
|
|
|
|
source comments than real program output.
|
|
|
|
|
|
|
|
|
|
2) The messages are numerous, and yet they are random and frivolous
|
|
|
|
|
("double yuck!" and such). There would be a lot of work with no
|
|
|
|
|
gain.
|
|
|
|
|
|
|
|
|
|
3) Finally, the debug messages are meant to be a clue for me to
|
|
|
|
|
debug problems with Wget. If I get them in a language I don't
|
2001-11-25 11:10:34 +08:00
|
|
|
|
understand, debugging will become a new challenge of its own! */
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/* Include these, so random files need not include them. */
|
|
|
|
|
#include "sysdep.h"
|
|
|
|
|
#include "options.h"
|
2001-03-31 06:36:59 +08:00
|
|
|
|
/* locale independent replacement for ctype.h */
|
|
|
|
|
#include "safe-ctype.h"
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
|
|
|
|
#define DO_NOTHING do {} while (0)
|
|
|
|
|
|
|
|
|
|
/* Print X if debugging is enabled; a no-op otherwise. */
|
|
|
|
|
#ifdef DEBUG
|
2000-11-20 04:50:10 +08:00
|
|
|
|
# define DEBUGP(x) do { if (opt.debug) { debug_logprintf x; } } while (0)
|
1999-12-02 15:42:23 +08:00
|
|
|
|
#else /* not DEBUG */
|
|
|
|
|
# define DEBUGP(x) DO_NOTHING
|
|
|
|
|
#endif /* not DEBUG */
|
|
|
|
|
|
|
|
|
|
/* Make gcc check for the format of logmsg() and debug_logmsg(). */
|
|
|
|
|
#ifdef __GNUC__
|
|
|
|
|
# define GCC_FORMAT_ATTR(a, b) __attribute__ ((format (printf, a, b)))
|
|
|
|
|
#else /* not __GNUC__ */
|
|
|
|
|
# define GCC_FORMAT_ATTR(a, b)
|
|
|
|
|
#endif /* not __GNUC__ */
|
|
|
|
|
|
|
|
|
|
/* These are from log.c, but they are used everywhere, so we declare
|
|
|
|
|
them here. */
|
|
|
|
|
enum log_options { LOG_VERBOSE, LOG_NOTQUIET, LOG_NONVERBOSE, LOG_ALWAYS };
|
|
|
|
|
|
2000-11-05 06:49:46 +08:00
|
|
|
|
#ifdef HAVE_STDARG_H
|
1999-12-02 15:42:23 +08:00
|
|
|
|
void logprintf PARAMS ((enum log_options, const char *, ...))
|
|
|
|
|
GCC_FORMAT_ATTR (2, 3);
|
|
|
|
|
void debug_logprintf PARAMS ((const char *, ...)) GCC_FORMAT_ATTR (1, 2);
|
2000-11-05 06:49:46 +08:00
|
|
|
|
#else /* not HAVE_STDARG_H */
|
|
|
|
|
void logprintf ();
|
|
|
|
|
void debug_logprintf ();
|
|
|
|
|
#endif /* not HAVE_STDARG_H */
|
1999-12-02 15:42:23 +08:00
|
|
|
|
void logputs PARAMS ((enum log_options, const char *));
|
2001-11-23 04:13:13 +08:00
|
|
|
|
void logflush PARAMS ((void));
|
|
|
|
|
void log_set_flush PARAMS ((int));
|
2001-12-10 13:31:45 +08:00
|
|
|
|
int log_set_save_context PARAMS ((int));
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
|
|
|
|
/* Defined in `utils.c', but used literally everywhere. */
|
2000-11-23 06:15:45 +08:00
|
|
|
|
#ifndef DEBUG_MALLOC
|
|
|
|
|
|
|
|
|
|
#define xmalloc xmalloc_real
|
|
|
|
|
#define xrealloc xrealloc_real
|
|
|
|
|
#define xstrdup xstrdup_real
|
2000-12-11 10:17:44 +08:00
|
|
|
|
#define xfree free
|
2000-11-23 06:15:45 +08:00
|
|
|
|
|
|
|
|
|
void *xmalloc_real PARAMS ((size_t));
|
|
|
|
|
void *xrealloc_real PARAMS ((void *, size_t));
|
|
|
|
|
char *xstrdup_real PARAMS ((const char *));
|
|
|
|
|
|
|
|
|
|
#else /* DEBUG_MALLOC */
|
|
|
|
|
|
|
|
|
|
#define xmalloc(s) xmalloc_debug (s, __FILE__, __LINE__)
|
|
|
|
|
#define xfree(p) xfree_debug (p, __FILE__, __LINE__)
|
|
|
|
|
#define xrealloc(p, s) xrealloc_debug (p, s, __FILE__, __LINE__)
|
|
|
|
|
#define xstrdup(p) xstrdup_debug (p, __FILE__, __LINE__)
|
|
|
|
|
|
|
|
|
|
void *xmalloc_debug PARAMS ((size_t, const char *, int));
|
|
|
|
|
void xfree_debug PARAMS ((void *, const char *, int));
|
|
|
|
|
void *xrealloc_debug PARAMS ((void *, size_t, const char *, int));
|
|
|
|
|
char *xstrdup_debug PARAMS ((const char *, const char *, int));
|
|
|
|
|
|
|
|
|
|
#endif /* DEBUG_MALLOC */
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
|
|
|
|
/* #### Find a better place for this. */
|
|
|
|
|
/* The log file to which Wget writes to after HUP. */
|
|
|
|
|
#define DEFAULT_LOGFILE "wget-log"
|
|
|
|
|
|
|
|
|
|
#define MD5_HASHLEN 16
|
|
|
|
|
|
|
|
|
|
/* Useful macros used across the code: */
|
|
|
|
|
|
|
|
|
|
/* Is the string a hpyhen-only? */
|
|
|
|
|
#define HYPHENP(x) (*(x) == '-' && !*((x) + 1))
|
|
|
|
|
|
|
|
|
|
/* The smaller value of the two. */
|
|
|
|
|
#define MINVAL(x, y) ((x) < (y) ? (x) : (y))
|
|
|
|
|
|
2003-09-19 22:08:37 +08:00
|
|
|
|
/* Convert an ASCII hex digit to the corresponding number between 0
|
|
|
|
|
and 15. X should be a hexadecimal digit that satisfies isxdigit;
|
|
|
|
|
otherwise, the result is undefined. */
|
|
|
|
|
#define XDIGIT_TO_NUM(x) ((x) < 'A' ? (x) - '0' : TOUPPER (x) - 'A' + 10)
|
|
|
|
|
|
|
|
|
|
/* Convert a sequence of ASCII hex digits X and Y to a number betewen
|
|
|
|
|
0 and 255. Uses XDIGIT_TO_NUM for conversion of individual
|
|
|
|
|
digits. */
|
|
|
|
|
#define X2DIGITS_TO_NUM(h1, h2) ((XDIGIT_TO_NUM (h1) << 4) + XDIGIT_TO_NUM (h2))
|
|
|
|
|
|
|
|
|
|
/* The reverse of the above: convert a number in the [0, 16) range to
|
|
|
|
|
its ASCII representation in hex. The A-F characters are in upper
|
2003-09-16 01:50:43 +08:00
|
|
|
|
case. */
|
2003-09-19 22:08:37 +08:00
|
|
|
|
#define XNUM_TO_DIGIT(x) ("0123456789ABCDEF"[x])
|
2003-09-16 01:50:43 +08:00
|
|
|
|
|
2003-09-19 22:08:37 +08:00
|
|
|
|
/* Like XNUM_TO_DIGIT, but generates lower-case characters. */
|
|
|
|
|
#define XNUM_TO_digit(x) ("0123456789abcdef"[x])
|
2003-09-16 01:50:43 +08:00
|
|
|
|
|
|
|
|
|
/* Returns the number of elements in an array with fixed
|
|
|
|
|
initialization. For example:
|
|
|
|
|
|
|
|
|
|
static char a[] = "foo"; -- countof(a) == 4 (for terminating \0)
|
|
|
|
|
|
|
|
|
|
int a[5] = {1, 2}; -- countof(a) == 5
|
|
|
|
|
|
2003-10-07 08:47:08 +08:00
|
|
|
|
char *a[] = { -- countof(a) == 3
|
2003-09-16 01:50:43 +08:00
|
|
|
|
"foo", "bar", "baz"
|
2003-10-07 08:47:08 +08:00
|
|
|
|
}; */
|
2003-09-16 01:50:43 +08:00
|
|
|
|
#define countof(array) (sizeof (array) / sizeof (*(array)))
|
|
|
|
|
|
2003-10-07 08:47:08 +08:00
|
|
|
|
#define alloca_array(type, size) ((type *) alloca ((size) * sizeof (type)))
|
|
|
|
|
|
2001-04-09 06:25:24 +08:00
|
|
|
|
/* Copy the data delimited with BEG and END to alloca-allocated
|
2003-09-19 22:08:37 +08:00
|
|
|
|
storage, and zero-terminate it. Arguments are evaluated only once,
|
|
|
|
|
in the order BEG, END, PLACE. */
|
2001-04-09 06:25:24 +08:00
|
|
|
|
#define BOUNDED_TO_ALLOCA(beg, end, place) do { \
|
2003-09-19 22:08:37 +08:00
|
|
|
|
const char *BTA_beg = (beg); \
|
|
|
|
|
int BTA_len = (end) - BTA_beg; \
|
|
|
|
|
char **BTA_dest = &(place); \
|
|
|
|
|
*BTA_dest = alloca (BTA_len + 1); \
|
|
|
|
|
memcpy (*BTA_dest, BTA_beg, BTA_len); \
|
|
|
|
|
(*BTA_dest)[BTA_len] = '\0'; \
|
2001-04-09 06:25:24 +08:00
|
|
|
|
} while (0)
|
|
|
|
|
|
|
|
|
|
/* Return non-zero if string bounded between BEG and END is equal to
|
|
|
|
|
STRING_LITERAL. The comparison is case-sensitive. */
|
|
|
|
|
#define BOUNDED_EQUAL(beg, end, string_literal) \
|
|
|
|
|
((end) - (beg) == sizeof (string_literal) - 1 \
|
|
|
|
|
&& !memcmp ((beg), (string_literal), \
|
|
|
|
|
sizeof (string_literal) - 1))
|
|
|
|
|
|
|
|
|
|
/* The same as above, except the comparison is case-insensitive. */
|
|
|
|
|
#define BOUNDED_EQUAL_NO_CASE(beg, end, string_literal) \
|
|
|
|
|
((end) - (beg) == sizeof (string_literal) - 1 \
|
|
|
|
|
&& !strncasecmp ((beg), (string_literal), \
|
|
|
|
|
sizeof (string_literal) - 1))
|
|
|
|
|
|
1999-12-02 15:42:23 +08:00
|
|
|
|
/* Note that this much more elegant definition cannot be used:
|
|
|
|
|
|
|
|
|
|
#define STRDUP_ALLOCA(str) (strcpy ((char *)alloca (strlen (str) + 1), str))
|
|
|
|
|
|
|
|
|
|
This is because some compilers don't handle alloca() as argument to
|
|
|
|
|
function correctly. Gcc under Intel has been reported to offend in
|
|
|
|
|
this case. */
|
|
|
|
|
|
|
|
|
|
#define STRDUP_ALLOCA(ptr, str) do { \
|
|
|
|
|
(ptr) = (char *)alloca (strlen (str) + 1); \
|
2003-10-07 08:47:08 +08:00
|
|
|
|
strcpy ((ptr), (str)); \
|
1999-12-02 15:42:23 +08:00
|
|
|
|
} while (0)
|
|
|
|
|
|
|
|
|
|
/* Generally useful if you want to avoid arbitrary size limits but
|
|
|
|
|
don't need a full dynamic array. Assumes that BASEVAR points to a
|
|
|
|
|
malloced array of TYPE objects (or possibly a NULL pointer, if
|
|
|
|
|
SIZEVAR is 0), with the total size stored in SIZEVAR. This macro
|
|
|
|
|
will realloc BASEVAR as necessary so that it can hold at least
|
|
|
|
|
NEEDED_SIZE objects. The reallocing is done by doubling, which
|
|
|
|
|
ensures constant amortized time per element. */
|
2003-10-03 06:20:44 +08:00
|
|
|
|
#define DO_REALLOC(basevar, sizevar, needed_size, type) do \
|
2000-03-21 23:47:45 +08:00
|
|
|
|
{ \
|
2000-11-07 05:24:57 +08:00
|
|
|
|
/* Avoid side-effectualness. */ \
|
|
|
|
|
long do_realloc_needed_size = (needed_size); \
|
2003-10-03 06:20:44 +08:00
|
|
|
|
long do_realloc_newsize = 0; \
|
|
|
|
|
while ((sizevar) < (do_realloc_needed_size)) { \
|
|
|
|
|
do_realloc_newsize = 2*(sizevar); \
|
|
|
|
|
if (do_realloc_newsize < 32) \
|
|
|
|
|
do_realloc_newsize = 32; \
|
|
|
|
|
(sizevar) = do_realloc_newsize; \
|
2000-11-07 05:24:57 +08:00
|
|
|
|
} \
|
2003-10-03 06:20:44 +08:00
|
|
|
|
if (do_realloc_newsize) \
|
|
|
|
|
basevar = (type *)xrealloc (basevar, do_realloc_newsize * sizeof (type)); \
|
2000-03-21 23:47:45 +08:00
|
|
|
|
} while (0)
|
|
|
|
|
|
1999-12-02 15:42:23 +08:00
|
|
|
|
/* Free FOO if it is non-NULL. */
|
2000-11-23 00:58:28 +08:00
|
|
|
|
#define FREE_MAYBE(foo) do { if (foo) xfree (foo); } while (0)
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
|
|
|
|
extern const char *exec_name;
|
|
|
|
|
|
2000-10-20 13:55:46 +08:00
|
|
|
|
/* Document type ("dt") flags */
|
1999-12-02 15:42:23 +08:00
|
|
|
|
enum
|
|
|
|
|
{
|
2003-09-21 20:02:57 +08:00
|
|
|
|
TEXTHTML = 0x0001, /* document is of type text/html
|
|
|
|
|
or application/xhtml+xml */
|
2000-10-20 13:55:46 +08:00
|
|
|
|
RETROKF = 0x0002, /* retrieval was OK */
|
|
|
|
|
HEAD_ONLY = 0x0004, /* only send the HEAD request */
|
|
|
|
|
SEND_NOCACHE = 0x0008, /* send Pragma: no-cache directive */
|
|
|
|
|
ACCEPTRANGES = 0x0010, /* Accept-ranges header was found */
|
2000-11-02 07:17:31 +08:00
|
|
|
|
ADDED_HTML_EXTENSION = 0x0020 /* added ".html" extension due to -E */
|
1999-12-02 15:42:23 +08:00
|
|
|
|
};
|
|
|
|
|
|
2003-09-19 22:08:37 +08:00
|
|
|
|
/* Universal error type -- used almost everywhere. Error reporting of
|
|
|
|
|
this detail is not generally used or needed and should be
|
|
|
|
|
simplified. */
|
1999-12-02 15:42:23 +08:00
|
|
|
|
typedef enum
|
|
|
|
|
{
|
2000-12-06 07:09:41 +08:00
|
|
|
|
NOCONERROR, HOSTERR, CONSOCKERR, CONERROR, CONSSLERR,
|
1999-12-02 15:42:23 +08:00
|
|
|
|
CONREFUSED, NEWLOCATION, NOTENOUGHMEM, CONPORTERR,
|
|
|
|
|
BINDERR, BINDOK, LISTENERR, ACCEPTERR, ACCEPTOK,
|
|
|
|
|
CONCLOSED, FTPOK, FTPLOGINC, FTPLOGREFUSED, FTPPORTERR,
|
|
|
|
|
FTPNSFOD, FTPRETROK, FTPUNKNOWNTYPE, FTPRERR,
|
2001-11-22 08:24:28 +08:00
|
|
|
|
FTPREXC, FTPSRVERR, FTPRETRINT, FTPRESTFAIL, URLERROR,
|
|
|
|
|
FOPENERR, FWRITEERR, HOK, HLEXC, HEOF,
|
1999-12-02 15:42:23 +08:00
|
|
|
|
HERR, RETROK, RECLEVELEXC, FTPACCDENIED, WRONGCODE,
|
|
|
|
|
FTPINVPASV, FTPNOPASV,
|
2001-04-29 00:22:20 +08:00
|
|
|
|
CONTNOTSUPPORTED, RETRUNNEEDED, RETRFINISHED, READERR, TRYLIMEXC,
|
2001-04-02 04:04:21 +08:00
|
|
|
|
URLBADPATTERN, FILEBADFILE, RANGEERR, RETRBADPATTERN,
|
|
|
|
|
RETNOTSUP, ROBOTSOK, NOROBOTS, PROXERR, AUTHFAILED,
|
|
|
|
|
QUOTEXC, WRITEFAILED,
|
2001-02-11 06:33:31 +08:00
|
|
|
|
SSLERRCERTFILE,SSLERRCERTKEY,SSLERRCTXCREATE
|
1999-12-02 15:42:23 +08:00
|
|
|
|
} uerr_t;
|
|
|
|
|
|
2000-03-02 14:33:48 +08:00
|
|
|
|
typedef unsigned char boolean;
|
|
|
|
|
#ifndef FALSE
|
|
|
|
|
#define FALSE 0
|
|
|
|
|
#endif
|
|
|
|
|
#ifndef TRUE
|
|
|
|
|
#define TRUE 1
|
|
|
|
|
#endif
|
|
|
|
|
|
2000-03-11 14:48:06 +08:00
|
|
|
|
/* So we can say strcmp(a, b) == EQ rather than strcmp(a, b) == 0 or
|
|
|
|
|
the really awful !strcmp(a, b). */
|
|
|
|
|
#define EQ 0
|
|
|
|
|
|
2000-08-30 19:26:21 +08:00
|
|
|
|
/* For most options, 0 means no limits, but with -p in the picture, that causes
|
|
|
|
|
a problem on the maximum recursion depth variable. To retain backwards
|
|
|
|
|
compatibility we allow users to consider "0" to be synonymous with "inf" for
|
|
|
|
|
-l, but internally infinite recursion is specified by -1 and 0 means to only
|
|
|
|
|
retrieve the requisites of a single document. */
|
|
|
|
|
#define INFINITE_RECURSION -1
|
|
|
|
|
|
2003-09-05 05:34:58 +08:00
|
|
|
|
#define CONNECT_ERROR(x) ((x) == ECONNREFUSED && !opt.retry_connrefused \
|
|
|
|
|
? CONREFUSED : CONERROR)
|
|
|
|
|
|
1999-12-02 15:42:23 +08:00
|
|
|
|
#endif /* WGET_H */
|