1999-12-02 15:42:23 +08:00
|
|
|
/* Declarations for url.c.
|
|
|
|
Copyright (C) 1995, 1996, 1997 Free Software Foundation, Inc.
|
|
|
|
|
|
|
|
This file is part of Wget.
|
|
|
|
|
|
|
|
This program is free software; you can redistribute it and/or modify
|
|
|
|
it under the terms of the GNU General Public License as published by
|
|
|
|
the Free Software Foundation; either version 2 of the License, or
|
|
|
|
(at your option) any later version.
|
|
|
|
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
GNU General Public License for more details.
|
|
|
|
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
|
|
along with this program; if not, write to the Free Software
|
|
|
|
Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. */
|
|
|
|
|
|
|
|
#ifndef URL_H
|
|
|
|
#define URL_H
|
|
|
|
|
|
|
|
/* If the string contains unsafe characters, duplicate it with
|
|
|
|
encode_string, otherwise just copy it with strdup. */
|
|
|
|
#define CLEANDUP(x) (contains_unsafe (x) ? encode_string (x) : xstrdup (x))
|
|
|
|
|
|
|
|
/* Structure containing info on a URL. */
|
|
|
|
struct urlinfo
|
|
|
|
{
|
|
|
|
char *url; /* Unchanged URL */
|
|
|
|
uerr_t proto; /* URL protocol */
|
|
|
|
char *host; /* Extracted hostname */
|
|
|
|
unsigned short port;
|
|
|
|
char ftp_type;
|
2000-03-02 22:16:12 +08:00
|
|
|
char *path, *dir, *file, *qstring;
|
|
|
|
/* Path, dir, file, and query string
|
1999-12-02 15:42:23 +08:00
|
|
|
(properly decoded) */
|
|
|
|
char *user, *passwd; /* Username and password */
|
|
|
|
struct urlinfo *proxy; /* The exact string to pass to proxy
|
|
|
|
server */
|
|
|
|
char *referer; /* The source from which the request
|
|
|
|
URI was obtained */
|
|
|
|
char *local; /* The local filename of the URL
|
|
|
|
document */
|
|
|
|
};
|
|
|
|
|
2000-11-21 10:06:36 +08:00
|
|
|
enum convert_options {
|
|
|
|
CO_NOCONVERT = 0, /* don't convert this URL */
|
|
|
|
CO_CONVERT_TO_RELATIVE, /* convert to relative, e.g. to
|
|
|
|
"../../otherdir/foo.gif" */
|
|
|
|
CO_CONVERT_TO_COMPLETE /* convert to absolute, e.g. to
|
|
|
|
"http://orighost/somedir/bar.jpg". */
|
1999-12-02 15:42:23 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
/* A structure that defines the whereabouts of a URL, i.e. its
|
|
|
|
position in an HTML document, etc. */
|
2000-11-21 10:06:36 +08:00
|
|
|
|
1999-12-02 15:42:23 +08:00
|
|
|
typedef struct _urlpos
|
|
|
|
{
|
2000-11-21 10:06:36 +08:00
|
|
|
char *url; /* linked URL, after it has been
|
|
|
|
merged with the base */
|
|
|
|
char *local_name; /* Local file to which it was saved */
|
|
|
|
|
|
|
|
/* Information about the original link: */
|
|
|
|
int link_relative_p; /* was the link relative? */
|
|
|
|
int link_complete_p; /* was the link complete (with the
|
|
|
|
host name, etc.) */
|
|
|
|
|
|
|
|
/* Conversion requirements: */
|
|
|
|
enum convert_options convert; /* is conversion required? */
|
|
|
|
|
|
|
|
/* URL's position in the buffer. */
|
|
|
|
int pos, size;
|
|
|
|
|
|
|
|
struct _urlpos *next; /* Next struct in list */
|
1999-12-02 15:42:23 +08:00
|
|
|
} urlpos;
|
|
|
|
|
2000-10-20 13:55:46 +08:00
|
|
|
/* downloaded_file() takes a parameter of this type and returns this type. */
|
2000-03-02 14:33:48 +08:00
|
|
|
typedef enum
|
|
|
|
{
|
2000-10-20 13:55:46 +08:00
|
|
|
/* Return enumerators: */
|
|
|
|
FILE_NOT_ALREADY_DOWNLOADED = 0,
|
|
|
|
|
|
|
|
/* Return / parameter enumerators: */
|
|
|
|
FILE_DOWNLOADED_NORMALLY,
|
|
|
|
FILE_DOWNLOADED_AND_HTML_EXTENSION_ADDED,
|
|
|
|
|
|
|
|
/* Parameter enumerators: */
|
2000-03-02 14:33:48 +08:00
|
|
|
CHECK_FOR_FILE
|
|
|
|
} downloaded_file_t;
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
|
|
/* Function declarations */
|
|
|
|
|
|
|
|
int skip_url PARAMS ((const char *));
|
|
|
|
|
|
|
|
int contains_unsafe PARAMS ((const char *));
|
|
|
|
char *encode_string PARAMS ((const char *));
|
|
|
|
|
|
|
|
struct urlinfo *newurl PARAMS ((void));
|
|
|
|
void freeurl PARAMS ((struct urlinfo *, int));
|
|
|
|
uerr_t urlproto PARAMS ((const char *));
|
|
|
|
int skip_proto PARAMS ((const char *));
|
2000-11-20 04:50:10 +08:00
|
|
|
int has_proto PARAMS ((const char *));
|
1999-12-02 15:42:23 +08:00
|
|
|
int skip_uname PARAMS ((const char *));
|
|
|
|
|
|
|
|
uerr_t parseurl PARAMS ((const char *, struct urlinfo *, int));
|
|
|
|
char *str_url PARAMS ((const struct urlinfo *, int));
|
|
|
|
int url_equal PARAMS ((const char *, const char *));
|
|
|
|
|
|
|
|
urlpos *get_urls_file PARAMS ((const char *));
|
2000-11-20 04:50:10 +08:00
|
|
|
urlpos *get_urls_html PARAMS ((const char *, const char *, int, int *));
|
1999-12-02 15:42:23 +08:00
|
|
|
void free_urlpos PARAMS ((urlpos *));
|
|
|
|
|
2000-11-01 03:25:32 +08:00
|
|
|
char *url_concat PARAMS ((const char *, const char *));
|
|
|
|
|
1999-12-02 15:42:23 +08:00
|
|
|
void rotate_backups PARAMS ((const char *));
|
|
|
|
int mkalldirs PARAMS ((const char *));
|
|
|
|
char *url_filename PARAMS ((const struct urlinfo *));
|
|
|
|
void opt_url PARAMS ((struct urlinfo *));
|
|
|
|
|
|
|
|
char *getproxy PARAMS ((uerr_t));
|
|
|
|
int no_proxy_match PARAMS ((const char *, const char **));
|
|
|
|
|
|
|
|
void convert_links PARAMS ((const char *, urlpos *));
|
|
|
|
urlpos *add_url PARAMS ((urlpos *, const char *, const char *));
|
|
|
|
|
2000-10-20 13:55:46 +08:00
|
|
|
downloaded_file_t downloaded_file PARAMS ((downloaded_file_t, const char *));
|
2000-03-02 14:33:48 +08:00
|
|
|
|
1999-12-02 15:42:23 +08:00
|
|
|
#endif /* URL_H */
|