1999-12-02 15:42:23 +08:00
|
|
|
/* Declarations for url.c.
|
2009-09-04 15:13:47 +08:00
|
|
|
Copyright (C) 1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004,
|
2011-01-01 20:19:37 +08:00
|
|
|
2005, 2006, 2007, 2008, 2009, 2010, 2011 Free Software Foundation,
|
|
|
|
Inc.
|
1999-12-02 15:42:23 +08:00
|
|
|
|
2001-05-28 03:35:15 +08:00
|
|
|
This file is part of GNU Wget.
|
1999-12-02 15:42:23 +08:00
|
|
|
|
2001-05-28 03:35:15 +08:00
|
|
|
GNU Wget is free software; you can redistribute it and/or modify
|
1999-12-02 15:42:23 +08:00
|
|
|
it under the terms of the GNU General Public License as published by
|
2007-07-10 13:53:22 +08:00
|
|
|
the Free Software Foundation; either version 3 of the License, or
|
1999-12-02 15:42:23 +08:00
|
|
|
(at your option) any later version.
|
|
|
|
|
2001-05-28 03:35:15 +08:00
|
|
|
GNU Wget is distributed in the hope that it will be useful,
|
1999-12-02 15:42:23 +08:00
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
GNU General Public License for more details.
|
|
|
|
|
|
|
|
You should have received a copy of the GNU General Public License
|
2007-07-10 13:53:22 +08:00
|
|
|
along with Wget. If not, see <http://www.gnu.org/licenses/>.
|
2002-05-18 10:16:36 +08:00
|
|
|
|
2007-11-28 16:05:33 +08:00
|
|
|
Additional permission under GNU GPL version 3 section 7
|
|
|
|
|
|
|
|
If you modify this program, or any covered work, by linking or
|
|
|
|
combining it with the OpenSSL project's OpenSSL library (or a
|
|
|
|
modified version of that library), containing parts covered by the
|
|
|
|
terms of the OpenSSL or SSLeay licenses, the Free Software Foundation
|
|
|
|
grants you additional permission to convey the resulting work.
|
|
|
|
Corresponding Source for a non-source form of such a combination
|
|
|
|
shall include the source code for the parts of OpenSSL used as well
|
|
|
|
as that of the covered work. */
|
1999-12-02 15:42:23 +08:00
|
|
|
|
|
|
|
#ifndef URL_H
|
|
|
|
#define URL_H
|
|
|
|
|
2001-03-09 07:11:03 +08:00
|
|
|
/* Default port definitions */
|
|
|
|
#define DEFAULT_HTTP_PORT 80
|
|
|
|
#define DEFAULT_FTP_PORT 21
|
|
|
|
#define DEFAULT_HTTPS_PORT 443
|
|
|
|
|
2012-09-29 19:47:53 +08:00
|
|
|
/* This represents how many characters less than the OS max name length a file
|
|
|
|
* should be. More precisely, a file name should be at most
|
|
|
|
* (NAME_MAX - CHOMP_BUFFER) characters in length. This number was arrived at
|
|
|
|
* by adding the lengths of all possible strings that could be appended to a
|
|
|
|
* file name later in the code (e.g. ".orig", ".html", etc.). This is
|
|
|
|
* hopefully plenty of extra characters, but I am not guaranteeing that a file
|
|
|
|
* name will be of the proper length by the time the code wants to open a
|
|
|
|
* file descriptor. */
|
|
|
|
#define CHOMP_BUFFER 19
|
|
|
|
|
2007-07-30 09:22:34 +08:00
|
|
|
/* Specifies how, or whether, user auth information should be included
|
|
|
|
* in URLs regenerated from URL parse structures. */
|
|
|
|
enum url_auth_mode {
|
|
|
|
URL_AUTH_SHOW,
|
|
|
|
URL_AUTH_HIDE_PASSWD,
|
|
|
|
URL_AUTH_HIDE
|
|
|
|
};
|
|
|
|
|
2001-11-22 08:24:28 +08:00
|
|
|
/* Note: the ordering here is related to the order of elements in
|
|
|
|
`supported_schemes' in url.c. */
|
|
|
|
|
2001-11-19 08:12:05 +08:00
|
|
|
enum url_scheme {
|
|
|
|
SCHEME_HTTP,
|
|
|
|
#ifdef HAVE_SSL
|
|
|
|
SCHEME_HTTPS,
|
|
|
|
#endif
|
|
|
|
SCHEME_FTP,
|
|
|
|
SCHEME_INVALID
|
|
|
|
};
|
2001-03-09 07:11:03 +08:00
|
|
|
|
1999-12-02 15:42:23 +08:00
|
|
|
/* Structure containing info on a URL. */
|
2001-11-22 08:24:28 +08:00
|
|
|
struct url
|
1999-12-02 15:42:23 +08:00
|
|
|
{
|
2001-11-22 08:24:28 +08:00
|
|
|
char *url; /* Original URL */
|
2001-11-19 08:12:05 +08:00
|
|
|
enum url_scheme scheme; /* URL scheme */
|
|
|
|
|
1999-12-02 15:42:23 +08:00
|
|
|
char *host; /* Extracted hostname */
|
2001-11-22 08:24:28 +08:00
|
|
|
int port; /* Port number */
|
|
|
|
|
|
|
|
/* URL components (URL-quoted). */
|
|
|
|
char *path;
|
|
|
|
char *params;
|
|
|
|
char *query;
|
|
|
|
char *fragment;
|
|
|
|
|
|
|
|
/* Extracted path info (unquoted). */
|
|
|
|
char *dir;
|
|
|
|
char *file;
|
|
|
|
|
|
|
|
/* Username and password (unquoted). */
|
|
|
|
char *user;
|
|
|
|
char *passwd;
|
1999-12-02 15:42:23 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
/* Function declarations */
|
|
|
|
|
2005-06-20 06:34:58 +08:00
|
|
|
char *url_escape (const char *);
|
2008-11-13 12:47:52 +08:00
|
|
|
char *url_escape_unsafe_and_reserved (const char *);
|
1999-12-02 15:42:23 +08:00
|
|
|
|
2008-09-27 17:13:21 +08:00
|
|
|
struct url *url_parse (const char *, int *, struct iri *iri, bool percent_encode);
|
2008-08-07 16:33:06 +08:00
|
|
|
char *url_error (const char *, int);
|
2005-06-20 06:34:58 +08:00
|
|
|
char *url_full_path (const struct url *);
|
|
|
|
void url_set_dir (struct url *, const char *);
|
|
|
|
void url_set_file (struct url *, const char *);
|
|
|
|
void url_free (struct url *);
|
2001-11-22 08:24:28 +08:00
|
|
|
|
2005-06-20 06:34:58 +08:00
|
|
|
enum url_scheme url_scheme (const char *);
|
2005-06-23 03:38:10 +08:00
|
|
|
bool url_has_scheme (const char *);
|
2010-03-03 04:41:32 +08:00
|
|
|
bool url_valid_scheme (const char *);
|
2005-06-20 06:34:58 +08:00
|
|
|
int scheme_default_port (enum url_scheme);
|
|
|
|
void scheme_disable (enum url_scheme);
|
2001-11-22 08:24:28 +08:00
|
|
|
|
2007-07-30 09:22:34 +08:00
|
|
|
char *url_string (const struct url *, enum url_auth_mode);
|
2010-09-24 20:07:58 +08:00
|
|
|
char *url_file_name (const struct url *, char *);
|
1999-12-02 15:42:23 +08:00
|
|
|
|
2005-06-20 06:34:58 +08:00
|
|
|
char *uri_merge (const char *, const char *);
|
2000-11-01 03:25:32 +08:00
|
|
|
|
2005-06-20 06:34:58 +08:00
|
|
|
int mkalldirs (const char *);
|
2000-03-02 14:33:48 +08:00
|
|
|
|
2005-06-20 06:34:58 +08:00
|
|
|
char *rewrite_shorthand_url (const char *);
|
2005-06-23 03:38:10 +08:00
|
|
|
bool schemes_are_similar_p (enum url_scheme a, enum url_scheme b);
|
2002-05-17 01:22:24 +08:00
|
|
|
|
2006-06-28 19:09:30 +08:00
|
|
|
bool are_urls_equal (const char *u1, const char *u2);
|
|
|
|
|
1999-12-02 15:42:23 +08:00
|
|
|
#endif /* URL_H */
|