1999-12-02 02:42:23 -05:00
|
|
|
/* Declarations for url.c.
|
2009-09-04 03:13:47 -04:00
|
|
|
Copyright (C) 1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004,
|
2015-03-09 11:32:01 -04:00
|
|
|
2005, 2006, 2007, 2008, 2009, 2010, 2011, 2015 Free Software
|
|
|
|
Foundation, Inc.
|
1999-12-02 02:42:23 -05:00
|
|
|
|
2001-05-27 15:35:15 -04:00
|
|
|
This file is part of GNU Wget.
|
1999-12-02 02:42:23 -05:00
|
|
|
|
2001-05-27 15:35:15 -04:00
|
|
|
GNU Wget is free software; you can redistribute it and/or modify
|
1999-12-02 02:42:23 -05:00
|
|
|
it under the terms of the GNU General Public License as published by
|
2007-07-10 01:53:22 -04:00
|
|
|
the Free Software Foundation; either version 3 of the License, or
|
1999-12-02 02:42:23 -05:00
|
|
|
(at your option) any later version.
|
|
|
|
|
2001-05-27 15:35:15 -04:00
|
|
|
GNU Wget is distributed in the hope that it will be useful,
|
1999-12-02 02:42:23 -05:00
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
GNU General Public License for more details.
|
|
|
|
|
|
|
|
You should have received a copy of the GNU General Public License
|
2007-07-10 01:53:22 -04:00
|
|
|
along with Wget. If not, see <http://www.gnu.org/licenses/>.
|
2002-05-17 22:16:36 -04:00
|
|
|
|
2007-11-28 03:05:33 -05:00
|
|
|
Additional permission under GNU GPL version 3 section 7
|
|
|
|
|
|
|
|
If you modify this program, or any covered work, by linking or
|
|
|
|
combining it with the OpenSSL project's OpenSSL library (or a
|
|
|
|
modified version of that library), containing parts covered by the
|
|
|
|
terms of the OpenSSL or SSLeay licenses, the Free Software Foundation
|
|
|
|
grants you additional permission to convey the resulting work.
|
|
|
|
Corresponding Source for a non-source form of such a combination
|
|
|
|
shall include the source code for the parts of OpenSSL used as well
|
|
|
|
as that of the covered work. */
|
1999-12-02 02:42:23 -05:00
|
|
|
|
|
|
|
#ifndef URL_H
|
|
|
|
#define URL_H
|
|
|
|
|
2001-03-08 18:11:03 -05:00
|
|
|
/* Default port definitions */
|
|
|
|
#define DEFAULT_HTTP_PORT 80
|
|
|
|
#define DEFAULT_FTP_PORT 21
|
|
|
|
#define DEFAULT_HTTPS_PORT 443
|
|
|
|
|
2012-09-29 07:47:53 -04:00
|
|
|
/* This represents how many characters less than the OS max name length a file
|
|
|
|
* should be. More precisely, a file name should be at most
|
|
|
|
* (NAME_MAX - CHOMP_BUFFER) characters in length. This number was arrived at
|
|
|
|
* by adding the lengths of all possible strings that could be appended to a
|
|
|
|
* file name later in the code (e.g. ".orig", ".html", etc.). This is
|
|
|
|
* hopefully plenty of extra characters, but I am not guaranteeing that a file
|
|
|
|
* name will be of the proper length by the time the code wants to open a
|
|
|
|
* file descriptor. */
|
|
|
|
#define CHOMP_BUFFER 19
|
|
|
|
|
2013-07-10 14:59:34 -04:00
|
|
|
/* The flags that allow clobbering the file (opening with "wb").
|
|
|
|
Defined here to avoid repetition later. #### This will require
|
|
|
|
rework. */
|
|
|
|
#define ALLOW_CLOBBER (opt.noclobber || opt.always_rest || opt.timestamping \
|
|
|
|
|| opt.dirstruct || opt.output_document || opt.backups > 0)
|
|
|
|
|
2007-07-29 21:22:34 -04:00
|
|
|
/* Specifies how, or whether, user auth information should be included
|
|
|
|
* in URLs regenerated from URL parse structures. */
|
|
|
|
enum url_auth_mode {
|
|
|
|
URL_AUTH_SHOW,
|
|
|
|
URL_AUTH_HIDE_PASSWD,
|
|
|
|
URL_AUTH_HIDE
|
|
|
|
};
|
|
|
|
|
2001-11-21 19:24:28 -05:00
|
|
|
/* Note: the ordering here is related to the order of elements in
|
|
|
|
`supported_schemes' in url.c. */
|
|
|
|
|
2001-11-18 19:12:05 -05:00
|
|
|
enum url_scheme {
|
|
|
|
SCHEME_HTTP,
|
|
|
|
#ifdef HAVE_SSL
|
|
|
|
SCHEME_HTTPS,
|
|
|
|
#endif
|
|
|
|
SCHEME_FTP,
|
|
|
|
SCHEME_INVALID
|
|
|
|
};
|
2001-03-08 18:11:03 -05:00
|
|
|
|
1999-12-02 02:42:23 -05:00
|
|
|
/* Structure containing info on a URL. */
|
2001-11-21 19:24:28 -05:00
|
|
|
struct url
|
1999-12-02 02:42:23 -05:00
|
|
|
{
|
2014-05-26 05:51:58 -04:00
|
|
|
char *url; /* Original URL */
|
|
|
|
enum url_scheme scheme; /* URL scheme */
|
2001-11-18 19:12:05 -05:00
|
|
|
|
2014-05-26 05:51:58 -04:00
|
|
|
char *host; /* Extracted hostname */
|
|
|
|
int port; /* Port number */
|
2001-11-21 19:24:28 -05:00
|
|
|
|
|
|
|
/* URL components (URL-quoted). */
|
|
|
|
char *path;
|
|
|
|
char *params;
|
|
|
|
char *query;
|
|
|
|
char *fragment;
|
|
|
|
|
|
|
|
/* Extracted path info (unquoted). */
|
|
|
|
char *dir;
|
|
|
|
char *file;
|
|
|
|
|
|
|
|
/* Username and password (unquoted). */
|
|
|
|
char *user;
|
|
|
|
char *passwd;
|
2015-02-13 07:24:19 -05:00
|
|
|
|
|
|
|
/* 'host' is allocated by idna_to_ascii_8z() via idn_encode().
|
|
|
|
* Call 'idn_free()' to free this memory. */
|
|
|
|
bool idn_allocated;
|
1999-12-02 02:42:23 -05:00
|
|
|
};
|
|
|
|
|
|
|
|
/* Function declarations */
|
|
|
|
|
2005-06-19 18:34:58 -04:00
|
|
|
char *url_escape (const char *);
|
2008-11-12 23:47:52 -05:00
|
|
|
char *url_escape_unsafe_and_reserved (const char *);
|
2014-02-14 09:44:51 -05:00
|
|
|
void url_unescape (char *);
|
2015-04-13 10:28:36 -04:00
|
|
|
void url_unescape_except_reserved (char *);
|
1999-12-02 02:42:23 -05:00
|
|
|
|
2008-09-27 05:13:21 -04:00
|
|
|
struct url *url_parse (const char *, int *, struct iri *iri, bool percent_encode);
|
2008-08-07 04:33:06 -04:00
|
|
|
char *url_error (const char *, int);
|
2005-06-19 18:34:58 -04:00
|
|
|
char *url_full_path (const struct url *);
|
|
|
|
void url_set_dir (struct url *, const char *);
|
|
|
|
void url_set_file (struct url *, const char *);
|
|
|
|
void url_free (struct url *);
|
2001-11-21 19:24:28 -05:00
|
|
|
|
2005-06-19 18:34:58 -04:00
|
|
|
enum url_scheme url_scheme (const char *);
|
2005-06-22 15:38:10 -04:00
|
|
|
bool url_has_scheme (const char *);
|
2010-03-02 15:41:32 -05:00
|
|
|
bool url_valid_scheme (const char *);
|
2005-06-19 18:34:58 -04:00
|
|
|
int scheme_default_port (enum url_scheme);
|
|
|
|
void scheme_disable (enum url_scheme);
|
2001-11-21 19:24:28 -05:00
|
|
|
|
2007-07-29 21:22:34 -04:00
|
|
|
char *url_string (const struct url *, enum url_auth_mode);
|
2010-09-24 08:07:58 -04:00
|
|
|
char *url_file_name (const struct url *, char *);
|
1999-12-02 02:42:23 -05:00
|
|
|
|
2005-06-19 18:34:58 -04:00
|
|
|
char *uri_merge (const char *, const char *);
|
2000-10-31 14:25:32 -05:00
|
|
|
|
2005-06-19 18:34:58 -04:00
|
|
|
int mkalldirs (const char *);
|
2000-03-02 01:33:48 -05:00
|
|
|
|
2005-06-19 18:34:58 -04:00
|
|
|
char *rewrite_shorthand_url (const char *);
|
2005-06-22 15:38:10 -04:00
|
|
|
bool schemes_are_similar_p (enum url_scheme a, enum url_scheme b);
|
2002-05-16 13:22:24 -04:00
|
|
|
|
2006-06-28 07:09:30 -04:00
|
|
|
bool are_urls_equal (const char *u1, const char *u2);
|
|
|
|
|
1999-12-02 02:42:23 -05:00
|
|
|
#endif /* URL_H */
|