2008-04-22 03:15:48 -04:00
|
|
|
/* Declarations for html-url.c.
|
2011-01-01 07:19:37 -05:00
|
|
|
Copyright (C) 1995, 1996, 1997, 2009, 2010, 2011 Free Software
|
|
|
|
Foundation, Inc.
|
2008-04-22 03:15:48 -04:00
|
|
|
|
|
|
|
This file is part of GNU Wget.
|
|
|
|
|
|
|
|
GNU Wget is free software; you can redistribute it and/or modify
|
|
|
|
it under the terms of the GNU General Public License as published by
|
2009-09-21 12:03:37 -04:00
|
|
|
the Free Software Foundation; either version 3 of the License, or (at
|
|
|
|
your option) any later version.
|
2008-04-22 03:15:48 -04:00
|
|
|
|
|
|
|
GNU Wget is distributed in the hope that it will be useful,
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
GNU General Public License for more details.
|
|
|
|
|
|
|
|
You should have received a copy of the GNU General Public License
|
2009-09-21 12:03:37 -04:00
|
|
|
along with Wget. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
|
|
|
|
Additional permission under GNU GPL version 3 section 7
|
|
|
|
|
|
|
|
If you modify this program, or any covered work, by linking or
|
|
|
|
combining it with the OpenSSL project's OpenSSL library (or a
|
|
|
|
modified version of that library), containing parts covered by the
|
|
|
|
terms of the OpenSSL or SSLeay licenses, the Free Software Foundation
|
|
|
|
grants you additional permission to convey the resulting work.
|
|
|
|
Corresponding Source for a non-source form of such a combination
|
|
|
|
shall include the source code for the parts of OpenSSL used as well
|
|
|
|
as that of the covered work. */
|
2008-04-22 03:15:48 -04:00
|
|
|
|
|
|
|
#ifndef HTML_URL_H
|
|
|
|
#define HTML_URL_H
|
|
|
|
|
|
|
|
struct map_context {
|
|
|
|
char *text; /* HTML text. */
|
|
|
|
char *base; /* Base URI of the document, possibly
|
|
|
|
changed through <base href=...>. */
|
|
|
|
const char *parent_base; /* Base of the current document. */
|
|
|
|
const char *document_file; /* File name of this document. */
|
|
|
|
bool nofollow; /* whether NOFOLLOW was specified in a
|
|
|
|
<meta name=robots> tag. */
|
|
|
|
|
2010-07-29 19:00:26 -04:00
|
|
|
struct urlpos *head; /* List of URLs that is being built. */
|
2008-04-22 03:15:48 -04:00
|
|
|
};
|
|
|
|
|
|
|
|
struct urlpos *get_urls_file (const char *);
|
2008-07-23 18:56:29 -04:00
|
|
|
struct urlpos *get_urls_html (const char *, const char *, bool *, struct iri *);
|
2008-04-22 03:15:48 -04:00
|
|
|
struct urlpos *append_url (const char *, int, int, struct map_context *);
|
|
|
|
void free_urlpos (struct urlpos *);
|
2014-05-11 17:20:49 -04:00
|
|
|
void cleanup_html_url (void);
|
2008-04-22 03:15:48 -04:00
|
|
|
|
|
|
|
#endif /* HTML_URL_H */
|