2000-11-19 15:50:10 -05:00
|
|
|
/* Declarations for html-parse.c.
|
2007-09-28 18:45:31 -04:00
|
|
|
Copyright (C) 1998, 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2006,
|
2010-05-08 15:56:15 -04:00
|
|
|
2007, 2008, 2009, 2010 Free Software Foundation, Inc.
|
2000-11-19 15:50:10 -05:00
|
|
|
|
2001-05-27 15:35:15 -04:00
|
|
|
This file is part of GNU Wget.
|
2000-11-19 15:50:10 -05:00
|
|
|
|
2001-05-27 15:35:15 -04:00
|
|
|
GNU Wget is free software; you can redistribute it and/or modify
|
2000-11-19 15:50:10 -05:00
|
|
|
it under the terms of the GNU General Public License as published by
|
2007-07-10 01:53:22 -04:00
|
|
|
the Free Software Foundation; either version 3 of the License, or
|
2003-10-08 12:17:33 -04:00
|
|
|
(at your option) any later version.
|
2000-11-19 15:50:10 -05:00
|
|
|
|
2001-05-27 15:35:15 -04:00
|
|
|
GNU Wget is distributed in the hope that it will be useful,
|
2000-11-19 15:50:10 -05:00
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
GNU General Public License for more details.
|
|
|
|
|
|
|
|
You should have received a copy of the GNU General Public License
|
2007-07-10 01:53:22 -04:00
|
|
|
along with Wget. If not, see <http://www.gnu.org/licenses/>.
|
2002-05-17 22:16:36 -04:00
|
|
|
|
2007-11-28 03:05:33 -05:00
|
|
|
Additional permission under GNU GPL version 3 section 7
|
|
|
|
|
|
|
|
If you modify this program, or any covered work, by linking or
|
|
|
|
combining it with the OpenSSL project's OpenSSL library (or a
|
|
|
|
modified version of that library), containing parts covered by the
|
|
|
|
terms of the OpenSSL or SSLeay licenses, the Free Software Foundation
|
|
|
|
grants you additional permission to convey the resulting work.
|
|
|
|
Corresponding Source for a non-source form of such a combination
|
|
|
|
shall include the source code for the parts of OpenSSL used as well
|
|
|
|
as that of the covered work. */
|
2000-11-19 15:50:10 -05:00
|
|
|
|
2001-11-29 13:55:52 -05:00
|
|
|
#ifndef HTML_PARSE_H
|
|
|
|
#define HTML_PARSE_H
|
|
|
|
|
2000-11-19 15:50:10 -05:00
|
|
|
struct attr_pair {
|
|
|
|
char *name; /* attribute name */
|
|
|
|
char *value; /* attribute value */
|
|
|
|
|
|
|
|
/* Needed for URL conversion; the places where the value begins and
|
|
|
|
ends, including the quotes and everything. */
|
|
|
|
const char *value_raw_beginning;
|
|
|
|
int value_raw_size;
|
|
|
|
|
|
|
|
/* Used internally by map_html_tags. */
|
|
|
|
int name_pool_index, value_pool_index;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct taginfo {
|
|
|
|
char *name; /* tag name */
|
|
|
|
int end_tag_p; /* whether this is an end-tag */
|
|
|
|
int nattrs; /* number of attributes */
|
|
|
|
struct attr_pair *attrs; /* attributes */
|
|
|
|
|
|
|
|
const char *start_position; /* start position of tag */
|
|
|
|
const char *end_position; /* end position of tag */
|
2008-04-22 03:15:48 -04:00
|
|
|
|
|
|
|
const char *contents_begin; /* delimiters of tag contents */
|
|
|
|
const char *contents_end; /* only valid if end_tag_p */
|
2000-11-19 15:50:10 -05:00
|
|
|
};
|
|
|
|
|
2003-10-09 11:01:58 -04:00
|
|
|
struct hash_table; /* forward declaration */
|
|
|
|
|
2003-10-08 12:17:33 -04:00
|
|
|
/* Flags for map_html_tags: */
|
|
|
|
#define MHT_STRICT_COMMENTS 1 /* use strict comment interpretation */
|
|
|
|
#define MHT_TRIM_VALUES 2 /* trim attribute values, e.g. interpret
|
|
|
|
<a href=" foo "> as "foo" */
|
|
|
|
|
2005-06-19 18:34:58 -04:00
|
|
|
void map_html_tags (const char *, int,
|
|
|
|
void (*) (struct taginfo *, void *), void *, int,
|
|
|
|
const struct hash_table *, const struct hash_table *);
|
2001-11-29 13:55:52 -05:00
|
|
|
|
|
|
|
#endif /* HTML_PARSE_H */
|