2000-11-19 15:50:10 -05:00
|
|
|
/* Declarations for html-parse.c.
|
|
|
|
Copyright (C) 1998 Free Software Foundation, Inc.
|
|
|
|
|
2001-05-27 15:35:15 -04:00
|
|
|
This file is part of GNU Wget.
|
2000-11-19 15:50:10 -05:00
|
|
|
|
2001-05-27 15:35:15 -04:00
|
|
|
GNU Wget is free software; you can redistribute it and/or modify
|
2000-11-19 15:50:10 -05:00
|
|
|
it under the terms of the GNU General Public License as published by
|
|
|
|
the Free Software Foundation; either version 2 of the License, or
|
2003-10-08 12:17:33 -04:00
|
|
|
(at your option) any later version.
|
2000-11-19 15:50:10 -05:00
|
|
|
|
2001-05-27 15:35:15 -04:00
|
|
|
GNU Wget is distributed in the hope that it will be useful,
|
2000-11-19 15:50:10 -05:00
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
GNU General Public License for more details.
|
|
|
|
|
|
|
|
You should have received a copy of the GNU General Public License
|
2001-05-27 15:35:15 -04:00
|
|
|
along with Wget; if not, write to the Free Software
|
2002-05-17 22:16:36 -04:00
|
|
|
Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
|
|
|
|
|
|
|
|
In addition, as a special exception, the Free Software Foundation
|
|
|
|
gives permission to link the code of its release of Wget with the
|
|
|
|
OpenSSL project's "OpenSSL" library (or with modified versions of it
|
|
|
|
that use the same license as the "OpenSSL" library), and distribute
|
|
|
|
the linked executables. You must obey the GNU General Public License
|
|
|
|
in all respects for all of the code used other than "OpenSSL". If you
|
|
|
|
modify this file, you may extend this exception to your version of the
|
|
|
|
file, but you are not obligated to do so. If you do not wish to do
|
|
|
|
so, delete this exception statement from your version. */
|
2000-11-19 15:50:10 -05:00
|
|
|
|
2001-11-29 13:55:52 -05:00
|
|
|
#ifndef HTML_PARSE_H
|
|
|
|
#define HTML_PARSE_H
|
|
|
|
|
2000-11-19 15:50:10 -05:00
|
|
|
struct attr_pair {
|
|
|
|
char *name; /* attribute name */
|
|
|
|
char *value; /* attribute value */
|
|
|
|
|
|
|
|
/* Needed for URL conversion; the places where the value begins and
|
|
|
|
ends, including the quotes and everything. */
|
|
|
|
const char *value_raw_beginning;
|
|
|
|
int value_raw_size;
|
|
|
|
|
|
|
|
/* Used internally by map_html_tags. */
|
|
|
|
int name_pool_index, value_pool_index;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct taginfo {
|
|
|
|
char *name; /* tag name */
|
|
|
|
int end_tag_p; /* whether this is an end-tag */
|
|
|
|
int nattrs; /* number of attributes */
|
|
|
|
struct attr_pair *attrs; /* attributes */
|
|
|
|
|
|
|
|
const char *start_position; /* start position of tag */
|
|
|
|
const char *end_position; /* end position of tag */
|
|
|
|
};
|
|
|
|
|
2003-10-09 11:01:58 -04:00
|
|
|
struct hash_table; /* forward declaration */
|
|
|
|
|
2003-10-08 12:17:33 -04:00
|
|
|
/* Flags for map_html_tags: */
|
|
|
|
#define MHT_STRICT_COMMENTS 1 /* use strict comment interpretation */
|
|
|
|
#define MHT_TRIM_VALUES 2 /* trim attribute values, e.g. interpret
|
|
|
|
<a href=" foo "> as "foo" */
|
|
|
|
|
2005-06-19 18:34:58 -04:00
|
|
|
void map_html_tags (const char *, int,
|
|
|
|
void (*) (struct taginfo *, void *), void *, int,
|
|
|
|
const struct hash_table *, const struct hash_table *);
|
2001-11-29 13:55:52 -05:00
|
|
|
|
|
|
|
#endif /* HTML_PARSE_H */
|