1
0
mirror of https://github.com/moparisthebest/wget synced 2024-07-03 16:38:41 -04:00

Do not assume external links type to be always "text/html".

This commit is contained in:
Manfred Koizar 2010-10-18 10:55:16 +02:00 committed by Giuseppe Scrivano
parent 542c549985
commit cea1f0718d
2 changed files with 19 additions and 6 deletions

View File

@ -1,3 +1,8 @@
2010-10-18 Manfred Koizar <mkoi-pg@aon.at> (tiny change)
* html-url.c (tag_handle_link): Do not assume external links type
to be always "text/html".
2010-10-16 Giuseppe Scrivano <gscrivano@gnu.org>
* connect.c (socket_ip_address): Initialize `sockaddr' to zero.

View File

@ -164,6 +164,7 @@ static struct {
to the attributes not mentioned here. We add them manually. */
static const char *additional_attributes[] = {
"rel", /* used by tag_handle_link */
"type", /* used by tag_handle_link */
"http-equiv", /* used by tag_handle_meta */
"name", /* used by tag_handle_meta */
"content", /* used by tag_handle_meta */
@ -526,14 +527,21 @@ tag_handle_link (int tagid, struct taginfo *tag, struct map_context *ctx)
{
up->link_inline_p = 1;
}
}
else
{
/* The external ones usually point to HTML pages, such as
<link rel="next" href="..."> */
<link rel="next" href="...">
except when the type attribute says otherwise:
<link rel="alternate" type="application/rss+xml" href=".../?feed=rss2" />
*/
char *type = find_attr (tag, "type", NULL);
if (!type || strcasecmp (type, "text/html") == 0)
up->link_expect_html = 1;
}
}
}
}
}
/* Handle the META tag. This requires special handling because of the
refresh feature and because of robot exclusion. */