mirror of
https://github.com/moparisthebest/wget
synced 2024-07-03 16:38:41 -04:00
[svn] Remove redirection cycle detection.
Published in <sxs7kpzhcwa.fsf@florida.arsdigita.de>.
This commit is contained in:
parent
f2bb99d102
commit
6c4c785cc2
@ -1,3 +1,11 @@
|
|||||||
|
2002-01-30 Hrvoje Niksic <hniksic@arsdigita.com>
|
||||||
|
|
||||||
|
* retr.c (retrieve_url): Remove redirection cycle detection. This
|
||||||
|
is because some sites legitimately redirect the user back to the
|
||||||
|
same location, e.g. after an authorization check performed by
|
||||||
|
another page. MAX_REDIRECTIONS is still used to prevent infinite
|
||||||
|
redirection loops.
|
||||||
|
|
||||||
2002-01-26 Hrvoje Niksic <hniksic@arsdigita.com>
|
2002-01-26 Hrvoje Niksic <hniksic@arsdigita.com>
|
||||||
|
|
||||||
* http.c (gethttp): Wrap host name in square brackets if it
|
* http.c (gethttp): Wrap host name in square brackets if it
|
||||||
|
71
src/retr.c
71
src/retr.c
@ -274,26 +274,6 @@ calc_rate (long bytes, long msecs, int *units)
|
|||||||
return dlrate;
|
return dlrate;
|
||||||
}
|
}
|
||||||
|
|
||||||
static int
|
|
||||||
register_redirections_mapper (void *key, void *value, void *arg)
|
|
||||||
{
|
|
||||||
const char *redirected_from = (const char *)key;
|
|
||||||
const char *redirected_to = (const char *)arg;
|
|
||||||
if (0 != strcmp (redirected_from, redirected_to))
|
|
||||||
register_redirection (redirected_from, redirected_to);
|
|
||||||
return 0;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* Register the redirections that lead to the successful download of
|
|
||||||
this URL. This is necessary so that the link converter can convert
|
|
||||||
redirected URLs to the local file. */
|
|
||||||
|
|
||||||
static void
|
|
||||||
register_all_redirections (struct hash_table *redirections, const char *final)
|
|
||||||
{
|
|
||||||
hash_table_map (redirections, register_redirections_mapper, (void *)final);
|
|
||||||
}
|
|
||||||
|
|
||||||
#define USE_PROXY_P(u) (opt.use_proxy && getproxy((u)->scheme) \
|
#define USE_PROXY_P(u) (opt.use_proxy && getproxy((u)->scheme) \
|
||||||
&& no_proxy_match((u)->host, \
|
&& no_proxy_match((u)->host, \
|
||||||
(const char **)opt.no_proxy))
|
(const char **)opt.no_proxy))
|
||||||
@ -320,7 +300,6 @@ retrieve_url (const char *origurl, char **file, char **newloc,
|
|||||||
struct url *u;
|
struct url *u;
|
||||||
int up_error_code; /* url parse error code */
|
int up_error_code; /* url parse error code */
|
||||||
char *local_file;
|
char *local_file;
|
||||||
struct hash_table *redirections = NULL;
|
|
||||||
int redirection_count = 0;
|
int redirection_count = 0;
|
||||||
|
|
||||||
/* If dt is NULL, just ignore it. */
|
/* If dt is NULL, just ignore it. */
|
||||||
@ -336,8 +315,6 @@ retrieve_url (const char *origurl, char **file, char **newloc,
|
|||||||
if (!u)
|
if (!u)
|
||||||
{
|
{
|
||||||
logprintf (LOG_NOTQUIET, "%s: %s.\n", url, url_error (up_error_code));
|
logprintf (LOG_NOTQUIET, "%s: %s.\n", url, url_error (up_error_code));
|
||||||
if (redirections)
|
|
||||||
string_set_free (redirections);
|
|
||||||
xfree (url);
|
xfree (url);
|
||||||
return URLERROR;
|
return URLERROR;
|
||||||
}
|
}
|
||||||
@ -362,8 +339,6 @@ retrieve_url (const char *origurl, char **file, char **newloc,
|
|||||||
{
|
{
|
||||||
logputs (LOG_NOTQUIET, _("Could not find proxy host.\n"));
|
logputs (LOG_NOTQUIET, _("Could not find proxy host.\n"));
|
||||||
url_free (u);
|
url_free (u);
|
||||||
if (redirections)
|
|
||||||
string_set_free (redirections);
|
|
||||||
xfree (url);
|
xfree (url);
|
||||||
return PROXERR;
|
return PROXERR;
|
||||||
}
|
}
|
||||||
@ -374,8 +349,6 @@ retrieve_url (const char *origurl, char **file, char **newloc,
|
|||||||
{
|
{
|
||||||
logprintf (LOG_NOTQUIET, _("Error parsing proxy URL %s: %s.\n"),
|
logprintf (LOG_NOTQUIET, _("Error parsing proxy URL %s: %s.\n"),
|
||||||
proxy, url_error (up_error_code));
|
proxy, url_error (up_error_code));
|
||||||
if (redirections)
|
|
||||||
string_set_free (redirections);
|
|
||||||
xfree (url);
|
xfree (url);
|
||||||
return PROXERR;
|
return PROXERR;
|
||||||
}
|
}
|
||||||
@ -383,8 +356,6 @@ retrieve_url (const char *origurl, char **file, char **newloc,
|
|||||||
{
|
{
|
||||||
logprintf (LOG_NOTQUIET, _("Error in proxy URL %s: Must be HTTP.\n"), proxy);
|
logprintf (LOG_NOTQUIET, _("Error in proxy URL %s: Must be HTTP.\n"), proxy);
|
||||||
url_free (proxy_url);
|
url_free (proxy_url);
|
||||||
if (redirections)
|
|
||||||
string_set_free (redirections);
|
|
||||||
xfree (url);
|
xfree (url);
|
||||||
return PROXERR;
|
return PROXERR;
|
||||||
}
|
}
|
||||||
@ -406,7 +377,7 @@ retrieve_url (const char *origurl, char **file, char **newloc,
|
|||||||
retrieval, so we save recursion to oldrec, and restore it
|
retrieval, so we save recursion to oldrec, and restore it
|
||||||
later. */
|
later. */
|
||||||
int oldrec = opt.recursive;
|
int oldrec = opt.recursive;
|
||||||
if (redirections)
|
if (redirection_count)
|
||||||
opt.recursive = 0;
|
opt.recursive = 0;
|
||||||
result = ftp_loop (u, dt);
|
result = ftp_loop (u, dt);
|
||||||
opt.recursive = oldrec;
|
opt.recursive = oldrec;
|
||||||
@ -415,7 +386,7 @@ retrieve_url (const char *origurl, char **file, char **newloc,
|
|||||||
FTP. In these cases we must decide whether the text is HTML
|
FTP. In these cases we must decide whether the text is HTML
|
||||||
according to the suffix. The HTML suffixes are `.html' and
|
according to the suffix. The HTML suffixes are `.html' and
|
||||||
`.htm', case-insensitive. */
|
`.htm', case-insensitive. */
|
||||||
if (redirections && local_file && u->scheme == SCHEME_FTP)
|
if (redirection_count && local_file && u->scheme == SCHEME_FTP)
|
||||||
{
|
{
|
||||||
char *suf = suffix (local_file);
|
char *suf = suffix (local_file);
|
||||||
if (suf && (!strcasecmp (suf, "html") || !strcasecmp (suf, "htm")))
|
if (suf && (!strcasecmp (suf, "html") || !strcasecmp (suf, "htm")))
|
||||||
@ -448,8 +419,6 @@ retrieve_url (const char *origurl, char **file, char **newloc,
|
|||||||
logprintf (LOG_NOTQUIET, "%s: %s.\n", mynewloc,
|
logprintf (LOG_NOTQUIET, "%s: %s.\n", mynewloc,
|
||||||
url_error (up_error_code));
|
url_error (up_error_code));
|
||||||
url_free (u);
|
url_free (u);
|
||||||
if (redirections)
|
|
||||||
string_set_free (redirections);
|
|
||||||
xfree (url);
|
xfree (url);
|
||||||
xfree (mynewloc);
|
xfree (mynewloc);
|
||||||
return result;
|
return result;
|
||||||
@ -461,45 +430,18 @@ retrieve_url (const char *origurl, char **file, char **newloc,
|
|||||||
xfree (mynewloc);
|
xfree (mynewloc);
|
||||||
mynewloc = xstrdup (newloc_parsed->url);
|
mynewloc = xstrdup (newloc_parsed->url);
|
||||||
|
|
||||||
if (!redirections)
|
/* Check for max. number of redirections. */
|
||||||
{
|
|
||||||
redirections = make_string_hash_table (0);
|
|
||||||
/* Add current URL immediately so we can detect it as soon
|
|
||||||
as possible in case of a cycle. */
|
|
||||||
string_set_add (redirections, u->url);
|
|
||||||
}
|
|
||||||
|
|
||||||
/* The new location is OK. Check for max. number of
|
|
||||||
redirections. */
|
|
||||||
if (++redirection_count > MAX_REDIRECTIONS)
|
if (++redirection_count > MAX_REDIRECTIONS)
|
||||||
{
|
{
|
||||||
logprintf (LOG_NOTQUIET, _("%d redirections exceeded.\n"),
|
logprintf (LOG_NOTQUIET, _("%d redirections exceeded.\n"),
|
||||||
MAX_REDIRECTIONS);
|
MAX_REDIRECTIONS);
|
||||||
url_free (newloc_parsed);
|
url_free (newloc_parsed);
|
||||||
url_free (u);
|
url_free (u);
|
||||||
if (redirections)
|
|
||||||
string_set_free (redirections);
|
|
||||||
xfree (url);
|
xfree (url);
|
||||||
xfree (mynewloc);
|
xfree (mynewloc);
|
||||||
return WRONGCODE;
|
return WRONGCODE;
|
||||||
}
|
}
|
||||||
|
|
||||||
/*Check for redirection cycle by
|
|
||||||
peeking through the history of redirections. */
|
|
||||||
if (string_set_contains (redirections, newloc_parsed->url))
|
|
||||||
{
|
|
||||||
logprintf (LOG_NOTQUIET, _("%s: Redirection cycle detected.\n"),
|
|
||||||
mynewloc);
|
|
||||||
url_free (newloc_parsed);
|
|
||||||
url_free (u);
|
|
||||||
if (redirections)
|
|
||||||
string_set_free (redirections);
|
|
||||||
xfree (url);
|
|
||||||
xfree (mynewloc);
|
|
||||||
return WRONGCODE;
|
|
||||||
}
|
|
||||||
string_set_add (redirections, newloc_parsed->url);
|
|
||||||
|
|
||||||
xfree (url);
|
xfree (url);
|
||||||
url = mynewloc;
|
url = mynewloc;
|
||||||
url_free (u);
|
url_free (u);
|
||||||
@ -512,8 +454,8 @@ retrieve_url (const char *origurl, char **file, char **newloc,
|
|||||||
if (*dt & RETROKF)
|
if (*dt & RETROKF)
|
||||||
{
|
{
|
||||||
register_download (u->url, local_file);
|
register_download (u->url, local_file);
|
||||||
if (redirections)
|
if (redirection_count && 0 != strcmp (origurl, u->url))
|
||||||
register_all_redirections (redirections, u->url);
|
register_redirection (origurl, u->url);
|
||||||
if (*dt & TEXTHTML)
|
if (*dt & TEXTHTML)
|
||||||
register_html (u->url, local_file);
|
register_html (u->url, local_file);
|
||||||
}
|
}
|
||||||
@ -526,9 +468,8 @@ retrieve_url (const char *origurl, char **file, char **newloc,
|
|||||||
|
|
||||||
url_free (u);
|
url_free (u);
|
||||||
|
|
||||||
if (redirections)
|
if (redirection_count)
|
||||||
{
|
{
|
||||||
string_set_free (redirections);
|
|
||||||
if (newloc)
|
if (newloc)
|
||||||
*newloc = url;
|
*newloc = url;
|
||||||
else
|
else
|
||||||
|
Loading…
Reference in New Issue
Block a user