1
0
mirror of https://github.com/moparisthebest/wget synced 2024-07-03 16:38:41 -04:00
wget/src/ftp.c

1970 lines
53 KiB
C
Raw Normal View History

1999-12-02 02:42:23 -05:00
/* File Transfer Protocol support.
2001-05-27 15:35:15 -04:00
Copyright (C) 1995, 1996, 1997, 1998, 2000, 2001
Free Software Foundation, Inc.
1999-12-02 02:42:23 -05:00
2001-05-27 15:35:15 -04:00
This file is part of GNU Wget.
1999-12-02 02:42:23 -05:00
2001-05-27 15:35:15 -04:00
GNU Wget is free software; you can redistribute it and/or modify
1999-12-02 02:42:23 -05:00
it under the terms of the GNU General Public License as published by
the Free Software Foundation; either version 2 of the License, or
(at your option) any later version.
2001-05-27 15:35:15 -04:00
GNU Wget is distributed in the hope that it will be useful,
1999-12-02 02:42:23 -05:00
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
2001-05-27 15:35:15 -04:00
along with Wget; if not, write to the Free Software
Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
In addition, as a special exception, the Free Software Foundation
gives permission to link the code of its release of Wget with the
OpenSSL project's "OpenSSL" library (or with modified versions of it
that use the same license as the "OpenSSL" library), and distribute
the linked executables. You must obey the GNU General Public License
in all respects for all of the code used other than "OpenSSL". If you
modify this file, you may extend this exception to your version of the
file, but you are not obligated to do so. If you do not wish to do
so, delete this exception statement from your version. */
1999-12-02 02:42:23 -05:00
#include <config.h>
#include <stdio.h>
#include <stdlib.h>
#ifdef HAVE_STRING_H
# include <string.h>
#else
# include <strings.h>
#endif
#ifdef HAVE_UNISTD_H
# include <unistd.h>
#endif
#include <sys/types.h>
#include <assert.h>
#include <errno.h>
#include "wget.h"
#include "utils.h"
#include "url.h"
#include "rbuf.h"
#include "retr.h"
#include "ftp.h"
#include "connect.h"
#include "host.h"
#include "netrc.h"
#include "convert.h" /* for downloaded_file */
1999-12-02 02:42:23 -05:00
#ifndef errno
extern int errno;
#endif
extern LARGE_INT total_downloaded_bytes;
1999-12-02 02:42:23 -05:00
/* File where the "ls -al" listing will be saved. */
#define LIST_FILENAME ".listing"
extern char ftp_last_respline[];
typedef struct
{
int st; /* connection status */
int cmd; /* command code */
struct rbuf rbuf; /* control connection buffer */
double dltime; /* time of the download in msecs */
enum stype rs; /* remote system reported by ftp server */
char *id; /* initial directory */
char *target; /* target file name */
struct url *proxy; /* FTWK-style proxy */
} ccon;
1999-12-02 02:42:23 -05:00
/* Look for regexp "( *[0-9]+ *byte" (literal parenthesis) anywhere in
the string S, and return the number converted to long, if found, 0
otherwise. */
static long
ftp_expected_bytes (const char *s)
{
long res;
while (1)
{
while (*s && *s != '(')
++s;
if (!*s)
return 0;
for (++s; *s && ISSPACE (*s); s++);
if (!*s)
return 0;
if (!ISDIGIT (*s))
continue;
res = 0;
do
{
res = (*s - '0') + 10 * res;
++s;
}
while (*s && ISDIGIT (*s));
if (!*s)
return 0;
while (*s && ISSPACE (*s))
++s;
if (!*s)
return 0;
2000-04-12 09:23:35 -04:00
if (TOLOWER (*s) != 'b')
1999-12-02 02:42:23 -05:00
continue;
if (strncasecmp (s, "byte", 4))
continue;
else
break;
}
return res;
}
2003-10-29 13:23:56 -05:00
#ifdef ENABLE_IPV6
static int
getfamily (int fd)
{
struct sockaddr_storage ss;
struct sockaddr *sa = (struct sockaddr *)&ss;
socklen_t len = sizeof (ss);
assert (fd >= 0);
if (getpeername (fd, sa, &len) < 0)
/* Mauro Tortonesi: HOW DO WE HANDLE THIS ERROR? */
abort ();
return sa->sa_family;
}
/*
* This function sets up a passive data connection with the FTP server.
* It is merely a wrapper around ftp_epsv, ftp_lpsv and ftp_pasv.
*/
static uerr_t
ftp_do_pasv (struct rbuf *rbuf, ip_address *addr, int *port)
2003-10-29 13:23:56 -05:00
{
uerr_t err;
int family;
family = getfamily (rbuf->fd);
assert (family == AF_INET || family == AF_INET6);
/* If our control connection is over IPv6, then we first try EPSV and then
* LPSV if the former is not supported. If the control connection is over
* IPv4, we simply issue the good old PASV request. */
if (family == AF_INET6)
{
if (!opt.server_response)
logputs (LOG_VERBOSE, "==> EPSV ... ");
err = ftp_epsv (rbuf, addr, port);
/* If EPSV is not supported try LPSV */
if (err == FTPNOPASV)
{
if (!opt.server_response)
logputs (LOG_VERBOSE, "==> LPSV ... ");
err = ftp_lpsv (rbuf, addr, port);
}
}
else
{
if (!opt.server_response)
logputs (LOG_VERBOSE, "==> PASV ... ");
err = ftp_pasv (rbuf, addr, port);
}
return err;
}
/*
* This function sets up an active data connection with the FTP server.
* It is merely a wrapper around ftp_eprt, ftp_lprt and ftp_port.
*/
static uerr_t
ftp_do_port (struct rbuf *rbuf, int *local_sock)
2003-10-29 13:23:56 -05:00
{
uerr_t err;
int family;
assert (rbuf != NULL);
assert (rbuf_initialized_p (rbuf));
family = getfamily (rbuf->fd);
assert (family == AF_INET || family == AF_INET6);
/* If our control connection is over IPv6, then we first try EPRT and then
* LPRT if the former is not supported. If the control connection is over
* IPv4, we simply issue the good old PORT request. */
if (family == AF_INET6)
{
if (!opt.server_response)
logputs (LOG_VERBOSE, "==> EPRT ... ");
err = ftp_eprt (rbuf, local_sock);
2003-10-29 13:23:56 -05:00
/* If EPRT is not supported try LPRT */
if (err == FTPPORTERR)
{
if (!opt.server_response)
logputs (LOG_VERBOSE, "==> LPRT ... ");
err = ftp_lprt (rbuf, local_sock);
2003-10-29 13:23:56 -05:00
}
}
else
{
if (!opt.server_response)
logputs (LOG_VERBOSE, "==> PORT ... ");
err = ftp_port (rbuf, local_sock);
2003-10-29 13:23:56 -05:00
}
return err;
}
#else
static uerr_t
ftp_do_pasv (struct rbuf *rbuf, ip_address *addr, int *port)
{
if (!opt.server_response)
logputs (LOG_VERBOSE, "==> PASV ... ");
return ftp_pasv (rbuf, addr, port);
}
static uerr_t
ftp_do_port (struct rbuf *rbuf, int *local_sock)
{
if (!opt.server_response)
logputs (LOG_VERBOSE, "==> PORT ... ");
return ftp_port (rbuf, local_sock);
}
2003-10-29 13:23:56 -05:00
#endif
1999-12-02 02:42:23 -05:00
/* Retrieves a file with denoted parameters through opening an FTP
connection to the server. It always closes the data connection,
and closes the control connection in case of error. */
static uerr_t
getftp (struct url *u, long *len, long restval, ccon *con)
1999-12-02 02:42:23 -05:00
{
int csock, dtsock, local_sock, res;
1999-12-02 02:42:23 -05:00
uerr_t err;
FILE *fp;
char *user, *passwd, *respline;
char *tms, *tmrate;
int cmd = con->cmd;
int pasv_mode_open = 0;
1999-12-02 02:42:23 -05:00
long expected_bytes = 0L;
assert (con != NULL);
assert (con->target != NULL);
1999-12-02 02:42:23 -05:00
/* Debug-check of the sanity of the request by making sure that LIST
and RETR are never both requested (since we can handle only one
at a time. */
assert (!((cmd & DO_LIST) && (cmd & DO_RETR)));
/* Make sure that at least *something* is requested. */
assert ((cmd & (DO_LIST | DO_CWD | DO_RETR | DO_LOGIN)) != 0);
user = u->user;
passwd = u->passwd;
search_netrc (u->host, (const char **)&user, (const char **)&passwd, 1);
user = user ? user : opt.ftp_acc;
passwd = passwd ? passwd : opt.ftp_pass;
assert (user && passwd);
dtsock = -1;
local_sock = -1;
1999-12-02 02:42:23 -05:00
con->dltime = 0;
if (!(cmd & DO_LOGIN))
csock = RBUF_FD (&con->rbuf);
else /* cmd & DO_LOGIN */
{
char type_char;
char *host = con->proxy ? con->proxy->host : u->host;
int port = con->proxy ? con->proxy->port : u->port;
char *logname = user;
if (con->proxy)
{
/* If proxy is in use, log in as username@target-site. */
logname = xmalloc (strlen (user) + 1 + strlen (u->host) + 1);
sprintf (logname, "%s@%s", user, u->host);
}
1999-12-02 02:42:23 -05:00
/* Login to the server: */
/* First: Establish the control connection. */
csock = connect_to_host (host, port);
if (csock == E_HOST)
return HOSTERR;
else if (csock < 0)
return CONNECT_ERROR (errno);
1999-12-02 02:42:23 -05:00
if (cmd & LEAVE_PENDING)
rbuf_initialize (&con->rbuf, csock);
else
rbuf_uninitialize (&con->rbuf);
1999-12-02 02:42:23 -05:00
/* Since this is a new connection, we may safely discard
anything left in the buffer. */
rbuf_discard (&con->rbuf);
/* Second: Login with proper USER/PASS sequence. */
logprintf (LOG_VERBOSE, _("Logging in as %s ... "), user);
if (opt.server_response)
logputs (LOG_ALWAYS, "\n");
err = ftp_login (&con->rbuf, logname, passwd);
if (con->proxy)
xfree (logname);
1999-12-02 02:42:23 -05:00
/* FTPRERR, FTPSRVERR, WRITEFAILED, FTPLOGREFUSED, FTPLOGINC */
switch (err)
{
case FTPRERR:
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET, _("\
Error in server response, closing control connection.\n"));
CLOSE (csock);
rbuf_uninitialize (&con->rbuf);
return err;
break;
case FTPSRVERR:
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET, _("Error in server greeting.\n"));
CLOSE (csock);
rbuf_uninitialize (&con->rbuf);
return err;
break;
case WRITEFAILED:
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET,
_("Write failed, closing control connection.\n"));
CLOSE (csock);
rbuf_uninitialize (&con->rbuf);
return err;
break;
case FTPLOGREFUSED:
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET, _("The server refuses login.\n"));
CLOSE (csock);
rbuf_uninitialize (&con->rbuf);
return FTPLOGREFUSED;
break;
case FTPLOGINC:
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET, _("Login incorrect.\n"));
CLOSE (csock);
rbuf_uninitialize (&con->rbuf);
return FTPLOGINC;
break;
case FTPOK:
if (!opt.server_response)
logputs (LOG_VERBOSE, _("Logged in!\n"));
break;
default:
abort ();
exit (1);
break;
}
/* Third: Get the system type */
if (!opt.server_response)
logprintf (LOG_VERBOSE, "==> SYST ... ");
err = ftp_syst (&con->rbuf, &con->rs);
/* FTPRERR */
switch (err)
{
case FTPRERR:
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET, _("\
Error in server response, closing control connection.\n"));
CLOSE (csock);
rbuf_uninitialize (&con->rbuf);
return err;
break;
case FTPSRVERR:
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET,
_("Server error, can't determine system type.\n"));
break;
case FTPOK:
/* Everything is OK. */
break;
default:
abort ();
break;
}
if (!opt.server_response && err != FTPSRVERR)
logputs (LOG_VERBOSE, _("done. "));
/* Fourth: Find the initial ftp directory */
if (!opt.server_response)
logprintf (LOG_VERBOSE, "==> PWD ... ");
err = ftp_pwd(&con->rbuf, &con->id);
/* FTPRERR */
switch (err)
{
case FTPRERR:
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET, _("\
Error in server response, closing control connection.\n"));
CLOSE (csock);
rbuf_uninitialize (&con->rbuf);
return err;
break;
case FTPSRVERR :
/* PWD unsupported -- assume "/". */
FREE_MAYBE (con->id);
con->id = xstrdup ("/");
break;
case FTPOK:
/* Everything is OK. */
break;
default:
abort ();
break;
}
/* VMS will report something like "PUB$DEVICE:[INITIAL.FOLDER]".
Convert it to "/INITIAL/FOLDER" */
if (con->rs == ST_VMS)
{
char *path = strchr (con->id, '[');
char *pathend = path ? strchr (path + 1, ']') : NULL;
if (!path || !pathend)
DEBUGP (("Initial VMS directory not in the form [...]!\n"));
else
{
char *idir = con->id;
DEBUGP (("Preprocessing the initial VMS directory\n"));
DEBUGP ((" old = '%s'\n", con->id));
/* We do the conversion in-place by copying the stuff
between [ and ] to the beginning, and changing dots
to slashes at the same time. */
*idir++ = '/';
for (++path; path < pathend; path++, idir++)
*idir = *path == '.' ? '/' : *path;
*idir = '\0';
DEBUGP ((" new = '%s'\n\n", con->id));
}
}
if (!opt.server_response)
logputs (LOG_VERBOSE, _("done.\n"));
/* Fifth: Set the FTP type. */
type_char = ftp_process_type (u->params);
1999-12-02 02:42:23 -05:00
if (!opt.server_response)
logprintf (LOG_VERBOSE, "==> TYPE %c ... ", type_char);
err = ftp_type (&con->rbuf, type_char);
1999-12-02 02:42:23 -05:00
/* FTPRERR, WRITEFAILED, FTPUNKNOWNTYPE */
switch (err)
{
case FTPRERR:
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET, _("\
Error in server response, closing control connection.\n"));
CLOSE (csock);
rbuf_uninitialize (&con->rbuf);
return err;
break;
case WRITEFAILED:
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET,
_("Write failed, closing control connection.\n"));
CLOSE (csock);
rbuf_uninitialize (&con->rbuf);
return err;
break;
case FTPUNKNOWNTYPE:
logputs (LOG_VERBOSE, "\n");
logprintf (LOG_NOTQUIET,
_("Unknown type `%c', closing control connection.\n"),
type_char);
1999-12-02 02:42:23 -05:00
CLOSE (csock);
rbuf_uninitialize (&con->rbuf);
return err;
case FTPOK:
/* Everything is OK. */
break;
default:
abort ();
break;
}
if (!opt.server_response)
logputs (LOG_VERBOSE, _("done. "));
} /* do login */
if (cmd & DO_CWD)
{
if (!*u->dir)
logputs (LOG_VERBOSE, _("==> CWD not needed.\n"));
else
{
char *target = u->dir;
DEBUGP (("changing working directory\n"));
/* Change working directory. To change to a non-absolute
Unix directory, we need to prepend initial directory
(con->id) to it. Absolute directories "just work".
A relative directory is one that does not begin with '/'
and, on non-Unix OS'es, one that doesn't begin with
"[a-z]:".
This is not done for OS400, which doesn't use
"/"-delimited directories, nor does it support directory
hierarchies. "CWD foo" followed by "CWD bar" leaves us
in "bar", not in "foo/bar", as would be customary
elsewhere. */
if (target[0] != '/'
&& !(con->rs != ST_UNIX
&& ISALPHA (target[0])
&& target[1] == ':')
&& con->rs != ST_OS400)
{
int idlen = strlen (con->id);
char *ntarget, *p;
/* Strip trailing slash(es) from con->id. */
while (idlen > 0 && con->id[idlen - 1] == '/')
--idlen;
p = ntarget = (char *)alloca (idlen + 1 + strlen (u->dir) + 1);
memcpy (p, con->id, idlen);
p += idlen;
*p++ = '/';
strcpy (p, target);
DEBUGP (("Prepended initial PWD to relative path:\n"));
DEBUGP ((" pwd: '%s'\n old: '%s'\n new: '%s'\n",
con->id, target, ntarget));
target = ntarget;
}
/* If the FTP host runs VMS, we will have to convert the absolute
directory path in UNIX notation to absolute directory path in
VMS notation as VMS FTP servers do not like UNIX notation of
absolute paths. "VMS notation" is [dir.subdir.subsubdir]. */
if (con->rs == ST_VMS)
{
char *tmpp;
char *ntarget = (char *)alloca (strlen (target) + 2);
/* We use a converted initial dir, so directories in
TARGET will be separated with slashes, something like
"/INITIAL/FOLDER/DIR/SUBDIR". Convert that to
"[INITIAL.FOLDER.DIR.SUBDIR]". */
strcpy (ntarget, target);
assert (*ntarget == '/');
*ntarget = '[';
for (tmpp = ntarget + 1; *tmpp; tmpp++)
if (*tmpp == '/')
*tmpp = '.';
*tmpp++ = ']';
*tmpp = '\0';
DEBUGP (("Changed file name to VMS syntax:\n"));
DEBUGP ((" Unix: '%s'\n VMS: '%s'\n", target, ntarget));
target = ntarget;
}
if (!opt.server_response)
logprintf (LOG_VERBOSE, "==> CWD %s ... ", target);
err = ftp_cwd (&con->rbuf, target);
1999-12-02 02:42:23 -05:00
/* FTPRERR, WRITEFAILED, FTPNSFOD */
switch (err)
{
case FTPRERR:
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET, _("\
Error in server response, closing control connection.\n"));
CLOSE (csock);
rbuf_uninitialize (&con->rbuf);
return err;
break;
case WRITEFAILED:
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET,
_("Write failed, closing control connection.\n"));
CLOSE (csock);
rbuf_uninitialize (&con->rbuf);
return err;
break;
case FTPNSFOD:
logputs (LOG_VERBOSE, "\n");
logprintf (LOG_NOTQUIET, _("No such directory `%s'.\n\n"),
u->dir);
CLOSE (csock);
rbuf_uninitialize (&con->rbuf);
return err;
break;
case FTPOK:
/* fine and dandy */
break;
default:
abort ();
break;
}
if (!opt.server_response)
logputs (LOG_VERBOSE, _("done.\n"));
}
}
else /* do not CWD */
logputs (LOG_VERBOSE, _("==> CWD not required.\n"));
if ((cmd & DO_RETR) && restval && *len == 0)
{
if (opt.verbose)
{
if (!opt.server_response)
logprintf (LOG_VERBOSE, "==> SIZE %s ... ", u->file);
}
err = ftp_size(&con->rbuf, u->file, len);
/* FTPRERR */
switch (err)
{
case FTPRERR:
case FTPSRVERR :
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET, _("\
Error in server response, closing control connection.\n"));
CLOSE (csock);
rbuf_uninitialize (&con->rbuf);
return err;
break;
case FTPOK:
/* Everything is OK. */
break;
default:
abort ();
break;
}
if (!opt.server_response)
logputs (LOG_VERBOSE, _("done.\n"));
}
1999-12-02 02:42:23 -05:00
/* If anything is to be retrieved, PORT (or PASV) must be sent. */
if (cmd & (DO_LIST | DO_RETR))
{
if (opt.ftp_pasv > 0)
1999-12-02 02:42:23 -05:00
{
ip_address passive_addr;
int passive_port;
2003-10-29 13:23:56 -05:00
err = ftp_do_pasv (&con->rbuf, &passive_addr, &passive_port);
1999-12-02 02:42:23 -05:00
/* FTPRERR, WRITEFAILED, FTPNOPASV, FTPINVPASV */
switch (err)
{
case FTPRERR:
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET, _("\
Error in server response, closing control connection.\n"));
CLOSE (csock);
rbuf_uninitialize (&con->rbuf);
return err;
break;
case WRITEFAILED:
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET,
_("Write failed, closing control connection.\n"));
CLOSE (csock);
rbuf_uninitialize (&con->rbuf);
return err;
break;
case FTPNOPASV:
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET, _("Cannot initiate PASV transfer.\n"));
break;
case FTPINVPASV:
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET, _("Cannot parse PASV response.\n"));
break;
case FTPOK:
/* fine and dandy */
break;
default:
abort ();
break;
} /* switch(err) */
1999-12-02 02:42:23 -05:00
if (err==FTPOK)
{
2003-10-29 13:23:56 -05:00
DEBUGP (("trying to connect to %s port %d\n",
pretty_print_address (&passive_addr),
passive_port));
dtsock = connect_to_ip (&passive_addr, passive_port, NULL);
if (dtsock < 0)
{
int save_errno = errno;
1999-12-02 02:42:23 -05:00
CLOSE (csock);
rbuf_uninitialize (&con->rbuf);
2003-10-29 13:23:56 -05:00
logprintf (LOG_VERBOSE, _("couldn't connect to %s port %hu: %s\n"),
pretty_print_address (&passive_addr), passive_port,
strerror (save_errno));
return CONNECT_ERROR (save_errno);
1999-12-02 02:42:23 -05:00
}
pasv_mode_open = 1; /* Flag to avoid accept port */
1999-12-02 02:42:23 -05:00
if (!opt.server_response)
logputs (LOG_VERBOSE, _("done. "));
} /* err==FTP_OK */
}
if (!pasv_mode_open) /* Try to use a port command if PASV failed */
1999-12-02 02:42:23 -05:00
{
err = ftp_do_port (&con->rbuf, &local_sock);
1999-12-02 02:42:23 -05:00
/* FTPRERR, WRITEFAILED, bindport (CONSOCKERR, CONPORTERR, BINDERR,
LISTENERR), HOSTERR, FTPPORTERR */
switch (err)
{
case FTPRERR:
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET, _("\
Error in server response, closing control connection.\n"));
CLOSE (csock);
CLOSE (dtsock);
CLOSE (local_sock);
1999-12-02 02:42:23 -05:00
rbuf_uninitialize (&con->rbuf);
return err;
break;
case WRITEFAILED:
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET,
_("Write failed, closing control connection.\n"));
CLOSE (csock);
CLOSE (dtsock);
CLOSE (local_sock);
1999-12-02 02:42:23 -05:00
rbuf_uninitialize (&con->rbuf);
return err;
break;
case CONSOCKERR:
logputs (LOG_VERBOSE, "\n");
logprintf (LOG_NOTQUIET, "socket: %s\n", strerror (errno));
CLOSE (csock);
CLOSE (dtsock);
CLOSE (local_sock);
1999-12-02 02:42:23 -05:00
rbuf_uninitialize (&con->rbuf);
return err;
break;
case CONPORTERR: case BINDERR: case LISTENERR:
/* What now? These problems are local... */
logputs (LOG_VERBOSE, "\n");
logprintf (LOG_NOTQUIET, _("Bind error (%s).\n"),
strerror (errno));
CLOSE (dtsock);
CLOSE (local_sock);
1999-12-02 02:42:23 -05:00
return err;
break;
case FTPPORTERR:
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET, _("Invalid PORT.\n"));
CLOSE (csock);
CLOSE (dtsock);
CLOSE (local_sock);
1999-12-02 02:42:23 -05:00
rbuf_uninitialize (&con->rbuf);
return err;
break;
case FTPOK:
/* fine and dandy */
break;
default:
abort ();
break;
} /* port switch */
if (!opt.server_response)
logputs (LOG_VERBOSE, _("done. "));
} /* dtsock == -1 */
} /* cmd & (DO_LIST | DO_RETR) */
/* Restart if needed. */
if (restval && (cmd & DO_RETR))
{
if (!opt.server_response)
logprintf (LOG_VERBOSE, "==> REST %ld ... ", restval);
err = ftp_rest (&con->rbuf, restval);
/* FTPRERR, WRITEFAILED, FTPRESTFAIL */
switch (err)
{
case FTPRERR:
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET, _("\
Error in server response, closing control connection.\n"));
CLOSE (csock);
CLOSE (dtsock);
CLOSE (local_sock);
1999-12-02 02:42:23 -05:00
rbuf_uninitialize (&con->rbuf);
return err;
break;
case WRITEFAILED:
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET,
_("Write failed, closing control connection.\n"));
CLOSE (csock);
CLOSE (dtsock);
CLOSE (local_sock);
1999-12-02 02:42:23 -05:00
rbuf_uninitialize (&con->rbuf);
return err;
break;
case FTPRESTFAIL:
/* If `-c' is specified and the file already existed when
Wget was started, it would be a bad idea for us to start
downloading it from scratch, effectively truncating it. */
if (opt.always_rest && (cmd & NO_TRUNCATE))
{
logprintf (LOG_NOTQUIET,
_("\nREST failed; will not truncate `%s'.\n"),
con->target);
CLOSE (csock);
CLOSE (dtsock);
CLOSE (local_sock);
rbuf_uninitialize (&con->rbuf);
return CONTNOTSUPPORTED;
}
1999-12-02 02:42:23 -05:00
logputs (LOG_VERBOSE, _("\nREST failed, starting from scratch.\n"));
restval = 0L;
break;
case FTPOK:
/* fine and dandy */
break;
default:
abort ();
break;
}
if (err != FTPRESTFAIL && !opt.server_response)
logputs (LOG_VERBOSE, _("done. "));
} /* restval && cmd & DO_RETR */
if (cmd & DO_RETR)
{
/* If we're in spider mode, don't really retrieve anything. The
fact that we got to this point should be proof enough that
the file exists, vaguely akin to HTTP's concept of a "HEAD"
request. */
if (opt.spider)
{
CLOSE (csock);
CLOSE (dtsock);
CLOSE (local_sock);
rbuf_uninitialize (&con->rbuf);
return RETRFINISHED;
}
1999-12-02 02:42:23 -05:00
if (opt.verbose)
{
if (!opt.server_response)
{
if (restval)
logputs (LOG_VERBOSE, "\n");
logprintf (LOG_VERBOSE, "==> RETR %s ... ", u->file);
}
}
2003-10-29 13:23:56 -05:00
1999-12-02 02:42:23 -05:00
err = ftp_retr (&con->rbuf, u->file);
/* FTPRERR, WRITEFAILED, FTPNSFOD */
switch (err)
{
case FTPRERR:
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET, _("\
Error in server response, closing control connection.\n"));
CLOSE (csock);
CLOSE (dtsock);
CLOSE (local_sock);
1999-12-02 02:42:23 -05:00
rbuf_uninitialize (&con->rbuf);
return err;
break;
case WRITEFAILED:
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET,
_("Write failed, closing control connection.\n"));
CLOSE (csock);
CLOSE (dtsock);
CLOSE (local_sock);
1999-12-02 02:42:23 -05:00
rbuf_uninitialize (&con->rbuf);
return err;
break;
case FTPNSFOD:
logputs (LOG_VERBOSE, "\n");
logprintf (LOG_NOTQUIET, _("No such file `%s'.\n\n"), u->file);
CLOSE (dtsock);
CLOSE (local_sock);
1999-12-02 02:42:23 -05:00
return err;
break;
case FTPOK:
/* fine and dandy */
break;
default:
abort ();
break;
}
if (!opt.server_response)
logputs (LOG_VERBOSE, _("done.\n"));
expected_bytes = ftp_expected_bytes (ftp_last_respline);
} /* do retrieve */
if (cmd & DO_LIST)
{
if (!opt.server_response)
logputs (LOG_VERBOSE, "==> LIST ... ");
/* As Maciej W. Rozycki (macro@ds2.pg.gda.pl) says, `LIST'
without arguments is better than `LIST .'; confirmed by
RFC959. */
err = ftp_list (&con->rbuf, NULL);
/* FTPRERR, WRITEFAILED */
switch (err)
{
case FTPRERR:
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET, _("\
Error in server response, closing control connection.\n"));
CLOSE (csock);
CLOSE (dtsock);
CLOSE (local_sock);
1999-12-02 02:42:23 -05:00
rbuf_uninitialize (&con->rbuf);
return err;
break;
case WRITEFAILED:
logputs (LOG_VERBOSE, "\n");
logputs (LOG_NOTQUIET,
_("Write failed, closing control connection.\n"));
CLOSE (csock);
CLOSE (dtsock);
CLOSE (local_sock);
1999-12-02 02:42:23 -05:00
rbuf_uninitialize (&con->rbuf);
return err;
break;
case FTPNSFOD:
logputs (LOG_VERBOSE, "\n");
logprintf (LOG_NOTQUIET, _("No such file or directory `%s'.\n\n"),
".");
CLOSE (dtsock);
CLOSE (local_sock);
1999-12-02 02:42:23 -05:00
return err;
break;
case FTPOK:
/* fine and dandy */
break;
default:
abort ();
break;
}
if (!opt.server_response)
logputs (LOG_VERBOSE, _("done.\n"));
expected_bytes = ftp_expected_bytes (ftp_last_respline);
} /* cmd & DO_LIST */
if (!(cmd & (DO_LIST | DO_RETR)) || (opt.spider && !(cmd & DO_LIST)))
return RETRFINISHED;
/* Some FTP servers return the total length of file after REST
command, others just return the remaining size. */
if (*len && restval && expected_bytes
&& (expected_bytes == *len - restval))
{
DEBUGP (("Lying FTP server found, adjusting.\n"));
expected_bytes = *len;
}
1999-12-02 02:42:23 -05:00
/* If no transmission was required, then everything is OK. */
if (!pasv_mode_open) /* we are not using pasive mode so we need
1999-12-02 02:42:23 -05:00
to accept */
{
/* Open the data transmission socket by calling acceptport(). */
err = acceptport (local_sock, &dtsock);
1999-12-02 02:42:23 -05:00
/* Possible errors: ACCEPTERR. */
if (err == ACCEPTERR)
{
logprintf (LOG_NOTQUIET, "accept: %s\n", strerror (errno));
return err;
}
}
/* Open the file -- if opt.dfp is set, use it instead. */
if (!opt.dfp || con->cmd & DO_LIST)
{
mkalldirs (con->target);
1999-12-02 02:42:23 -05:00
if (opt.backups)
rotate_backups (con->target);
1999-12-02 02:42:23 -05:00
/* #### Is this correct? */
chmod (con->target, 0600);
1999-12-02 02:42:23 -05:00
fp = fopen (con->target, restval ? "ab" : "wb");
1999-12-02 02:42:23 -05:00
if (!fp)
{
logprintf (LOG_NOTQUIET, "%s: %s\n", con->target, strerror (errno));
1999-12-02 02:42:23 -05:00
CLOSE (csock);
rbuf_uninitialize (&con->rbuf);
CLOSE (dtsock);
CLOSE (local_sock);
1999-12-02 02:42:23 -05:00
return FOPENERR;
}
}
else
{
extern int global_download_count;
fp = opt.dfp;
/* Rewind the output document if the download starts over and if
this is the first download. See gethttp() for a longer
explanation. */
if (!restval && global_download_count == 0 && opt.dfp != stdout)
{
/* This will silently fail for streams that don't correspond
to regular files, but that's OK. */
rewind (fp);
/* ftruncate is needed because opt.dfp is opened in append
mode if opt.always_rest is set. */
ftruncate (fileno (fp), 0);
clearerr (fp);
}
}
1999-12-02 02:42:23 -05:00
if (*len)
{
logprintf (LOG_VERBOSE, _("Length: %s"), legible (*len));
if (restval)
logprintf (LOG_VERBOSE, _(" [%s to go]"), legible (*len - restval));
logputs (LOG_VERBOSE, "\n");
expected_bytes = *len; /* for get_contents/show_progress */
1999-12-02 02:42:23 -05:00
}
else if (expected_bytes)
{
logprintf (LOG_VERBOSE, _("Length: %s"), legible (expected_bytes));
if (restval)
logprintf (LOG_VERBOSE, _(" [%s to go]"),
legible (expected_bytes - restval));
logputs (LOG_VERBOSE, _(" (unauthoritative)\n"));
}
1999-12-02 02:42:23 -05:00
/* Get the contents of the document. */
res = get_contents (dtsock, fp, len, restval, expected_bytes, &con->rbuf,
0, &con->dltime);
1999-12-02 02:42:23 -05:00
tms = time_str (NULL);
tmrate = retr_rate (*len - restval, con->dltime, 0);
1999-12-02 02:42:23 -05:00
/* Close data connection socket. */
CLOSE (dtsock);
CLOSE (local_sock);
1999-12-02 02:42:23 -05:00
/* Close the local file. */
{
/* Close or flush the file. We have to be careful to check for
error here. Checking the result of fwrite() is not enough --
errors could go unnoticed! */
int flush_res;
if (!opt.dfp || con->cmd & DO_LIST)
flush_res = fclose (fp);
else
flush_res = fflush (fp);
if (flush_res == EOF)
res = -2;
}
2003-10-29 13:23:56 -05:00
1999-12-02 02:42:23 -05:00
/* If get_contents couldn't write to fp, bail out. */
if (res == -2)
{
logprintf (LOG_NOTQUIET, _("%s: %s, closing control connection.\n"),
con->target, strerror (errno));
1999-12-02 02:42:23 -05:00
CLOSE (csock);
rbuf_uninitialize (&con->rbuf);
return FWRITEERR;
}
else if (res == -1)
{
logprintf (LOG_NOTQUIET, _("%s (%s) - Data connection: %s; "),
tms, tmrate, strerror (errno));
if (opt.server_response)
logputs (LOG_ALWAYS, "\n");
}
/* Get the server to tell us if everything is retrieved. */
err = ftp_response (&con->rbuf, &respline);
/* ...and empty the buffer. */
rbuf_discard (&con->rbuf);
if (err != FTPOK)
{
xfree (respline);
1999-12-02 02:42:23 -05:00
/* The control connection is decidedly closed. Print the time
only if it hasn't already been printed. */
if (res != -1)
logprintf (LOG_NOTQUIET, "%s (%s) - ", tms, tmrate);
logputs (LOG_NOTQUIET, _("Control connection closed.\n"));
/* If there is an error on the control connection, close it, but
return FTPRETRINT, since there is a possibility that the
whole file was retrieved nevertheless (but that is for
ftp_loop_internal to decide). */
CLOSE (csock);
rbuf_uninitialize (&con->rbuf);
return FTPRETRINT;
} /* err != FTPOK */
/* If retrieval failed for any reason, return FTPRETRINT, but do not
close socket, since the control connection is still alive. If
there is something wrong with the control connection, it will
become apparent later. */
if (*respline != '2')
{
xfree (respline);
1999-12-02 02:42:23 -05:00
if (res != -1)
logprintf (LOG_NOTQUIET, "%s (%s) - ", tms, tmrate);
logputs (LOG_NOTQUIET, _("Data transfer aborted.\n"));
return FTPRETRINT;
}
xfree (respline);
1999-12-02 02:42:23 -05:00
if (res == -1)
{
/* What now? The data connection was erroneous, whereas the
response says everything is OK. We shall play it safe. */
return FTPRETRINT;
}
if (!(cmd & LEAVE_PENDING))
{
/* I should probably send 'QUIT' and check for a reply, but this
is faster. #### Is it OK, though? */
CLOSE (csock);
rbuf_uninitialize (&con->rbuf);
}
/* If it was a listing, and opt.server_response is true,
print it out. */
if (opt.server_response && (con->cmd & DO_LIST))
{
mkalldirs (con->target);
fp = fopen (con->target, "r");
1999-12-02 02:42:23 -05:00
if (!fp)
logprintf (LOG_ALWAYS, "%s: %s\n", con->target, strerror (errno));
1999-12-02 02:42:23 -05:00
else
{
char *line;
/* The lines are being read with read_whole_line because of
no-buffering on opt.lfile. */
while ((line = read_whole_line (fp)))
{
logprintf (LOG_ALWAYS, "%s\n", line);
xfree (line);
1999-12-02 02:42:23 -05:00
}
fclose (fp);
}
} /* con->cmd & DO_LIST && server_response */
return RETRFINISHED;
}
/* A one-file FTP loop. This is the part where FTP retrieval is
retried, and retried, and retried, and...
This loop either gets commands from con, or (if ON_YOUR_OWN is
set), makes them up to retrieve the file given by the URL. */
static uerr_t
ftp_loop_internal (struct url *u, struct fileinfo *f, ccon *con)
1999-12-02 02:42:23 -05:00
{
int count, orig_lp;
1999-12-02 02:42:23 -05:00
long restval, len;
char *tms, *locf;
char *tmrate = NULL;
1999-12-02 02:42:23 -05:00
uerr_t err;
struct stat st;
if (!con->target)
con->target = url_file_name (u);
1999-12-02 02:42:23 -05:00
if (opt.noclobber && file_exists_p (con->target))
1999-12-02 02:42:23 -05:00
{
logprintf (LOG_VERBOSE,
_("File `%s' already there, not retrieving.\n"), con->target);
1999-12-02 02:42:23 -05:00
/* If the file is there, we suppose it's retrieved OK. */
return RETROK;
}
/* Remove it if it's a link. */
remove_link (con->target);
1999-12-02 02:42:23 -05:00
if (!opt.output_document)
locf = con->target;
1999-12-02 02:42:23 -05:00
else
locf = opt.output_document;
count = 0;
if (con->st & ON_YOUR_OWN)
con->st = ON_YOUR_OWN;
orig_lp = con->cmd & LEAVE_PENDING ? 1 : 0;
/* THE loop. */
do
{
/* Increment the pass counter. */
++count;
2000-12-05 19:24:40 -05:00
sleep_between_retrievals (count);
1999-12-02 02:42:23 -05:00
if (con->st & ON_YOUR_OWN)
{
con->cmd = 0;
con->cmd |= (DO_RETR | LEAVE_PENDING);
if (rbuf_initialized_p (&con->rbuf))
con->cmd &= ~ (DO_LOGIN | DO_CWD);
else
con->cmd |= (DO_LOGIN | DO_CWD);
}
else /* not on your own */
{
if (rbuf_initialized_p (&con->rbuf))
con->cmd &= ~DO_LOGIN;
else
con->cmd |= DO_LOGIN;
if (con->st & DONE_CWD)
con->cmd &= ~DO_CWD;
else
con->cmd |= DO_CWD;
}
1999-12-02 02:42:23 -05:00
/* Assume no restarting. */
restval = 0L;
if ((count > 1 || opt.always_rest)
&& !(con->cmd & DO_LIST)
&& file_exists_p (locf))
if (stat (locf, &st) == 0 && S_ISREG (st.st_mode))
1999-12-02 02:42:23 -05:00
restval = st.st_size;
/* In `-c' is used, check whether the file we're writing to
exists and is of non-zero length. If so, we'll refuse to
truncate it if the server doesn't support continued
downloads. */
if (opt.always_rest && restval > 0)
con->cmd |= NO_TRUNCATE;
1999-12-02 02:42:23 -05:00
/* Get the current time string. */
tms = time_str (NULL);
/* Print fetch message, if opt.verbose. */
if (opt.verbose)
{
char *hurl = url_string (u, 1);
1999-12-02 02:42:23 -05:00
char tmp[15];
strcpy (tmp, " ");
if (count > 1)
sprintf (tmp, _("(try:%2d)"), count);
logprintf (LOG_VERBOSE, "--%s-- %s\n %s => `%s'\n",
tms, hurl, tmp, locf);
#ifdef WINDOWS
ws_changetitle (hurl, 1);
#endif
xfree (hurl);
1999-12-02 02:42:23 -05:00
}
/* Send getftp the proper length, if fileinfo was provided. */
if (f)
len = f->size;
else
len = 0;
err = getftp (u, &len, restval, con);
if (!rbuf_initialized_p (&con->rbuf))
con->st &= ~DONE_CWD;
else
con->st |= DONE_CWD;
switch (err)
{
2003-10-29 18:13:25 -05:00
case HOSTERR: case CONIMPOSSIBLE: case FWRITEERR: case FOPENERR:
case FTPNSFOD: case FTPLOGINC: case FTPNOPASV: case CONTNOTSUPPORTED:
1999-12-02 02:42:23 -05:00
/* Fatal errors, give up. */
return err;
break;
case CONSOCKERR: case CONERROR: case FTPSRVERR: case FTPRERR:
case WRITEFAILED: case FTPUNKNOWNTYPE: case CONPORTERR:
case BINDERR: case LISTENERR: case ACCEPTERR:
case FTPPORTERR: case FTPLOGREFUSED: case FTPINVPASV:
printwhat (count, opt.ntry);
/* non-fatal errors */
continue;
break;
case FTPRETRINT:
/* If the control connection was closed, the retrieval
will be considered OK if f->size == len. */
if (!f || len != f->size)
{
printwhat (count, opt.ntry);
continue;
}
break;
case RETRFINISHED:
/* Great! */
break;
default:
/* Not as great. */
abort ();
}
/* Time? */
tms = time_str (NULL);
if (!opt.spider)
tmrate = retr_rate (len - restval, con->dltime, 0);
/* If we get out of the switch above without continue'ing, we've
successfully downloaded a file. Remember this fact. */
downloaded_file (FILE_DOWNLOADED_NORMALLY, locf);
1999-12-02 02:42:23 -05:00
if (con->st & ON_YOUR_OWN)
{
CLOSE (RBUF_FD (&con->rbuf));
rbuf_uninitialize (&con->rbuf);
}
if (!opt.spider)
logprintf (LOG_VERBOSE, _("%s (%s) - `%s' saved [%ld]\n\n"),
tms, tmrate, locf, len);
if (!opt.verbose && !opt.quiet)
{
/* Need to hide the password from the URL. The `if' is here
so that we don't do the needless allocation every
time. */
char *hurl = url_string (u, 1);
logprintf (LOG_NONVERBOSE, "%s URL: %s [%ld] -> \"%s\" [%d]\n",
tms, hurl, len, locf, count);
xfree (hurl);
}
if ((con->cmd & DO_LIST))
/* This is a directory listing file. */
{
if (!opt.remove_listing)
/* --dont-remove-listing was specified, so do count this towards the
number of bytes and files downloaded. */
{
total_downloaded_bytes += len;
opt.numurls++;
}
/* Deletion of listing files is not controlled by --delete-after, but
by the more specific option --dont-remove-listing, and the code
to do this deletion is in another function. */
}
else if (!opt.spider)
/* This is not a directory listing file. */
1999-12-02 02:42:23 -05:00
{
/* Unlike directory listing files, don't pretend normal files weren't
downloaded if they're going to be deleted. People seeding proxies,
for instance, may want to know how many bytes and files they've
downloaded through it. */
total_downloaded_bytes += len;
opt.numurls++;
if (opt.delete_after)
{
DEBUGP (("Removing file due to --delete-after in"
" ftp_loop_internal():\n"));
logprintf (LOG_VERBOSE, _("Removing %s.\n"), locf);
if (unlink (locf))
logprintf (LOG_NOTQUIET, "unlink: %s\n", strerror (errno));
}
1999-12-02 02:42:23 -05:00
}
2003-10-29 13:23:56 -05:00
1999-12-02 02:42:23 -05:00
/* Restore the original leave-pendingness. */
if (orig_lp)
con->cmd |= LEAVE_PENDING;
else
con->cmd &= ~LEAVE_PENDING;
return RETROK;
} while (!opt.ntry || (count < opt.ntry));
if (rbuf_initialized_p (&con->rbuf) && (con->st & ON_YOUR_OWN))
{
CLOSE (RBUF_FD (&con->rbuf));
rbuf_uninitialize (&con->rbuf);
}
return TRYLIMEXC;
}
/* Return the directory listing in a reusable format. The directory
is specifed in u->dir. */
uerr_t
ftp_get_listing (struct url *u, ccon *con, struct fileinfo **f)
1999-12-02 02:42:23 -05:00
{
uerr_t err;
char *uf; /* url file name */
char *lf; /* list file name */
char *old_target = con->target;
1999-12-02 02:42:23 -05:00
con->st &= ~ON_YOUR_OWN;
con->cmd |= (DO_LIST | LEAVE_PENDING);
con->cmd &= ~DO_RETR;
/* Find the listing file name. We do it by taking the file name of
the URL and replacing the last component with the listing file
name. */
uf = url_file_name (u);
lf = file_merge (uf, LIST_FILENAME);
xfree (uf);
DEBUGP ((_("Using `%s' as listing tmp file.\n"), lf));
con->target = lf;
1999-12-02 02:42:23 -05:00
err = ftp_loop_internal (u, NULL, con);
con->target = old_target;
1999-12-02 02:42:23 -05:00
if (err == RETROK)
*f = ftp_parse_ls (lf, con->rs);
1999-12-02 02:42:23 -05:00
else
*f = NULL;
1999-12-02 02:42:23 -05:00
if (opt.remove_listing)
{
if (unlink (lf))
1999-12-02 02:42:23 -05:00
logprintf (LOG_NOTQUIET, "unlink: %s\n", strerror (errno));
else
logprintf (LOG_VERBOSE, _("Removed `%s'.\n"), lf);
1999-12-02 02:42:23 -05:00
}
xfree (lf);
1999-12-02 02:42:23 -05:00
con->cmd &= ~DO_LIST;
return err;
1999-12-02 02:42:23 -05:00
}
static uerr_t ftp_retrieve_dirs PARAMS ((struct url *, struct fileinfo *,
1999-12-02 02:42:23 -05:00
ccon *));
static uerr_t ftp_retrieve_glob PARAMS ((struct url *, ccon *, int));
1999-12-02 02:42:23 -05:00
static struct fileinfo *delelement PARAMS ((struct fileinfo *,
struct fileinfo **));
static void freefileinfo PARAMS ((struct fileinfo *f));
/* Retrieve a list of files given in struct fileinfo linked list. If
a file is a symbolic link, do not retrieve it, but rather try to
set up a similar link on the local disk, if the symlinks are
supported.
If opt.recursive is set, after all files have been retrieved,
ftp_retrieve_dirs will be called to retrieve the directories. */
static uerr_t
ftp_retrieve_list (struct url *u, struct fileinfo *f, ccon *con)
1999-12-02 02:42:23 -05:00
{
static int depth = 0;
uerr_t err;
struct fileinfo *orig;
long local_size;
time_t tml;
int dlthis;
/* Increase the depth. */
++depth;
if (opt.reclevel != INFINITE_RECURSION && depth > opt.reclevel)
1999-12-02 02:42:23 -05:00
{
DEBUGP ((_("Recursion depth %d exceeded max. depth %d.\n"),
depth, opt.reclevel));
--depth;
return RECLEVELEXC;
}
assert (f != NULL);
orig = f;
con->st &= ~ON_YOUR_OWN;
if (!(con->st & DONE_CWD))
con->cmd |= DO_CWD;
else
con->cmd &= ~DO_CWD;
con->cmd |= (DO_RETR | LEAVE_PENDING);
if (!rbuf_initialized_p (&con->rbuf))
con->cmd |= DO_LOGIN;
else
con->cmd &= ~DO_LOGIN;
err = RETROK; /* in case it's not used */
while (f)
{
char *old_target, *ofile;
if (opt.quota && total_downloaded_bytes > opt.quota)
1999-12-02 02:42:23 -05:00
{
--depth;
return QUOTEXC;
}
old_target = con->target;
ofile = xstrdup (u->file);
url_set_file (u, f->name);
con->target = url_file_name (u);
1999-12-02 02:42:23 -05:00
err = RETROK;
dlthis = 1;
if (opt.timestamping && f->type == FT_PLAINFILE)
{
1999-12-02 02:42:23 -05:00
struct stat st;
/* If conversion of HTML files retrieved via FTP is ever implemented,
we'll need to stat() <file>.orig here when -K has been specified.
I'm not implementing it now since files on an FTP server are much
more likely than files on an HTTP server to legitimately have a
.orig suffix. */
if (!stat (con->target, &st))
1999-12-02 02:42:23 -05:00
{
int eq_size;
int cor_val;
1999-12-02 02:42:23 -05:00
/* Else, get it from the file. */
local_size = st.st_size;
tml = st.st_mtime;
#ifdef WINDOWS
/* Modification time granularity is 2 seconds for Windows, so
increase local time by 1 second for later comparison. */
tml++;
#endif
/* Compare file sizes only for servers that tell us correct
values. Assumme sizes being equal for servers that lie
about file size. */
cor_val = (con->rs == ST_UNIX || con->rs == ST_WINNT);
eq_size = cor_val ? (local_size == f->size) : 1 ;
if (f->tstamp <= tml && eq_size)
1999-12-02 02:42:23 -05:00
{
/* Remote file is older, file sizes can be compared and
are both equal. */
logprintf (LOG_VERBOSE, _("\
Remote file no newer than local file `%s' -- not retrieving.\n"), con->target);
1999-12-02 02:42:23 -05:00
dlthis = 0;
}
else if (eq_size)
{
/* Remote file is newer or sizes cannot be matched */
logprintf (LOG_VERBOSE, _("\
Remote file is newer than local file `%s' -- retrieving.\n\n"),
con->target);
}
else
{
/* Sizes do not match */
logprintf (LOG_VERBOSE, _("\
The sizes do not match (local %ld) -- retrieving.\n\n"), local_size);
}
}
1999-12-02 02:42:23 -05:00
} /* opt.timestamping && f->type == FT_PLAINFILE */
switch (f->type)
{
case FT_SYMLINK:
/* If opt.retr_symlinks is defined, we treat symlinks as
if they were normal files. There is currently no way
to distinguish whether they might be directories, and
follow them. */
if (!opt.retr_symlinks)
{
#ifdef HAVE_SYMLINK
if (!f->linkto)
logputs (LOG_NOTQUIET,
_("Invalid name of the symlink, skipping.\n"));
else
{
struct stat st;
/* Check whether we already have the correct
symbolic link. */
int rc = lstat (con->target, &st);
1999-12-02 02:42:23 -05:00
if (rc == 0)
{
size_t len = strlen (f->linkto) + 1;
if (S_ISLNK (st.st_mode))
{
char *link_target = (char *)alloca (len);
size_t n = readlink (con->target, link_target, len);
1999-12-02 02:42:23 -05:00
if ((n == len - 1)
&& (memcmp (link_target, f->linkto, n) == 0))
{
logprintf (LOG_VERBOSE, _("\
Already have correct symlink %s -> %s\n\n"),
con->target, f->linkto);
1999-12-02 02:42:23 -05:00
dlthis = 0;
break;
}
}
}
logprintf (LOG_VERBOSE, _("Creating symlink %s -> %s\n"),
con->target, f->linkto);
1999-12-02 02:42:23 -05:00
/* Unlink before creating symlink! */
unlink (con->target);
if (symlink (f->linkto, con->target) == -1)
1999-12-02 02:42:23 -05:00
logprintf (LOG_NOTQUIET, "symlink: %s\n",
strerror (errno));
logputs (LOG_VERBOSE, "\n");
} /* have f->linkto */
#else /* not HAVE_SYMLINK */
logprintf (LOG_NOTQUIET,
_("Symlinks not supported, skipping symlink `%s'.\n"),
con->target);
1999-12-02 02:42:23 -05:00
#endif /* not HAVE_SYMLINK */
}
else /* opt.retr_symlinks */
{
if (dlthis)
err = ftp_loop_internal (u, f, con);
} /* opt.retr_symlinks */
break;
case FT_DIRECTORY:
if (!opt.recursive)
logprintf (LOG_NOTQUIET, _("Skipping directory `%s'.\n"),
f->name);
break;
case FT_PLAINFILE:
/* Call the retrieve loop. */
if (dlthis)
err = ftp_loop_internal (u, f, con);
break;
case FT_UNKNOWN:
logprintf (LOG_NOTQUIET, _("%s: unknown/unsupported file type.\n"),
f->name);
break;
} /* switch */
/* Set the time-stamp information to the local file. Symlinks
are not to be stamped because it sets the stamp on the
original. :( */
if (!(f->type == FT_SYMLINK && !opt.retr_symlinks)
1999-12-02 02:42:23 -05:00
&& f->tstamp != -1
&& dlthis
&& file_exists_p (con->target))
1999-12-02 02:42:23 -05:00
{
/* #### This code repeats in http.c and ftp.c. Move it to a
function! */
const char *fl = NULL;
if (opt.output_document)
{
if (opt.od_known_regular)
fl = opt.output_document;
}
else
fl = con->target;
if (fl)
touch (fl, f->tstamp);
1999-12-02 02:42:23 -05:00
}
else if (f->tstamp == -1)
logprintf (LOG_NOTQUIET, _("%s: corrupt time-stamp.\n"), con->target);
1999-12-02 02:42:23 -05:00
2000-06-01 07:20:05 -04:00
if (f->perms && f->type == FT_PLAINFILE && dlthis)
chmod (con->target, f->perms);
1999-12-02 02:42:23 -05:00
else
DEBUGP (("Unrecognized permissions for %s.\n", con->target));
xfree (con->target);
con->target = old_target;
url_set_file (u, ofile);
xfree (ofile);
1999-12-02 02:42:23 -05:00
/* Break on fatals. */
if (err == QUOTEXC || err == HOSTERR || err == FWRITEERR)
break;
con->cmd &= ~ (DO_CWD | DO_LOGIN);
f = f->next;
}
1999-12-02 02:42:23 -05:00
/* We do not want to call ftp_retrieve_dirs here */
if (opt.recursive &&
!(opt.reclevel != INFINITE_RECURSION && depth >= opt.reclevel))
1999-12-02 02:42:23 -05:00
err = ftp_retrieve_dirs (u, orig, con);
else if (opt.recursive)
DEBUGP ((_("Will not retrieve dirs since depth is %d (max %d).\n"),
depth, opt.reclevel));
--depth;
return err;
}
/* Retrieve the directories given in a file list. This function works
by simply going through the linked list and calling
ftp_retrieve_glob on each directory entry. The function knows
about excluded directories. */
static uerr_t
ftp_retrieve_dirs (struct url *u, struct fileinfo *f, ccon *con)
1999-12-02 02:42:23 -05:00
{
char *container = NULL;
int container_size = 0;
1999-12-02 02:42:23 -05:00
for (; f; f = f->next)
{
int size;
char *odir, *newdir;
1999-12-02 02:42:23 -05:00
if (opt.quota && total_downloaded_bytes > opt.quota)
1999-12-02 02:42:23 -05:00
break;
if (f->type != FT_DIRECTORY)
continue;
1999-12-02 02:42:23 -05:00
/* Allocate u->dir off stack, but reallocate only if a larger
string is needed. It's a pity there's no "realloca" for an
item on the bottom of the stack. */
size = strlen (u->dir) + 1 + strlen (f->name) + 1;
if (size > container_size)
container = (char *)alloca (size);
newdir = container;
odir = u->dir;
if (*odir == '\0'
|| (*odir == '/' && *(odir + 1) == '\0'))
/* If ODIR is empty or just "/", simply append f->name to
ODIR. (In the former case, to preserve u->dir being
relative; in the latter case, to avoid double slash.) */
sprintf (newdir, "%s%s", odir, f->name);
else
/* Else, use a separator. */
sprintf (newdir, "%s/%s", odir, f->name);
DEBUGP (("Composing new CWD relative to the initial directory.\n"));
DEBUGP ((" odir = '%s'\n f->name = '%s'\n newdir = '%s'\n\n",
odir, f->name, newdir));
if (!accdir (newdir, ALLABS))
1999-12-02 02:42:23 -05:00
{
logprintf (LOG_VERBOSE, _("\
Not descending to `%s' as it is excluded/not-included.\n"), newdir);
1999-12-02 02:42:23 -05:00
continue;
}
1999-12-02 02:42:23 -05:00
con->st &= ~DONE_CWD;
odir = xstrdup (u->dir); /* because url_set_dir will free
u->dir. */
url_set_dir (u, newdir);
1999-12-02 02:42:23 -05:00
ftp_retrieve_glob (u, con, GETALL);
url_set_dir (u, odir);
xfree (odir);
1999-12-02 02:42:23 -05:00
/* Set the time-stamp? */
}
if (opt.quota && total_downloaded_bytes > opt.quota)
1999-12-02 02:42:23 -05:00
return QUOTEXC;
else
return RETROK;
}
/* Return non-zero if S has a leading '/' or contains '../' */
static int
has_insecure_name_p (const char *s)
{
if (*s == '/')
return 1;
if (strstr(s, "../") != 0)
return 1;
return 0;
}
1999-12-02 02:42:23 -05:00
/* A near-top-level function to retrieve the files in a directory.
The function calls ftp_get_listing, to get a linked list of files.
Then it weeds out the file names that do not match the pattern.
ftp_retrieve_list is called with this updated list as an argument.
If the argument ACTION is GETONE, just download the file (but first
get the listing, so that the time-stamp is heeded); if it's GLOBALL,
use globbing; if it's GETALL, download the whole directory. */
static uerr_t
ftp_retrieve_glob (struct url *u, ccon *con, int action)
1999-12-02 02:42:23 -05:00
{
struct fileinfo *f, *start;
1999-12-02 02:42:23 -05:00
uerr_t res;
con->cmd |= LEAVE_PENDING;
res = ftp_get_listing (u, con, &start);
if (res != RETROK)
return res;
1999-12-02 02:42:23 -05:00
/* First: weed out that do not conform the global rules given in
opt.accepts and opt.rejects. */
if (opt.accepts || opt.rejects)
{
f = start;
1999-12-02 02:42:23 -05:00
while (f)
{
if (f->type != FT_DIRECTORY && !acceptable (f->name))
{
logprintf (LOG_VERBOSE, _("Rejecting `%s'.\n"), f->name);
f = delelement (f, &start);
}
else
f = f->next;
}
}
/* Remove all files with possible harmful names */
f = start;
while (f)
{
if (has_insecure_name_p (f->name))
{
logprintf (LOG_VERBOSE, _("Rejecting `%s'.\n"), f->name);
f = delelement (f, &start);
}
else
f = f->next;
}
1999-12-02 02:42:23 -05:00
/* Now weed out the files that do not match our globbing pattern.
If we are dealing with a globbing pattern, that is. */
if (*u->file && (action == GLOBALL || action == GETONE))
{
int matchres = 0;
f = start;
1999-12-02 02:42:23 -05:00
while (f)
{
matchres = fnmatch (u->file, f->name, 0);
if (matchres == -1)
{
logprintf (LOG_NOTQUIET, "%s: %s\n", con->target,
1999-12-02 02:42:23 -05:00
strerror (errno));
break;
}
if (matchres == FNM_NOMATCH)
f = delelement (f, &start); /* delete the element from the list */
else
f = f->next; /* leave the element in the list */
}
if (matchres == -1)
{
freefileinfo (start);
return RETRBADPATTERN;
}
}
res = RETROK;
if (start)
{
/* Just get everything. */
ftp_retrieve_list (u, start, con);
}
else if (!start)
{
if (action == GLOBALL)
{
/* No luck. */
/* #### This message SUCKS. We should see what was the
reason that nothing was retrieved. */
logprintf (LOG_VERBOSE, _("No matches on pattern `%s'.\n"), u->file);
}
else /* GETONE or GETALL */
{
/* Let's try retrieving it anyway. */
con->st |= ON_YOUR_OWN;
res = ftp_loop_internal (u, NULL, con);
return res;
}
}
freefileinfo (start);
if (opt.quota && total_downloaded_bytes > opt.quota)
1999-12-02 02:42:23 -05:00
return QUOTEXC;
else
/* #### Should we return `res' here? */
return RETROK;
}
/* The wrapper that calls an appropriate routine according to contents
of URL. Inherently, its capabilities are limited on what can be
encoded into a URL. */
uerr_t
ftp_loop (struct url *u, int *dt, struct url *proxy)
1999-12-02 02:42:23 -05:00
{
ccon con; /* FTP connection */
uerr_t res;
*dt = 0;
memset (&con, 0, sizeof (con));
1999-12-02 02:42:23 -05:00
rbuf_uninitialize (&con.rbuf);
con.st = ON_YOUR_OWN;
con.rs = ST_UNIX;
con.id = NULL;
con.proxy = proxy;
1999-12-02 02:42:23 -05:00
res = RETROK; /* in case it's not used */
/* If the file name is empty, the user probably wants a directory
index. We'll provide one, properly HTML-ized. Unless
opt.htmlify is 0, of course. :-) */
if (!*u->file && !opt.recursive)
{
struct fileinfo *f;
res = ftp_get_listing (u, &con, &f);
1999-12-02 02:42:23 -05:00
if (res == RETROK)
1999-12-02 02:42:23 -05:00
{
if (opt.htmlify && !opt.spider)
1999-12-02 02:42:23 -05:00
{
char *filename = (opt.output_document
? xstrdup (opt.output_document)
: (con.target ? xstrdup (con.target)
: url_file_name (u)));
1999-12-02 02:42:23 -05:00
res = ftp_index (filename, u, f);
if (res == FTPOK && opt.verbose)
{
if (!opt.output_document)
{
struct stat st;
long sz;
if (stat (filename, &st) == 0)
sz = st.st_size;
else
sz = -1;
logprintf (LOG_NOTQUIET,
_("Wrote HTML-ized index to `%s' [%ld].\n"),
filename, sz);
}
else
logprintf (LOG_NOTQUIET,
_("Wrote HTML-ized index to `%s'.\n"),
filename);
}
xfree (filename);
1999-12-02 02:42:23 -05:00
}
freefileinfo (f);
}
}
else
{
int wild = has_wildcards_p (u->file);
if ((opt.ftp_glob && wild) || opt.recursive || opt.timestamping)
{
/* ftp_retrieve_glob is a catch-all function that gets called
if we need globbing, time-stamping or recursion. Its
third argument is just what we really need. */
res = ftp_retrieve_glob (u, &con,
(opt.ftp_glob && wild) ? GLOBALL : GETONE);
1999-12-02 02:42:23 -05:00
}
else
res = ftp_loop_internal (u, NULL, &con);
}
if (res == FTPOK)
res = RETROK;
if (res == RETROK)
*dt |= RETROKF;
/* If a connection was left, quench it. */
if (rbuf_initialized_p (&con.rbuf))
CLOSE (RBUF_FD (&con.rbuf));
FREE_MAYBE (con.id);
con.id = NULL;
FREE_MAYBE (con.target);
con.target = NULL;
1999-12-02 02:42:23 -05:00
return res;
}
/* Delete an element from the fileinfo linked list. Returns the
address of the next element, or NULL if the list is exhausted. It
can modify the start of the list. */
static struct fileinfo *
delelement (struct fileinfo *f, struct fileinfo **start)
{
struct fileinfo *prev = f->prev;
struct fileinfo *next = f->next;
xfree (f->name);
1999-12-02 02:42:23 -05:00
FREE_MAYBE (f->linkto);
xfree (f);
1999-12-02 02:42:23 -05:00
if (next)
next->prev = prev;
if (prev)
prev->next = next;
else
*start = next;
return next;
}
/* Free the fileinfo linked list of files. */
static void
freefileinfo (struct fileinfo *f)
{
while (f)
{
struct fileinfo *next = f->next;
xfree (f->name);
1999-12-02 02:42:23 -05:00
if (f->linkto)
xfree (f->linkto);
xfree (f);
1999-12-02 02:42:23 -05:00
f = next;
}
}