wget/src/main.c

968 lines
29 KiB
C
Raw Normal View History

1999-12-02 02:42:23 -05:00
/* Command line parsing.
Copyright (C) 1995, 1996, 1997, 1998, 2000, 2001, 2002
2001-05-27 15:35:15 -04:00
Free Software Foundation, Inc.
1999-12-02 02:42:23 -05:00
2001-05-27 15:35:15 -04:00
This file is part of GNU Wget.
1999-12-02 02:42:23 -05:00
2001-05-27 15:35:15 -04:00
GNU Wget is free software; you can redistribute it and/or modify
1999-12-02 02:42:23 -05:00
it under the terms of the GNU General Public License as published by
the Free Software Foundation; either version 2 of the License, or
(at your option) any later version.
2001-05-27 15:35:15 -04:00
GNU Wget is distributed in the hope that it will be useful,
1999-12-02 02:42:23 -05:00
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
2001-05-27 15:35:15 -04:00
along with Wget; if not, write to the Free Software
Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
In addition, as a special exception, the Free Software Foundation
gives permission to link the code of its release of Wget with the
OpenSSL project's "OpenSSL" library (or with modified versions of it
that use the same license as the "OpenSSL" library), and distribute
the linked executables. You must obey the GNU General Public License
in all respects for all of the code used other than "OpenSSL". If you
modify this file, you may extend this exception to your version of the
file, but you are not obligated to do so. If you do not wish to do
so, delete this exception statement from your version. */
1999-12-02 02:42:23 -05:00
#include <config.h>
#include <stdio.h>
#include <stdlib.h>
#ifdef HAVE_UNISTD_H
# include <unistd.h>
#endif /* HAVE_UNISTD_H */
#include <sys/types.h>
#ifdef HAVE_STRING_H
# include <string.h>
#else
# include <strings.h>
#endif /* HAVE_STRING_H */
#ifdef HAVE_SIGNAL_H
# include <signal.h>
#endif
#ifdef HAVE_NLS
#ifdef HAVE_LOCALE_H
# include <locale.h>
#endif /* HAVE_LOCALE_H */
#endif /* HAVE_NLS */
#include <errno.h>
1999-12-02 02:42:23 -05:00
#include "wget.h"
#include "utils.h"
#include "init.h"
#include "retr.h"
#include "recur.h"
#include "host.h"
2001-04-08 18:25:24 -04:00
#include "cookies.h"
#include "url.h"
#include "progress.h" /* for progress_handle_sigwinch */
1999-12-02 02:42:23 -05:00
#ifdef HAVE_SSL
# include "gen_sslfunc.h"
#endif
/* On GNU system this will include system-wide getopt.h. */
#include "getopt.h"
1999-12-02 02:42:23 -05:00
#ifndef PATH_SEPARATOR
# define PATH_SEPARATOR '/'
#endif
extern char *version_string;
#ifndef errno
extern int errno;
#endif
struct options opt;
extern struct cookie_jar *wget_cookie_jar;
1999-12-02 02:42:23 -05:00
/* From log.c. */
void log_init PARAMS ((const char *, int));
void log_close PARAMS ((void));
void log_request_redirect_output PARAMS ((const char *));
1999-12-02 02:42:23 -05:00
static RETSIGTYPE redirect_output_signal PARAMS ((int));
const char *exec_name;
/* Initialize I18N. The initialization amounts to invoking
setlocale(), bindtextdomain() and textdomain().
Does nothing if NLS is disabled or missing. */
static void
i18n_initialize (void)
{
/* If HAVE_NLS is defined, assume the existence of the three
functions invoked here. */
#ifdef HAVE_NLS
/* Set the current locale. */
/* Here we use LC_MESSAGES instead of LC_ALL, for two reasons.
First, message catalogs are all of I18N Wget uses anyway.
Second, setting LC_ALL has a dangerous potential of messing
things up. For example, when in a foreign locale, Solaris
strptime() fails to handle international dates correctly, which
makes http_atotm() malfunction. */
2000-04-12 09:23:35 -04:00
#ifdef LC_MESSAGES
1999-12-02 02:42:23 -05:00
setlocale (LC_MESSAGES, "");
setlocale (LC_CTYPE, "");
2000-04-12 09:23:35 -04:00
#else
setlocale (LC_ALL, "");
#endif
1999-12-02 02:42:23 -05:00
/* Set the text message domain. */
bindtextdomain ("wget", LOCALEDIR);
textdomain ("wget");
#endif /* HAVE_NLS */
}
/* Print the usage message. */
static void
print_usage (void)
{
printf (_("Usage: %s [OPTION]... [URL]...\n"), exec_name);
}
/* Print the help message, describing all the available options. If
you add an option, be sure to update this list. */
static void
print_help (void)
{
printf (_("GNU Wget %s, a non-interactive network retriever.\n"),
version_string);
print_usage ();
/* Had to split this in parts, so the #@@#%# Ultrix compiler and cpp
don't bitch. Also, it makes translation much easier. */
fputs (_("\
1999-12-02 02:42:23 -05:00
\n\
Mandatory arguments to long options are mandatory for short options too.\n\
\n"), stdout);
fputs (_("\
1999-12-02 02:42:23 -05:00
Startup:\n\
-V, --version display the version of Wget and exit.\n\
-h, --help print this help.\n\
-b, --background go to background after startup.\n\
-e, --execute=COMMAND execute a `.wgetrc\'-style command.\n\
\n"), stdout);
fputs (_("\
1999-12-02 02:42:23 -05:00
Logging and input file:\n\
-o, --output-file=FILE log messages to FILE.\n\
-a, --append-output=FILE append messages to FILE.\n\
-d, --debug print debug output.\n\
-q, --quiet quiet (no output).\n\
-v, --verbose be verbose (this is the default).\n\
-nv, --non-verbose turn off verboseness, without being quiet.\n\
-i, --input-file=FILE download URLs found in FILE.\n\
1999-12-02 02:42:23 -05:00
-F, --force-html treat input file as HTML.\n\
-B, --base=URL prepends URL to relative links in -F -i file.\n\
\n"),stdout);
fputs (_("\
1999-12-02 02:42:23 -05:00
Download:\n\
-t, --tries=NUMBER set number of retries to NUMBER (0 unlimits).\n\
--retry-connrefused retry even if connection is refused.\n\
1999-12-02 02:42:23 -05:00
-O --output-document=FILE write documents to FILE.\n\
-nc, --no-clobber don\'t clobber existing files or use .# suffixes.\n\
-c, --continue resume getting a partially-downloaded file.\n\
--progress=TYPE select progress gauge type.\n\
-N, --timestamping don\'t re-retrieve files unless newer than local.\n\
1999-12-02 02:42:23 -05:00
-S, --server-response print server response.\n\
--spider don\'t download anything.\n\
-T, --timeout=SECONDS set all timeout values to SECONDS.\n\
--dns-timeout=SECS set the DNS lookup timeout to SECS.\n\
--connect-timeout=SECS set the connect timeout to SECS.\n\
--read-timeout=SECS set the read timeout to SECS.\n\
1999-12-02 02:42:23 -05:00
-w, --wait=SECONDS wait SECONDS between retrievals.\n\
--waitretry=SECONDS wait 1...SECONDS between retries of a retrieval.\n\
--random-wait wait from 0...2*WAIT secs between retrievals.\n\
1999-12-02 02:42:23 -05:00
-Y, --proxy=on/off turn proxy on or off.\n\
-Q, --quota=NUMBER set retrieval quota to NUMBER.\n\
--bind-address=ADDRESS bind to ADDRESS (hostname or IP) on local host.\n\
--limit-rate=RATE limit download rate to RATE.\n\
2003-09-10 15:41:54 -04:00
--dns-cache=off disable caching DNS lookups.\n\
--restrict-file-names=OS restrict chars in file names to ones OS allows.\n\
\n"), stdout);
fputs (_("\
1999-12-02 02:42:23 -05:00
Directories:\n\
-nd, --no-directories don\'t create directories.\n\
1999-12-02 02:42:23 -05:00
-x, --force-directories force creation of directories.\n\
-nH, --no-host-directories don\'t create host directories.\n\
-P, --directory-prefix=PREFIX save files to PREFIX/...\n\
--cut-dirs=NUMBER ignore NUMBER remote directory components.\n\
\n"), stdout);
fputs (_("\
1999-12-02 02:42:23 -05:00
HTTP options:\n\
--http-user=USER set http user to USER.\n\
--http-passwd=PASS set http password to PASS.\n\
-C, --cache=on/off (dis)allow server-cached data (normally allowed).\n\
-E, --html-extension save all text/html documents with .html extension.\n\
1999-12-02 02:42:23 -05:00
--ignore-length ignore `Content-Length\' header field.\n\
--header=STRING insert STRING among the headers.\n\
--proxy-user=USER set USER as proxy username.\n\
--proxy-passwd=PASS set PASS as proxy password.\n\
--referer=URL include `Referer: URL\' header in HTTP request.\n\
1999-12-02 02:42:23 -05:00
-s, --save-headers save the HTTP headers to file.\n\
-U, --user-agent=AGENT identify as AGENT instead of Wget/VERSION.\n\
--no-http-keep-alive disable HTTP keep-alive (persistent connections).\n\
--cookies=off don't use cookies.\n\
2001-04-08 18:25:24 -04:00
--load-cookies=FILE load cookies from FILE before session.\n\
--save-cookies=FILE save cookies to FILE after session.\n\
--post-data=STRING use the POST method; send STRING as the data.\n\
--post-file=FILE use the POST method; send contents of FILE.\n\
\n"), stdout);
#ifdef HAVE_SSL
fputs (_("\
HTTPS (SSL) options:\n\
--sslcertfile=FILE optional client certificate.\n\
--sslcertkey=KEYFILE optional keyfile for this certificate.\n\
--egd-file=FILE file name of the EGD socket.\n\
--sslcadir=DIR dir where hash list of CA's are stured.\n\
--sslcafile=FILE file with bundle of CA's\n\
--sslcerttype=0/1 Client-Cert type 0=PEM (default) / 1=ASN1 (DER)\n\
--sslcheckcert=0/1 Check the server cert agenst given CA\n\
--sslprotocol=0-3 choose SSL protocol; 0=automatic,\n\
1=SSLv2 2=SSLv3 3=TLSv1\n\
\n"), stdout);
#endif
fputs (_("\
1999-12-02 02:42:23 -05:00
FTP options:\n\
-nr, --dont-remove-listing don\'t remove `.listing\' files.\n\
-g, --glob=on/off turn file name globbing on or off.\n\
--passive-ftp use the \"passive\" transfer mode.\n\
--retr-symlinks when recursing, get linked-to files (not dirs).\n\
\n"), stdout);
fputs (_("\
1999-12-02 02:42:23 -05:00
Recursive retrieval:\n\
-r, --recursive recursive download.\n\
-l, --level=NUMBER maximum recursion depth (inf or 0 for infinite).\n\
--delete-after delete files locally after downloading them.\n\
-k, --convert-links convert non-relative links to relative.\n\
-K, --backup-converted before converting file X, back up as X.orig.\n\
-m, --mirror shortcut option equivalent to -r -N -l inf -nr.\n\
-p, --page-requisites get all images, etc. needed to display HTML page.\n\
--strict-comments turn on strict (SGML) handling of HTML comments.\n\
\n"), stdout);
fputs (_("\
1999-12-02 02:42:23 -05:00
Recursive accept/reject:\n\
[svn] * TODO: Removed done item: we now have an option (-G) that makes it easy to download a single HTML document and all its constituents. * po/*.{gmo,po,pot}: Regenerated after adding new options. * po/hr.po: Hrvoje forgot '\n's on his translations of my altered messages, causing msgfmt to balk and `make install' to fail. * wget.texi (Recursive Retrieval Options): In -K description, added a link to the discussion of interaction with -N. (Recursive Accept/Reject Options): Did some alphabetizing and added descriptions of new --follow-tags and -G / --ignore-tags options. (Following Links): Changed "the loads of" to "loads of". (Wgetrc Commands): Added descriptions of new follow_tags and ignore_tags commands. * html.c (idmatch): Implemented checking of my new --follow-tags and --ignore-tags options. * init.c (commands): Added comment reminding people adding new entries doing allocation to add corresponding freeing in cleanup(). (commands): Added new followtags and ignoretags commands. (cleanup): Free storage for new followtags and ignoretags. * main.c: Use of "comma-separated list" was random -- normalized it. Did some alphabetization. Added comments pointing out "Options without arguments" and "Options accepting an argument" sections of long_options[]. Added new options --follow-tags and -G / --ignore-tags. Added comment that Damir's --referer is currently undocumented. Added comment that Heiko's --waitretry is partially undocumented (mentioned in --help but not in wget.texi). Moved improperly sorted 24, 129, and 'G' cases. * options.h (struct options): Added new fields follow_tags and ignore_tags. * wget.h: Added "#define EQ 0" so we can say "strcmp(a, b) == EQ".
2000-03-11 01:48:06 -05:00
-A, --accept=LIST comma-separated list of accepted extensions.\n\
-R, --reject=LIST comma-separated list of rejected extensions.\n\
-D, --domains=LIST comma-separated list of accepted domains.\n\
1999-12-02 02:42:23 -05:00
--exclude-domains=LIST comma-separated list of rejected domains.\n\
--follow-ftp follow FTP links from HTML documents.\n\
[svn] * TODO: Removed done item: we now have an option (-G) that makes it easy to download a single HTML document and all its constituents. * po/*.{gmo,po,pot}: Regenerated after adding new options. * po/hr.po: Hrvoje forgot '\n's on his translations of my altered messages, causing msgfmt to balk and `make install' to fail. * wget.texi (Recursive Retrieval Options): In -K description, added a link to the discussion of interaction with -N. (Recursive Accept/Reject Options): Did some alphabetizing and added descriptions of new --follow-tags and -G / --ignore-tags options. (Following Links): Changed "the loads of" to "loads of". (Wgetrc Commands): Added descriptions of new follow_tags and ignore_tags commands. * html.c (idmatch): Implemented checking of my new --follow-tags and --ignore-tags options. * init.c (commands): Added comment reminding people adding new entries doing allocation to add corresponding freeing in cleanup(). (commands): Added new followtags and ignoretags commands. (cleanup): Free storage for new followtags and ignoretags. * main.c: Use of "comma-separated list" was random -- normalized it. Did some alphabetization. Added comments pointing out "Options without arguments" and "Options accepting an argument" sections of long_options[]. Added new options --follow-tags and -G / --ignore-tags. Added comment that Damir's --referer is currently undocumented. Added comment that Heiko's --waitretry is partially undocumented (mentioned in --help but not in wget.texi). Moved improperly sorted 24, 129, and 'G' cases. * options.h (struct options): Added new fields follow_tags and ignore_tags. * wget.h: Added "#define EQ 0" so we can say "strcmp(a, b) == EQ".
2000-03-11 01:48:06 -05:00
--follow-tags=LIST comma-separated list of followed HTML tags.\n\
-G, --ignore-tags=LIST comma-separated list of ignored HTML tags.\n\
1999-12-02 02:42:23 -05:00
-H, --span-hosts go to foreign hosts when recursive.\n\
[svn] * TODO: Removed done item: we now have an option (-G) that makes it easy to download a single HTML document and all its constituents. * po/*.{gmo,po,pot}: Regenerated after adding new options. * po/hr.po: Hrvoje forgot '\n's on his translations of my altered messages, causing msgfmt to balk and `make install' to fail. * wget.texi (Recursive Retrieval Options): In -K description, added a link to the discussion of interaction with -N. (Recursive Accept/Reject Options): Did some alphabetizing and added descriptions of new --follow-tags and -G / --ignore-tags options. (Following Links): Changed "the loads of" to "loads of". (Wgetrc Commands): Added descriptions of new follow_tags and ignore_tags commands. * html.c (idmatch): Implemented checking of my new --follow-tags and --ignore-tags options. * init.c (commands): Added comment reminding people adding new entries doing allocation to add corresponding freeing in cleanup(). (commands): Added new followtags and ignoretags commands. (cleanup): Free storage for new followtags and ignoretags. * main.c: Use of "comma-separated list" was random -- normalized it. Did some alphabetization. Added comments pointing out "Options without arguments" and "Options accepting an argument" sections of long_options[]. Added new options --follow-tags and -G / --ignore-tags. Added comment that Damir's --referer is currently undocumented. Added comment that Heiko's --waitretry is partially undocumented (mentioned in --help but not in wget.texi). Moved improperly sorted 24, 129, and 'G' cases. * options.h (struct options): Added new fields follow_tags and ignore_tags. * wget.h: Added "#define EQ 0" so we can say "strcmp(a, b) == EQ".
2000-03-11 01:48:06 -05:00
-L, --relative follow relative links only.\n\
1999-12-02 02:42:23 -05:00
-I, --include-directories=LIST list of allowed directories.\n\
-X, --exclude-directories=LIST list of excluded directories.\n\
-np, --no-parent don\'t ascend to the parent directory.\n\
\n"), stdout);
fputs (_("Mail bug reports and suggestions to <bug-wget@gnu.org>.\n"),
stdout);
1999-12-02 02:42:23 -05:00
}
int
main (int argc, char *const *argv)
{
char **url, **t;
int i, c, nurl, status, append_to_log;
static struct option long_options[] =
{
[svn] * TODO: Removed done item: we now have an option (-G) that makes it easy to download a single HTML document and all its constituents. * po/*.{gmo,po,pot}: Regenerated after adding new options. * po/hr.po: Hrvoje forgot '\n's on his translations of my altered messages, causing msgfmt to balk and `make install' to fail. * wget.texi (Recursive Retrieval Options): In -K description, added a link to the discussion of interaction with -N. (Recursive Accept/Reject Options): Did some alphabetizing and added descriptions of new --follow-tags and -G / --ignore-tags options. (Following Links): Changed "the loads of" to "loads of". (Wgetrc Commands): Added descriptions of new follow_tags and ignore_tags commands. * html.c (idmatch): Implemented checking of my new --follow-tags and --ignore-tags options. * init.c (commands): Added comment reminding people adding new entries doing allocation to add corresponding freeing in cleanup(). (commands): Added new followtags and ignoretags commands. (cleanup): Free storage for new followtags and ignoretags. * main.c: Use of "comma-separated list" was random -- normalized it. Did some alphabetization. Added comments pointing out "Options without arguments" and "Options accepting an argument" sections of long_options[]. Added new options --follow-tags and -G / --ignore-tags. Added comment that Damir's --referer is currently undocumented. Added comment that Heiko's --waitretry is partially undocumented (mentioned in --help but not in wget.texi). Moved improperly sorted 24, 129, and 'G' cases. * options.h (struct options): Added new fields follow_tags and ignore_tags. * wget.h: Added "#define EQ 0" so we can say "strcmp(a, b) == EQ".
2000-03-11 01:48:06 -05:00
/* Options without arguments: */
1999-12-02 02:42:23 -05:00
{ "background", no_argument, NULL, 'b' },
2001-04-08 18:25:24 -04:00
{ "backup-converted", no_argument, NULL, 'K' },
1999-12-02 02:42:23 -05:00
{ "continue", no_argument, NULL, 'c' },
{ "convert-links", no_argument, NULL, 'k' },
{ "debug", no_argument, NULL, 'd' },
{ "delete-after", no_argument, NULL, 136 },
{ "dont-remove-listing", no_argument, NULL, 149 },
{ "follow-ftp", no_argument, NULL, 142 },
1999-12-02 02:42:23 -05:00
{ "force-directories", no_argument, NULL, 'x' },
{ "force-hier", no_argument, NULL, 'x' }, /* obsolete */
{ "force-html", no_argument, NULL, 'F'},
{ "help", no_argument, NULL, 'h' },
{ "html-extension", no_argument, NULL, 'E' },
{ "ignore-length", no_argument, NULL, 138 },
1999-12-02 02:42:23 -05:00
{ "mirror", no_argument, NULL, 'm' },
{ "no-clobber", no_argument, NULL, 141 },
{ "no-directories", no_argument, NULL, 147 },
{ "no-host-directories", no_argument, NULL, 148 },
{ "no-host-lookup", no_argument, NULL, 150 },
{ "no-http-keep-alive", no_argument, NULL, 156 },
{ "no-parent", no_argument, NULL, 133 },
{ "non-verbose", no_argument, NULL, 146 },
{ "passive-ftp", no_argument, NULL, 139 },
{ "page-requisites", no_argument, NULL, 'p' },
1999-12-02 02:42:23 -05:00
{ "quiet", no_argument, NULL, 'q' },
{ "random-wait", no_argument, NULL, 165 },
1999-12-02 02:42:23 -05:00
{ "recursive", no_argument, NULL, 'r' },
{ "relative", no_argument, NULL, 'L' },
{ "retr-symlinks", no_argument, NULL, 137 },
{ "retry-connrefused", no_argument, NULL, 174 },
1999-12-02 02:42:23 -05:00
{ "save-headers", no_argument, NULL, 's' },
{ "server-response", no_argument, NULL, 'S' },
{ "span-hosts", no_argument, NULL, 'H' },
{ "spider", no_argument, NULL, 132 },
{ "strict-comments", no_argument, NULL, 177 },
1999-12-02 02:42:23 -05:00
{ "timestamping", no_argument, NULL, 'N' },
{ "verbose", no_argument, NULL, 'v' },
{ "version", no_argument, NULL, 'V' },
[svn] * TODO: Removed done item: we now have an option (-G) that makes it easy to download a single HTML document and all its constituents. * po/*.{gmo,po,pot}: Regenerated after adding new options. * po/hr.po: Hrvoje forgot '\n's on his translations of my altered messages, causing msgfmt to balk and `make install' to fail. * wget.texi (Recursive Retrieval Options): In -K description, added a link to the discussion of interaction with -N. (Recursive Accept/Reject Options): Did some alphabetizing and added descriptions of new --follow-tags and -G / --ignore-tags options. (Following Links): Changed "the loads of" to "loads of". (Wgetrc Commands): Added descriptions of new follow_tags and ignore_tags commands. * html.c (idmatch): Implemented checking of my new --follow-tags and --ignore-tags options. * init.c (commands): Added comment reminding people adding new entries doing allocation to add corresponding freeing in cleanup(). (commands): Added new followtags and ignoretags commands. (cleanup): Free storage for new followtags and ignoretags. * main.c: Use of "comma-separated list" was random -- normalized it. Did some alphabetization. Added comments pointing out "Options without arguments" and "Options accepting an argument" sections of long_options[]. Added new options --follow-tags and -G / --ignore-tags. Added comment that Damir's --referer is currently undocumented. Added comment that Heiko's --waitretry is partially undocumented (mentioned in --help but not in wget.texi). Moved improperly sorted 24, 129, and 'G' cases. * options.h (struct options): Added new fields follow_tags and ignore_tags. * wget.h: Added "#define EQ 0" so we can say "strcmp(a, b) == EQ".
2000-03-11 01:48:06 -05:00
/* Options accepting an argument: */
1999-12-02 02:42:23 -05:00
{ "accept", required_argument, NULL, 'A' },
{ "append-output", required_argument, NULL, 'a' },
{ "backups", required_argument, NULL, 151 }, /* undocumented */
1999-12-02 02:42:23 -05:00
{ "base", required_argument, NULL, 'B' },
{ "bind-address", required_argument, NULL, 155 },
1999-12-02 02:42:23 -05:00
{ "cache", required_argument, NULL, 'C' },
{ "connect-timeout", required_argument, NULL, 180 },
{ "cookies", required_argument, NULL, 160 },
{ "cut-dirs", required_argument, NULL, 145 },
{ "dns-timeout", required_argument, NULL, 178 },
1999-12-02 02:42:23 -05:00
{ "directory-prefix", required_argument, NULL, 'P' },
2003-09-10 15:41:54 -04:00
{ "dns-cache", required_argument, NULL, 175 },
1999-12-02 02:42:23 -05:00
{ "domains", required_argument, NULL, 'D' },
{ "dot-style", required_argument, NULL, 134 },
1999-12-02 02:42:23 -05:00
{ "execute", required_argument, NULL, 'e' },
{ "exclude-directories", required_argument, NULL, 'X' },
{ "exclude-domains", required_argument, NULL, 140 },
{ "follow-tags", required_argument, NULL, 153 },
1999-12-02 02:42:23 -05:00
{ "glob", required_argument, NULL, 'g' },
{ "header", required_argument, NULL, 131 },
{ "htmlify", required_argument, NULL, 135 },
{ "http-passwd", required_argument, NULL, 130 },
{ "http-user", required_argument, NULL, 129 },
[svn] * TODO: Removed done item: we now have an option (-G) that makes it easy to download a single HTML document and all its constituents. * po/*.{gmo,po,pot}: Regenerated after adding new options. * po/hr.po: Hrvoje forgot '\n's on his translations of my altered messages, causing msgfmt to balk and `make install' to fail. * wget.texi (Recursive Retrieval Options): In -K description, added a link to the discussion of interaction with -N. (Recursive Accept/Reject Options): Did some alphabetizing and added descriptions of new --follow-tags and -G / --ignore-tags options. (Following Links): Changed "the loads of" to "loads of". (Wgetrc Commands): Added descriptions of new follow_tags and ignore_tags commands. * html.c (idmatch): Implemented checking of my new --follow-tags and --ignore-tags options. * init.c (commands): Added comment reminding people adding new entries doing allocation to add corresponding freeing in cleanup(). (commands): Added new followtags and ignoretags commands. (cleanup): Free storage for new followtags and ignoretags. * main.c: Use of "comma-separated list" was random -- normalized it. Did some alphabetization. Added comments pointing out "Options without arguments" and "Options accepting an argument" sections of long_options[]. Added new options --follow-tags and -G / --ignore-tags. Added comment that Damir's --referer is currently undocumented. Added comment that Heiko's --waitretry is partially undocumented (mentioned in --help but not in wget.texi). Moved improperly sorted 24, 129, and 'G' cases. * options.h (struct options): Added new fields follow_tags and ignore_tags. * wget.h: Added "#define EQ 0" so we can say "strcmp(a, b) == EQ".
2000-03-11 01:48:06 -05:00
{ "ignore-tags", required_argument, NULL, 'G' },
1999-12-02 02:42:23 -05:00
{ "include-directories", required_argument, NULL, 'I' },
{ "input-file", required_argument, NULL, 'i' },
{ "level", required_argument, NULL, 'l' },
{ "limit-rate", required_argument, NULL, 164 },
{ "load-cookies", required_argument, NULL, 161 },
1999-12-02 02:42:23 -05:00
{ "no", required_argument, NULL, 'n' },
{ "output-document", required_argument, NULL, 'O' },
{ "output-file", required_argument, NULL, 'o' },
{ "post-data", required_argument, NULL, 167 },
{ "post-file", required_argument, NULL, 168 },
{ "progress", required_argument, NULL, 163 },
1999-12-02 02:42:23 -05:00
{ "proxy", required_argument, NULL, 'Y' },
{ "proxy-passwd", required_argument, NULL, 144 },
{ "proxy-user", required_argument, NULL, 143 },
1999-12-02 02:42:23 -05:00
{ "quota", required_argument, NULL, 'Q' },
{ "read-timeout", required_argument, NULL, 179 },
1999-12-02 02:42:23 -05:00
{ "reject", required_argument, NULL, 'R' },
{ "restrict-file-names", required_argument, NULL, 176 },
{ "save-cookies", required_argument, NULL, 162 },
1999-12-02 02:42:23 -05:00
{ "timeout", required_argument, NULL, 'T' },
{ "tries", required_argument, NULL, 't' },
{ "user-agent", required_argument, NULL, 'U' },
{ "referer", required_argument, NULL, 157 },
1999-12-02 02:42:23 -05:00
{ "use-proxy", required_argument, NULL, 'Y' },
#ifdef HAVE_SSL
{ "sslcertfile", required_argument, NULL, 158 },
{ "sslcertkey", required_argument, NULL, 159 },
{ "egd-file", required_argument, NULL, 166 },
{ "sslcadir", required_argument, NULL, 169},
{ "sslcafile", required_argument, NULL, 170},
{ "sslcerttype", required_argument, NULL, 171},
{ "sslcheckcert", required_argument, NULL, 172},
{ "sslprotocol", required_argument, NULL, 173},
#endif /* HAVE_SSL */
1999-12-02 02:42:23 -05:00
{ "wait", required_argument, NULL, 'w' },
{ "waitretry", required_argument, NULL, 152 },
1999-12-02 02:42:23 -05:00
{ 0, 0, 0, 0 }
};
i18n_initialize ();
append_to_log = 0;
/* Construct the name of the executable, without the directory part. */
exec_name = strrchr (argv[0], PATH_SEPARATOR);
if (!exec_name)
exec_name = argv[0];
else
++exec_name;
#ifdef WINDOWS
windows_main_junk (&argc, (char **) argv, (char **) &exec_name);
#endif
initialize (); /* sets option defaults; reads the system wgetrc and .wgetrc */
1999-12-02 02:42:23 -05:00
/* [Is the order of the option letters significant? If not, they should be
alphabetized, like the long_options. The only thing I know for sure is
that the options with required arguments must be followed by a ':'.
-- Dan Harkless <wget@harkless.org>] */
1999-12-02 02:42:23 -05:00
while ((c = getopt_long (argc, argv, "\
2001-04-01 17:26:28 -04:00
hpVqvdkKsxmNWrHSLcFbEY:G:g:T:U:O:l:n:i:o:a:t:D:A:R:P:B:e:Q:X:I:w:C:",
1999-12-02 02:42:23 -05:00
long_options, (int *)0)) != EOF)
{
switch (c)
{
/* Options without arguments: */
case 132:
setoptval ("spider", "on");
1999-12-02 02:42:23 -05:00
break;
case 133:
setoptval ("noparent", "on");
1999-12-02 02:42:23 -05:00
break;
case 136:
setoptval ("deleteafter", "on");
1999-12-02 02:42:23 -05:00
break;
case 137:
setoptval ("retrsymlinks", "on");
1999-12-02 02:42:23 -05:00
break;
case 138:
setoptval ("ignorelength", "on");
1999-12-02 02:42:23 -05:00
break;
case 139:
setoptval ("passiveftp", "on");
1999-12-02 02:42:23 -05:00
break;
case 141:
setoptval ("noclobber", "on");
1999-12-02 02:42:23 -05:00
break;
case 142:
setoptval ("followftp", "on");
1999-12-02 02:42:23 -05:00
break;
case 145:
setoptval ("cutdirs", optarg);
1999-12-02 02:42:23 -05:00
break;
case 146:
setoptval ("verbose", "off");
1999-12-02 02:42:23 -05:00
break;
case 147:
setoptval ("dirstruct", "off");
1999-12-02 02:42:23 -05:00
break;
case 148:
setoptval ("addhostdir", "off");
1999-12-02 02:42:23 -05:00
break;
case 149:
setoptval ("removelisting", "off");
1999-12-02 02:42:23 -05:00
break;
case 155:
setoptval ("bindaddress", optarg);
break;
case 156:
setoptval ("httpkeepalive", "off");
break;
case 165:
setoptval ("randomwait", "on");
break;
1999-12-02 02:42:23 -05:00
case 'b':
setoptval ("background", "on");
1999-12-02 02:42:23 -05:00
break;
case 'c':
setoptval ("continue", "on");
1999-12-02 02:42:23 -05:00
break;
case 'd':
#ifdef DEBUG
setoptval ("debug", "on");
1999-12-02 02:42:23 -05:00
#else /* not DEBUG */
fprintf (stderr, _("%s: debug support not compiled in.\n"),
exec_name);
#endif /* not DEBUG */
break;
case 'E':
setoptval ("htmlextension", "on");
1999-12-02 02:42:23 -05:00
break;
case 'F':
setoptval ("forcehtml", "on");
1999-12-02 02:42:23 -05:00
break;
case 'H':
setoptval ("spanhosts", "on");
1999-12-02 02:42:23 -05:00
break;
case 'h':
print_help ();
#ifdef WINDOWS
ws_help (exec_name);
#endif
exit (0);
break;
case 'K':
setoptval ("backupconverted", "on");
break;
[svn] * TODO: Removed done item: we now have an option (-G) that makes it easy to download a single HTML document and all its constituents. * po/*.{gmo,po,pot}: Regenerated after adding new options. * po/hr.po: Hrvoje forgot '\n's on his translations of my altered messages, causing msgfmt to balk and `make install' to fail. * wget.texi (Recursive Retrieval Options): In -K description, added a link to the discussion of interaction with -N. (Recursive Accept/Reject Options): Did some alphabetizing and added descriptions of new --follow-tags and -G / --ignore-tags options. (Following Links): Changed "the loads of" to "loads of". (Wgetrc Commands): Added descriptions of new follow_tags and ignore_tags commands. * html.c (idmatch): Implemented checking of my new --follow-tags and --ignore-tags options. * init.c (commands): Added comment reminding people adding new entries doing allocation to add corresponding freeing in cleanup(). (commands): Added new followtags and ignoretags commands. (cleanup): Free storage for new followtags and ignoretags. * main.c: Use of "comma-separated list" was random -- normalized it. Did some alphabetization. Added comments pointing out "Options without arguments" and "Options accepting an argument" sections of long_options[]. Added new options --follow-tags and -G / --ignore-tags. Added comment that Damir's --referer is currently undocumented. Added comment that Heiko's --waitretry is partially undocumented (mentioned in --help but not in wget.texi). Moved improperly sorted 24, 129, and 'G' cases. * options.h (struct options): Added new fields follow_tags and ignore_tags. * wget.h: Added "#define EQ 0" so we can say "strcmp(a, b) == EQ".
2000-03-11 01:48:06 -05:00
case 'k':
setoptval ("convertlinks", "on");
[svn] * TODO: Removed done item: we now have an option (-G) that makes it easy to download a single HTML document and all its constituents. * po/*.{gmo,po,pot}: Regenerated after adding new options. * po/hr.po: Hrvoje forgot '\n's on his translations of my altered messages, causing msgfmt to balk and `make install' to fail. * wget.texi (Recursive Retrieval Options): In -K description, added a link to the discussion of interaction with -N. (Recursive Accept/Reject Options): Did some alphabetizing and added descriptions of new --follow-tags and -G / --ignore-tags options. (Following Links): Changed "the loads of" to "loads of". (Wgetrc Commands): Added descriptions of new follow_tags and ignore_tags commands. * html.c (idmatch): Implemented checking of my new --follow-tags and --ignore-tags options. * init.c (commands): Added comment reminding people adding new entries doing allocation to add corresponding freeing in cleanup(). (commands): Added new followtags and ignoretags commands. (cleanup): Free storage for new followtags and ignoretags. * main.c: Use of "comma-separated list" was random -- normalized it. Did some alphabetization. Added comments pointing out "Options without arguments" and "Options accepting an argument" sections of long_options[]. Added new options --follow-tags and -G / --ignore-tags. Added comment that Damir's --referer is currently undocumented. Added comment that Heiko's --waitretry is partially undocumented (mentioned in --help but not in wget.texi). Moved improperly sorted 24, 129, and 'G' cases. * options.h (struct options): Added new fields follow_tags and ignore_tags. * wget.h: Added "#define EQ 0" so we can say "strcmp(a, b) == EQ".
2000-03-11 01:48:06 -05:00
break;
1999-12-02 02:42:23 -05:00
case 'L':
setoptval ("relativeonly", "on");
1999-12-02 02:42:23 -05:00
break;
case 'm':
setoptval ("mirror", "on");
1999-12-02 02:42:23 -05:00
break;
case 'N':
setoptval ("timestamping", "on");
1999-12-02 02:42:23 -05:00
break;
case 'p':
setoptval ("pagerequisites", "on");
break;
1999-12-02 02:42:23 -05:00
case 'S':
setoptval ("serverresponse", "on");
1999-12-02 02:42:23 -05:00
break;
case 's':
setoptval ("saveheaders", "on");
1999-12-02 02:42:23 -05:00
break;
case 'q':
setoptval ("quiet", "on");
1999-12-02 02:42:23 -05:00
break;
case 'r':
setoptval ("recursive", "on");
1999-12-02 02:42:23 -05:00
break;
case 'V':
printf ("GNU Wget %s\n\n", version_string);
printf ("%s", _("\
Copyright (C) 1995, 1996, 1997, 1998, 2000, 2001 Free Software Foundation, Inc.\n"));
printf ("%s", _("\
1999-12-02 02:42:23 -05:00
This program is distributed in the hope that it will be useful,\n\
but WITHOUT ANY WARRANTY; without even the implied warranty of\n\
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the\n\
GNU General Public License for more details.\n"));
printf (_("\nOriginally written by Hrvoje Niksic <hniksic@arsdigita.com>.\n"));
1999-12-02 02:42:23 -05:00
exit (0);
break;
case 'v':
setoptval ("verbose", "on");
1999-12-02 02:42:23 -05:00
break;
case 'x':
setoptval ("dirstruct", "on");
1999-12-02 02:42:23 -05:00
break;
case 174:
setoptval ("retryconnrefused", "on");
break;
case 177:
setoptval ("strictcomments", "on");
break;
1999-12-02 02:42:23 -05:00
/* Options accepting an argument: */
case 129:
setoptval ("httpuser", optarg);
1999-12-02 02:42:23 -05:00
break;
case 130:
setoptval ("httppasswd", optarg);
1999-12-02 02:42:23 -05:00
break;
case 131:
setoptval ("header", optarg);
1999-12-02 02:42:23 -05:00
break;
case 134:
setoptval ("dotstyle", optarg);
1999-12-02 02:42:23 -05:00
break;
case 135:
setoptval ("htmlify", optarg);
1999-12-02 02:42:23 -05:00
break;
case 140:
setoptval ("excludedomains", optarg);
1999-12-02 02:42:23 -05:00
break;
case 143:
setoptval ("proxyuser", optarg);
1999-12-02 02:42:23 -05:00
break;
case 144:
setoptval ("proxypasswd", optarg);
1999-12-02 02:42:23 -05:00
break;
case 151:
setoptval ("backups", optarg);
1999-12-02 02:42:23 -05:00
break;
case 152:
setoptval ("waitretry", optarg);
[svn] * TODO: Removed done item: we now have an option (-G) that makes it easy to download a single HTML document and all its constituents. * po/*.{gmo,po,pot}: Regenerated after adding new options. * po/hr.po: Hrvoje forgot '\n's on his translations of my altered messages, causing msgfmt to balk and `make install' to fail. * wget.texi (Recursive Retrieval Options): In -K description, added a link to the discussion of interaction with -N. (Recursive Accept/Reject Options): Did some alphabetizing and added descriptions of new --follow-tags and -G / --ignore-tags options. (Following Links): Changed "the loads of" to "loads of". (Wgetrc Commands): Added descriptions of new follow_tags and ignore_tags commands. * html.c (idmatch): Implemented checking of my new --follow-tags and --ignore-tags options. * init.c (commands): Added comment reminding people adding new entries doing allocation to add corresponding freeing in cleanup(). (commands): Added new followtags and ignoretags commands. (cleanup): Free storage for new followtags and ignoretags. * main.c: Use of "comma-separated list" was random -- normalized it. Did some alphabetization. Added comments pointing out "Options without arguments" and "Options accepting an argument" sections of long_options[]. Added new options --follow-tags and -G / --ignore-tags. Added comment that Damir's --referer is currently undocumented. Added comment that Heiko's --waitretry is partially undocumented (mentioned in --help but not in wget.texi). Moved improperly sorted 24, 129, and 'G' cases. * options.h (struct options): Added new fields follow_tags and ignore_tags. * wget.h: Added "#define EQ 0" so we can say "strcmp(a, b) == EQ".
2000-03-11 01:48:06 -05:00
break;
case 153:
setoptval ("followtags", optarg);
[svn] * TODO: Removed done item: we now have an option (-G) that makes it easy to download a single HTML document and all its constituents. * po/*.{gmo,po,pot}: Regenerated after adding new options. * po/hr.po: Hrvoje forgot '\n's on his translations of my altered messages, causing msgfmt to balk and `make install' to fail. * wget.texi (Recursive Retrieval Options): In -K description, added a link to the discussion of interaction with -N. (Recursive Accept/Reject Options): Did some alphabetizing and added descriptions of new --follow-tags and -G / --ignore-tags options. (Following Links): Changed "the loads of" to "loads of". (Wgetrc Commands): Added descriptions of new follow_tags and ignore_tags commands. * html.c (idmatch): Implemented checking of my new --follow-tags and --ignore-tags options. * init.c (commands): Added comment reminding people adding new entries doing allocation to add corresponding freeing in cleanup(). (commands): Added new followtags and ignoretags commands. (cleanup): Free storage for new followtags and ignoretags. * main.c: Use of "comma-separated list" was random -- normalized it. Did some alphabetization. Added comments pointing out "Options without arguments" and "Options accepting an argument" sections of long_options[]. Added new options --follow-tags and -G / --ignore-tags. Added comment that Damir's --referer is currently undocumented. Added comment that Heiko's --waitretry is partially undocumented (mentioned in --help but not in wget.texi). Moved improperly sorted 24, 129, and 'G' cases. * options.h (struct options): Added new fields follow_tags and ignore_tags. * wget.h: Added "#define EQ 0" so we can say "strcmp(a, b) == EQ".
2000-03-11 01:48:06 -05:00
break;
2001-04-08 18:25:24 -04:00
case 160:
setoptval ("cookies", optarg);
2001-04-08 18:25:24 -04:00
break;
case 161:
setoptval ("loadcookies", optarg);
2001-04-08 18:25:24 -04:00
break;
case 162:
setoptval ("savecookies", optarg);
2001-04-08 18:25:24 -04:00
break;
case 163:
setoptval ("progress", optarg);
break;
case 164:
setoptval ("limitrate", optarg);
break;
case 157:
setoptval ("referer", optarg);
[svn] * TODO: Removed done item: we now have an option (-G) that makes it easy to download a single HTML document and all its constituents. * po/*.{gmo,po,pot}: Regenerated after adding new options. * po/hr.po: Hrvoje forgot '\n's on his translations of my altered messages, causing msgfmt to balk and `make install' to fail. * wget.texi (Recursive Retrieval Options): In -K description, added a link to the discussion of interaction with -N. (Recursive Accept/Reject Options): Did some alphabetizing and added descriptions of new --follow-tags and -G / --ignore-tags options. (Following Links): Changed "the loads of" to "loads of". (Wgetrc Commands): Added descriptions of new follow_tags and ignore_tags commands. * html.c (idmatch): Implemented checking of my new --follow-tags and --ignore-tags options. * init.c (commands): Added comment reminding people adding new entries doing allocation to add corresponding freeing in cleanup(). (commands): Added new followtags and ignoretags commands. (cleanup): Free storage for new followtags and ignoretags. * main.c: Use of "comma-separated list" was random -- normalized it. Did some alphabetization. Added comments pointing out "Options without arguments" and "Options accepting an argument" sections of long_options[]. Added new options --follow-tags and -G / --ignore-tags. Added comment that Damir's --referer is currently undocumented. Added comment that Heiko's --waitretry is partially undocumented (mentioned in --help but not in wget.texi). Moved improperly sorted 24, 129, and 'G' cases. * options.h (struct options): Added new fields follow_tags and ignore_tags. * wget.h: Added "#define EQ 0" so we can say "strcmp(a, b) == EQ".
2000-03-11 01:48:06 -05:00
break;
#ifdef HAVE_SSL
case 158:
setoptval ("sslcertfile", optarg);
break;
case 159:
setoptval ("sslcertkey", optarg);
break;
case 166:
setoptval ("egdfile", optarg);
break;
case 169:
setoptval ("sslcadir", optarg);
break;
case 170:
setoptval ("sslcafile", optarg);
break;
case 171:
setoptval ("sslcerttype", optarg);
break;
case 172:
setoptval ("sslcheckcert", optarg);
break;
case 173:
setoptval ("sslprotocol", optarg);
break;
#endif /* HAVE_SSL */
case 167:
setoptval ("postdata", optarg);
break;
case 168:
setoptval ("postfile", optarg);
break;
2003-09-10 15:41:54 -04:00
case 175:
setoptval ("dnscache", optarg);
2003-09-10 15:41:54 -04:00
break;
case 176:
setoptval ("restrictfilenames", optarg);
break;
case 178:
setoptval ("dnstimeout", optarg);
break;
case 179:
setoptval ("readtimeout", optarg);
break;
case 180:
setoptval ("connecttimeout", optarg);
break;
1999-12-02 02:42:23 -05:00
case 'A':
setoptval ("accept", optarg);
1999-12-02 02:42:23 -05:00
break;
case 'a':
setoptval ("logfile", optarg);
1999-12-02 02:42:23 -05:00
append_to_log = 1;
break;
case 'B':
setoptval ("base", optarg);
1999-12-02 02:42:23 -05:00
break;
case 'C':
setoptval ("cache", optarg);
1999-12-02 02:42:23 -05:00
break;
case 'D':
setoptval ("domains", optarg);
1999-12-02 02:42:23 -05:00
break;
case 'e':
run_command (optarg);
1999-12-02 02:42:23 -05:00
break;
[svn] * TODO: Removed done item: we now have an option (-G) that makes it easy to download a single HTML document and all its constituents. * po/*.{gmo,po,pot}: Regenerated after adding new options. * po/hr.po: Hrvoje forgot '\n's on his translations of my altered messages, causing msgfmt to balk and `make install' to fail. * wget.texi (Recursive Retrieval Options): In -K description, added a link to the discussion of interaction with -N. (Recursive Accept/Reject Options): Did some alphabetizing and added descriptions of new --follow-tags and -G / --ignore-tags options. (Following Links): Changed "the loads of" to "loads of". (Wgetrc Commands): Added descriptions of new follow_tags and ignore_tags commands. * html.c (idmatch): Implemented checking of my new --follow-tags and --ignore-tags options. * init.c (commands): Added comment reminding people adding new entries doing allocation to add corresponding freeing in cleanup(). (commands): Added new followtags and ignoretags commands. (cleanup): Free storage for new followtags and ignoretags. * main.c: Use of "comma-separated list" was random -- normalized it. Did some alphabetization. Added comments pointing out "Options without arguments" and "Options accepting an argument" sections of long_options[]. Added new options --follow-tags and -G / --ignore-tags. Added comment that Damir's --referer is currently undocumented. Added comment that Heiko's --waitretry is partially undocumented (mentioned in --help but not in wget.texi). Moved improperly sorted 24, 129, and 'G' cases. * options.h (struct options): Added new fields follow_tags and ignore_tags. * wget.h: Added "#define EQ 0" so we can say "strcmp(a, b) == EQ".
2000-03-11 01:48:06 -05:00
case 'G':
setoptval ("ignoretags", optarg);
[svn] * TODO: Removed done item: we now have an option (-G) that makes it easy to download a single HTML document and all its constituents. * po/*.{gmo,po,pot}: Regenerated after adding new options. * po/hr.po: Hrvoje forgot '\n's on his translations of my altered messages, causing msgfmt to balk and `make install' to fail. * wget.texi (Recursive Retrieval Options): In -K description, added a link to the discussion of interaction with -N. (Recursive Accept/Reject Options): Did some alphabetizing and added descriptions of new --follow-tags and -G / --ignore-tags options. (Following Links): Changed "the loads of" to "loads of". (Wgetrc Commands): Added descriptions of new follow_tags and ignore_tags commands. * html.c (idmatch): Implemented checking of my new --follow-tags and --ignore-tags options. * init.c (commands): Added comment reminding people adding new entries doing allocation to add corresponding freeing in cleanup(). (commands): Added new followtags and ignoretags commands. (cleanup): Free storage for new followtags and ignoretags. * main.c: Use of "comma-separated list" was random -- normalized it. Did some alphabetization. Added comments pointing out "Options without arguments" and "Options accepting an argument" sections of long_options[]. Added new options --follow-tags and -G / --ignore-tags. Added comment that Damir's --referer is currently undocumented. Added comment that Heiko's --waitretry is partially undocumented (mentioned in --help but not in wget.texi). Moved improperly sorted 24, 129, and 'G' cases. * options.h (struct options): Added new fields follow_tags and ignore_tags. * wget.h: Added "#define EQ 0" so we can say "strcmp(a, b) == EQ".
2000-03-11 01:48:06 -05:00
break;
1999-12-02 02:42:23 -05:00
case 'g':
setoptval ("glob", optarg);
1999-12-02 02:42:23 -05:00
break;
case 'I':
setoptval ("includedirectories", optarg);
1999-12-02 02:42:23 -05:00
break;
case 'i':
setoptval ("input", optarg);
1999-12-02 02:42:23 -05:00
break;
case 'l':
setoptval ("reclevel", optarg);
1999-12-02 02:42:23 -05:00
break;
case 'n':
{
/* #### What we really want here is --no-foo. */
1999-12-02 02:42:23 -05:00
char *p;
for (p = optarg; *p; p++)
switch (*p)
{
case 'v':
setoptval ("verbose", "off");
1999-12-02 02:42:23 -05:00
break;
case 'H':
setoptval ("addhostdir", "off");
1999-12-02 02:42:23 -05:00
break;
case 'd':
setoptval ("dirstruct", "off");
1999-12-02 02:42:23 -05:00
break;
case 'c':
setoptval ("noclobber", "on");
1999-12-02 02:42:23 -05:00
break;
case 'r':
setoptval ("removelisting", "off");
1999-12-02 02:42:23 -05:00
break;
case 'p':
setoptval ("noparent", "on");
1999-12-02 02:42:23 -05:00
break;
case 'k':
setoptval ("httpkeepalive", "off");
break;
1999-12-02 02:42:23 -05:00
default:
printf (_("%s: illegal option -- `-n%c'\n"), exec_name, *p);
print_usage ();
printf ("\n");
printf (_("Try `%s --help\' for more options.\n"), exec_name);
exit (1);
}
break;
}
case 'O':
setoptval ("outputdocument", optarg);
1999-12-02 02:42:23 -05:00
break;
case 'o':
setoptval ("logfile", optarg);
1999-12-02 02:42:23 -05:00
break;
case 'P':
setoptval ("dirprefix", optarg);
1999-12-02 02:42:23 -05:00
break;
case 'Q':
setoptval ("quota", optarg);
1999-12-02 02:42:23 -05:00
break;
case 'R':
setoptval ("reject", optarg);
1999-12-02 02:42:23 -05:00
break;
case 'T':
setoptval ("timeout", optarg);
1999-12-02 02:42:23 -05:00
break;
case 't':
setoptval ("tries", optarg);
1999-12-02 02:42:23 -05:00
break;
case 'U':
setoptval ("useragent", optarg);
1999-12-02 02:42:23 -05:00
break;
case 'w':
setoptval ("wait", optarg);
1999-12-02 02:42:23 -05:00
break;
case 'X':
setoptval ("excludedirectories", optarg);
1999-12-02 02:42:23 -05:00
break;
case 'Y':
setoptval ("useproxy", optarg);
1999-12-02 02:42:23 -05:00
break;
case '?':
print_usage ();
printf ("\n");
printf (_("Try `%s --help' for more options.\n"), exec_name);
exit (0);
break;
}
}
/* All user options have now been processed, so it's now safe to do
interoption dependency checks. */
if (opt.reclevel == 0)
opt.reclevel = INFINITE_RECURSION; /* see wget.h for commentary on this */
if (opt.page_requisites && !opt.recursive)
{
opt.recursive = TRUE;
opt.reclevel = 0;
if (!opt.no_dirstruct)
opt.dirstruct = TRUE; /* usually handled by cmd_spec_recursive() */
}
1999-12-02 02:42:23 -05:00
if (opt.verbose == -1)
opt.verbose = !opt.quiet;
/* Sanity checks. */
if (opt.verbose && opt.quiet)
{
printf (_("Can't be verbose and quiet at the same time.\n"));
print_usage ();
exit (1);
}
if (opt.timestamping && opt.noclobber)
{
printf (_("\
Can't timestamp and not clobber old files at the same time.\n"));
print_usage ();
exit (1);
}
nurl = argc - optind;
if (!nurl && !opt.input_filename)
{
/* No URL specified. */
printf (_("%s: missing URL\n"), exec_name);
print_usage ();
printf ("\n");
/* #### Something nicer should be printed here -- similar to the
pre-1.5 `--help' page. */
printf (_("Try `%s --help' for more options.\n"), exec_name);
exit (1);
}
if (opt.background)
fork_to_background ();
/* Initialize progress. Have to do this after the options are
processed so we know where the log file is. */
if (opt.verbose)
set_progress_implementation (opt.progress_type);
1999-12-02 02:42:23 -05:00
/* Allocate basic pointer. */
url = ALLOCA_ARRAY (char *, nurl + 1);
/* Fill in the arguments. */
for (i = 0; i < nurl; i++, optind++)
{
char *rewritten = rewrite_shorthand_url (argv[optind]);
if (rewritten)
url[i] = rewritten;
else
url[i] = xstrdup (argv[optind]);
1999-12-02 02:42:23 -05:00
}
url[i] = NULL;
/* Change the title of console window on Windows. #### I think this
statement should belong to retrieve_url(). --hniksic. */
#ifdef WINDOWS
ws_changetitle (*url, nurl);
#endif
/* Initialize logging. */
log_init (opt.lfilename, append_to_log);
DEBUGP (("DEBUG output created by Wget %s on %s.\n\n", version_string,
OS_TYPE));
2001-04-08 18:25:24 -04:00
1999-12-02 02:42:23 -05:00
/* Open the output filename if necessary. */
if (opt.output_document)
{
if (HYPHENP (opt.output_document))
opt.dfp = stdout;
else
{
struct stat st;
opt.dfp = fopen (opt.output_document, opt.always_rest ? "ab" : "wb");
1999-12-02 02:42:23 -05:00
if (opt.dfp == NULL)
{
perror (opt.output_document);
exit (1);
}
if (fstat (fileno (opt.dfp), &st) == 0 && S_ISREG (st.st_mode))
opt.od_known_regular = 1;
1999-12-02 02:42:23 -05:00
}
}
#ifdef WINDOWS
ws_startup ();
#endif
/* Setup the signal handler to redirect output when hangup is
received. */
#ifdef HAVE_SIGNAL
if (signal(SIGHUP, SIG_IGN) != SIG_IGN)
signal(SIGHUP, redirect_output_signal);
/* ...and do the same for SIGUSR1. */
signal (SIGUSR1, redirect_output_signal);
/* Writing to a closed socket normally signals SIGPIPE, and the
process exits. What we want is to ignore SIGPIPE and just check
for the return value of write(). */
signal (SIGPIPE, SIG_IGN);
#ifdef SIGWINCH
signal (SIGWINCH, progress_handle_sigwinch);
#endif
1999-12-02 02:42:23 -05:00
#endif /* HAVE_SIGNAL */
#ifdef HAVE_SSL
/* Must call this before resolving any URLs because it has the power
to disable `https'. */
ssl_init_prng ();
#endif
1999-12-02 02:42:23 -05:00
status = RETROK; /* initialize it, just-in-case */
/* Retrieve the URLs from argument list. */
for (t = url; *t; t++)
{
char *filename = NULL, *redirected_URL = NULL;
1999-12-02 02:42:23 -05:00
int dt;
if (opt.recursive && url_scheme (*t) != SCHEME_FTP)
status = retrieve_tree (*t);
else
status = retrieve_url (*t, &filename, &redirected_URL, NULL, &dt);
if (opt.delete_after && file_exists_p(filename))
{
DEBUGP (("Removing file due to --delete-after in main():\n"));
logprintf (LOG_VERBOSE, _("Removing %s.\n"), filename);
if (unlink (filename))
logprintf (LOG_NOTQUIET, "unlink: %s\n", strerror (errno));
}
FREE_MAYBE (redirected_URL);
1999-12-02 02:42:23 -05:00
FREE_MAYBE (filename);
}
/* And then from the input file, if any. */
if (opt.input_filename)
{
int count;
status = retrieve_from_file (opt.input_filename, opt.force_html, &count);
if (!count)
logprintf (LOG_NOTQUIET, _("No URLs found in %s.\n"),
opt.input_filename);
}
/* Print the downloaded sum. */
if (opt.recursive
|| nurl > 1
|| (opt.input_filename && opt.downloaded != 0))
{
logprintf (LOG_NOTQUIET,
_("\nFINISHED --%s--\nDownloaded: %s bytes in %d files\n"),
time_str (NULL),
(opt.downloaded_overflow ?
"<overflow>" : legible_very_long (opt.downloaded)),
opt.numurls);
1999-12-02 02:42:23 -05:00
/* Print quota warning, if exceeded. */
if (downloaded_exceeds_quota ())
1999-12-02 02:42:23 -05:00
logprintf (LOG_NOTQUIET,
_("Download quota (%s bytes) EXCEEDED!\n"),
legible (opt.quota));
}
2001-04-08 18:25:24 -04:00
if (opt.cookies_output && wget_cookie_jar)
cookie_jar_save (wget_cookie_jar, opt.cookies_output);
2001-04-08 18:25:24 -04:00
if (opt.convert_links && !opt.delete_after)
1999-12-02 02:42:23 -05:00
{
convert_all_links ();
}
1999-12-02 02:42:23 -05:00
log_close ();
for (i = 0; i < nurl; i++)
xfree (url[i]);
1999-12-02 02:42:23 -05:00
cleanup ();
#ifdef DEBUG_MALLOC
print_malloc_debug_stats ();
#endif
1999-12-02 02:42:23 -05:00
if (status == RETROK)
return 0;
else
return 1;
}
#ifdef HAVE_SIGNAL
1999-12-02 02:42:23 -05:00
/* Hangup signal handler. When wget receives SIGHUP or SIGUSR1, it
will proceed operation as usual, trying to write into a log file.
If that is impossible, the output will be turned off.
#### It is unsafe to do call libc functions from a signal handler.
What we should do is, set a global variable, and have the code in
log.c pick it up. */
1999-12-02 02:42:23 -05:00
static RETSIGTYPE
redirect_output_signal (int sig)
{
char *signal_name = (sig == SIGHUP ? "SIGHUP" :
(sig == SIGUSR1 ? "SIGUSR1" :
"WTF?!"));
log_request_redirect_output (signal_name);
progress_schedule_redirect ();
signal (sig, redirect_output_signal);
1999-12-02 02:42:23 -05:00
}
#endif /* HAVE_SIGNAL */