X-Git-Url: http://sjero.net/git/?p=wget;a=blobdiff_plain;f=src%2Fmain.c;h=42389839181433fb1cacbaacf644509c972ae436;hp=ec8ed32576aeb125d766f6a149cd16f19ad86ede;hb=9dadbf6fe9577a6a6b7e7bab4e4b782fc1a6f86c;hpb=74fbb03b10f6148b5a0cf5b8831b1872e55df7f6 diff --git a/src/main.c b/src/main.c index ec8ed325..5c0b3315 100644 --- a/src/main.c +++ b/src/main.c @@ -1,11 +1,12 @@ /* Command line parsing. - Copyright (C) 2003, 2004, 2005 Free Software Foundation, Inc. + Copyright (C) 1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, + 2004, 2005, 2006, 2007, 2008, 2009 Free Software Foundation, Inc. This file is part of GNU Wget. GNU Wget is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by -the Free Software Foundation; either version 2 of the License, or +the Free Software Foundation; either version 3 of the License, or (at your option) any later version. GNU Wget is distributed in the hope that it will be useful, @@ -14,20 +15,20 @@ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License -along with Wget; if not, write to the Free Software -Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. +along with Wget. If not, see . -In addition, as a special exception, the Free Software Foundation -gives permission to link the code of its release of Wget with the -OpenSSL project's "OpenSSL" library (or with modified versions of it -that use the same license as the "OpenSSL" library), and distribute -the linked executables. You must obey the GNU General Public License -in all respects for all of the code used other than "OpenSSL". If you -modify this file, you may extend this exception to your version of the -file, but you are not obligated to do so. If you do not wish to do -so, delete this exception statement from your version. */ +Additional permission under GNU GPL version 3 section 7 -#include +If you modify this program, or any covered work, by linking or +combining it with the OpenSSL project's OpenSSL library (or a +modified version of that library), containing parts covered by the +terms of the OpenSSL or SSLeay licenses, the Free Software Foundation +grants you additional permission to convey the resulting work. +Corresponding Source for a non-source form of such a combination +shall include the source code for the parts of OpenSSL used as well +as that of the covered work. */ + +#include "wget.h" #include #include @@ -36,24 +37,31 @@ so, delete this exception statement from your version. */ #endif /* HAVE_UNISTD_H */ #include #include -#if defined(HAVE_NLS) && defined(HAVE_LOCALE_H) +#ifdef ENABLE_NLS # include #endif #include #include +#include -#include "wget.h" #include "utils.h" #include "init.h" #include "retr.h" #include "recur.h" #include "host.h" #include "url.h" -#include "progress.h" /* for progress_handle_sigwinch */ +#include "progress.h" /* for progress_handle_sigwinch */ #include "convert.h" +#include "spider.h" +#include "http.h" /* for save_cookies */ + +#include +#include +#include -/* On GNU system this will include system-wide getopt.h. */ -#include "getopt.h" +#ifdef __VMS +#include "vms.h" +#endif /* __VMS */ #ifndef PATH_SEPARATOR # define PATH_SEPARATOR '/' @@ -61,15 +69,27 @@ so, delete this exception statement from your version. */ struct options opt; -extern LARGE_INT total_downloaded_bytes; +/* defined in version.c */ extern char *version_string; +extern char *compilation_string; +extern char *system_getrc; +extern char *link_string; +/* defined in build_info.c */ +extern char *compiled_features[]; +/* Used for --version output in print_version */ +#define MAX_CHARS_PER_LINE 72 +#define TABULATION 4 -extern struct cookie_jar *wget_cookie_jar; - +#if defined(SIGHUP) || defined(SIGUSR1) static void redirect_output_signal (int); +#endif const char *exec_name; + +/* Number of successfully downloaded URLs */ +int numurls = 0; +#ifndef TESTING /* Initialize I18N/L10N. That amounts to invoking setlocale, and setting up gettext's message catalog using bindtextdomain and textdomain. Does nothing if NLS is disabled or missing. */ @@ -77,27 +97,14 @@ const char *exec_name; static void i18n_initialize (void) { - /* HAVE_NLS implies existence of functions invoked here. */ -#ifdef HAVE_NLS + /* ENABLE_NLS implies existence of functions invoked here. */ +#ifdef ENABLE_NLS /* Set the current locale. */ - /* Where possible, sets only LC_MESSAGES and LC_CTYPE. Other - categories, such as numeric, time, or collation, break code that - parses data received from the network and relies on C-locale - behavior of libc functions. For example, Solaris strptime fails - to recognize English month names in non-English locales, which - breaks http_atotm. Some implementations of fnmatch perform - unwanted case folding in non-C locales. ctype macros, while they - were used, provided another example against LC_ALL. */ -#if defined(LC_MESSAGES) && defined(LC_CTYPE) - setlocale (LC_MESSAGES, ""); - setlocale (LC_CTYPE, ""); /* safe because we use safe-ctype */ -#else setlocale (LC_ALL, ""); -#endif /* Set the text message domain. */ bindtextdomain ("wget", LOCALEDIR); textdomain ("wget"); -#endif /* HAVE_NLS */ +#endif /* ENABLE_NLS */ } /* Definition of command-line options. */ @@ -133,14 +140,17 @@ struct cmdline_option { OPT__NO, OPT__PARENT } type; - const void *data; /* for standard options */ - int argtype; /* for non-standard options */ + const void *data; /* for standard options */ + int argtype; /* for non-standard options */ }; -struct cmdline_option option_data[] = +static struct cmdline_option option_data[] = { { "accept", 'A', OPT_VALUE, "accept", -1 }, + { "adjust-extension", 'E', OPT_BOOLEAN, "adjustextension", -1 }, { "append-output", 'a', OPT__APPEND_OUTPUT, NULL, required_argument }, + { "ask-password", 0, OPT_BOOLEAN, "askpassword", -1 }, + { "auth-no-challenge", 0, OPT_BOOLEAN, "authnochallenge", -1 }, { "background", 'b', OPT_BOOLEAN, "background", -1 }, { "backup-converted", 'K', OPT_BOOLEAN, "backupconverted", -1 }, { "backups", 0, OPT_BOOLEAN, "backups", -1 }, @@ -156,9 +166,11 @@ struct cmdline_option option_data[] = { "connect-timeout", 0, OPT_VALUE, "connecttimeout", -1 }, { "continue", 'c', OPT_BOOLEAN, "continue", -1 }, { "convert-links", 'k', OPT_BOOLEAN, "convertlinks", -1 }, + { "content-disposition", 0, OPT_BOOLEAN, "contentdisposition", -1 }, { "cookies", 0, OPT_BOOLEAN, "cookies", -1 }, { "cut-dirs", 0, OPT_VALUE, "cutdirs", -1 }, { WHEN_DEBUG ("debug"), 'd', OPT_BOOLEAN, "debug", -1 }, + { "default-page", 0, OPT_VALUE, "defaultpage", -1 }, { "delete-after", 0, OPT_BOOLEAN, "deleteafter", -1 }, { "directories", 0, OPT_BOOLEAN, "dirstruct", -1 }, { "directory-prefix", 'P', OPT_VALUE, "dirprefix", -1 }, @@ -166,7 +178,7 @@ struct cmdline_option option_data[] = { "dns-timeout", 0, OPT_VALUE, "dnstimeout", -1 }, { "domains", 'D', OPT_VALUE, "domains", -1 }, { "dont-remove-listing", 0, OPT__DONT_REMOVE_LISTING, NULL, no_argument }, - { "dot-style", 0, OPT_VALUE, "dotstyle", -1 }, + { "dot-style", 0, OPT_VALUE, "dotstyle", -1 }, /* deprecated */ { "egd-file", 0, OPT_VALUE, "egdfile", -1 }, { "exclude-directories", 'X', OPT_VALUE, "excludedirectories", -1 }, { "exclude-domains", 0, OPT_VALUE, "excludedomains", -1 }, @@ -176,17 +188,21 @@ struct cmdline_option option_data[] = { "force-directories", 'x', OPT_BOOLEAN, "dirstruct", -1 }, { "force-html", 'F', OPT_BOOLEAN, "forcehtml", -1 }, { "ftp-password", 0, OPT_VALUE, "ftppassword", -1 }, +#ifdef __VMS + { "ftp-stmlf", 0, OPT_BOOLEAN, "ftpstmlf", -1 }, +#endif /* def __VMS */ { "ftp-user", 0, OPT_VALUE, "ftpuser", -1 }, { "glob", 0, OPT_BOOLEAN, "glob", -1 }, { "header", 0, OPT_VALUE, "header", -1 }, { "help", 'h', OPT_FUNCALL, (void *)print_help, no_argument }, { "host-directories", 0, OPT_BOOLEAN, "addhostdir", -1 }, - { "html-extension", 'E', OPT_BOOLEAN, "htmlextension", -1 }, + { "html-extension", 'E', OPT_BOOLEAN, "adjustextension", -1 }, { "htmlify", 0, OPT_BOOLEAN, "htmlify", -1 }, { "http-keep-alive", 0, OPT_BOOLEAN, "httpkeepalive", -1 }, { "http-passwd", 0, OPT_VALUE, "httppassword", -1 }, /* deprecated */ { "http-password", 0, OPT_VALUE, "httppassword", -1 }, { "http-user", 0, OPT_VALUE, "httpuser", -1 }, + { "ignore-case", 0, OPT_BOOLEAN, "ignorecase", -1 }, { "ignore-length", 0, OPT_BOOLEAN, "ignorelength", -1 }, { "ignore-tags", 0, OPT_VALUE, "ignoretags", -1 }, { "include-directories", 'I', OPT_VALUE, "includedirectories", -1 }, @@ -195,10 +211,13 @@ struct cmdline_option option_data[] = { "inet6-only", '6', OPT_BOOLEAN, "inet6only", -1 }, #endif { "input-file", 'i', OPT_VALUE, "input", -1 }, + { "iri", 0, OPT_BOOLEAN, "iri", -1 }, { "keep-session-cookies", 0, OPT_BOOLEAN, "keepsessioncookies", -1 }, { "level", 'l', OPT_VALUE, "reclevel", -1 }, { "limit-rate", 0, OPT_VALUE, "limitrate", -1 }, { "load-cookies", 0, OPT_VALUE, "loadcookies", -1 }, + { "local-encoding", 0, OPT_VALUE, "localencoding", -1 }, + { "max-redirect", 0, OPT_VALUE, "maxredirect", -1 }, { "mirror", 'm', OPT_BOOLEAN, "mirror", -1 }, { "no", 'n', OPT__NO, NULL, required_argument }, { "no-clobber", 0, OPT_BOOLEAN, "noclobber", -1 }, @@ -231,6 +250,7 @@ struct cmdline_option option_data[] = { "referer", 0, OPT_VALUE, "referer", -1 }, { "reject", 'R', OPT_VALUE, "reject", -1 }, { "relative", 'L', OPT_BOOLEAN, "relativeonly", -1 }, + { "remote-encoding", 0, OPT_VALUE, "remoteencoding", -1 }, { "remove-listing", 0, OPT_BOOLEAN, "removelisting", -1 }, { "restrict-file-names", 0, OPT_BOOLEAN, "restrictfilenames", -1 }, { "retr-symlinks", 0, OPT_BOOLEAN, "retrsymlinks", -1 }, @@ -252,6 +272,9 @@ struct cmdline_option option_data[] = { "version", 'V', OPT_FUNCALL, (void *) print_version, no_argument }, { "wait", 'w', OPT_VALUE, "wait", -1 }, { "waitretry", 0, OPT_VALUE, "waitretry", -1 }, +#ifdef MSDOS + { "wdebug", 0, OPT_BOOLEAN, "wdebug", -1 }, +#endif }; #undef WHEN_DEBUG @@ -295,58 +318,58 @@ static void init_switches (void) { char *p = short_options; - int i, o = 0; + size_t i, o = 0; for (i = 0; i < countof (option_data); i++) { struct cmdline_option *opt = &option_data[i]; struct option *longopt; if (!opt->long_name) - /* The option is disabled. */ - continue; + /* The option is disabled. */ + continue; longopt = &long_options[o++]; longopt->name = opt->long_name; longopt->val = i; if (opt->short_name) - { - *p++ = opt->short_name; - optmap[opt->short_name - 32] = longopt - long_options; - } + { + *p++ = opt->short_name; + optmap[opt->short_name - 32] = longopt - long_options; + } switch (opt->type) - { - case OPT_VALUE: - longopt->has_arg = required_argument; + { + case OPT_VALUE: + longopt->has_arg = required_argument; if (opt->short_name) - *p++ = ':'; - break; - case OPT_BOOLEAN: - /* Specify an optional argument for long options, so that - --option=off works the same as --no-option, for - compatibility with pre-1.10 Wget. However, don't specify - optional arguments short-option booleans because they - prevent combining of short options. */ - longopt->has_arg = optional_argument; - /* For Boolean options, add the "--no-FOO" variant, which is - identical to "--foo", except it has opposite meaning and - it doesn't allow an argument. */ - longopt = &long_options[o++]; - longopt->name = no_prefix (opt->long_name); - longopt->has_arg = no_argument; - /* Mask the value so we'll be able to recognize that we're - dealing with the false value. */ - longopt->val = i | BOOLEAN_NEG_MARKER; - break; - default: - assert (opt->argtype != -1); - longopt->has_arg = opt->argtype; - if (opt->short_name) - { - if (longopt->has_arg == required_argument) - *p++ = ':'; - /* Don't handle optional_argument */ - } - } + *p++ = ':'; + break; + case OPT_BOOLEAN: + /* Specify an optional argument for long options, so that + --option=off works the same as --no-option, for + compatibility with pre-1.10 Wget. However, don't specify + optional arguments short-option booleans because they + prevent combining of short options. */ + longopt->has_arg = optional_argument; + /* For Boolean options, add the "--no-FOO" variant, which is + identical to "--foo", except it has opposite meaning and + it doesn't allow an argument. */ + longopt = &long_options[o++]; + longopt->name = no_prefix (opt->long_name); + longopt->has_arg = no_argument; + /* Mask the value so we'll be able to recognize that we're + dealing with the false value. */ + longopt->val = i | BOOLEAN_NEG_MARKER; + break; + default: + assert (opt->argtype != -1); + longopt->has_arg = opt->argtype; + if (opt->short_name) + { + if (longopt->has_arg == required_argument) + *p++ = ':'; + /* Don't handle optional_argument */ + } + } } /* Terminate short_options. */ *p = '\0'; @@ -394,6 +417,10 @@ Logging and input file:\n"), #ifdef ENABLE_DEBUG N_("\ -d, --debug print lots of debugging information.\n"), +#endif +#ifdef MSDOS + N_("\ + --wdebug print Watt-32 debug output.\n"), #endif N_("\ -q, --quiet quiet (no output).\n"), @@ -402,11 +429,12 @@ Logging and input file:\n"), N_("\ -nv, --no-verbose turn off verboseness, without being quiet.\n"), N_("\ - -i, --input-file=FILE download URLs found in FILE.\n"), + -i, --input-file=FILE download URLs found in local or external FILE.\n"), N_("\ -F, --force-html treat input file as HTML.\n"), N_("\ - -B, --base=URL prepends URL to relative links in -F -i file.\n"), + -B, --base=URL resolves HTML input-file links (-i -F)\n\ + relative to URL.\n"), "\n", N_("\ @@ -445,8 +473,6 @@ Download:\n"), --waitretry=SECONDS wait 1..SECONDS between retries of a retrieval.\n"), N_("\ --random-wait wait from 0...2*WAIT secs between retrievals.\n"), - N_("\ - -Y, --proxy explicitly turn on proxy.\n"), N_("\ --no-proxy explicitly turn off proxy.\n"), N_("\ @@ -459,6 +485,8 @@ Download:\n"), --no-dns-cache disable caching DNS lookups.\n"), N_("\ --restrict-file-names=OS restrict chars in file names to ones OS allows.\n"), + N_("\ + --ignore-case ignore case when matching files/directories.\n"), #ifdef ENABLE_IPV6 N_("\ -4, --inet4-only connect only to IPv4 addresses.\n"), @@ -472,6 +500,14 @@ Download:\n"), --user=USER set both ftp and http user to USER.\n"), N_("\ --password=PASS set both ftp and http password to PASS.\n"), + N_("\ + --ask-password prompt for passwords.\n"), + N_("\ + --no-iri turn off IRI support.\n"), + N_("\ + --local-encoding=ENC use ENC as the local encoding for IRIs.\n"), + N_("\ + --remote-encoding=ENC use ENC as the default remote encoding.\n"), "\n", N_("\ @@ -498,12 +534,17 @@ HTTP options:\n"), --http-password=PASS set http password to PASS.\n"), N_("\ --no-cache disallow server-cached data.\n"), + N_ ("\ + --default-page=NAME Change the default page name (normally\n\ + this is `index.html'.).\n"), N_("\ - -E, --html-extension save HTML documents with `.html' extension.\n"), + -E, --adjust-extension save HTML/CSS documents with proper extensions.\n"), N_("\ --ignore-length ignore `Content-Length' header field.\n"), N_("\ --header=STRING insert STRING among the headers.\n"), + N_("\ + --max-redirect maximum redirections allowed per page.\n"), N_("\ --proxy-user=USER set USER as proxy username.\n"), N_("\ @@ -528,6 +569,13 @@ HTTP options:\n"), --post-data=STRING use the POST method; send STRING as the data.\n"), N_("\ --post-file=FILE use the POST method; send contents of FILE.\n"), + N_("\ + --content-disposition honor the Content-Disposition header when\n\ + choosing local file names (EXPERIMENTAL).\n"), + N_("\ + --auth-no-challenge send Basic HTTP authentication information\n\ + without first waiting for the server's\n\ + challenge.\n"), "\n", #ifdef HAVE_SSL @@ -559,6 +607,10 @@ HTTPS (SSL/TLS) options:\n"), N_("\ FTP options:\n"), +#ifdef __VMS + N_("\ + --ftp-stmlf Use Stream_LF format for all binary FTP files.\n"), +#endif /* def __VMS */ N_("\ --ftp-user=USER set ftp user to USER.\n"), N_("\ @@ -571,8 +623,6 @@ FTP options:\n"), --no-passive-ftp disable the \"passive\" transfer mode.\n"), N_("\ --retr-symlinks when recursing, get linked-to files (not dir).\n"), - N_("\ - --preserve-permissions preserve remote file permissions.\n"), "\n", N_("\ @@ -584,11 +634,17 @@ Recursive download:\n"), N_("\ --delete-after delete files locally after downloading them.\n"), N_("\ - -k, --convert-links make links in downloaded HTML point to local files.\n"), + -k, --convert-links make links in downloaded HTML or CSS point to\n\ + local files.\n"), +#ifdef __VMS + N_("\ + -K, --backup-converted before converting file X, back up as X_orig.\n"), +#else /* def __VMS */ N_("\ -K, --backup-converted before converting file X, back up as X.orig.\n"), +#endif /* def __VMS [else] */ N_("\ - -m, --mirror shortcut option equivalent to -r -N -l inf -nr.\n"), + -m, --mirror shortcut for -N -r -l inf --no-remove-listing.\n"), N_("\ -p, --page-requisites get all images, etc. needed to display HTML page.\n"), N_("\ @@ -626,10 +682,10 @@ Recursive accept/reject:\n"), N_("Mail bug reports and suggestions to .\n") }; - int i; + size_t i; printf (_("GNU Wget %s, a non-interactive network retriever.\n"), - version_string); + version_string); print_usage (); for (i = 0; i < countof (help); i++) @@ -638,30 +694,181 @@ Recursive accept/reject:\n"), exit (0); } +/* Return a human-readable printed representation of INTERVAL, + measured in seconds. */ + +static char * +secs_to_human_time (double interval) +{ + static char buf[32]; + int secs = (int) (interval + 0.5); + int hours, mins, days; + + days = secs / 86400, secs %= 86400; + hours = secs / 3600, secs %= 3600; + mins = secs / 60, secs %= 60; + + if (days) + sprintf (buf, "%dd %dh %dm %ds", days, hours, mins, secs); + else if (hours) + sprintf (buf, "%dh %dm %ds", hours, mins, secs); + else if (mins) + sprintf (buf, "%dm %ds", mins, secs); + else + sprintf (buf, "%ss", print_decimal (interval)); + + return buf; +} + +static char * +prompt_for_password (void) +{ + if (opt.user) + printf (_("Password for user %s: "), quote (opt.user)); + else + printf (_("Password: ")); + return getpass(""); +} + +/* Function that prints the line argument while limiting it + to at most line_length. prefix is printed on the first line + and an appropriate number of spaces are added on subsequent + lines.*/ +static void +format_and_print_line (const char *prefix, const char *line, + int line_length) +{ + int remaining_chars; + char *line_dup, *token; + + assert (prefix != NULL); + assert (line != NULL); + + line_dup = xstrdup (line); + + if (line_length <= 0) + line_length = MAX_CHARS_PER_LINE - TABULATION; + + printf ("%s", prefix); + remaining_chars = line_length; + /* We break on spaces. */ + token = strtok (line_dup, " "); + while (token != NULL) + { + /* If however a token is much larger than the maximum + line length, all bets are off and we simply print the + token on the next line. */ + if (remaining_chars <= strlen (token)) + { + printf ("\n%*c", TABULATION, ' '); + remaining_chars = line_length - TABULATION; + } + printf ("%s ", token); + remaining_chars -= strlen (token) + 1; /* account for " " */ + token = strtok (NULL, " "); + } + + printf ("\n"); + + xfree (line_dup); +} + static void print_version (void) { - printf ("GNU Wget %s\n\n", version_string); + const char *wgetrc_title = _("Wgetrc: "); + const char *locale_title = _("Locale: "); + const char *compile_title = _("Compile: "); + const char *link_title = _("Link: "); + char *line; + char *env_wgetrc, *user_wgetrc; + int i; + +#ifdef __VMS + printf (_("GNU Wget %s built on VMS %s %s.\n\n"), + version_string, vms_arch(), vms_vers()); +#else /* def __VMS */ + printf (_("GNU Wget %s built on %s.\n\n"), version_string, OS_TYPE); +#endif /* def __VMS */ + /* compiled_features is a char*[]. We limit the characters per + line to MAX_CHARS_PER_LINE and prefix each line with a constant + number of spaces for proper alignment. */ + for (i = 0; compiled_features[i] != NULL; ) + { + int line_length = MAX_CHARS_PER_LINE; + while ((line_length > 0) && (compiled_features[i] != NULL)) + { + printf ("%s ", compiled_features[i]); + line_length -= strlen (compiled_features[i]) + 2; + i++; + } + printf ("\n"); + } + printf ("\n"); + /* Handle the case when $WGETRC is unset and $HOME/.wgetrc is + absent. */ + printf ("%s\n", wgetrc_title); + env_wgetrc = wgetrc_env_file_name (); + if (env_wgetrc && *env_wgetrc) + { + printf (_(" %s (env)\n"), env_wgetrc); + xfree (env_wgetrc); + } + user_wgetrc = wgetrc_user_file_name (); + if (user_wgetrc) + { + printf (_(" %s (user)\n"), user_wgetrc); + xfree (user_wgetrc); + } +#ifdef SYSTEM_WGETRC + printf (_(" %s (system)\n"), SYSTEM_WGETRC); +#endif + + format_and_print_line (locale_title, + LOCALEDIR, + MAX_CHARS_PER_LINE); + + format_and_print_line (compile_title, + compilation_string, + MAX_CHARS_PER_LINE); + + format_and_print_line (link_title, + link_string, + MAX_CHARS_PER_LINE); + + printf ("\n"); + /* TRANSLATORS: When available, an actual copyright character + (cirle-c) should be used in preference to "(C)". */ fputs (_("\ -Copyright (C) 2005 Free Software Foundation, Inc.\n"), stdout); +Copyright (C) 2009 Free Software Foundation, Inc.\n"), stdout); fputs (_("\ -This program is distributed in the hope that it will be useful,\n\ -but WITHOUT ANY WARRANTY; without even the implied warranty of\n\ -MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the\n\ -GNU General Public License for more details.\n"), stdout); +License GPLv3+: GNU GPL version 3 or later\n\ +.\n\ +This is free software: you are free to change and redistribute it.\n\ +There is NO WARRANTY, to the extent permitted by law.\n"), stdout); + /* TRANSLATORS: When available, please use the proper diacritics for + names such as this one. See en_US.po for reference. */ fputs (_("\nOriginally written by Hrvoje Niksic .\n"), - stdout); + stdout); + fputs (_("Currently maintained by Micah Cowan .\n"), + stdout); + fputs (_("Please send bug reports and questions to .\n"), + stdout); exit (0); } - + +char *program_name; /* Needed by lib/error.c. */ + int -main (int argc, char *const *argv) +main (int argc, char **argv) { char **url, **t; int i, ret, longindex; int nurl, status; bool append_to_log = false; + program_name = argv[0]; + i18n_initialize (); /* Construct the name of the executable, without the directory part. */ @@ -673,7 +880,7 @@ main (int argc, char *const *argv) #ifdef WINDOWS /* Drop extension (typically .EXE) from executable filename. */ - windows_main (&argc, (char **) argv, (char **) &exec_name); + windows_main ((char **) &exec_name); #endif /* Set option defaults; read the system wgetrc and ~/.wgetrc. */ @@ -682,130 +889,135 @@ main (int argc, char *const *argv) init_switches (); longindex = -1; while ((ret = getopt_long (argc, argv, - short_options, long_options, &longindex)) != -1) + short_options, long_options, &longindex)) != -1) { int val; struct cmdline_option *opt; /* If LONGINDEX is unchanged, it means RET is referring a short - option. */ + option. */ if (longindex == -1) - { - if (ret == '?') - { - print_usage (); - printf ("\n"); - printf (_("Try `%s --help' for more options.\n"), exec_name); - exit (2); - } - /* Find the short option character in the mapping. */ - longindex = optmap[ret - 32]; - } + { + if (ret == '?') + { + print_usage (); + printf ("\n"); + printf (_("Try `%s --help' for more options.\n"), exec_name); + exit (2); + } + /* Find the short option character in the mapping. */ + longindex = optmap[ret - 32]; + } val = long_options[longindex].val; /* Use the retrieved value to locate the option in the - option_data array, and to see if we're dealing with the - negated "--no-FOO" variant of the boolean option "--foo". */ + option_data array, and to see if we're dealing with the + negated "--no-FOO" variant of the boolean option "--foo". */ opt = &option_data[val & ~BOOLEAN_NEG_MARKER]; switch (opt->type) - { - case OPT_VALUE: - setoptval (opt->data, optarg, opt->long_name); - break; - case OPT_BOOLEAN: - if (optarg) - /* The user has specified a value -- use it. */ - setoptval (opt->data, optarg, opt->long_name); - else - { - /* NEG is true for `--no-FOO' style boolean options. */ - bool neg = !!(val & BOOLEAN_NEG_MARKER); - setoptval (opt->data, neg ? "0" : "1", opt->long_name); - } - break; - case OPT_FUNCALL: - { - void (*func) (void) = (void (*) (void)) opt->data; - func (); - } - break; - case OPT__APPEND_OUTPUT: - setoptval ("logfile", optarg, opt->long_name); - append_to_log = true; - break; - case OPT__EXECUTE: - run_command (optarg); - break; - case OPT__NO: - { - /* We support real --no-FOO flags now, but keep these - short options for convenience and backward - compatibility. */ - char *p; - for (p = optarg; *p; p++) - switch (*p) - { - case 'v': - setoptval ("verbose", "0", opt->long_name); - break; - case 'H': - setoptval ("addhostdir", "0", opt->long_name); - break; - case 'd': - setoptval ("dirstruct", "0", opt->long_name); - break; - case 'c': - setoptval ("noclobber", "1", opt->long_name); - break; - case 'p': - setoptval ("noparent", "1", opt->long_name); - break; - default: - printf (_("%s: illegal option -- `-n%c'\n"), exec_name, *p); - print_usage (); - printf ("\n"); - printf (_("Try `%s --help' for more options.\n"), exec_name); - exit (1); - } - break; - } - case OPT__PARENT: - case OPT__CLOBBER: - { - /* The wgetrc commands are named noparent and noclobber, - so we must revert the meaning of the cmdline options - before passing the value to setoptval. */ - bool flag = true; - if (optarg) - flag = (*optarg == '1' || TOLOWER (*optarg) == 'y' - || (TOLOWER (optarg[0]) == 'o' - && TOLOWER (optarg[1]) == 'n')); - setoptval (opt->type == OPT__PARENT ? "noparent" : "noclobber", - flag ? "0" : "1", opt->long_name); - break; - } - case OPT__DONT_REMOVE_LISTING: - setoptval ("removelisting", "0", opt->long_name); - break; - } + { + case OPT_VALUE: + setoptval (opt->data, optarg, opt->long_name); + break; + case OPT_BOOLEAN: + if (optarg) + /* The user has specified a value -- use it. */ + setoptval (opt->data, optarg, opt->long_name); + else + { + /* NEG is true for `--no-FOO' style boolean options. */ + bool neg = !!(val & BOOLEAN_NEG_MARKER); + setoptval (opt->data, neg ? "0" : "1", opt->long_name); + } + break; + case OPT_FUNCALL: + { + void (*func) (void) = (void (*) (void)) opt->data; + func (); + } + break; + case OPT__APPEND_OUTPUT: + setoptval ("logfile", optarg, opt->long_name); + append_to_log = true; + break; + case OPT__EXECUTE: + run_command (optarg); + break; + case OPT__NO: + { + /* We support real --no-FOO flags now, but keep these + short options for convenience and backward + compatibility. */ + char *p; + for (p = optarg; *p; p++) + switch (*p) + { + case 'v': + setoptval ("verbose", "0", opt->long_name); + break; + case 'H': + setoptval ("addhostdir", "0", opt->long_name); + break; + case 'd': + setoptval ("dirstruct", "0", opt->long_name); + break; + case 'c': + setoptval ("noclobber", "1", opt->long_name); + break; + case 'p': + setoptval ("noparent", "1", opt->long_name); + break; + default: + printf (_("%s: illegal option -- `-n%c'\n"), exec_name, *p); + print_usage (); + printf ("\n"); + printf (_("Try `%s --help' for more options.\n"), exec_name); + exit (1); + } + break; + } + case OPT__PARENT: + case OPT__CLOBBER: + { + /* The wgetrc commands are named noparent and noclobber, + so we must revert the meaning of the cmdline options + before passing the value to setoptval. */ + bool flag = true; + if (optarg) + flag = (*optarg == '1' || c_tolower (*optarg) == 'y' + || (c_tolower (optarg[0]) == 'o' + && c_tolower (optarg[1]) == 'n')); + setoptval (opt->type == OPT__PARENT ? "noparent" : "noclobber", + flag ? "0" : "1", opt->long_name); + break; + } + case OPT__DONT_REMOVE_LISTING: + setoptval ("removelisting", "0", opt->long_name); + break; + } longindex = -1; } + nurl = argc - optind; + /* All user options have now been processed, so it's now safe to do interoption dependency checks. */ if (opt.reclevel == 0) - opt.reclevel = INFINITE_RECURSION; /* see recur.h for commentary on this */ + opt.reclevel = INFINITE_RECURSION; /* see recur.h for commentary */ + + if (opt.spider || opt.delete_after) + opt.no_dirstruct = true; if (opt.page_requisites && !opt.recursive) { /* Don't set opt.recursive here because it would confuse the FTP - code. Instead, call retrieve_tree below when either - page_requisites or recursive is requested. */ + code. Instead, call retrieve_tree below when either + page_requisites or recursive is requested. */ opt.reclevel = 0; if (!opt.no_dirstruct) - opt.dirstruct = 1; /* normally handled by cmd_spec_recursive() */ + opt.dirstruct = 1; /* normally handled by cmd_spec_recursive() */ } if (opt.verbose == -1) @@ -833,8 +1045,46 @@ Can't timestamp and not clobber old files at the same time.\n")); exit (1); } #endif + if (opt.output_document) + { + if (opt.convert_links + && (nurl > 1 || opt.page_requisites || opt.recursive)) + { + fputs (_("\ +Cannot specify both -k and -O if multiple URLs are given, or in combination\n\ +with -p or -r. See the manual for details.\n\n"), stdout); + print_usage (); + exit (1); + } + if (opt.page_requisites + || opt.recursive) + { + logprintf (LOG_NOTQUIET, "%s", _("\ +WARNING: combining -O with -r or -p will mean that all downloaded content\n\ +will be placed in the single file you specified.\n\n")); + } + if (opt.timestamping) + { + logprintf (LOG_NOTQUIET, "%s", _("\ +WARNING: timestamping does nothing in combination with -O. See the manual\n\ +for details.\n\n")); + opt.timestamping = false; + } + if (opt.noclobber && file_exists_p(opt.output_document)) + { + /* Check if output file exists; if it does, exit. */ + logprintf (LOG_VERBOSE, _("File `%s' already there; not retrieving.\n"), opt.output_document); + exit(1); + } + } + + if (opt.ask_passwd && opt.passwd) + { + printf (_("Cannot specify both --ask-password and --password.\n")); + print_usage (); + exit (1); + } - nurl = argc - optind; if (!nurl && !opt.input_filename) { /* No URL specified. */ @@ -842,13 +1092,48 @@ Can't timestamp and not clobber old files at the same time.\n")); print_usage (); printf ("\n"); /* #### Something nicer should be printed here -- similar to the - pre-1.5 `--help' page. */ + pre-1.5 `--help' page. */ printf (_("Try `%s --help' for more options.\n"), exec_name); exit (1); } +#ifdef ENABLE_IRI + if (opt.enable_iri) + { + if (opt.locale && !check_encoding_name (opt.locale)) + opt.locale = NULL; + + if (!opt.locale) + opt.locale = find_locale (); + + if (opt.encoding_remote && !check_encoding_name (opt.encoding_remote)) + opt.encoding_remote = NULL; + } +#else + if (opt.enable_iri || opt.locale || opt.encoding_remote) + { + /* sXXXav : be more specific... */ + printf(_("This version does not have support for IRIs\n")); + exit(1); + } +#endif + + if (opt.ask_passwd) + { + opt.passwd = prompt_for_password (); + + if (opt.passwd == NULL || opt.passwd[0] == '\0') + exit (1); + } + +#ifdef MSDOS + if (opt.wdebug) + dbug_init(); + sock_init(); +#else if (opt.background) fork_to_background (); +#endif /* Initialize progress. Have to do this after the options are processed so we know where the log file is. */ @@ -861,41 +1146,85 @@ Can't timestamp and not clobber old files at the same time.\n")); { char *rewritten = rewrite_shorthand_url (argv[optind]); if (rewritten) - url[i] = rewritten; + url[i] = rewritten; else - url[i] = xstrdup (argv[optind]); + url[i] = xstrdup (argv[optind]); } url[i] = NULL; /* Initialize logging. */ log_init (opt.lfilename, append_to_log); - DEBUGP (("DEBUG output created by Wget %s on %s.\n\n", version_string, - OS_TYPE)); + DEBUGP (("DEBUG output created by Wget %s on %s.\n\n", + version_string, OS_TYPE)); /* Open the output filename if necessary. */ + +/* 2005-04-17 SMS. + Note that having the output_stream ("-O") file opened here for an FTP + URL rather than in getftp() (ftp.c) (and the http equivalent) rather + limits the ability in VMS to open the file differently for ASCII + versus binary FTP there. (Of course, doing it here allows a open + failure to be detected immediately, without first connecting to the + server.) +*/ if (opt.output_document) { - extern FILE *output_stream; - extern bool output_stream_regular; - if (HYPHENP (opt.output_document)) - output_stream = stdout; + { +#ifdef WINDOWS + FILE *result; + result = freopen ("CONOUT$", "wb", stdout); + if (result == NULL) + { + logputs (LOG_NOTQUIET, _("\ +WARNING: Can't reopen standard output in binary mode;\n\ + downloaded file may contain inappropriate line endings.\n")); + } +#endif + output_stream = stdout; + } else - { - struct_stat st; - output_stream = fopen (opt.output_document, - opt.always_rest ? "ab" : "wb"); - if (output_stream == NULL) - { - perror (opt.output_document); - exit (1); - } - if (fstat (fileno (output_stream), &st) == 0 && S_ISREG (st.st_mode)) - output_stream_regular = true; - } + { + struct_fstat st; + +#ifdef __VMS +/* Common fopen() optional arguments: + sequential access only, access callback function. +*/ +# define FOPEN_OPT_ARGS , "fop=sqo", "acc", acc_cb, &open_id + int open_id = 7; +#else /* def __VMS */ +# define FOPEN_OPT_ARGS +#endif /* def __VMS [else] */ + + output_stream = fopen (opt.output_document, + opt.always_rest ? "ab" : "wb" + FOPEN_OPT_ARGS); + if (output_stream == NULL) + { + perror (opt.output_document); + exit (1); + } + if (fstat (fileno (output_stream), &st) == 0 && S_ISREG (st.st_mode)) + output_stream_regular = true; + } } +#ifdef __VMS + /* Set global ODS5 flag according to the specified destination (if + any), otherwise according to the current default device. + */ + if (output_stream == NULL) + { + set_ods5_dest( "SYS$DISK"); + } + else if (output_stream != stdout) + { + set_ods5_dest( opt.output_document); + } +#endif /* def __VMS */ + #ifdef WINDOWS ws_startup (); #endif @@ -920,29 +1249,61 @@ Can't timestamp and not clobber old files at the same time.\n")); signal (SIGWINCH, progress_handle_sigwinch); #endif - status = RETROK; /* initialize it, just-in-case */ + status = RETROK; /* initialize it, just-in-case */ /* Retrieve the URLs from argument list. */ for (t = url; *t; t++) { char *filename = NULL, *redirected_URL = NULL; - int dt; - - if ((opt.recursive || opt.page_requisites) - && url_scheme (*t) != SCHEME_FTP) - status = retrieve_tree (*t); + int dt, url_err; + /* Need to do a new struct iri every time, because + * retrieve_url may modify it in some circumstances, + * currently. */ + struct iri *iri = iri_new (); + struct url *url_parsed; + + set_uri_encoding (iri, opt.locale, true); + url_parsed = url_parse (*t, &url_err, iri, true); + + if (!url_parsed) + { + char *error = url_error (*t, url_err); + logprintf (LOG_NOTQUIET, "%s: %s.\n",*t, error); + xfree (error); + status = URLERROR; + } else - status = retrieve_url (*t, &filename, &redirected_URL, NULL, &dt); - - if (opt.delete_after && file_exists_p(filename)) - { - DEBUGP (("Removing file due to --delete-after in main():\n")); - logprintf (LOG_VERBOSE, _("Removing %s.\n"), filename); - if (unlink (filename)) - logprintf (LOG_NOTQUIET, "unlink: %s\n", strerror (errno)); - } - - xfree_null (redirected_URL); - xfree_null (filename); + { + if ((opt.recursive || opt.page_requisites) + && (url_scheme (*t) != SCHEME_FTP || url_uses_proxy (url_parsed))) + { + int old_follow_ftp = opt.follow_ftp; + + /* Turn opt.follow_ftp on in case of recursive FTP retrieval */ + if (url_scheme (*t) == SCHEME_FTP) + opt.follow_ftp = 1; + + status = retrieve_tree (url_parsed, NULL); + + opt.follow_ftp = old_follow_ftp; + } + else + { + status = retrieve_url (url_parsed, *t, &filename, &redirected_URL, + NULL, &dt, opt.recursive, iri); + } + + if (opt.delete_after && file_exists_p(filename)) + { + DEBUGP (("Removing file due to --delete-after in main():\n")); + logprintf (LOG_VERBOSE, _("Removing %s.\n"), filename); + if (unlink (filename)) + logprintf (LOG_NOTQUIET, "unlink: %s\n", strerror (errno)); + } + xfree_null (redirected_URL); + xfree_null (filename); + url_free (url_parsed); + } + iri_free (iri); } /* And then from the input file, if any. */ @@ -951,23 +1312,35 @@ Can't timestamp and not clobber old files at the same time.\n")); int count; status = retrieve_from_file (opt.input_filename, opt.force_html, &count); if (!count) - logprintf (LOG_NOTQUIET, _("No URLs found in %s.\n"), - opt.input_filename); + logprintf (LOG_NOTQUIET, _("No URLs found in %s.\n"), + opt.input_filename); + } + + /* Print broken links. */ + if (opt.recursive && opt.spider) + { + print_broken_links(); } + /* Print the downloaded sum. */ - if (opt.recursive || opt.page_requisites - || nurl > 1 - || (opt.input_filename && total_downloaded_bytes != 0)) + if ((opt.recursive || opt.page_requisites + || nurl > 1 + || (opt.input_filename && total_downloaded_bytes != 0)) + && + total_downloaded_bytes != 0) { logprintf (LOG_NOTQUIET, - _("\nFINISHED --%s--\nDownloaded: %s bytes in %d files\n"), - time_str (NULL), with_thousand_seps_large (total_downloaded_bytes), - opt.numurls); + _("FINISHED --%s--\nDownloaded: %d files, %s in %s (%s)\n"), + datetime_str (time (NULL)), + numurls, + human_readable (total_downloaded_bytes), + secs_to_human_time (total_download_time), + retr_rate (total_downloaded_bytes, total_download_time)); /* Print quota warning, if exceeded. */ if (opt.quota && total_downloaded_bytes > opt.quota) - logprintf (LOG_NOTQUIET, - _("Download quota (%s bytes) EXCEEDED!\n"), - with_thousand_seps_large (opt.quota)); + logprintf (LOG_NOTQUIET, + _("Download quota of %s EXCEEDED!\n"), + human_readable (opt.quota)); } if (opt.cookies_output) @@ -981,16 +1354,23 @@ Can't timestamp and not clobber old files at the same time.\n")); xfree (url[i]); cleanup (); -#ifdef DEBUG_MALLOC - print_malloc_debug_stats (); -#endif if (status == RETROK) return 0; else return 1; } +#endif /* TESTING */ #if defined(SIGHUP) || defined(SIGUSR1) + +/* So the signal_name check doesn't blow when only one is available. */ +#ifndef SIGHUP +# define SIGHUP -1 +#endif +#ifndef SIGUSR1 +# define SIGUSR1 -1 +#endif + /* Hangup signal handler. When wget receives SIGHUP or SIGUSR1, it will proceed operation as usual, trying to write into a log file. If that is impossible, the output will be turned off. */ @@ -999,10 +1379,14 @@ static void redirect_output_signal (int sig) { const char *signal_name = (sig == SIGHUP ? "SIGHUP" : - (sig == SIGUSR1 ? "SIGUSR1" : - "WTF?!")); + (sig == SIGUSR1 ? "SIGUSR1" : + "WTF?!")); log_request_redirect_output (signal_name); progress_schedule_redirect (); signal (sig, redirect_output_signal); } #endif + +/* + * vim: et ts=2 sw=2 + */