1 /* Command line parsing.
2 Copyright (C) 1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004,
3 2005, 2006, 2007, 2008, 2009, 2010, 2011 Free Software Foundation,
6 This file is part of GNU Wget.
8 GNU Wget is free software; you can redistribute it and/or modify
9 it under the terms of the GNU General Public License as published by
10 the Free Software Foundation; either version 3 of the License, or
11 (at your option) any later version.
13 GNU Wget is distributed in the hope that it will be useful,
14 but WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 GNU General Public License for more details.
18 You should have received a copy of the GNU General Public License
19 along with Wget. If not, see <http://www.gnu.org/licenses/>.
21 Additional permission under GNU GPL version 3 section 7
23 If you modify this program, or any covered work, by linking or
24 combining it with the OpenSSL project's OpenSSL library (or a
25 modified version of that library), containing parts covered by the
26 terms of the OpenSSL or SSLeay licenses, the Free Software Foundation
27 grants you additional permission to convey the resulting work.
28 Corresponding Source for a non-source form of such a combination
29 shall include the source code for the parts of OpenSSL used as well
30 as that of the covered work. */
53 #include "progress.h" /* for progress_handle_sigwinch */
56 #include "http.h" /* for save_cookies */
72 #ifndef PATH_SEPARATOR
73 # define PATH_SEPARATOR '/'
82 /* defined in version.c */
83 extern char *version_string;
84 extern char *compilation_string;
85 extern char *system_getrc;
86 extern char *link_string;
87 /* defined in build_info.c */
88 extern const char *compiled_features[];
89 /* Used for --version output in print_version */
90 #define MAX_CHARS_PER_LINE 72
93 #if defined(SIGHUP) || defined(SIGUSR1)
94 static void redirect_output_signal (int);
97 const char *exec_name;
99 /* Number of successfully downloaded URLs */
103 /* Initialize I18N/L10N. That amounts to invoking setlocale, and
104 setting up gettext's message catalog using bindtextdomain and
105 textdomain. Does nothing if NLS is disabled or missing. */
108 i18n_initialize (void)
110 /* ENABLE_NLS implies existence of functions invoked here. */
112 /* Set the current locale. */
113 setlocale (LC_ALL, "");
114 /* Set the text message domain. */
115 bindtextdomain ("wget", LOCALEDIR);
117 #endif /* ENABLE_NLS */
120 /* Definition of command-line options. */
122 static void print_help (void);
123 static void print_version (void);
128 # define IF_SSL(x) NULL
132 # define WHEN_DEBUG(x) x
134 # define WHEN_DEBUG(x) NULL
137 struct cmdline_option {
138 const char *long_name;
144 /* Non-standard options that have to be handled specially in
148 OPT__DONT_REMOVE_LISTING,
153 const void *data; /* for standard options */
154 int argtype; /* for non-standard options */
157 static struct cmdline_option option_data[] =
159 { "accept", 'A', OPT_VALUE, "accept", -1 },
160 { "adjust-extension", 'E', OPT_BOOLEAN, "adjustextension", -1 },
161 { "append-output", 'a', OPT__APPEND_OUTPUT, NULL, required_argument },
162 { "ask-password", 0, OPT_BOOLEAN, "askpassword", -1 },
163 { "auth-no-challenge", 0, OPT_BOOLEAN, "authnochallenge", -1 },
164 { "background", 'b', OPT_BOOLEAN, "background", -1 },
165 { "backup-converted", 'K', OPT_BOOLEAN, "backupconverted", -1 },
166 { "backups", 0, OPT_BOOLEAN, "backups", -1 },
167 { "base", 'B', OPT_VALUE, "base", -1 },
168 { "bind-address", 0, OPT_VALUE, "bindaddress", -1 },
169 { IF_SSL ("ca-certificate"), 0, OPT_VALUE, "cacertificate", -1 },
170 { IF_SSL ("ca-directory"), 0, OPT_VALUE, "cadirectory", -1 },
171 { "cache", 0, OPT_BOOLEAN, "cache", -1 },
172 { IF_SSL ("certificate"), 0, OPT_VALUE, "certificate", -1 },
173 { IF_SSL ("certificate-type"), 0, OPT_VALUE, "certificatetype", -1 },
174 { IF_SSL ("check-certificate"), 0, OPT_BOOLEAN, "checkcertificate", -1 },
175 { "clobber", 0, OPT__CLOBBER, NULL, optional_argument },
176 { "config", 0, OPT_VALUE, "chooseconfig", -1 },
177 { "connect-timeout", 0, OPT_VALUE, "connecttimeout", -1 },
178 { "continue", 'c', OPT_BOOLEAN, "continue", -1 },
179 { "convert-links", 'k', OPT_BOOLEAN, "convertlinks", -1 },
180 { "content-disposition", 0, OPT_BOOLEAN, "contentdisposition", -1 },
181 { "cookies", 0, OPT_BOOLEAN, "cookies", -1 },
182 { "cut-dirs", 0, OPT_VALUE, "cutdirs", -1 },
183 { WHEN_DEBUG ("debug"), 'd', OPT_BOOLEAN, "debug", -1 },
184 { "default-page", 0, OPT_VALUE, "defaultpage", -1 },
185 { "delete-after", 0, OPT_BOOLEAN, "deleteafter", -1 },
186 { "directories", 0, OPT_BOOLEAN, "dirstruct", -1 },
187 { "directory-prefix", 'P', OPT_VALUE, "dirprefix", -1 },
188 { "dns-cache", 0, OPT_BOOLEAN, "dnscache", -1 },
189 { "dns-timeout", 0, OPT_VALUE, "dnstimeout", -1 },
190 { "domains", 'D', OPT_VALUE, "domains", -1 },
191 { "dont-remove-listing", 0, OPT__DONT_REMOVE_LISTING, NULL, no_argument },
192 { "dot-style", 0, OPT_VALUE, "dotstyle", -1 }, /* deprecated */
193 { "egd-file", 0, OPT_VALUE, "egdfile", -1 },
194 { "exclude-directories", 'X', OPT_VALUE, "excludedirectories", -1 },
195 { "exclude-domains", 0, OPT_VALUE, "excludedomains", -1 },
196 { "execute", 'e', OPT__EXECUTE, NULL, required_argument },
197 { "follow-ftp", 0, OPT_BOOLEAN, "followftp", -1 },
198 { "follow-tags", 0, OPT_VALUE, "followtags", -1 },
199 { "force-directories", 'x', OPT_BOOLEAN, "dirstruct", -1 },
200 { "force-html", 'F', OPT_BOOLEAN, "forcehtml", -1 },
201 { "ftp-password", 0, OPT_VALUE, "ftppassword", -1 },
203 { "ftp-stmlf", 0, OPT_BOOLEAN, "ftpstmlf", -1 },
204 #endif /* def __VMS */
205 { "ftp-user", 0, OPT_VALUE, "ftpuser", -1 },
206 { "glob", 0, OPT_BOOLEAN, "glob", -1 },
207 { "header", 0, OPT_VALUE, "header", -1 },
208 { "help", 'h', OPT_FUNCALL, (void *)print_help, no_argument },
209 { "host-directories", 0, OPT_BOOLEAN, "addhostdir", -1 },
210 { "html-extension", 'E', OPT_BOOLEAN, "adjustextension", -1 }, /* deprecated */
211 { "htmlify", 0, OPT_BOOLEAN, "htmlify", -1 },
212 { "http-keep-alive", 0, OPT_BOOLEAN, "httpkeepalive", -1 },
213 { "http-passwd", 0, OPT_VALUE, "httppassword", -1 }, /* deprecated */
214 { "http-password", 0, OPT_VALUE, "httppassword", -1 },
215 { "http-user", 0, OPT_VALUE, "httpuser", -1 },
216 { "ignore-case", 0, OPT_BOOLEAN, "ignorecase", -1 },
217 { "ignore-length", 0, OPT_BOOLEAN, "ignorelength", -1 },
218 { "ignore-tags", 0, OPT_VALUE, "ignoretags", -1 },
219 { "include-directories", 'I', OPT_VALUE, "includedirectories", -1 },
221 { "inet4-only", '4', OPT_BOOLEAN, "inet4only", -1 },
222 { "inet6-only", '6', OPT_BOOLEAN, "inet6only", -1 },
224 { "input-file", 'i', OPT_VALUE, "input", -1 },
225 { "iri", 0, OPT_BOOLEAN, "iri", -1 },
226 { "keep-session-cookies", 0, OPT_BOOLEAN, "keepsessioncookies", -1 },
227 { "level", 'l', OPT_VALUE, "reclevel", -1 },
228 { "limit-rate", 0, OPT_VALUE, "limitrate", -1 },
229 { "load-cookies", 0, OPT_VALUE, "loadcookies", -1 },
230 { "local-encoding", 0, OPT_VALUE, "localencoding", -1 },
231 { "max-redirect", 0, OPT_VALUE, "maxredirect", -1 },
232 { "mirror", 'm', OPT_BOOLEAN, "mirror", -1 },
233 { "no", 'n', OPT__NO, NULL, required_argument },
234 { "no-clobber", 0, OPT_BOOLEAN, "noclobber", -1 },
235 { "no-parent", 0, OPT_BOOLEAN, "noparent", -1 },
236 { "output-document", 'O', OPT_VALUE, "outputdocument", -1 },
237 { "output-file", 'o', OPT_VALUE, "logfile", -1 },
238 { "page-requisites", 'p', OPT_BOOLEAN, "pagerequisites", -1 },
239 { "parent", 0, OPT__PARENT, NULL, optional_argument },
240 { "passive-ftp", 0, OPT_BOOLEAN, "passiveftp", -1 },
241 { "password", 0, OPT_VALUE, "password", -1 },
242 { "post-data", 0, OPT_VALUE, "postdata", -1 },
243 { "post-file", 0, OPT_VALUE, "postfile", -1 },
244 { "prefer-family", 0, OPT_VALUE, "preferfamily", -1 },
245 { "preserve-permissions", 0, OPT_BOOLEAN, "preservepermissions", -1 }, /* deprecated */
246 { IF_SSL ("private-key"), 0, OPT_VALUE, "privatekey", -1 },
247 { IF_SSL ("private-key-type"), 0, OPT_VALUE, "privatekeytype", -1 },
248 { "progress", 0, OPT_VALUE, "progress", -1 },
249 { "protocol-directories", 0, OPT_BOOLEAN, "protocoldirectories", -1 },
250 { "proxy", 0, OPT_BOOLEAN, "useproxy", -1 },
251 { "proxy__compat", 'Y', OPT_VALUE, "useproxy", -1 }, /* back-compatible */
252 { "proxy-passwd", 0, OPT_VALUE, "proxypassword", -1 }, /* deprecated */
253 { "proxy-password", 0, OPT_VALUE, "proxypassword", -1 },
254 { "proxy-user", 0, OPT_VALUE, "proxyuser", -1 },
255 { "quiet", 'q', OPT_BOOLEAN, "quiet", -1 },
256 { "quota", 'Q', OPT_VALUE, "quota", -1 },
257 { "random-file", 0, OPT_VALUE, "randomfile", -1 },
258 { "random-wait", 0, OPT_BOOLEAN, "randomwait", -1 },
259 { "read-timeout", 0, OPT_VALUE, "readtimeout", -1 },
260 { "recursive", 'r', OPT_BOOLEAN, "recursive", -1 },
261 { "referer", 0, OPT_VALUE, "referer", -1 },
262 { "reject", 'R', OPT_VALUE, "reject", -1 },
263 { "relative", 'L', OPT_BOOLEAN, "relativeonly", -1 },
264 { "remote-encoding", 0, OPT_VALUE, "remoteencoding", -1 },
265 { "remove-listing", 0, OPT_BOOLEAN, "removelisting", -1 },
266 { "restrict-file-names", 0, OPT_BOOLEAN, "restrictfilenames", -1 },
267 { "retr-symlinks", 0, OPT_BOOLEAN, "retrsymlinks", -1 },
268 { "retry-connrefused", 0, OPT_BOOLEAN, "retryconnrefused", -1 },
269 { "save-cookies", 0, OPT_VALUE, "savecookies", -1 },
270 { "save-headers", 0, OPT_BOOLEAN, "saveheaders", -1 },
271 { IF_SSL ("secure-protocol"), 0, OPT_VALUE, "secureprotocol", -1 },
272 { "server-response", 'S', OPT_BOOLEAN, "serverresponse", -1 },
273 { "span-hosts", 'H', OPT_BOOLEAN, "spanhosts", -1 },
274 { "spider", 0, OPT_BOOLEAN, "spider", -1 },
275 { "strict-comments", 0, OPT_BOOLEAN, "strictcomments", -1 },
276 { "timeout", 'T', OPT_VALUE, "timeout", -1 },
277 { "timestamping", 'N', OPT_BOOLEAN, "timestamping", -1 },
278 { "tries", 't', OPT_VALUE, "tries", -1 },
279 { "unlink", 0, OPT_BOOLEAN, "unlink", -1 },
280 { "trust-server-names", 0, OPT_BOOLEAN, "trustservernames", -1 },
281 { "use-server-timestamps", 0, OPT_BOOLEAN, "useservertimestamps", -1 },
282 { "user", 0, OPT_VALUE, "user", -1 },
283 { "user-agent", 'U', OPT_VALUE, "useragent", -1 },
284 { "verbose", 'v', OPT_BOOLEAN, "verbose", -1 },
285 { "verbose", 0, OPT_BOOLEAN, "verbose", -1 },
286 { "version", 'V', OPT_FUNCALL, (void *) print_version, no_argument },
287 { "wait", 'w', OPT_VALUE, "wait", -1 },
288 { "waitretry", 0, OPT_VALUE, "waitretry", -1 },
290 { "wdebug", 0, OPT_BOOLEAN, "wdebug", -1 },
297 /* Return a string that contains S with "no-" prepended. The string
298 is NUL-terminated and allocated off static storage at Wget
302 no_prefix (const char *s)
304 static char buffer[1024];
305 static char *p = buffer;
308 int size = 3 + strlen (s) + 1; /* "no-STRING\0" */
309 if (p + size >= buffer + sizeof (buffer))
312 cp[0] = 'n', cp[1] = 'o', cp[2] = '-';
318 /* The arguments that that main passes to getopt_long. */
319 static struct option long_options[2 * countof (option_data) + 1];
320 static char short_options[128];
322 /* Mapping between short option chars and option_data indices. */
323 static unsigned char optmap[96];
325 /* Marker for `--no-FOO' values in long_options. */
326 #define BOOLEAN_NEG_MARKER 1024
328 /* Initialize the long_options array used by getopt_long from the data
334 char *p = short_options;
336 for (i = 0; i < countof (option_data); i++)
338 struct cmdline_option *opt = &option_data[i];
339 struct option *longopt;
342 /* The option is disabled. */
345 longopt = &long_options[o++];
346 longopt->name = opt->long_name;
350 *p++ = opt->short_name;
351 optmap[opt->short_name - 32] = longopt - long_options;
356 longopt->has_arg = required_argument;
361 /* Specify an optional argument for long options, so that
362 --option=off works the same as --no-option, for
363 compatibility with pre-1.10 Wget. However, don't specify
364 optional arguments short-option booleans because they
365 prevent combining of short options. */
366 longopt->has_arg = optional_argument;
367 /* For Boolean options, add the "--no-FOO" variant, which is
368 identical to "--foo", except it has opposite meaning and
369 it doesn't allow an argument. */
370 longopt = &long_options[o++];
371 longopt->name = no_prefix (opt->long_name);
372 longopt->has_arg = no_argument;
373 /* Mask the value so we'll be able to recognize that we're
374 dealing with the false value. */
375 longopt->val = i | BOOLEAN_NEG_MARKER;
378 assert (opt->argtype != -1);
379 longopt->has_arg = opt->argtype;
382 if (longopt->has_arg == required_argument)
384 /* Don't handle optional_argument */
388 /* Terminate short_options. */
390 /* No need for xzero(long_options[o]) because its storage is static
391 and it will be zeroed by default. */
392 assert (o <= countof (long_options));
395 /* Print the usage message. */
397 print_usage (int error)
399 return fprintf (error ? stderr : stdout,
400 _("Usage: %s [OPTION]... [URL]...\n"), exec_name);
403 /* Print the help message, describing all the available options. If
404 you add an option, be sure to update this list. */
408 /* We split the help text this way to ease translation of individual
410 static const char *help[] = {
413 Mandatory arguments to long options are mandatory for short options too.\n\n"),
417 -V, --version display the version of Wget and exit.\n"),
419 -h, --help print this help.\n"),
421 -b, --background go to background after startup.\n"),
423 -e, --execute=COMMAND execute a `.wgetrc'-style command.\n"),
427 Logging and input file:\n"),
429 -o, --output-file=FILE log messages to FILE.\n"),
431 -a, --append-output=FILE append messages to FILE.\n"),
434 -d, --debug print lots of debugging information.\n"),
438 --wdebug print Watt-32 debug output.\n"),
441 -q, --quiet quiet (no output).\n"),
443 -v, --verbose be verbose (this is the default).\n"),
445 -nv, --no-verbose turn off verboseness, without being quiet.\n"),
447 -i, --input-file=FILE download URLs found in local or external FILE.\n"),
449 -F, --force-html treat input file as HTML.\n"),
451 -B, --base=URL resolves HTML input-file links (-i -F)\n\
452 relative to URL.\n"),
454 --config=FILE Specify config file to use.\n"),
460 -t, --tries=NUMBER set number of retries to NUMBER (0 unlimits).\n"),
462 --retry-connrefused retry even if connection is refused.\n"),
464 -O, --output-document=FILE write documents to FILE.\n"),
466 -nc, --no-clobber skip downloads that would download to\n\
467 existing files (overwriting them).\n"),
469 -c, --continue resume getting a partially-downloaded file.\n"),
471 --progress=TYPE select progress gauge type.\n"),
473 -N, --timestamping don't re-retrieve files unless newer than\n\
476 --no-use-server-timestamps don't set the local file's timestamp by\n\
477 the one on the server.\n"),
479 -S, --server-response print server response.\n"),
481 --spider don't download anything.\n"),
483 -T, --timeout=SECONDS set all timeout values to SECONDS.\n"),
485 --dns-timeout=SECS set the DNS lookup timeout to SECS.\n"),
487 --connect-timeout=SECS set the connect timeout to SECS.\n"),
489 --read-timeout=SECS set the read timeout to SECS.\n"),
491 -w, --wait=SECONDS wait SECONDS between retrievals.\n"),
493 --waitretry=SECONDS wait 1..SECONDS between retries of a retrieval.\n"),
495 --random-wait wait from 0.5*WAIT...1.5*WAIT secs between retrievals.\n"),
497 --no-proxy explicitly turn off proxy.\n"),
499 -Q, --quota=NUMBER set retrieval quota to NUMBER.\n"),
501 --bind-address=ADDRESS bind to ADDRESS (hostname or IP) on local host.\n"),
503 --limit-rate=RATE limit download rate to RATE.\n"),
505 --no-dns-cache disable caching DNS lookups.\n"),
507 --restrict-file-names=OS restrict chars in file names to ones OS allows.\n"),
509 --ignore-case ignore case when matching files/directories.\n"),
512 -4, --inet4-only connect only to IPv4 addresses.\n"),
514 -6, --inet6-only connect only to IPv6 addresses.\n"),
516 --prefer-family=FAMILY connect first to addresses of specified family,\n\
517 one of IPv6, IPv4, or none.\n"),
520 --user=USER set both ftp and http user to USER.\n"),
522 --password=PASS set both ftp and http password to PASS.\n"),
524 --ask-password prompt for passwords.\n"),
526 --no-iri turn off IRI support.\n"),
528 --local-encoding=ENC use ENC as the local encoding for IRIs.\n"),
530 --remote-encoding=ENC use ENC as the default remote encoding.\n"),
532 --unlink remove file before clobber.\n"),
538 -nd, --no-directories don't create directories.\n"),
540 -x, --force-directories force creation of directories.\n"),
542 -nH, --no-host-directories don't create host directories.\n"),
544 --protocol-directories use protocol name in directories.\n"),
546 -P, --directory-prefix=PREFIX save files to PREFIX/...\n"),
548 --cut-dirs=NUMBER ignore NUMBER remote directory components.\n"),
554 --http-user=USER set http user to USER.\n"),
556 --http-password=PASS set http password to PASS.\n"),
558 --no-cache disallow server-cached data.\n"),
560 --default-page=NAME Change the default page name (normally\n\
561 this is `index.html'.).\n"),
563 -E, --adjust-extension save HTML/CSS documents with proper extensions.\n"),
565 --ignore-length ignore `Content-Length' header field.\n"),
567 --header=STRING insert STRING among the headers.\n"),
569 --max-redirect maximum redirections allowed per page.\n"),
571 --proxy-user=USER set USER as proxy username.\n"),
573 --proxy-password=PASS set PASS as proxy password.\n"),
575 --referer=URL include `Referer: URL' header in HTTP request.\n"),
577 --save-headers save the HTTP headers to file.\n"),
579 -U, --user-agent=AGENT identify as AGENT instead of Wget/VERSION.\n"),
581 --no-http-keep-alive disable HTTP keep-alive (persistent connections).\n"),
583 --no-cookies don't use cookies.\n"),
585 --load-cookies=FILE load cookies from FILE before session.\n"),
587 --save-cookies=FILE save cookies to FILE after session.\n"),
589 --keep-session-cookies load and save session (non-permanent) cookies.\n"),
591 --post-data=STRING use the POST method; send STRING as the data.\n"),
593 --post-file=FILE use the POST method; send contents of FILE.\n"),
595 --content-disposition honor the Content-Disposition header when\n\
596 choosing local file names (EXPERIMENTAL).\n"),
598 --auth-no-challenge send Basic HTTP authentication information\n\
599 without first waiting for the server's\n\
605 HTTPS (SSL/TLS) options:\n"),
607 --secure-protocol=PR choose secure protocol, one of auto, SSLv2,\n\
608 SSLv3, and TLSv1.\n"),
610 --no-check-certificate don't validate the server's certificate.\n"),
612 --certificate=FILE client certificate file.\n"),
614 --certificate-type=TYPE client certificate type, PEM or DER.\n"),
616 --private-key=FILE private key file.\n"),
618 --private-key-type=TYPE private key type, PEM or DER.\n"),
620 --ca-certificate=FILE file with the bundle of CA's.\n"),
622 --ca-directory=DIR directory where hash list of CA's is stored.\n"),
624 --random-file=FILE file with random data for seeding the SSL PRNG.\n"),
626 --egd-file=FILE file naming the EGD socket with random data.\n"),
628 #endif /* HAVE_SSL */
634 --ftp-stmlf Use Stream_LF format for all binary FTP files.\n"),
635 #endif /* def __VMS */
637 --ftp-user=USER set ftp user to USER.\n"),
639 --ftp-password=PASS set ftp password to PASS.\n"),
641 --no-remove-listing don't remove `.listing' files.\n"),
643 --no-glob turn off FTP file name globbing.\n"),
645 --no-passive-ftp disable the \"passive\" transfer mode.\n"),
647 --retr-symlinks when recursing, get linked-to files (not dir).\n"),
651 Recursive download:\n"),
653 -r, --recursive specify recursive download.\n"),
655 -l, --level=NUMBER maximum recursion depth (inf or 0 for infinite).\n"),
657 --delete-after delete files locally after downloading them.\n"),
659 -k, --convert-links make links in downloaded HTML or CSS point to\n\
663 -K, --backup-converted before converting file X, back up as X_orig.\n"),
664 #else /* def __VMS */
666 -K, --backup-converted before converting file X, back up as X.orig.\n"),
667 #endif /* def __VMS [else] */
669 -m, --mirror shortcut for -N -r -l inf --no-remove-listing.\n"),
671 -p, --page-requisites get all images, etc. needed to display HTML page.\n"),
673 --strict-comments turn on strict (SGML) handling of HTML comments.\n"),
677 Recursive accept/reject:\n"),
679 -A, --accept=LIST comma-separated list of accepted extensions.\n"),
681 -R, --reject=LIST comma-separated list of rejected extensions.\n"),
683 -D, --domains=LIST comma-separated list of accepted domains.\n"),
685 --exclude-domains=LIST comma-separated list of rejected domains.\n"),
687 --follow-ftp follow FTP links from HTML documents.\n"),
689 --follow-tags=LIST comma-separated list of followed HTML tags.\n"),
691 --ignore-tags=LIST comma-separated list of ignored HTML tags.\n"),
693 -H, --span-hosts go to foreign hosts when recursive.\n"),
695 -L, --relative follow relative links only.\n"),
697 -I, --include-directories=LIST list of allowed directories.\n"),
699 --trust-server-names use the name specified by the redirection\n\
700 url last component.\n"),
702 -X, --exclude-directories=LIST list of excluded directories.\n"),
704 -np, --no-parent don't ascend to the parent directory.\n"),
707 N_("Mail bug reports and suggestions to <bug-wget@gnu.org>.\n")
712 if (printf (_("GNU Wget %s, a non-interactive network retriever.\n"),
715 if (print_usage (0) < 0)
718 for (i = 0; i < countof (help); i++)
719 if (fputs (_(help[i]), stdout) < 0)
725 /* Return a human-readable printed representation of INTERVAL,
726 measured in seconds. */
729 secs_to_human_time (double interval)
732 int secs = (int) (interval + 0.5);
733 int hours, mins, days;
735 days = secs / 86400, secs %= 86400;
736 hours = secs / 3600, secs %= 3600;
737 mins = secs / 60, secs %= 60;
740 sprintf (buf, "%dd %dh %dm %ds", days, hours, mins, secs);
742 sprintf (buf, "%dh %dm %ds", hours, mins, secs);
744 sprintf (buf, "%dm %ds", mins, secs);
746 sprintf (buf, "%ss", print_decimal (interval));
752 prompt_for_password (void)
755 fprintf (stderr, _("Password for user %s: "), quote (opt.user));
757 fprintf (stderr, _("Password: "));
761 /* Function that prints the line argument while limiting it
762 to at most line_length. prefix is printed on the first line
763 and an appropriate number of spaces are added on subsequent
766 format_and_print_line (const char *prefix, const char *line,
770 char *line_dup, *token;
772 assert (prefix != NULL);
773 assert (line != NULL);
775 line_dup = xstrdup (line);
777 if (line_length <= 0)
778 line_length = MAX_CHARS_PER_LINE - TABULATION;
780 if (printf ("%s", prefix) < 0)
782 remaining_chars = line_length;
783 /* We break on spaces. */
784 token = strtok (line_dup, " ");
785 while (token != NULL)
787 /* If however a token is much larger than the maximum
788 line length, all bets are off and we simply print the
789 token on the next line. */
790 if (remaining_chars <= strlen (token))
792 if (printf ("\n%*c", TABULATION, ' ') < 0)
794 remaining_chars = line_length - TABULATION;
796 if (printf ("%s ", token) < 0)
798 remaining_chars -= strlen (token) + 1; /* account for " " */
799 token = strtok (NULL, " ");
802 if (printf ("\n") < 0)
812 const char *wgetrc_title = _("Wgetrc: ");
813 const char *locale_title = _("Locale: ");
814 const char *compile_title = _("Compile: ");
815 const char *link_title = _("Link: ");
816 char *env_wgetrc, *user_wgetrc;
819 if (printf (_("GNU Wget %s built on %s.\n\n"), version_string, OS_TYPE) < 0)
822 for (i = 0; compiled_features[i] != NULL; )
824 int line_length = MAX_CHARS_PER_LINE;
825 while ((line_length > 0) && (compiled_features[i] != NULL))
827 if (printf ("%s ", compiled_features[i]) < 0)
829 line_length -= strlen (compiled_features[i]) + 2;
832 if (printf ("\n") < 0)
835 if (printf ("\n") < 0)
838 /* Handle the case when $WGETRC is unset and $HOME/.wgetrc is
840 if (printf ("%s\n", wgetrc_title) < 0)
843 env_wgetrc = wgetrc_env_file_name ();
844 if (env_wgetrc && *env_wgetrc)
846 if (printf (_(" %s (env)\n"), env_wgetrc) < 0)
850 user_wgetrc = wgetrc_user_file_name ();
853 if (printf (_(" %s (user)\n"), user_wgetrc) < 0)
858 if (printf (_(" %s (system)\n"), SYSTEM_WGETRC) < 0)
863 if (format_and_print_line (locale_title,
865 MAX_CHARS_PER_LINE) < 0)
867 #endif /* def ENABLE_NLS */
869 if (compilation_string != NULL)
870 if (format_and_print_line (compile_title,
872 MAX_CHARS_PER_LINE) < 0)
875 if (link_string != NULL)
876 if (format_and_print_line (link_title,
878 MAX_CHARS_PER_LINE) < 0)
881 if (printf ("\n") < 0)
884 /* TRANSLATORS: When available, an actual copyright character
885 (circle-c) should be used in preference to "(C)". */
887 Copyright (C) 2011 Free Software Foundation, Inc.\n"), stdout) < 0)
890 License GPLv3+: GNU GPL version 3 or later\n\
891 <http://www.gnu.org/licenses/gpl.html>.\n\
892 This is free software: you are free to change and redistribute it.\n\
893 There is NO WARRANTY, to the extent permitted by law.\n"), stdout) < 0)
895 /* TRANSLATORS: When available, please use the proper diacritics for
896 names such as this one. See en_US.po for reference. */
897 if (fputs (_("\nOriginally written by Hrvoje Niksic <hniksic@xemacs.org>.\n"),
900 if (fputs (_("Please send bug reports and questions to <bug-wget@gnu.org>.\n"),
907 char *program_name; /* Needed by lib/error.c. */
910 main (int argc, char **argv)
913 int i, ret, longindex;
915 bool append_to_log = false;
917 total_downloaded_bytes = 0;
919 program_name = argv[0];
921 struct ptimer *timer = ptimer_new ();
922 double start_time = ptimer_measure (timer);
926 /* Construct the name of the executable, without the directory part. */
928 /* On VMS, lose the "dev:[dir]" prefix and the ".EXE;nnn" suffix. */
929 exec_name = vms_basename (argv[0]);
930 #else /* def __VMS */
931 exec_name = strrchr (argv[0], PATH_SEPARATOR);
936 #endif /* def __VMS [else] */
939 /* Drop extension (typically .EXE) from executable filename. */
940 windows_main ((char **) &exec_name);
943 /* Load the hard-coded defaults. */
948 /* This seperate getopt_long is needed to find the user config
949 and parse it before the other user options. */
952 bool use_userconfig = false;
954 while ((retconf = getopt_long (argc, argv,
955 short_options, long_options, &longindex)) != -1)
958 bool userrc_ret = true;
959 struct cmdline_option *config_opt;
960 confval = long_options[longindex].val;
961 config_opt = &option_data[confval & ~BOOLEAN_NEG_MARKER];
962 if (strcmp (config_opt->long_name, "config") == 0)
964 userrc_ret &= run_wgetrc (optarg);
965 use_userconfig = true;
969 printf ("Exiting due to error in %s\n", optarg);
976 /* If the user did not specify a config, read the system wgetrc and ~/.wgetrc. */
977 if (use_userconfig == false)
984 while ((ret = getopt_long (argc, argv,
985 short_options, long_options, &longindex)) != -1)
988 struct cmdline_option *opt;
990 /* If LONGINDEX is unchanged, it means RET is referring a short
998 printf (_("Try `%s --help' for more options.\n"), exec_name);
1001 /* Find the short option character in the mapping. */
1002 longindex = optmap[ret - 32];
1004 val = long_options[longindex].val;
1006 /* Use the retrieved value to locate the option in the
1007 option_data array, and to see if we're dealing with the
1008 negated "--no-FOO" variant of the boolean option "--foo". */
1009 opt = &option_data[val & ~BOOLEAN_NEG_MARKER];
1013 setoptval (opt->data, optarg, opt->long_name);
1017 /* The user has specified a value -- use it. */
1018 setoptval (opt->data, optarg, opt->long_name);
1021 /* NEG is true for `--no-FOO' style boolean options. */
1022 bool neg = !!(val & BOOLEAN_NEG_MARKER);
1023 setoptval (opt->data, neg ? "0" : "1", opt->long_name);
1028 void (*func) (void) = (void (*) (void)) opt->data;
1032 case OPT__APPEND_OUTPUT:
1033 setoptval ("logfile", optarg, opt->long_name);
1034 append_to_log = true;
1037 run_command (optarg);
1041 /* We support real --no-FOO flags now, but keep these
1042 short options for convenience and backward
1045 for (p = optarg; p && *p; p++)
1049 setoptval ("verbose", "0", opt->long_name);
1052 setoptval ("addhostdir", "0", opt->long_name);
1055 setoptval ("dirstruct", "0", opt->long_name);
1058 setoptval ("noclobber", "1", opt->long_name);
1061 setoptval ("noparent", "1", opt->long_name);
1064 fprintf (stderr, _("%s: illegal option -- `-n%c'\n"),
1067 fprintf (stderr, "\n");
1068 fprintf (stderr, _("Try `%s --help' for more options.\n"),
1077 /* The wgetrc commands are named noparent and noclobber,
1078 so we must revert the meaning of the cmdline options
1079 before passing the value to setoptval. */
1082 flag = (*optarg == '1' || c_tolower (*optarg) == 'y'
1083 || (c_tolower (optarg[0]) == 'o'
1084 && c_tolower (optarg[1]) == 'n'));
1085 setoptval (opt->type == OPT__PARENT ? "noparent" : "noclobber",
1086 flag ? "0" : "1", opt->long_name);
1089 case OPT__DONT_REMOVE_LISTING:
1090 setoptval ("removelisting", "0", opt->long_name);
1097 nurl = argc - optind;
1099 /* All user options have now been processed, so it's now safe to do
1100 interoption dependency checks. */
1102 if (opt.noclobber && opt.convert_links)
1105 _("Both --no-clobber and --convert-links were specified,"
1106 "only --convert-links will be used.\n"));
1107 opt.noclobber = false;
1110 if (opt.reclevel == 0)
1111 opt.reclevel = INFINITE_RECURSION; /* see recur.h for commentary */
1113 if (opt.spider || opt.delete_after)
1114 opt.no_dirstruct = true;
1116 if (opt.page_requisites && !opt.recursive)
1118 /* Don't set opt.recursive here because it would confuse the FTP
1119 code. Instead, call retrieve_tree below when either
1120 page_requisites or recursive is requested. */
1122 if (!opt.no_dirstruct)
1123 opt.dirstruct = 1; /* normally handled by cmd_spec_recursive() */
1126 if (opt.verbose == -1)
1127 opt.verbose = !opt.quiet;
1129 /* Sanity checks. */
1130 if (opt.verbose && opt.quiet)
1132 fprintf (stderr, _("Can't be verbose and quiet at the same time.\n"));
1136 if (opt.timestamping && opt.noclobber)
1138 fprintf (stderr, _("\
1139 Can't timestamp and not clobber old files at the same time.\n"));
1144 if (opt.ipv4_only && opt.ipv6_only)
1147 _("Cannot specify both --inet4-only and --inet6-only.\n"));
1152 if (opt.output_document)
1154 if (opt.convert_links
1155 && (nurl > 1 || opt.page_requisites || opt.recursive))
1158 Cannot specify both -k and -O if multiple URLs are given, or in combination\n\
1159 with -p or -r. See the manual for details.\n\n"), stderr);
1163 if (opt.page_requisites
1166 logprintf (LOG_NOTQUIET, "%s", _("\
1167 WARNING: combining -O with -r or -p will mean that all downloaded content\n\
1168 will be placed in the single file you specified.\n\n"));
1170 if (opt.timestamping)
1172 logprintf (LOG_NOTQUIET, "%s", _("\
1173 WARNING: timestamping does nothing in combination with -O. See the manual\n\
1174 for details.\n\n"));
1175 opt.timestamping = false;
1177 if (opt.noclobber && file_exists_p(opt.output_document))
1179 /* Check if output file exists; if it does, exit. */
1180 logprintf (LOG_VERBOSE,
1181 _("File `%s' already there; not retrieving.\n"),
1182 opt.output_document);
1187 if (opt.ask_passwd && opt.passwd)
1190 _("Cannot specify both --ask-password and --password.\n"));
1195 if (!nurl && !opt.input_filename)
1197 /* No URL specified. */
1198 fprintf (stderr, _("%s: missing URL\n"), exec_name);
1201 /* #### Something nicer should be printed here -- similar to the
1202 pre-1.5 `--help' page. */
1203 fprintf (stderr, _("Try `%s --help' for more options.\n"), exec_name);
1210 if (opt.locale && !check_encoding_name (opt.locale))
1214 opt.locale = find_locale ();
1216 if (opt.encoding_remote && !check_encoding_name (opt.encoding_remote))
1217 opt.encoding_remote = NULL;
1220 memset (&dummy_iri, 0, sizeof (dummy_iri));
1221 if (opt.enable_iri || opt.locale || opt.encoding_remote)
1223 /* sXXXav : be more specific... */
1224 fprintf (stderr, _("This version does not have support for IRIs\n"));
1231 opt.passwd = prompt_for_password ();
1233 if (opt.passwd == NULL || opt.passwd[0] == '\0')
1243 fork_to_background ();
1246 /* Initialize progress. Have to do this after the options are
1247 processed so we know where the log file is. */
1249 set_progress_implementation (opt.progress_type);
1251 /* Fill in the arguments. */
1252 url = alloca_array (char *, nurl + 1);
1253 for (i = 0; i < nurl; i++, optind++)
1255 char *rewritten = rewrite_shorthand_url (argv[optind]);
1259 url[i] = xstrdup (argv[optind]);
1263 /* Initialize logging. */
1264 log_init (opt.lfilename, append_to_log);
1266 DEBUGP (("DEBUG output created by Wget %s on %s.\n\n",
1267 version_string, OS_TYPE));
1269 /* Open the output filename if necessary. */
1272 Note that having the output_stream ("-O") file opened here for an FTP
1273 URL rather than in getftp() (ftp.c) (and the http equivalent) rather
1274 limits the ability in VMS to open the file differently for ASCII
1275 versus binary FTP there. (Of course, doing it here allows a open
1276 failure to be detected immediately, without first connecting to the
1279 if (opt.output_document)
1281 if (HYPHENP (opt.output_document))
1284 _setmode (_fileno (stdout), _O_BINARY);
1286 output_stream = stdout;
1293 /* Common fopen() optional arguments:
1294 sequential access only, access callback function.
1296 # define FOPEN_OPT_ARGS , "fop=sqo", "acc", acc_cb, &open_id
1298 #else /* def __VMS */
1299 # define FOPEN_OPT_ARGS
1300 #endif /* def __VMS [else] */
1302 output_stream = fopen (opt.output_document,
1303 opt.always_rest ? "ab" : "wb"
1305 if (output_stream == NULL)
1307 perror (opt.output_document);
1310 if (fstat (fileno (output_stream), &st) == 0 && S_ISREG (st.st_mode))
1311 output_stream_regular = true;
1313 if (!output_stream_regular && opt.convert_links)
1315 fprintf (stderr, _("-k can be used together with -O only if \
1316 outputting to a regular file.\n"));
1323 /* Set global ODS5 flag according to the specified destination (if
1324 any), otherwise according to the current default device.
1326 if (output_stream == NULL)
1327 set_ods5_dest( "SYS$DISK");
1328 else if (output_stream != stdout)
1329 set_ods5_dest( opt.output_document);
1330 #endif /* def __VMS */
1337 /* Setup the signal handler to redirect output when hangup is
1339 if (signal(SIGHUP, SIG_IGN) != SIG_IGN)
1340 signal(SIGHUP, redirect_output_signal);
1342 /* ...and do the same for SIGUSR1. */
1344 signal (SIGUSR1, redirect_output_signal);
1347 /* Writing to a closed socket normally signals SIGPIPE, and the
1348 process exits. What we want is to ignore SIGPIPE and just check
1349 for the return value of write(). */
1350 signal (SIGPIPE, SIG_IGN);
1353 signal (SIGWINCH, progress_handle_sigwinch);
1356 /* Retrieve the URLs from argument list. */
1357 for (t = url; *t; t++)
1359 char *filename = NULL, *redirected_URL = NULL;
1361 /* Need to do a new struct iri every time, because
1362 * retrieve_url may modify it in some circumstances,
1364 struct iri *iri = iri_new ();
1365 struct url *url_parsed;
1367 set_uri_encoding (iri, opt.locale, true);
1368 url_parsed = url_parse (*t, &url_err, iri, true);
1372 char *error = url_error (*t, url_err);
1373 logprintf (LOG_NOTQUIET, "%s: %s.\n",*t, error);
1375 inform_exit_status (URLERROR);
1379 if ((opt.recursive || opt.page_requisites)
1380 && (url_scheme (*t) != SCHEME_FTP || url_uses_proxy (url_parsed)))
1382 int old_follow_ftp = opt.follow_ftp;
1384 /* Turn opt.follow_ftp on in case of recursive FTP retrieval */
1385 if (url_scheme (*t) == SCHEME_FTP)
1388 retrieve_tree (url_parsed, NULL);
1390 opt.follow_ftp = old_follow_ftp;
1394 retrieve_url (url_parsed, *t, &filename, &redirected_URL, NULL,
1395 &dt, opt.recursive, iri, true);
1398 if (opt.delete_after && file_exists_p(filename))
1400 DEBUGP (("Removing file due to --delete-after in main():\n"));
1401 logprintf (LOG_VERBOSE, _("Removing %s.\n"), filename);
1402 if (unlink (filename))
1403 logprintf (LOG_NOTQUIET, "unlink: %s\n", strerror (errno));
1405 xfree_null (redirected_URL);
1406 xfree_null (filename);
1407 url_free (url_parsed);
1412 /* And then from the input file, if any. */
1413 if (opt.input_filename)
1417 status = retrieve_from_file (opt.input_filename, opt.force_html, &count);
1418 inform_exit_status (status);
1420 logprintf (LOG_NOTQUIET, _("No URLs found in %s.\n"),
1421 opt.input_filename);
1424 /* Print broken links. */
1425 if (opt.recursive && opt.spider)
1426 print_broken_links ();
1428 /* Print the downloaded sum. */
1429 if ((opt.recursive || opt.page_requisites
1431 || (opt.input_filename && total_downloaded_bytes != 0))
1433 total_downloaded_bytes != 0)
1435 double end_time = ptimer_measure (timer);
1436 ptimer_destroy (timer);
1438 char *wall_time = xstrdup (secs_to_human_time (end_time - start_time));
1439 char *download_time = xstrdup (secs_to_human_time (total_download_time));
1440 logprintf (LOG_NOTQUIET,
1441 _("FINISHED --%s--\nTotal wall clock time: %s\n"
1442 "Downloaded: %d files, %s in %s (%s)\n"),
1443 datetime_str (time (NULL)),
1446 human_readable (total_downloaded_bytes),
1448 retr_rate (total_downloaded_bytes, total_download_time));
1450 xfree (download_time);
1452 /* Print quota warning, if exceeded. */
1453 if (opt.quota && total_downloaded_bytes > opt.quota)
1454 logprintf (LOG_NOTQUIET,
1455 _("Download quota of %s EXCEEDED!\n"),
1456 human_readable (opt.quota));
1459 if (opt.cookies_output)
1462 if (opt.convert_links && !opt.delete_after)
1463 convert_all_links ();
1466 for (i = 0; i < nurl; i++)
1470 return get_exit_status ();
1472 #endif /* TESTING */
1474 #if defined(SIGHUP) || defined(SIGUSR1)
1476 /* So the signal_name check doesn't blow when only one is available. */
1484 /* Hangup signal handler. When wget receives SIGHUP or SIGUSR1, it
1485 will proceed operation as usual, trying to write into a log file.
1486 If that is impossible, the output will be turned off. */
1489 redirect_output_signal (int sig)
1491 const char *signal_name = (sig == SIGHUP ? "SIGHUP" :
1492 (sig == SIGUSR1 ? "SIGUSR1" :
1494 log_request_redirect_output (signal_name);
1495 progress_schedule_redirect ();
1496 signal (sig, redirect_output_signal);