1 /* Command line parsing.
2 Copyright (C) 1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004,
3 2005, 2006, 2007, 2008, 2009, 2010 Free Software Foundation, Inc.
5 This file is part of GNU Wget.
7 GNU Wget is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 3 of the License, or
10 (at your option) any later version.
12 GNU Wget is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with Wget. If not, see <http://www.gnu.org/licenses/>.
20 Additional permission under GNU GPL version 3 section 7
22 If you modify this program, or any covered work, by linking or
23 combining it with the OpenSSL project's OpenSSL library (or a
24 modified version of that library), containing parts covered by the
25 terms of the OpenSSL or SSLeay licenses, the Free Software Foundation
26 grants you additional permission to convey the resulting work.
27 Corresponding Source for a non-source form of such a combination
28 shall include the source code for the parts of OpenSSL used as well
29 as that of the covered work. */
52 #include "progress.h" /* for progress_handle_sigwinch */
55 #include "http.h" /* for save_cookies */
66 #ifndef PATH_SEPARATOR
67 # define PATH_SEPARATOR '/'
72 /* defined in version.c */
73 extern char *version_string;
74 extern char *compilation_string;
75 extern char *system_getrc;
76 extern char *link_string;
77 /* defined in build_info.c */
78 extern const char *compiled_features[];
79 /* Used for --version output in print_version */
80 #define MAX_CHARS_PER_LINE 72
83 #if defined(SIGHUP) || defined(SIGUSR1)
84 static void redirect_output_signal (int);
87 const char *exec_name;
89 /* Number of successfully downloaded URLs */
93 /* Initialize I18N/L10N. That amounts to invoking setlocale, and
94 setting up gettext's message catalog using bindtextdomain and
95 textdomain. Does nothing if NLS is disabled or missing. */
98 i18n_initialize (void)
100 /* ENABLE_NLS implies existence of functions invoked here. */
102 /* Set the current locale. */
103 setlocale (LC_ALL, "");
104 /* Set the text message domain. */
105 bindtextdomain ("wget", LOCALEDIR);
107 #endif /* ENABLE_NLS */
110 /* Definition of command-line options. */
112 static void print_help (void);
113 static void print_version (void);
118 # define IF_SSL(x) NULL
122 # define WHEN_DEBUG(x) x
124 # define WHEN_DEBUG(x) NULL
127 struct cmdline_option {
128 const char *long_name;
134 /* Non-standard options that have to be handled specially in
138 OPT__DONT_REMOVE_LISTING,
143 const void *data; /* for standard options */
144 int argtype; /* for non-standard options */
147 static struct cmdline_option option_data[] =
149 { "accept", 'A', OPT_VALUE, "accept", -1 },
150 { "adjust-extension", 'E', OPT_BOOLEAN, "adjustextension", -1 },
151 { "append-output", 'a', OPT__APPEND_OUTPUT, NULL, required_argument },
152 { "ask-password", 0, OPT_BOOLEAN, "askpassword", -1 },
153 { "auth-no-challenge", 0, OPT_BOOLEAN, "authnochallenge", -1 },
154 { "background", 'b', OPT_BOOLEAN, "background", -1 },
155 { "backup-converted", 'K', OPT_BOOLEAN, "backupconverted", -1 },
156 { "backups", 0, OPT_BOOLEAN, "backups", -1 },
157 { "base", 'B', OPT_VALUE, "base", -1 },
158 { "bind-address", 0, OPT_VALUE, "bindaddress", -1 },
159 { IF_SSL ("ca-certificate"), 0, OPT_VALUE, "cacertificate", -1 },
160 { IF_SSL ("ca-directory"), 0, OPT_VALUE, "cadirectory", -1 },
161 { "cache", 0, OPT_BOOLEAN, "cache", -1 },
162 { IF_SSL ("certificate"), 0, OPT_VALUE, "certificate", -1 },
163 { IF_SSL ("certificate-type"), 0, OPT_VALUE, "certificatetype", -1 },
164 { IF_SSL ("check-certificate"), 0, OPT_BOOLEAN, "checkcertificate", -1 },
165 { "clobber", 0, OPT__CLOBBER, NULL, optional_argument },
166 { "config", 0, OPT_VALUE, "chooseconfig", -1 },
167 { "connect-timeout", 0, OPT_VALUE, "connecttimeout", -1 },
168 { "continue", 'c', OPT_BOOLEAN, "continue", -1 },
169 { "convert-links", 'k', OPT_BOOLEAN, "convertlinks", -1 },
170 { "content-disposition", 0, OPT_BOOLEAN, "contentdisposition", -1 },
171 { "cookies", 0, OPT_BOOLEAN, "cookies", -1 },
172 { "cut-dirs", 0, OPT_VALUE, "cutdirs", -1 },
173 { WHEN_DEBUG ("debug"), 'd', OPT_BOOLEAN, "debug", -1 },
174 { "default-page", 0, OPT_VALUE, "defaultpage", -1 },
175 { "delete-after", 0, OPT_BOOLEAN, "deleteafter", -1 },
176 { "directories", 0, OPT_BOOLEAN, "dirstruct", -1 },
177 { "directory-prefix", 'P', OPT_VALUE, "dirprefix", -1 },
178 { "dns-cache", 0, OPT_BOOLEAN, "dnscache", -1 },
179 { "dns-timeout", 0, OPT_VALUE, "dnstimeout", -1 },
180 { "domains", 'D', OPT_VALUE, "domains", -1 },
181 { "dont-remove-listing", 0, OPT__DONT_REMOVE_LISTING, NULL, no_argument },
182 { "dot-style", 0, OPT_VALUE, "dotstyle", -1 }, /* deprecated */
183 { "egd-file", 0, OPT_VALUE, "egdfile", -1 },
184 { "exclude-directories", 'X', OPT_VALUE, "excludedirectories", -1 },
185 { "exclude-domains", 0, OPT_VALUE, "excludedomains", -1 },
186 { "execute", 'e', OPT__EXECUTE, NULL, required_argument },
187 { "follow-ftp", 0, OPT_BOOLEAN, "followftp", -1 },
188 { "follow-tags", 0, OPT_VALUE, "followtags", -1 },
189 { "force-directories", 'x', OPT_BOOLEAN, "dirstruct", -1 },
190 { "force-html", 'F', OPT_BOOLEAN, "forcehtml", -1 },
191 { "ftp-password", 0, OPT_VALUE, "ftppassword", -1 },
193 { "ftp-stmlf", 0, OPT_BOOLEAN, "ftpstmlf", -1 },
194 #endif /* def __VMS */
195 { "ftp-user", 0, OPT_VALUE, "ftpuser", -1 },
196 { "glob", 0, OPT_BOOLEAN, "glob", -1 },
197 { "header", 0, OPT_VALUE, "header", -1 },
198 { "help", 'h', OPT_FUNCALL, (void *)print_help, no_argument },
199 { "host-directories", 0, OPT_BOOLEAN, "addhostdir", -1 },
200 { "html-extension", 'E', OPT_BOOLEAN, "adjustextension", -1 }, /* deprecated */
201 { "htmlify", 0, OPT_BOOLEAN, "htmlify", -1 },
202 { "http-keep-alive", 0, OPT_BOOLEAN, "httpkeepalive", -1 },
203 { "http-passwd", 0, OPT_VALUE, "httppassword", -1 }, /* deprecated */
204 { "http-password", 0, OPT_VALUE, "httppassword", -1 },
205 { "http-user", 0, OPT_VALUE, "httpuser", -1 },
206 { "ignore-case", 0, OPT_BOOLEAN, "ignorecase", -1 },
207 { "ignore-length", 0, OPT_BOOLEAN, "ignorelength", -1 },
208 { "ignore-tags", 0, OPT_VALUE, "ignoretags", -1 },
209 { "include-directories", 'I', OPT_VALUE, "includedirectories", -1 },
211 { "inet4-only", '4', OPT_BOOLEAN, "inet4only", -1 },
212 { "inet6-only", '6', OPT_BOOLEAN, "inet6only", -1 },
214 { "input-file", 'i', OPT_VALUE, "input", -1 },
215 { "iri", 0, OPT_BOOLEAN, "iri", -1 },
216 { "keep-session-cookies", 0, OPT_BOOLEAN, "keepsessioncookies", -1 },
217 { "level", 'l', OPT_VALUE, "reclevel", -1 },
218 { "limit-rate", 0, OPT_VALUE, "limitrate", -1 },
219 { "load-cookies", 0, OPT_VALUE, "loadcookies", -1 },
220 { "local-encoding", 0, OPT_VALUE, "localencoding", -1 },
221 { "max-redirect", 0, OPT_VALUE, "maxredirect", -1 },
222 { "mirror", 'm', OPT_BOOLEAN, "mirror", -1 },
223 { "no", 'n', OPT__NO, NULL, required_argument },
224 { "no-clobber", 0, OPT_BOOLEAN, "noclobber", -1 },
225 { "no-parent", 0, OPT_BOOLEAN, "noparent", -1 },
226 { "output-document", 'O', OPT_VALUE, "outputdocument", -1 },
227 { "output-file", 'o', OPT_VALUE, "logfile", -1 },
228 { "page-requisites", 'p', OPT_BOOLEAN, "pagerequisites", -1 },
229 { "parent", 0, OPT__PARENT, NULL, optional_argument },
230 { "passive-ftp", 0, OPT_BOOLEAN, "passiveftp", -1 },
231 { "password", 0, OPT_VALUE, "password", -1 },
232 { "post-data", 0, OPT_VALUE, "postdata", -1 },
233 { "post-file", 0, OPT_VALUE, "postfile", -1 },
234 { "prefer-family", 0, OPT_VALUE, "preferfamily", -1 },
235 { "preserve-permissions", 0, OPT_BOOLEAN, "preservepermissions", -1 }, /* deprecated */
236 { IF_SSL ("private-key"), 0, OPT_VALUE, "privatekey", -1 },
237 { IF_SSL ("private-key-type"), 0, OPT_VALUE, "privatekeytype", -1 },
238 { "progress", 0, OPT_VALUE, "progress", -1 },
239 { "protocol-directories", 0, OPT_BOOLEAN, "protocoldirectories", -1 },
240 { "proxy", 0, OPT_BOOLEAN, "useproxy", -1 },
241 { "proxy__compat", 'Y', OPT_VALUE, "useproxy", -1 }, /* back-compatible */
242 { "proxy-passwd", 0, OPT_VALUE, "proxypassword", -1 }, /* deprecated */
243 { "proxy-password", 0, OPT_VALUE, "proxypassword", -1 },
244 { "proxy-user", 0, OPT_VALUE, "proxyuser", -1 },
245 { "quiet", 'q', OPT_BOOLEAN, "quiet", -1 },
246 { "quota", 'Q', OPT_VALUE, "quota", -1 },
247 { "random-file", 0, OPT_VALUE, "randomfile", -1 },
248 { "random-wait", 0, OPT_BOOLEAN, "randomwait", -1 },
249 { "read-timeout", 0, OPT_VALUE, "readtimeout", -1 },
250 { "recursive", 'r', OPT_BOOLEAN, "recursive", -1 },
251 { "referer", 0, OPT_VALUE, "referer", -1 },
252 { "reject", 'R', OPT_VALUE, "reject", -1 },
253 { "relative", 'L', OPT_BOOLEAN, "relativeonly", -1 },
254 { "remote-encoding", 0, OPT_VALUE, "remoteencoding", -1 },
255 { "remove-listing", 0, OPT_BOOLEAN, "removelisting", -1 },
256 { "restrict-file-names", 0, OPT_BOOLEAN, "restrictfilenames", -1 },
257 { "retr-symlinks", 0, OPT_BOOLEAN, "retrsymlinks", -1 },
258 { "retry-connrefused", 0, OPT_BOOLEAN, "retryconnrefused", -1 },
259 { "save-cookies", 0, OPT_VALUE, "savecookies", -1 },
260 { "save-headers", 0, OPT_BOOLEAN, "saveheaders", -1 },
261 { IF_SSL ("secure-protocol"), 0, OPT_VALUE, "secureprotocol", -1 },
262 { "server-response", 'S', OPT_BOOLEAN, "serverresponse", -1 },
263 { "span-hosts", 'H', OPT_BOOLEAN, "spanhosts", -1 },
264 { "spider", 0, OPT_BOOLEAN, "spider", -1 },
265 { "strict-comments", 0, OPT_BOOLEAN, "strictcomments", -1 },
266 { "timeout", 'T', OPT_VALUE, "timeout", -1 },
267 { "timestamping", 'N', OPT_BOOLEAN, "timestamping", -1 },
268 { "tries", 't', OPT_VALUE, "tries", -1 },
269 { "unlink", 0, OPT_BOOLEAN, "unlink", -1 },
270 { "trust-server-names", 0, OPT_BOOLEAN, "trustservernames", -1 },
271 { "use-server-timestamps", 0, OPT_BOOLEAN, "useservertimestamps", -1 },
272 { "user", 0, OPT_VALUE, "user", -1 },
273 { "user-agent", 'U', OPT_VALUE, "useragent", -1 },
274 { "verbose", 'v', OPT_BOOLEAN, "verbose", -1 },
275 { "verbose", 0, OPT_BOOLEAN, "verbose", -1 },
276 { "version", 'V', OPT_FUNCALL, (void *) print_version, no_argument },
277 { "wait", 'w', OPT_VALUE, "wait", -1 },
278 { "waitretry", 0, OPT_VALUE, "waitretry", -1 },
280 { "wdebug", 0, OPT_BOOLEAN, "wdebug", -1 },
287 /* Return a string that contains S with "no-" prepended. The string
288 is NUL-terminated and allocated off static storage at Wget
292 no_prefix (const char *s)
294 static char buffer[1024];
295 static char *p = buffer;
298 int size = 3 + strlen (s) + 1; /* "no-STRING\0" */
299 if (p + size >= buffer + sizeof (buffer))
302 cp[0] = 'n', cp[1] = 'o', cp[2] = '-';
308 /* The arguments that that main passes to getopt_long. */
309 static struct option long_options[2 * countof (option_data) + 1];
310 static char short_options[128];
312 /* Mapping between short option chars and option_data indices. */
313 static unsigned char optmap[96];
315 /* Marker for `--no-FOO' values in long_options. */
316 #define BOOLEAN_NEG_MARKER 1024
318 /* Initialize the long_options array used by getopt_long from the data
324 char *p = short_options;
326 for (i = 0; i < countof (option_data); i++)
328 struct cmdline_option *opt = &option_data[i];
329 struct option *longopt;
332 /* The option is disabled. */
335 longopt = &long_options[o++];
336 longopt->name = opt->long_name;
340 *p++ = opt->short_name;
341 optmap[opt->short_name - 32] = longopt - long_options;
346 longopt->has_arg = required_argument;
351 /* Specify an optional argument for long options, so that
352 --option=off works the same as --no-option, for
353 compatibility with pre-1.10 Wget. However, don't specify
354 optional arguments short-option booleans because they
355 prevent combining of short options. */
356 longopt->has_arg = optional_argument;
357 /* For Boolean options, add the "--no-FOO" variant, which is
358 identical to "--foo", except it has opposite meaning and
359 it doesn't allow an argument. */
360 longopt = &long_options[o++];
361 longopt->name = no_prefix (opt->long_name);
362 longopt->has_arg = no_argument;
363 /* Mask the value so we'll be able to recognize that we're
364 dealing with the false value. */
365 longopt->val = i | BOOLEAN_NEG_MARKER;
368 assert (opt->argtype != -1);
369 longopt->has_arg = opt->argtype;
372 if (longopt->has_arg == required_argument)
374 /* Don't handle optional_argument */
378 /* Terminate short_options. */
380 /* No need for xzero(long_options[o]) because its storage is static
381 and it will be zeroed by default. */
382 assert (o <= countof (long_options));
385 /* Print the usage message. */
387 print_usage (int error)
389 fprintf (error ? stderr : stdout, _("Usage: %s [OPTION]... [URL]...\n"),
393 /* Print the help message, describing all the available options. If
394 you add an option, be sure to update this list. */
398 /* We split the help text this way to ease translation of individual
400 static const char *help[] = {
403 Mandatory arguments to long options are mandatory for short options too.\n\n"),
407 -V, --version display the version of Wget and exit.\n"),
409 -h, --help print this help.\n"),
411 -b, --background go to background after startup.\n"),
413 -e, --execute=COMMAND execute a `.wgetrc'-style command.\n"),
417 Logging and input file:\n"),
419 -o, --output-file=FILE log messages to FILE.\n"),
421 -a, --append-output=FILE append messages to FILE.\n"),
424 -d, --debug print lots of debugging information.\n"),
428 --wdebug print Watt-32 debug output.\n"),
431 -q, --quiet quiet (no output).\n"),
433 -v, --verbose be verbose (this is the default).\n"),
435 -nv, --no-verbose turn off verboseness, without being quiet.\n"),
437 -i, --input-file=FILE download URLs found in local or external FILE.\n"),
439 -F, --force-html treat input file as HTML.\n"),
441 -B, --base=URL resolves HTML input-file links (-i -F)\n\
442 relative to URL.\n"),
444 --config=FILE Specify config file to use.\n"),
450 -t, --tries=NUMBER set number of retries to NUMBER (0 unlimits).\n"),
452 --retry-connrefused retry even if connection is refused.\n"),
454 -O, --output-document=FILE write documents to FILE.\n"),
456 -nc, --no-clobber skip downloads that would download to\n\
459 -c, --continue resume getting a partially-downloaded file.\n"),
461 --progress=TYPE select progress gauge type.\n"),
463 -N, --timestamping don't re-retrieve files unless newer than\n\
466 --no-use-server-timestamps don't set the local file's timestamp by\n\
467 the one on the server.\n"),
469 -S, --server-response print server response.\n"),
471 --spider don't download anything.\n"),
473 -T, --timeout=SECONDS set all timeout values to SECONDS.\n"),
475 --dns-timeout=SECS set the DNS lookup timeout to SECS.\n"),
477 --connect-timeout=SECS set the connect timeout to SECS.\n"),
479 --read-timeout=SECS set the read timeout to SECS.\n"),
481 -w, --wait=SECONDS wait SECONDS between retrievals.\n"),
483 --waitretry=SECONDS wait 1..SECONDS between retries of a retrieval.\n"),
485 --random-wait wait from 0.5*WAIT...1.5*WAIT secs between retrievals.\n"),
487 --no-proxy explicitly turn off proxy.\n"),
489 -Q, --quota=NUMBER set retrieval quota to NUMBER.\n"),
491 --bind-address=ADDRESS bind to ADDRESS (hostname or IP) on local host.\n"),
493 --limit-rate=RATE limit download rate to RATE.\n"),
495 --no-dns-cache disable caching DNS lookups.\n"),
497 --restrict-file-names=OS restrict chars in file names to ones OS allows.\n"),
499 --ignore-case ignore case when matching files/directories.\n"),
502 -4, --inet4-only connect only to IPv4 addresses.\n"),
504 -6, --inet6-only connect only to IPv6 addresses.\n"),
506 --prefer-family=FAMILY connect first to addresses of specified family,\n\
507 one of IPv6, IPv4, or none.\n"),
510 --user=USER set both ftp and http user to USER.\n"),
512 --password=PASS set both ftp and http password to PASS.\n"),
514 --ask-password prompt for passwords.\n"),
516 --no-iri turn off IRI support.\n"),
518 --local-encoding=ENC use ENC as the local encoding for IRIs.\n"),
520 --remote-encoding=ENC use ENC as the default remote encoding.\n"),
522 --unlink remove file before clobber.\n"),
528 -nd, --no-directories don't create directories.\n"),
530 -x, --force-directories force creation of directories.\n"),
532 -nH, --no-host-directories don't create host directories.\n"),
534 --protocol-directories use protocol name in directories.\n"),
536 -P, --directory-prefix=PREFIX save files to PREFIX/...\n"),
538 --cut-dirs=NUMBER ignore NUMBER remote directory components.\n"),
544 --http-user=USER set http user to USER.\n"),
546 --http-password=PASS set http password to PASS.\n"),
548 --no-cache disallow server-cached data.\n"),
550 --default-page=NAME Change the default page name (normally\n\
551 this is `index.html'.).\n"),
553 -E, --adjust-extension save HTML/CSS documents with proper extensions.\n"),
555 --ignore-length ignore `Content-Length' header field.\n"),
557 --header=STRING insert STRING among the headers.\n"),
559 --max-redirect maximum redirections allowed per page.\n"),
561 --proxy-user=USER set USER as proxy username.\n"),
563 --proxy-password=PASS set PASS as proxy password.\n"),
565 --referer=URL include `Referer: URL' header in HTTP request.\n"),
567 --save-headers save the HTTP headers to file.\n"),
569 -U, --user-agent=AGENT identify as AGENT instead of Wget/VERSION.\n"),
571 --no-http-keep-alive disable HTTP keep-alive (persistent connections).\n"),
573 --no-cookies don't use cookies.\n"),
575 --load-cookies=FILE load cookies from FILE before session.\n"),
577 --save-cookies=FILE save cookies to FILE after session.\n"),
579 --keep-session-cookies load and save session (non-permanent) cookies.\n"),
581 --post-data=STRING use the POST method; send STRING as the data.\n"),
583 --post-file=FILE use the POST method; send contents of FILE.\n"),
585 --content-disposition honor the Content-Disposition header when\n\
586 choosing local file names (EXPERIMENTAL).\n"),
588 --auth-no-challenge send Basic HTTP authentication information\n\
589 without first waiting for the server's\n\
595 HTTPS (SSL/TLS) options:\n"),
597 --secure-protocol=PR choose secure protocol, one of auto, SSLv2,\n\
598 SSLv3, and TLSv1.\n"),
600 --no-check-certificate don't validate the server's certificate.\n"),
602 --certificate=FILE client certificate file.\n"),
604 --certificate-type=TYPE client certificate type, PEM or DER.\n"),
606 --private-key=FILE private key file.\n"),
608 --private-key-type=TYPE private key type, PEM or DER.\n"),
610 --ca-certificate=FILE file with the bundle of CA's.\n"),
612 --ca-directory=DIR directory where hash list of CA's is stored.\n"),
614 --random-file=FILE file with random data for seeding the SSL PRNG.\n"),
616 --egd-file=FILE file naming the EGD socket with random data.\n"),
618 #endif /* HAVE_SSL */
624 --ftp-stmlf Use Stream_LF format for all binary FTP files.\n"),
625 #endif /* def __VMS */
627 --ftp-user=USER set ftp user to USER.\n"),
629 --ftp-password=PASS set ftp password to PASS.\n"),
631 --no-remove-listing don't remove `.listing' files.\n"),
633 --no-glob turn off FTP file name globbing.\n"),
635 --no-passive-ftp disable the \"passive\" transfer mode.\n"),
637 --retr-symlinks when recursing, get linked-to files (not dir).\n"),
641 Recursive download:\n"),
643 -r, --recursive specify recursive download.\n"),
645 -l, --level=NUMBER maximum recursion depth (inf or 0 for infinite).\n"),
647 --delete-after delete files locally after downloading them.\n"),
649 -k, --convert-links make links in downloaded HTML or CSS point to\n\
653 -K, --backup-converted before converting file X, back up as X_orig.\n"),
654 #else /* def __VMS */
656 -K, --backup-converted before converting file X, back up as X.orig.\n"),
657 #endif /* def __VMS [else] */
659 -m, --mirror shortcut for -N -r -l inf --no-remove-listing.\n"),
661 -p, --page-requisites get all images, etc. needed to display HTML page.\n"),
663 --strict-comments turn on strict (SGML) handling of HTML comments.\n"),
667 Recursive accept/reject:\n"),
669 -A, --accept=LIST comma-separated list of accepted extensions.\n"),
671 -R, --reject=LIST comma-separated list of rejected extensions.\n"),
673 -D, --domains=LIST comma-separated list of accepted domains.\n"),
675 --exclude-domains=LIST comma-separated list of rejected domains.\n"),
677 --follow-ftp follow FTP links from HTML documents.\n"),
679 --follow-tags=LIST comma-separated list of followed HTML tags.\n"),
681 --ignore-tags=LIST comma-separated list of ignored HTML tags.\n"),
683 -H, --span-hosts go to foreign hosts when recursive.\n"),
685 -L, --relative follow relative links only.\n"),
687 -I, --include-directories=LIST list of allowed directories.\n"),
689 --trust-server-names use the name specified by the redirection\n\
690 url last component.\n"),
692 -X, --exclude-directories=LIST list of excluded directories.\n"),
694 -np, --no-parent don't ascend to the parent directory.\n"),
697 N_("Mail bug reports and suggestions to <bug-wget@gnu.org>.\n")
702 printf (_("GNU Wget %s, a non-interactive network retriever.\n"),
706 for (i = 0; i < countof (help); i++)
707 fputs (_(help[i]), stdout);
712 /* Return a human-readable printed representation of INTERVAL,
713 measured in seconds. */
716 secs_to_human_time (double interval)
719 int secs = (int) (interval + 0.5);
720 int hours, mins, days;
722 days = secs / 86400, secs %= 86400;
723 hours = secs / 3600, secs %= 3600;
724 mins = secs / 60, secs %= 60;
727 sprintf (buf, "%dd %dh %dm %ds", days, hours, mins, secs);
729 sprintf (buf, "%dh %dm %ds", hours, mins, secs);
731 sprintf (buf, "%dm %ds", mins, secs);
733 sprintf (buf, "%ss", print_decimal (interval));
739 prompt_for_password (void)
742 printf (_("Password for user %s: "), quote (opt.user));
744 printf (_("Password: "));
748 /* Function that prints the line argument while limiting it
749 to at most line_length. prefix is printed on the first line
750 and an appropriate number of spaces are added on subsequent
753 format_and_print_line (const char *prefix, const char *line,
757 char *line_dup, *token;
759 assert (prefix != NULL);
760 assert (line != NULL);
762 line_dup = xstrdup (line);
764 if (line_length <= 0)
765 line_length = MAX_CHARS_PER_LINE - TABULATION;
767 printf ("%s", prefix);
768 remaining_chars = line_length;
769 /* We break on spaces. */
770 token = strtok (line_dup, " ");
771 while (token != NULL)
773 /* If however a token is much larger than the maximum
774 line length, all bets are off and we simply print the
775 token on the next line. */
776 if (remaining_chars <= strlen (token))
778 printf ("\n%*c", TABULATION, ' ');
779 remaining_chars = line_length - TABULATION;
781 printf ("%s ", token);
782 remaining_chars -= strlen (token) + 1; /* account for " " */
783 token = strtok (NULL, " ");
794 const char *wgetrc_title = _("Wgetrc: ");
795 const char *locale_title = _("Locale: ");
796 const char *compile_title = _("Compile: ");
797 const char *link_title = _("Link: ");
798 char *env_wgetrc, *user_wgetrc;
801 printf (_("GNU Wget %s built on %s.\n\n"), version_string, OS_TYPE);
803 for (i = 0; compiled_features[i] != NULL; )
805 int line_length = MAX_CHARS_PER_LINE;
806 while ((line_length > 0) && (compiled_features[i] != NULL))
808 printf ("%s ", compiled_features[i]);
809 line_length -= strlen (compiled_features[i]) + 2;
816 /* Handle the case when $WGETRC is unset and $HOME/.wgetrc is
818 printf ("%s\n", wgetrc_title);
819 env_wgetrc = wgetrc_env_file_name ();
820 if (env_wgetrc && *env_wgetrc)
822 printf (_(" %s (env)\n"), env_wgetrc);
825 user_wgetrc = wgetrc_user_file_name ();
828 printf (_(" %s (user)\n"), user_wgetrc);
832 printf (_(" %s (system)\n"), SYSTEM_WGETRC);
836 format_and_print_line (locale_title,
839 #endif /* def ENABLE_NLS */
841 if (compilation_string != NULL)
842 format_and_print_line (compile_title,
846 if (link_string != NULL)
847 format_and_print_line (link_title,
852 /* TRANSLATORS: When available, an actual copyright character
853 (cirle-c) should be used in preference to "(C)". */
855 Copyright (C) 2009 Free Software Foundation, Inc.\n"), stdout);
857 License GPLv3+: GNU GPL version 3 or later\n\
858 <http://www.gnu.org/licenses/gpl.html>.\n\
859 This is free software: you are free to change and redistribute it.\n\
860 There is NO WARRANTY, to the extent permitted by law.\n"), stdout);
861 /* TRANSLATORS: When available, please use the proper diacritics for
862 names such as this one. See en_US.po for reference. */
863 fputs (_("\nOriginally written by Hrvoje Niksic <hniksic@xemacs.org>.\n"),
865 fputs (_("Please send bug reports and questions to <bug-wget@gnu.org>.\n"),
870 char *program_name; /* Needed by lib/error.c. */
873 main (int argc, char **argv)
876 int i, ret, longindex;
878 bool append_to_log = false;
880 program_name = argv[0];
882 struct ptimer *timer = ptimer_new ();
883 double start_time = ptimer_measure (timer);
887 /* Construct the name of the executable, without the directory part. */
889 /* On VMS, lose the "dev:[dir]" prefix and the ".EXE;nnn" suffix. */
890 exec_name = vms_basename (argv[0]);
891 #else /* def __VMS */
892 exec_name = strrchr (argv[0], PATH_SEPARATOR);
897 #endif /* def __VMS [else] */
900 /* Drop extension (typically .EXE) from executable filename. */
901 windows_main ((char **) &exec_name);
904 /* Load the hard-coded defaults. */
909 /* This seperate getopt_long is needed to find the user config
910 and parse it before the other user options. */
913 bool use_userconfig = false;
915 while ((retconf = getopt_long (argc, argv,
916 short_options, long_options, &longindex)) != -1)
919 bool userrc_ret = true;
920 struct cmdline_option *config_opt;
921 confval = long_options[longindex].val;
922 config_opt = &option_data[confval & ~BOOLEAN_NEG_MARKER];
923 if (strcmp (config_opt->long_name, "config") == 0)
925 userrc_ret &= run_wgetrc (optarg);
926 use_userconfig = true;
930 printf ("Exiting due to error in %s\n", optarg);
937 /* If the user did not specify a config, read the system wgetrc and ~/.wgetrc. */
938 if (use_userconfig == false)
945 while ((ret = getopt_long (argc, argv,
946 short_options, long_options, &longindex)) != -1)
949 struct cmdline_option *opt;
951 /* If LONGINDEX is unchanged, it means RET is referring a short
959 printf (_("Try `%s --help' for more options.\n"), exec_name);
962 /* Find the short option character in the mapping. */
963 longindex = optmap[ret - 32];
965 val = long_options[longindex].val;
967 /* Use the retrieved value to locate the option in the
968 option_data array, and to see if we're dealing with the
969 negated "--no-FOO" variant of the boolean option "--foo". */
970 opt = &option_data[val & ~BOOLEAN_NEG_MARKER];
974 setoptval (opt->data, optarg, opt->long_name);
978 /* The user has specified a value -- use it. */
979 setoptval (opt->data, optarg, opt->long_name);
982 /* NEG is true for `--no-FOO' style boolean options. */
983 bool neg = !!(val & BOOLEAN_NEG_MARKER);
984 setoptval (opt->data, neg ? "0" : "1", opt->long_name);
989 void (*func) (void) = (void (*) (void)) opt->data;
993 case OPT__APPEND_OUTPUT:
994 setoptval ("logfile", optarg, opt->long_name);
995 append_to_log = true;
998 run_command (optarg);
1002 /* We support real --no-FOO flags now, but keep these
1003 short options for convenience and backward
1006 for (p = optarg; p && *p; p++)
1010 setoptval ("verbose", "0", opt->long_name);
1013 setoptval ("addhostdir", "0", opt->long_name);
1016 setoptval ("dirstruct", "0", opt->long_name);
1019 setoptval ("noclobber", "1", opt->long_name);
1022 setoptval ("noparent", "1", opt->long_name);
1025 fprintf (stderr, _("%s: illegal option -- `-n%c'\n"),
1028 fprintf (stderr, "\n");
1029 fprintf (stderr, _("Try `%s --help' for more options.\n"),
1038 /* The wgetrc commands are named noparent and noclobber,
1039 so we must revert the meaning of the cmdline options
1040 before passing the value to setoptval. */
1043 flag = (*optarg == '1' || c_tolower (*optarg) == 'y'
1044 || (c_tolower (optarg[0]) == 'o'
1045 && c_tolower (optarg[1]) == 'n'));
1046 setoptval (opt->type == OPT__PARENT ? "noparent" : "noclobber",
1047 flag ? "0" : "1", opt->long_name);
1050 case OPT__DONT_REMOVE_LISTING:
1051 setoptval ("removelisting", "0", opt->long_name);
1058 nurl = argc - optind;
1060 /* All user options have now been processed, so it's now safe to do
1061 interoption dependency checks. */
1063 if (opt.reclevel == 0)
1064 opt.reclevel = INFINITE_RECURSION; /* see recur.h for commentary */
1066 if (opt.spider || opt.delete_after)
1067 opt.no_dirstruct = true;
1069 if (opt.page_requisites && !opt.recursive)
1071 /* Don't set opt.recursive here because it would confuse the FTP
1072 code. Instead, call retrieve_tree below when either
1073 page_requisites or recursive is requested. */
1075 if (!opt.no_dirstruct)
1076 opt.dirstruct = 1; /* normally handled by cmd_spec_recursive() */
1079 if (opt.verbose == -1)
1080 opt.verbose = !opt.quiet;
1082 /* Sanity checks. */
1083 if (opt.verbose && opt.quiet)
1085 fprintf (stderr, _("Can't be verbose and quiet at the same time.\n"));
1089 if (opt.timestamping && opt.noclobber)
1091 fprintf (stderr, _("\
1092 Can't timestamp and not clobber old files at the same time.\n"));
1097 if (opt.ipv4_only && opt.ipv6_only)
1100 _("Cannot specify both --inet4-only and --inet6-only.\n"));
1105 if (opt.output_document)
1107 if (opt.convert_links
1108 && (nurl > 1 || opt.page_requisites || opt.recursive))
1111 Cannot specify both -k and -O if multiple URLs are given, or in combination\n\
1112 with -p or -r. See the manual for details.\n\n"), stderr);
1116 if (opt.page_requisites
1119 logprintf (LOG_NOTQUIET, "%s", _("\
1120 WARNING: combining -O with -r or -p will mean that all downloaded content\n\
1121 will be placed in the single file you specified.\n\n"));
1123 if (opt.timestamping)
1125 logprintf (LOG_NOTQUIET, "%s", _("\
1126 WARNING: timestamping does nothing in combination with -O. See the manual\n\
1127 for details.\n\n"));
1128 opt.timestamping = false;
1130 if (opt.noclobber && file_exists_p(opt.output_document))
1132 /* Check if output file exists; if it does, exit. */
1133 logprintf (LOG_VERBOSE,
1134 _("File `%s' already there; not retrieving.\n"),
1135 opt.output_document);
1140 if (opt.ask_passwd && opt.passwd)
1143 _("Cannot specify both --ask-password and --password.\n"));
1148 if (!nurl && !opt.input_filename)
1150 /* No URL specified. */
1151 fprintf (stderr, _("%s: missing URL\n"), exec_name);
1154 /* #### Something nicer should be printed here -- similar to the
1155 pre-1.5 `--help' page. */
1156 fprintf (stderr, _("Try `%s --help' for more options.\n"), exec_name);
1163 if (opt.locale && !check_encoding_name (opt.locale))
1167 opt.locale = find_locale ();
1169 if (opt.encoding_remote && !check_encoding_name (opt.encoding_remote))
1170 opt.encoding_remote = NULL;
1173 if (opt.enable_iri || opt.locale || opt.encoding_remote)
1175 /* sXXXav : be more specific... */
1176 fprintf (stderr, _("This version does not have support for IRIs\n"));
1183 opt.passwd = prompt_for_password ();
1185 if (opt.passwd == NULL || opt.passwd[0] == '\0')
1195 fork_to_background ();
1198 /* Initialize progress. Have to do this after the options are
1199 processed so we know where the log file is. */
1201 set_progress_implementation (opt.progress_type);
1203 /* Fill in the arguments. */
1204 url = alloca_array (char *, nurl + 1);
1205 for (i = 0; i < nurl; i++, optind++)
1207 char *rewritten = rewrite_shorthand_url (argv[optind]);
1211 url[i] = xstrdup (argv[optind]);
1215 /* Initialize logging. */
1216 log_init (opt.lfilename, append_to_log);
1218 DEBUGP (("DEBUG output created by Wget %s on %s.\n\n",
1219 version_string, OS_TYPE));
1221 /* Open the output filename if necessary. */
1224 Note that having the output_stream ("-O") file opened here for an FTP
1225 URL rather than in getftp() (ftp.c) (and the http equivalent) rather
1226 limits the ability in VMS to open the file differently for ASCII
1227 versus binary FTP there. (Of course, doing it here allows a open
1228 failure to be detected immediately, without first connecting to the
1231 if (opt.output_document)
1233 if (HYPHENP (opt.output_document))
1237 result = freopen ("CONOUT$", "wb", stdout);
1240 logputs (LOG_NOTQUIET, _("\
1241 WARNING: Can't reopen standard output in binary mode;\n\
1242 downloaded file may contain inappropriate line endings.\n"));
1245 output_stream = stdout;
1252 /* Common fopen() optional arguments:
1253 sequential access only, access callback function.
1255 # define FOPEN_OPT_ARGS , "fop=sqo", "acc", acc_cb, &open_id
1257 #else /* def __VMS */
1258 # define FOPEN_OPT_ARGS
1259 #endif /* def __VMS [else] */
1261 output_stream = fopen (opt.output_document,
1262 opt.always_rest ? "ab" : "wb"
1264 if (output_stream == NULL)
1266 perror (opt.output_document);
1269 if (fstat (fileno (output_stream), &st) == 0 && S_ISREG (st.st_mode))
1270 output_stream_regular = true;
1272 if (!output_stream_regular && opt.convert_links)
1274 fprintf (stderr, _("-k can be used together with -O only if \
1275 outputting to a regular file.\n"));
1282 /* Set global ODS5 flag according to the specified destination (if
1283 any), otherwise according to the current default device.
1285 if (output_stream == NULL)
1286 set_ods5_dest( "SYS$DISK");
1287 else if (output_stream != stdout)
1288 set_ods5_dest( opt.output_document);
1289 #endif /* def __VMS */
1296 /* Setup the signal handler to redirect output when hangup is
1298 if (signal(SIGHUP, SIG_IGN) != SIG_IGN)
1299 signal(SIGHUP, redirect_output_signal);
1301 /* ...and do the same for SIGUSR1. */
1303 signal (SIGUSR1, redirect_output_signal);
1306 /* Writing to a closed socket normally signals SIGPIPE, and the
1307 process exits. What we want is to ignore SIGPIPE and just check
1308 for the return value of write(). */
1309 signal (SIGPIPE, SIG_IGN);
1312 signal (SIGWINCH, progress_handle_sigwinch);
1315 /* Retrieve the URLs from argument list. */
1316 for (t = url; *t; t++)
1318 char *filename = NULL, *redirected_URL = NULL;
1320 /* Need to do a new struct iri every time, because
1321 * retrieve_url may modify it in some circumstances,
1323 struct iri *iri = iri_new ();
1324 struct url *url_parsed;
1326 set_uri_encoding (iri, opt.locale, true);
1327 url_parsed = url_parse (*t, &url_err, iri, true);
1331 char *error = url_error (*t, url_err);
1332 logprintf (LOG_NOTQUIET, "%s: %s.\n",*t, error);
1337 if ((opt.recursive || opt.page_requisites)
1338 && (url_scheme (*t) != SCHEME_FTP || url_uses_proxy (url_parsed)))
1340 int old_follow_ftp = opt.follow_ftp;
1342 /* Turn opt.follow_ftp on in case of recursive FTP retrieval */
1343 if (url_scheme (*t) == SCHEME_FTP)
1346 retrieve_tree (url_parsed, NULL);
1348 opt.follow_ftp = old_follow_ftp;
1352 retrieve_url (url_parsed, *t, &filename, &redirected_URL, NULL,
1353 &dt, opt.recursive, iri, true);
1356 if (opt.delete_after && file_exists_p(filename))
1358 DEBUGP (("Removing file due to --delete-after in main():\n"));
1359 logprintf (LOG_VERBOSE, _("Removing %s.\n"), filename);
1360 if (unlink (filename))
1361 logprintf (LOG_NOTQUIET, "unlink: %s\n", strerror (errno));
1363 xfree_null (redirected_URL);
1364 xfree_null (filename);
1365 url_free (url_parsed);
1370 /* And then from the input file, if any. */
1371 if (opt.input_filename)
1374 retrieve_from_file (opt.input_filename, opt.force_html, &count);
1376 logprintf (LOG_NOTQUIET, _("No URLs found in %s.\n"),
1377 opt.input_filename);
1380 /* Print broken links. */
1381 if (opt.recursive && opt.spider)
1382 print_broken_links ();
1384 /* Print the downloaded sum. */
1385 if ((opt.recursive || opt.page_requisites
1387 || (opt.input_filename && total_downloaded_bytes != 0))
1389 total_downloaded_bytes != 0)
1391 double end_time = ptimer_measure (timer);
1392 ptimer_destroy (timer);
1394 char *wall_time = xstrdup (secs_to_human_time (end_time - start_time));
1395 char *download_time = xstrdup (secs_to_human_time (total_download_time));
1396 logprintf (LOG_NOTQUIET,
1397 _("FINISHED --%s--\nTotal wall clock time: %s\n"
1398 "Downloaded: %d files, %s in %s (%s)\n"),
1399 datetime_str (time (NULL)),
1402 human_readable (total_downloaded_bytes),
1404 retr_rate (total_downloaded_bytes, total_download_time));
1406 xfree (download_time);
1408 /* Print quota warning, if exceeded. */
1409 if (opt.quota && total_downloaded_bytes > opt.quota)
1410 logprintf (LOG_NOTQUIET,
1411 _("Download quota of %s EXCEEDED!\n"),
1412 human_readable (opt.quota));
1415 if (opt.cookies_output)
1418 if (opt.convert_links && !opt.delete_after)
1419 convert_all_links ();
1422 for (i = 0; i < nurl; i++)
1426 return get_exit_status ();
1428 #endif /* TESTING */
1430 #if defined(SIGHUP) || defined(SIGUSR1)
1432 /* So the signal_name check doesn't blow when only one is available. */
1440 /* Hangup signal handler. When wget receives SIGHUP or SIGUSR1, it
1441 will proceed operation as usual, trying to write into a log file.
1442 If that is impossible, the output will be turned off. */
1445 redirect_output_signal (int sig)
1447 const char *signal_name = (sig == SIGHUP ? "SIGHUP" :
1448 (sig == SIGUSR1 ? "SIGUSR1" :
1450 log_request_redirect_output (signal_name);
1451 progress_schedule_redirect ();
1452 signal (sig, redirect_output_signal);