1 /* Command line parsing.
2 Copyright (C) 1995, 1996, 1997, 1998 Free Software Foundation, Inc.
4 This file is part of Wget.
6 This program is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 2 of the License, or
9 (at your option) any later version.
11 This program is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with this program; if not, write to the Free Software
18 Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. */
27 #endif /* HAVE_UNISTD_H */
28 #include <sys/types.h>
33 #endif /* HAVE_STRING_H */
40 #endif /* HAVE_LOCALE_H */
43 #define OPTIONS_DEFINED_HERE /* for options.h */
53 #ifndef PATH_SEPARATOR
54 # define PATH_SEPARATOR '/'
57 extern char *version_string;
66 void log_init PARAMS ((const char *, int));
67 void log_close PARAMS ((void));
68 void redirect_output PARAMS ((const char *));
70 static RETSIGTYPE redirect_output_signal PARAMS ((int));
72 const char *exec_name;
74 /* Initialize I18N. The initialization amounts to invoking
75 setlocale(), bindtextdomain() and textdomain().
76 Does nothing if NLS is disabled or missing. */
78 i18n_initialize (void)
80 /* If HAVE_NLS is defined, assume the existence of the three
81 functions invoked here. */
83 /* Set the current locale. */
84 /* Here we use LC_MESSAGES instead of LC_ALL, for two reasons.
85 First, message catalogs are all of I18N Wget uses anyway.
86 Second, setting LC_ALL has a dangerous potential of messing
87 things up. For example, when in a foreign locale, Solaris
88 strptime() fails to handle international dates correctly, which
89 makes http_atotm() malfunction. */
90 setlocale (LC_MESSAGES, "");
91 /* Set the text message domain. */
92 bindtextdomain ("wget", LOCALEDIR);
97 /* Print the usage message. */
101 printf (_("Usage: %s [OPTION]... [URL]...\n"), exec_name);
104 /* Print the help message, describing all the available options. If
105 you add an option, be sure to update this list. */
109 printf (_("GNU Wget %s, a non-interactive network retriever.\n"),
112 /* Had to split this in parts, so the #@@#%# Ultrix compiler and cpp
113 don't bitch. Also, it makes translation much easier. */
114 printf ("%s%s%s%s%s%s%s%s%s%s", _("\
116 Mandatory arguments to long options are mandatory for short options too.\n\
119 -V, --version display the version of Wget and exit.\n\
120 -h, --help print this help.\n\
121 -b, --background go to background after startup.\n\
122 -e, --execute=COMMAND execute a `.wgetrc\' command.\n\
124 Logging and input file:\n\
125 -o, --output-file=FILE log messages to FILE.\n\
126 -a, --append-output=FILE append messages to FILE.\n\
127 -d, --debug print debug output.\n\
128 -q, --quiet quiet (no output).\n\
129 -v, --verbose be verbose (this is the default).\n\
130 -nv, --non-verbose turn off verboseness, without being quiet.\n\
131 -i, --input-file=FILE read URL-s from file.\n\
132 -F, --force-html treat input file as HTML.\n\
135 -t, --tries=NUMBER set number of retries to NUMBER (0 unlimits).\n\
136 -O --output-document=FILE write documents to FILE.\n\
137 -nc, --no-clobber don\'t clobber existing files.\n\
138 -c, --continue restart getting an existing file.\n\
139 --dot-style=STYLE set retrieval display style.\n\
140 -N, --timestamping don\'t retrieve files if older than local.\n\
141 -S, --server-response print server response.\n\
142 --spider don\'t download anything.\n\
143 -T, --timeout=SECONDS set the read timeout to SECONDS.\n\
144 -w, --wait=SECONDS wait SECONDS between retrievals.\n\
145 --waitretry=SECONDS wait 0..max SECONDS between retries of a retrieval.\n\
146 -Y, --proxy=on/off turn proxy on or off.\n\
147 -Q, --quota=NUMBER set retrieval quota to NUMBER.\n\
150 -nd --no-directories don\'t create directories.\n\
151 -x, --force-directories force creation of directories.\n\
152 -nH, --no-host-directories don\'t create host directories.\n\
153 -P, --directory-prefix=PREFIX save files to PREFIX/...\n\
154 --cut-dirs=NUMBER ignore NUMBER remote directory components.\n\
157 --http-user=USER set http user to USER.\n\
158 --http-passwd=PASS set http password to PASS.\n\
159 -C, --cache=on/off (dis)allow server-cached data (normally allowed).\n\
160 --ignore-length ignore `Content-Length\' header field.\n\
161 --header=STRING insert STRING among the headers.\n\
162 --proxy-user=USER set USER as proxy username.\n\
163 --proxy-passwd=PASS set PASS as proxy password.\n\
164 -s, --save-headers save the HTTP headers to file.\n\
165 -U, --user-agent=AGENT identify as AGENT instead of Wget/VERSION.\n\
168 --retr-symlinks retrieve FTP symbolic links.\n\
169 -g, --glob=on/off turn file name globbing on or off.\n\
170 --passive-ftp use the \"passive\" transfer mode.\n\
172 Recursive retrieval:\n\
173 -r, --recursive recursive web-suck -- use with care!.\n\
174 -l, --level=NUMBER maximum recursion depth (0 to unlimit).\n\
175 --delete-after delete downloaded files.\n\
176 -k, --convert-links convert non-relative links to relative.\n\
177 -K, --backup-converted before converting file X, back up as X.orig.\n\
178 -m, --mirror turn on options suitable for mirroring.\n\
179 -nr, --dont-remove-listing don\'t remove `.listing\' files.\n\
181 Recursive accept/reject:\n\
182 -A, --accept=LIST list of accepted extensions.\n\
183 -R, --reject=LIST list of rejected extensions.\n\
184 -D, --domains=LIST list of accepted domains.\n\
185 --exclude-domains=LIST comma-separated list of rejected domains.\n\
186 -L, --relative follow relative links only.\n\
187 --follow-ftp follow FTP links from HTML documents.\n\
188 -H, --span-hosts go to foreign hosts when recursive.\n\
189 -I, --include-directories=LIST list of allowed directories.\n\
190 -X, --exclude-directories=LIST list of excluded directories.\n\
191 -nh, --no-host-lookup don\'t DNS-lookup hosts.\n\
192 -np, --no-parent don\'t ascend to the parent directory.\n\
193 \n"), _("Mail bug reports and suggestions to <bug-wget@gnu.org>.\n"));
197 main (int argc, char *const *argv)
200 int i, c, nurl, status, append_to_log;
203 static struct option long_options[] =
205 { "background", no_argument, NULL, 'b' },
206 { "continue", no_argument, NULL, 'c' },
207 { "convert-links", no_argument, NULL, 'k' },
208 { "backup-converted", no_argument, NULL, 'K' },
209 { "debug", no_argument, NULL, 'd' },
210 { "dont-remove-listing", no_argument, NULL, 21 },
211 { "email-address", no_argument, NULL, 'E' }, /* undocumented (debug) */
212 { "follow-ftp", no_argument, NULL, 14 },
213 { "force-directories", no_argument, NULL, 'x' },
214 { "force-hier", no_argument, NULL, 'x' }, /* obsolete */
215 { "force-html", no_argument, NULL, 'F'},
216 { "help", no_argument, NULL, 'h' },
217 { "ignore-length", no_argument, NULL, 10 },
218 { "mirror", no_argument, NULL, 'm' },
219 { "no-clobber", no_argument, NULL, 13 },
220 { "no-directories", no_argument, NULL, 19 },
221 { "no-host-directories", no_argument, NULL, 20 },
222 { "no-host-lookup", no_argument, NULL, 22 },
223 { "no-parent", no_argument, NULL, 5 },
224 { "non-verbose", no_argument, NULL, 18 },
225 { "passive-ftp", no_argument, NULL, 11 },
226 { "quiet", no_argument, NULL, 'q' },
227 { "recursive", no_argument, NULL, 'r' },
228 { "relative", no_argument, NULL, 'L' },
229 { "retr-symlinks", no_argument, NULL, 9 },
230 { "save-headers", no_argument, NULL, 's' },
231 { "server-response", no_argument, NULL, 'S' },
232 { "span-hosts", no_argument, NULL, 'H' },
233 { "spider", no_argument, NULL, 4 },
234 { "timestamping", no_argument, NULL, 'N' },
235 { "verbose", no_argument, NULL, 'v' },
236 { "version", no_argument, NULL, 'V' },
238 { "accept", required_argument, NULL, 'A' },
239 { "append-output", required_argument, NULL, 'a' },
240 { "backups", required_argument, NULL, 23 }, /* undocumented */
241 { "base", required_argument, NULL, 'B' },
242 { "cache", required_argument, NULL, 'C' },
243 { "cut-dirs", required_argument, NULL, 17 },
244 { "delete-after", no_argument, NULL, 8 },
245 { "directory-prefix", required_argument, NULL, 'P' },
246 { "domains", required_argument, NULL, 'D' },
247 { "dot-style", required_argument, NULL, 6 },
248 { "execute", required_argument, NULL, 'e' },
249 { "exclude-directories", required_argument, NULL, 'X' },
250 { "exclude-domains", required_argument, NULL, 12 },
251 { "glob", required_argument, NULL, 'g' },
252 { "header", required_argument, NULL, 3 },
253 { "htmlify", required_argument, NULL, 7 },
254 { "http-passwd", required_argument, NULL, 2 },
255 { "http-user", required_argument, NULL, 1 },
256 { "include-directories", required_argument, NULL, 'I' },
257 { "input-file", required_argument, NULL, 'i' },
258 { "level", required_argument, NULL, 'l' },
259 { "no", required_argument, NULL, 'n' },
260 { "output-document", required_argument, NULL, 'O' },
261 { "output-file", required_argument, NULL, 'o' },
262 { "proxy", required_argument, NULL, 'Y' },
263 { "proxy-passwd", required_argument, NULL, 16 },
264 { "proxy-user", required_argument, NULL, 15 },
265 { "quota", required_argument, NULL, 'Q' },
266 { "reject", required_argument, NULL, 'R' },
267 { "timeout", required_argument, NULL, 'T' },
268 { "tries", required_argument, NULL, 't' },
269 { "user-agent", required_argument, NULL, 'U' },
270 { "referer", required_argument, NULL, 129 },
271 { "use-proxy", required_argument, NULL, 'Y' },
272 { "wait", required_argument, NULL, 'w' },
273 { "waitretry", required_argument, NULL, 24 },
281 /* Construct the name of the executable, without the directory part. */
282 exec_name = strrchr (argv[0], PATH_SEPARATOR);
289 windows_main_junk (&argc, (char **) argv, (char **) &exec_name);
294 while ((c = getopt_long (argc, argv, "\
295 hVqvdkKsxmNWrHSLcFbEY:g:T:U:O:l:n:i:o:a:t:D:A:R:P:B:e:Q:X:I:w:",
296 long_options, (int *)0)) != EOF)
300 /* Options without arguments: */
302 setval ("spider", "on");
305 setval ("noparent", "on");
308 setval ("deleteafter", "on");
311 setval ("retrsymlinks", "on");
314 setval ("ignorelength", "on");
317 setval ("passiveftp", "on");
320 setval ("noclobber", "on");
323 setval ("followftp", "on");
326 setval ("cutdirs", optarg);
329 setval ("verbose", "off");
332 setval ("dirstruct", "off");
335 setval ("addhostdir", "off");
338 setval ("removelisting", "off");
341 setval ("simplehostcheck", "on");
344 setval ("background", "on");
347 setval ("continue", "on");
351 setval ("debug", "on");
352 #else /* not DEBUG */
353 fprintf (stderr, _("%s: debug support not compiled in.\n"),
355 #endif /* not DEBUG */
358 /* For debugging purposes. */
359 printf ("%s\n", ftp_getaddress ());
363 setval ("forcehtml", "on");
366 setval ("spanhosts", "on");
376 setval ("convertlinks", "on");
379 setval ("backupconverted", "on");
382 setval ("relativeonly", "on");
385 setval ("mirror", "on");
388 setval ("timestamping", "on");
391 setval ("serverresponse", "on");
394 setval ("saveheaders", "on");
397 setval ("quiet", "on");
400 setval ("recursive", "on");
403 printf ("GNU Wget %s\n\n", version_string);
405 Copyright (C) 1995, 1996, 1997, 1998 Free Software Foundation, Inc.\n\
406 This program is distributed in the hope that it will be useful,\n\
407 but WITHOUT ANY WARRANTY; without even the implied warranty of\n\
408 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the\n\
409 GNU General Public License for more details.\n"));
410 printf (_("\nWritten by Hrvoje Niksic <hniksic@srce.hr>.\n"));
414 setval ("verbose", "on");
417 setval ("dirstruct", "on");
420 /* Options accepting an argument: */
422 setval ("httpuser", optarg);
425 setval ("httppasswd", optarg);
428 setval ("header", optarg);
431 setval ("dotstyle", optarg);
434 setval ("htmlify", optarg);
437 setval ("excludedomains", optarg);
440 setval ("proxyuser", optarg);
443 setval ("proxypasswd", optarg);
446 setval ("backups", optarg);
449 setval ("accept", optarg);
452 setval ("logfile", optarg);
456 setval ("base", optarg);
459 setval ("cache", optarg);
462 setval ("domains", optarg);
467 if (parse_line (optarg, &com, &val))
469 if (!setval (com, val))
474 fprintf (stderr, _("%s: %s: invalid command\n"), exec_name,
483 setval ("glob", optarg);
486 setval ("includedirectories", optarg);
489 setval ("input", optarg);
492 setval ("reclevel", optarg);
496 /* #### The n? options are utter crock! */
499 for (p = optarg; *p; p++)
503 setval ("verbose", "off");
506 setval ("simplehostcheck", "on");
509 setval ("addhostdir", "off");
512 setval ("dirstruct", "off");
515 setval ("noclobber", "on");
518 setval ("removelisting", "off");
521 setval ("noparent", "on");
524 printf (_("%s: illegal option -- `-n%c'\n"), exec_name, *p);
527 printf (_("Try `%s --help\' for more options.\n"), exec_name);
533 setval ("outputdocument", optarg);
536 setval ("logfile", optarg);
539 setval ("dirprefix", optarg);
542 setval ("quota", optarg);
545 setval ("reject", optarg);
548 setval ("timeout", optarg);
551 setval ("tries", optarg);
554 setval ("useragent", optarg);
557 setval ("referer", optarg);
560 setval ("wait", optarg);
563 setval ("waitretry", optarg);
567 setval ("excludedirectories", optarg);
570 setval ("useproxy", optarg);
576 printf (_("Try `%s --help' for more options.\n"), exec_name);
581 if (opt.verbose == -1)
582 opt.verbose = !opt.quiet;
584 /* Retain compatibility with previous scripts.
585 if wait has been set, but waitretry has not, give it the wait value.
586 A simple check on the values is not enough, I could have set
587 wait to n>0 and waitretry to 0 - HEH */
589 setval ("waitretry", opt.wait);
592 if (opt.verbose && opt.quiet)
594 printf (_("Can't be verbose and quiet at the same time.\n"));
598 if (opt.timestamping && opt.noclobber)
601 Can't timestamp and not clobber old files at the same time.\n"));
605 nurl = argc - optind;
606 if (!nurl && !opt.input_filename)
608 /* No URL specified. */
609 printf (_("%s: missing URL\n"), exec_name);
612 /* #### Something nicer should be printed here -- similar to the
613 pre-1.5 `--help' page. */
614 printf (_("Try `%s --help' for more options.\n"), exec_name);
619 fork_to_background ();
621 /* Allocate basic pointer. */
622 url = ALLOCA_ARRAY (char *, nurl + 1);
623 /* Fill in the arguments. */
624 for (i = 0; i < nurl; i++, optind++)
626 char *irix4_cc_needs_this;
627 STRDUP_ALLOCA (irix4_cc_needs_this, argv[optind]);
628 url[i] = irix4_cc_needs_this;
632 /* Change the title of console window on Windows. #### I think this
633 statement should belong to retrieve_url(). --hniksic. */
635 ws_changetitle (*url, nurl);
638 /* Initialize logging. */
639 log_init (opt.lfilename, append_to_log);
641 DEBUGP (("DEBUG output created by Wget %s on %s.\n\n", version_string,
643 /* Open the output filename if necessary. */
644 if (opt.output_document)
646 if (HYPHENP (opt.output_document))
650 opt.dfp = fopen (opt.output_document, "wb");
653 perror (opt.output_document);
663 /* Setup the signal handler to redirect output when hangup is
666 if (signal(SIGHUP, SIG_IGN) != SIG_IGN)
667 signal(SIGHUP, redirect_output_signal);
668 /* ...and do the same for SIGUSR1. */
669 signal (SIGUSR1, redirect_output_signal);
670 /* Writing to a closed socket normally signals SIGPIPE, and the
671 process exits. What we want is to ignore SIGPIPE and just check
672 for the return value of write(). */
673 signal (SIGPIPE, SIG_IGN);
674 #endif /* HAVE_SIGNAL */
676 status = RETROK; /* initialize it, just-in-case */
678 /* Retrieve the URLs from argument list. */
679 for (t = url; *t; t++)
681 char *filename, *new_file;
684 status = retrieve_url (*t, &filename, &new_file, NULL, &dt);
685 if (opt.recursive && status == RETROK && (dt & TEXTHTML))
686 status = recursive_retrieve (filename, new_file ? new_file : *t);
687 FREE_MAYBE (new_file);
688 FREE_MAYBE (filename);
691 /* And then from the input file, if any. */
692 if (opt.input_filename)
695 status = retrieve_from_file (opt.input_filename, opt.force_html, &count);
697 logprintf (LOG_NOTQUIET, _("No URLs found in %s.\n"),
700 /* Print the downloaded sum. */
703 || (opt.input_filename && opt.downloaded != 0))
705 logprintf (LOG_NOTQUIET,
706 _("\nFINISHED --%s--\nDownloaded: %s bytes in %d files\n"),
707 time_str (NULL), legible (opt.downloaded), opt.numurls);
708 /* Print quota warning, if exceeded. */
709 if (opt.quota && opt.downloaded > opt.quota)
710 logprintf (LOG_NOTQUIET,
711 _("Download quota (%s bytes) EXCEEDED!\n"),
712 legible (opt.quota));
714 if (opt.convert_links)
716 convert_all_links ();
720 if (status == RETROK)
726 /* Hangup signal handler. When wget receives SIGHUP or SIGUSR1, it
727 will proceed operation as usual, trying to write into a log file.
728 If that is impossible, the output will be turned off. */
732 redirect_output_signal (int sig)
735 signal (sig, redirect_output_signal);
736 /* Please note that the double `%' in `%%s' is intentional, because
737 redirect_output passes tmp through printf. */
738 sprintf (tmp, _("%s received, redirecting output to `%%s'.\n"),
739 (sig == SIGHUP ? "SIGHUP" :
740 (sig == SIGUSR1 ? "SIGUSR1" :
742 redirect_output (tmp);
744 #endif /* HAVE_SIGNAL */