]> sjero.net Git - wget/blobdiff - src/ChangeLog
[svn] New option --no-http-keep-alive.
[wget] / src / ChangeLog
index 9e0706cd29dcba065d0baccb10c55cbef8f46b22..71401675a3fc499ee8f69b00daacba7d115078d2 100644 (file)
@@ -1,3 +1,234 @@
+2000-11-20  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * http.c (gethttp): Don't use the return value of sprintf().
+       (gethttp): Inhibit keep-alive if opt.http_keep_alive is 0.
+
+2000-11-20  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * recur.c (recursive_retrieve): Print the "so we don't load"
+       debugging message only if we really don't load.
+
+       * http.c (gethttp): Inhibit keep-alive if proxy is being used.
+       (gethttp): Don't request keep-alive if keep-alive is inhibited.
+
+2000-11-19  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * http.c (gethttp): Make the HTTP persistent connections more
+       robust.
+
+2000-11-19  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * retr.c (get_contents): If use_expected, make sure that the
+       appropriate amount of data is being read.
+
+       * http.c (gethttp): Check for both `Keep-Alive: ...' and
+       `Connection: Keep-Alive'.
+
+       * wget.h (DEBUGP): Call debug_logprintf only if opt.debug is
+       turned on.
+
+2000-11-19  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * http.c (connection_available_p): Use it.
+
+       * connect.c (test_socket_open): New function.
+
+       * http.c (gethttp): Support persistent connections.  Based on the
+       ideas, and partly on code, by Sam Horrocks <sam@daemoninc.com>.
+       (register_persistent): New function.
+       (connection_available_p): Ditto.
+       (invalidate_connection): Ditto.
+
+2000-11-19  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * url.c (convert_links): Handle UREL2ABS case.
+
+       * recur.c (recursive_retrieve): Instead of the list
+       urls_downloaded, use hash tables dl_file_url_map and
+       dl_url_file_map.
+       (convert_all_links): Use them to retrieve data.
+
+       * host.c (clean_hosts): Free the hash tables.
+
+       * main.c (private_initialize): Call host_init().
+
+       * host.c (store_hostaddress): Use a saner, hash table-based data
+       model.
+       (realhost): Ditto.
+       (host_init): Initialize the hash tables.
+
+2000-11-18  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * utils.c (slist_append): Eviscerate NOSORT.  Hash tables are now
+       used for what the sorted slists used to be used for.
+       (slist_contains): Don't rely on the list being sorted.
+       (slist_append): Simplify the code.
+
+       * recur.c (recursive_cleanup): Use free_string_set.
+
+       * utils.c (string_set_add, string_set_exists, string_set_free):
+       New functions for easier freeing of hash tables whose keys are
+       strdup'ed strings.
+
+       * recur.c (recursive_retrieve): Use the hash table functions for
+       storing undesirable URLs.
+
+       * hash.c: New file.
+
+2000-11-17  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * main.c (private_initialize): Call url_init.
+       (main): Call private_initialize.
+
+       * url.c (unsafe_char_table): New table.
+       (UNSAFE_CHAR): Use it.
+       (init_unsafe_char_table): New function.
+       (url_init): New function; call init_unsafe_char_table.
+
+2000-11-15  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * html-url.c (handle_link): Handle HTML fragment identifiers.
+
+       * recur.c (recursive_retrieve): If norobot info is respected and
+       the file is specified not to be followed by robots, respect that.
+
+       * html-url.c (collect_tags_mapper): Handle <meta name=robots
+       content=X>.  For us the important cases are where X is NONE or
+       where X contains NOFOLLOW.
+       (get_urls_html): Propagate that information to the caller.
+
+2000-11-13  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * url.c (convert_links): Unlink the file we might be reading from
+       before writing to it.
+       (convert_links): Use alloca instead of malloc for
+       filename_plus_orig_suffix.
+
+2000-11-10  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * url.c (get_urls_file): Ditto.
+       (convert_links): Ditto.
+
+       * html-url.c (get_urls_html): Use read_file() instead of
+       load_file().
+
+       * utils.c (read_file): New function, instead of the old
+       load_file().
+       (read_file_free): Ditto.
+
+       * url.c (findurl): Search only for the supported protocols.
+       (convert_links): Use fwrite() when writing out a region of
+       characters.
+
+2000-11-10  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * ftp-ls.c: Move html_quote_string and ftp_index here.
+
+       * url.c: Remove get_urls_html, since that's now in html-url.c.
+
+       * html-url.c: New file.
+
+       * html-parse.c: New file.
+
+2000-11-16  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * mswindows.h: Define snprintf and vsnprintf to _snprintf and
+       _vsnprintf respectively.
+
+2000-11-15  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * config.h.in: Do the _XOPEN_SOURCE and _SVID_SOURCE things only
+       on Linux.
+
+2000-11-12  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * host.c (realhost): Add HOST to the list with quality==0 only if
+       it wasn't already there.
+       Based on analysis by Lu Guohan <feng@public.bjnet.edu.cn>.
+
+2000-11-10  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * init.c (run_wgetrc): Don't bother killing off '\r' since
+       pars_line() skips whitespace at end of line anyway.
+       (parse_line): Oops, it didn't.  Now it does.
+
+       * recur.c (parse_robots): Ditto here.
+
+       * ftp-ls.c (ftp_parse_unix_ls): Kill off the newline character
+       manually because read_whole_line no longer does.
+
+       * utils.c (read_whole_line): Rewrite to: a) use less memory
+       (reallocates to needed size after work), b) work faster -->
+       fgets() instead of getc, c) be more correct --> doesn't kill the
+       newline character at the end of line.
+
+2000-11-10  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * init.c (comind): Initialize MAX to array size - 1.
+
+2000-11-08  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * url.c (construct): Changed last_slash[-1] to *(last_slash - 1).
+       Suggested by Edward J. Sabol.
+
+2000-11-08  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * url.c (construct): Handle the case where host name is not
+       followed by a slash.
+
+2000-11-06  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * init.c: commands[] need to be sorted!  ("base" wasn't.)
+
+2000-11-05  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * wget.h (DO_REALLOC_FROM_ALLOCA): Use braces to disambiguate
+       `if'.
+
+2000-11-05  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * url.c (construct): Insert unneeded initialization for the
+       compiler to shut up.
+
+       * config.h.in: Define _XOPEN_SOURCE to 500 to get the prototype
+       for strptime() (*duh*).  Define _SVID_SOURCE to get S_IFLNK which
+       otherwise gets lost when you define _XOPEN_SOURCE.
+
+       * utils.c (touch): Include the file name in the error message.
+       From Debian.
+
+2000-11-05  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * log.c (logvprintf): Use vsnprintf() in all cases.  If necessary,
+       resize the buffer to fit the formated message.  That way, messages
+       of arbitrary size may be printed.
+       (logvprintf): Use saved_append() to optionally log the last
+       several lines of output.
+       (logputs): Ditto.
+       (log_close): Adapt to new data structures.
+       (log_dump): Ditto.
+       (redirect_output): Print messages to stderr, not to stdout.
+
+       * log.c (saved_append_1): New function.  Replaces the old logging
+       system ("log all output until 10M characters") with a new, much
+       more reasonable one ("log last screenful of text").
+       (saved_append): New function; call saved_append_1.
+       (free_log_line): New function.
+
+2000-11-05  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * url.c (construct): Fix comment.
+       (find_last_char): Document.
+
+2000-11-04  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * snprintf.c: New file.
+
+2000-11-03  Hrvoje Niksic  <hniksic@arsdigita.com>
+
+       * wget.h: If HAVE_STDARG_H is not defined, don't declare argument
+       types to logprintf() and debug_logprintf().
+
 2000-11-02  Hrvoje Niksic  <hniksic@arsdigita.com>
 
        * ftp.c (ftp_loop_internal): Hide the password from the URL when