X-Git-Url: http://sjero.net/git/?p=wget;a=blobdiff_plain;f=src%2Fretr.c;h=f1b8f955a36f3f2361f7142b1366fd78aaba72c5;hp=8752dce71510d3ef3819bdbbb4ba7a0906aa1c4a;hb=b014f8fae9291e7504c0cca2dd8b9a0035466c03;hpb=a9da78c6d8f9e2699107fcde81efeb607dde1cca diff --git a/src/retr.c b/src/retr.c index 8752dce7..f1b8f955 100644 --- a/src/retr.c +++ b/src/retr.c @@ -39,6 +39,7 @@ as that of the covered work. */ #include #include +#include "exits.h" #include "utils.h" #include "retr.h" #include "progress.h" @@ -168,7 +169,18 @@ write_data (FILE *out, const char *buf, int bufsize, wgint *skip, performance: fast downloads will arrive in large 16K chunks (which stdio would write out immediately anyway), and slow downloads wouldn't be limited by disk speed. */ + + /* 2005-04-20 SMS. + Perhaps it shouldn't hinder performance, but it sure does, at least + on VMS (more than 2X). Rather than speculate on what it should or + shouldn't do, it might make more sense to test it. Even better, it + might be nice to explain what possible benefit it could offer, as + it appears to be a clear invitation to poor performance with no + actual justification. (Also, why 16K? Anyone test other values?) + */ +#ifndef __VMS fflush (out); +#endif /* ndef __VMS */ return !ferror (out); } @@ -600,11 +612,12 @@ static char *getproxy (struct url *); uerr_t retrieve_url (struct url * orig_parsed, const char *origurl, char **file, char **newloc, const char *refurl, int *dt, bool recursive, - struct iri *iri) + struct iri *iri, bool register_status) { uerr_t result; char *url; bool location_changed; + bool iri_fallbacked = 0; int dummy; char *mynewloc, *proxy; struct url *u = orig_parsed, *proxy_url; @@ -628,15 +641,11 @@ retrieve_url (struct url * orig_parsed, const char *origurl, char **file, if (file) *file = NULL; - second_try: - DEBUGP (("[IRI Retrieving %s with %s (UTF-8=%d)\n", quote_n (0, url), - iri->uri_encoding ? quote_n (1, iri->uri_encoding) : "None", - iri->utf8_encode)); - if (!refurl) refurl = opt.referer; redirected: + /* (also for IRI fallbacking) */ result = NOCONERROR; mynewloc = NULL; @@ -660,7 +669,8 @@ retrieve_url (struct url * orig_parsed, const char *origurl, char **file, xfree (url); xfree (error); RESTORE_POST_DATA; - return PROXERR; + result = PROXERR; + goto bail; } if (proxy_url->scheme != SCHEME_HTTP && proxy_url->scheme != u->scheme) { @@ -668,7 +678,8 @@ retrieve_url (struct url * orig_parsed, const char *origurl, char **file, url_free (proxy_url); xfree (url); RESTORE_POST_DATA; - return PROXERR; + result = PROXERR; + goto bail; } } @@ -749,7 +760,7 @@ retrieve_url (struct url * orig_parsed, const char *origurl, char **file, xfree (mynewloc); xfree (error); RESTORE_POST_DATA; - return result; + goto bail; } /* Now mynewloc will become newloc_parsed->url, because if the @@ -771,7 +782,8 @@ retrieve_url (struct url * orig_parsed, const char *origurl, char **file, xfree (url); xfree (mynewloc); RESTORE_POST_DATA; - return WRONGCODE; + result = WRONGCODE; + goto bail; } xfree (url); @@ -805,7 +817,9 @@ retrieve_url (struct url * orig_parsed, const char *origurl, char **file, if (u) { DEBUGP (("[IRI fallbacking to non-utf8 for %s\n", quote (url))); - goto second_try; + url = xstrdup (u->url); + iri_fallbacked = 1; + goto redirected; } else DEBUGP (("[Couldn't fallback to non-utf8 for %s\n", quote (url))); @@ -840,7 +854,7 @@ retrieve_url (struct url * orig_parsed, const char *origurl, char **file, url_free (u); } - if (redirection_count) + if (redirection_count || iri_fallbacked) { if (newloc) *newloc = url; @@ -856,6 +870,9 @@ retrieve_url (struct url * orig_parsed, const char *origurl, char **file, RESTORE_POST_DATA; +bail: + if (register_status) + inform_exit_status (result); return result; } @@ -900,7 +917,7 @@ retrieve_from_file (const char *file, bool html, int *count) opt.base_href = xstrdup (url); status = retrieve_url (url_parsed, url, &input_file, NULL, NULL, &dt, - false, iri); + false, iri, true); if (status != RETROK) return status; @@ -960,7 +977,8 @@ retrieve_from_file (const char *file, bool html, int *count) else status = retrieve_url (parsed_url ? parsed_url : cur_url->url, cur_url->url->url, &filename, - &new_file, NULL, &dt, opt.recursive, tmpiri); + &new_file, NULL, &dt, opt.recursive, tmpiri, + true); if (parsed_url) url_free (parsed_url);