X-Git-Url: http://sjero.net/git/?p=wget;a=blobdiff_plain;f=src%2Fhtml-url.c;h=59d873b394e6443cbaacad970399fbf6b67596f3;hp=89b93539d65f926c26997b76bec953fb26faecce;hb=3f84a5e00e255ab46e69d8ff5e565b238fce4126;hpb=1b2dce0493a5695ec1bff8ea9e11a7adc79cff1a diff --git a/src/html-url.c b/src/html-url.c index 89b93539..59d873b3 100644 --- a/src/html-url.c +++ b/src/html-url.c @@ -612,9 +612,12 @@ get_urls_html (const char *file, const char *url, int *meta_disallow_follow) init_interesting (); /* Specify MHT_TRIM_VALUES because of buggy HTML generators that - generate instead of (Netscape - ignores spaces as well.) If you really mean space, use &32; or - %20. */ + generate instead of (browsers + ignore spaces as well.) If you really mean space, use &32; or + %20. MHT_TRIM_VALUES also causes squashing of embedded newlines, + e.g. in . Such newlines are also + ignored by IE and Mozilla and are presumably introduced by + writing HTML with editors that force word wrap. */ flags = MHT_TRIM_VALUES; if (opt.strict_comments) flags |= MHT_STRICT_COMMENTS;