X-Git-Url: http://sjero.net/git/?p=wget;a=blobdiff_plain;f=src%2Firi.c;h=dcab3ea1533fc2ea9e9d3429a134a9b9471060ee;hp=067291c7cf5c33dedacccf32e33147047016070e;hb=HEAD;hpb=260b9593dc03da095df30efc3eed251a231d09a9 diff --git a/src/iri.c b/src/iri.c index 067291c7..dcab3ea1 100644 --- a/src/iri.c +++ b/src/iri.c @@ -1,5 +1,5 @@ /* IRI related functions. - Copyright (C) 2008, 2009, 2010 Free Software Foundation, Inc. + Copyright (C) 2008, 2009, 2010, 2011 Free Software Foundation, Inc. This file is part of GNU Wget. @@ -256,15 +256,30 @@ idn_decode (char *host) /* Try to transcode string str from remote encoding to UTF-8. On success, *new contains the transcoded string. *new content is unspecified otherwise. */ bool -remote_to_utf8 (struct iri *i, const char *str, const char **new) +remote_to_utf8 (struct iri *iri, const char *str, const char **new) { iconv_t cd; bool ret = false; - if (!i->uri_encoding) + if (!iri->uri_encoding) return false; - cd = iconv_open ("UTF-8", i->uri_encoding); + /* When `i->uri_encoding' == "UTF-8" there is nothing to convert. But we must + test for non-ASCII symbols for correct hostname processing in `idn_encode' + function. */ + if (!strcmp (iri->uri_encoding, "UTF-8")) + { + const char *p = str; + for (p = str; *p; p++) + if (*p < 0) + { + *new = strdup (str); + return true; + } + return false; + } + + cd = iconv_open ("UTF-8", iri->uri_encoding); if (cd == (iconv_t)(-1)) return false;