X-Git-Url: http://sjero.net/git/?a=blobdiff_plain;f=src%2Firi.c;h=ea4046afca4504e12257c009f1e473cc741d5702;hb=84395897ad2d1c107be470946daba744b2e7ebe8;hp=3ee99871273ad76c4d115c015bcb751653e93ec3;hpb=b967d49f79b6e0ce73559bd30d231bddc2e4b232;p=wget diff --git a/src/iri.c b/src/iri.c index 3ee99871..ea4046af 100644 --- a/src/iri.c +++ b/src/iri.c @@ -39,16 +39,12 @@ as that of the covered work. */ #include #include "utils.h" -#include "iri.h" /* RFC3987 section 3.1 mandates STD3 ASCII RULES */ #define IDNA_FLAGS IDNA_USE_STD3_ASCII_RULES /* Note: locale encoding is kept in options struct (opt.locale) */ -static iconv_t locale2utf8; - -static bool open_locale_to_utf8 (void); static bool do_conversion (iconv_t cd, char *in, size_t inlen, char **out); @@ -119,27 +115,7 @@ check_encoding_name (char *encoding) static bool open_locale_to_utf8 (void) { - if (locale2utf8) - return true; - - /* sXXXav : That shouldn't happen, just in case */ - if (!opt.locale) - { - logprintf (LOG_VERBOSE, "open_locale_to_utf8: locale is unset\n"); - opt.locale = find_locale (); - } - - if (!opt.locale) - return false; - - locale2utf8 = iconv_open ("UTF-8", opt.locale); - if (locale2utf8 != (iconv_t)(-1)) - return true; - logprintf (LOG_VERBOSE, "Conversion from %s to %s isn't supported\n", - quote (opt.locale), quote ("UTF-8")); - locale2utf8 = NULL; - return false; } /* Try converting string str from locale to UTF-8. Return a new string @@ -147,22 +123,35 @@ open_locale_to_utf8 (void) const char * locale_to_utf8 (const char *str) { + iconv_t l2u; char *new; - if (!strcasecmp (opt.locale, "utf-8")) - return str; + /* That shouldn't happen, just in case */ + if (!opt.locale) + { + logprintf (LOG_VERBOSE, "open_locale_to_utf8: locale is unset\n"); + opt.locale = find_locale (); + } - if (!open_locale_to_utf8 ()) + if (!opt.locale || !strcasecmp (opt.locale, "utf-8")) return str; - if (do_conversion (locale2utf8, (char *) str, strlen ((char *) str), &new)) + l2u = iconv_open ("UTF-8", opt.locale); + if (l2u != (iconv_t)(-1)) + { + logprintf (LOG_VERBOSE, "Conversion from %s to %s isn't supported\n", + quote (opt.locale), quote ("UTF-8")); + return str; + } + + if (do_conversion (l2u, (char *) str, strlen ((char *) str), &new)) return (const char *) new; return str; } /* Do the conversion according to the passed conversion descriptor cd. *out - will containes the transcoded string on success. *out content is + will contain the transcoded string on success. *out content is unspecified otherwise. */ static bool do_conversion (iconv_t cd, char *in, size_t inlen, char **out) @@ -236,11 +225,7 @@ idn_encode (struct iri *i, char *host) if (!i->utf8_encode) { if (!remote_to_utf8 (i, (const char *) host, (const char **) &new)) - { - /* Nothing to encode or an error occured */ - return NULL; - } - + return NULL; /* Nothing to encode or an error occured */ host = new; } @@ -281,18 +266,13 @@ idn_decode (char *host) bool remote_to_utf8 (struct iri *i, const char *str, const char **new) { - char *r; iconv_t cd; bool ret = false; - if (opt.encoding_remote) - r = opt.encoding_remote; - else if (i->uri_encoding) - r = i->uri_encoding; - else + if (!i->uri_encoding) return false; - cd = iconv_open ("UTF-8", r); + cd = iconv_open ("UTF-8", i->uri_encoding); if (cd == (iconv_t)(-1)) return false; @@ -311,6 +291,7 @@ remote_to_utf8 (struct iri *i, const char *str, const char **new) return ret; } +/* Allocate a new iri structure and return a pointer to it. */ struct iri * iri_new (void) { @@ -318,8 +299,10 @@ iri_new (void) i->uri_encoding = opt.encoding_remote ? xstrdup (opt.encoding_remote) : NULL; i->content_encoding = NULL; i->utf8_encode = opt.enable_iri; + return i; } +/* Completely free an iri structure. */ void iri_free (struct iri *i) { @@ -328,15 +311,17 @@ iri_free (struct iri *i) xfree (i); } +/* Set uri_encoding of struct iri i. If a remote encoding was specified, use + it unless force is true. */ void set_uri_encoding (struct iri *i, char *charset, bool force) { - DEBUGP (("[IRI uri = `%s'\n", quote (charset))); + DEBUGP (("URI encoding = `%s'\n", charset ? quote (charset) : "None")); if (!force && opt.encoding_remote) return; if (i->uri_encoding) { - if (!strcasecmp (i->uri_encoding, charset)) + if (charset && !strcasecmp (i->uri_encoding, charset)) return; xfree (i->uri_encoding); } @@ -344,15 +329,16 @@ set_uri_encoding (struct iri *i, char *charset, bool force) i->uri_encoding = charset ? xstrdup (charset) : NULL; } +/* Set content_encoding of struct iri i. */ void set_content_encoding (struct iri *i, char *charset) { - DEBUGP (("[IRI content = %s\n", quote (charset))); + DEBUGP (("URI content encoding = %s\n", charset ? quote (charset) : "None")); if (opt.encoding_remote) return; if (i->content_encoding) { - if (!strcasecmp (i->content_encoding, charset)) + if (charset && !strcasecmp (i->content_encoding, charset)) return; xfree (i->content_encoding); }