X-Git-Url: http://sjero.net/git/?p=wget;a=blobdiff_plain;f=src%2Fcmpt.c;h=4bd582c85dff8342106f552e2af008d0c4d8949d;hp=84cdbc24b16ca376b1329e6a6e7c2b92ee9ff046;hb=4d7c5e087b2bc82c9f503dff003916d1047903ce;hpb=6af41f62f0e1d8f1d7c67b472e95c17c282e2900 diff --git a/src/cmpt.c b/src/cmpt.c index 84cdbc24..4bd582c8 100644 --- a/src/cmpt.c +++ b/src/cmpt.c @@ -1,11 +1,11 @@ /* Replacements for routines missing on some systems. - Copyright (C) 1995-2005 Free Software Foundation, Inc. + Copyright (C) 1996-2006 Free Software Foundation, Inc. This file is part of GNU Wget. GNU Wget is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by -the Free Software Foundation; either version 2 of the License, or +the Free Software Foundation; either version 3 of the License, or (at your option) any later version. GNU Wget is distributed in the hope that it will be useful, @@ -14,8 +14,7 @@ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License -along with Wget; if not, write to the Free Software -Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. +along with Wget. If not, see . In addition, as a special exception, the Free Software Foundation gives permission to link the code of its release of Wget with the @@ -32,6 +31,7 @@ so, delete this exception statement from your version. */ #include #include #include +#include #ifdef HAVE_UNISTD_H # include @@ -42,18 +42,18 @@ so, delete this exception statement from your version. */ #include "wget.h" /* Some systems lack certain functions normally taken for granted. - For example, Windows doesn't have strptime, and some systems lack - strcasecmp and strncasecmp. This file should contain fallback - implementations of the missing functions. It should *not* define - new Wget-specific functions -- those should placed in utils.c or - elsewhere. */ + For example, Windows doesn't have strptime, and some systems don't + have a usable fnmatch. This file should contain fallback + implementations of such missing functions. It should *not* define + new Wget-specific interfaces -- those should be placed in utils.c + or elsewhere. */ /* strcasecmp and strncasecmp apparently originated with BSD 4.4. SUSv3 seems to be the only standard out there (that I can find) - that requires their existence, so there are systems that lack them - still in use. Note that these don't get defined under Windows - because mswindows.h defines them to the equivalent Windows - functions stricmp and strnicmp. */ + that requires their existence, so in theory there might be systems + still in use that lack them. Note that these don't get defined + under Windows because mswindows.h defines them to the equivalent + Windows functions stricmp and strnicmp. */ #ifndef HAVE_STRCASECMP /* From GNU libc. */ @@ -110,310 +110,28 @@ strncasecmp (const char *s1, const char *s2, size_t n) return c1 - c2; } #endif /* not HAVE_STRNCASECMP */ - -/* strpbrk is a BSD 4.3 function mandated by POSIX and C99 and present - on Windows. It might be missing from older Unixes of non-BSD - ancestry or possibly from non-Unix systems Wget gets ported to, so - we add it here. */ - -#ifndef HAVE_STRPBRK -/* Find the first ocurrence in S of any character in ACCEPT. */ -char * -strpbrk (const char *s, const char *accept) -{ - while (*s != '\0') - { - const char *a = accept; - while (*a != '\0') - if (*a++ == *s) - return (char *) s; - ++s; - } - - return 0; -} -#endif /* HAVE_STRPBRK */ - -/* mktime is a BSD 4.3 function also required by POSIX and C99. I - don't know if there is a widely used system that lacks it, so it - might be a candidate for removal. */ - -#ifndef HAVE_MKTIME -/* From GNU libc 2.0. */ - -/* Copyright (C) 1993, 1994, 1995, 1996, 1997 Free Software Foundation, Inc. - This file is part of the GNU C Library. - Contributed by Paul Eggert (eggert@twinsun.com). */ - -#ifdef _LIBC -# define HAVE_LIMITS_H 1 -# define HAVE_LOCALTIME_R 1 -# define STDC_HEADERS 1 -#endif - -/* Assume that leap seconds are possible, unless told otherwise. - If the host has a `zic' command with a `-L leapsecondfilename' option, - then it supports leap seconds; otherwise it probably doesn't. */ -#ifndef LEAP_SECONDS_POSSIBLE -# define LEAP_SECONDS_POSSIBLE 1 -#endif - -#ifndef __P -# define __P(args) args -#endif /* Not __P. */ - -#ifndef CHAR_BIT -# define CHAR_BIT 8 -#endif - -#ifndef INT_MIN -# define INT_MIN (~0 << (sizeof (int) * CHAR_BIT - 1)) -#endif -#ifndef INT_MAX -# define INT_MAX (~0 - INT_MIN) -#endif - -#ifndef TIME_T_MIN -/* The outer cast to time_t works around a bug in Cray C 5.0.3.0. */ -# define TIME_T_MIN ((time_t) \ - (0 < (time_t) -1 ? (time_t) 0 \ - : ~ (time_t) 0 << (sizeof (time_t) * CHAR_BIT - 1))) -#endif -#ifndef TIME_T_MAX -# define TIME_T_MAX (~ (time_t) 0 - TIME_T_MIN) -#endif - -#define TM_YEAR_BASE 1900 -#define EPOCH_YEAR 1970 - -#ifndef __isleap -/* Nonzero if YEAR is a leap year (every 4 years, - except every 100th isn't, and every 400th is). */ -# define __isleap(year) \ - ((year) % 4 == 0 && ((year) % 100 != 0 || (year) % 400 == 0)) -#endif - -/* How many days come before each month (0-12). */ -/* __mon_yday[][] is common to mktime and strptime implementations. - --abbotti */ -const unsigned short int __mon_yday[2][13]; -#ifndef NEED_MON_YDAY -# define NEED_MON_YDAY -#endif -static time_t ydhms_tm_diff __P ((int, int, int, int, int, const struct tm *)); -time_t __mktime_internal __P ((struct tm *, - struct tm *(*) (const time_t *, struct tm *), - time_t *)); +#ifndef HAVE_MEMRCHR +/* memrchr is a GNU extension. It is like the memchr function, except + that it searches backwards from the end of the n bytes pointed to + by s instead of forwards from the front. */ - -#ifdef _LIBC -# define localtime_r __localtime_r -#else -# if ! HAVE_LOCALTIME_R && ! defined localtime_r -/* Approximate localtime_r as best we can in its absence. */ -# define localtime_r my_mktime_localtime_r -static struct tm *localtime_r __P ((const time_t *, struct tm *)); -static struct tm * -localtime_r (t, tp) - const time_t *t; - struct tm *tp; -{ - struct tm *l = localtime (t); - if (! l) - return 0; - *tp = *l; - return tp; -} -# endif /* ! HAVE_LOCALTIME_R && ! defined (localtime_r) */ -#endif /* ! _LIBC */ - - -/* Yield the difference between (YEAR-YDAY HOUR:MIN:SEC) and (*TP), - measured in seconds, ignoring leap seconds. - YEAR uses the same numbering as TM->tm_year. - All values are in range, except possibly YEAR. - If overflow occurs, yield the low order bits of the correct answer. */ -static time_t -ydhms_tm_diff (year, yday, hour, min, sec, tp) - int year, yday, hour, min, sec; - const struct tm *tp; -{ - /* Compute intervening leap days correctly even if year is negative. - Take care to avoid int overflow. time_t overflow is OK, since - only the low order bits of the correct time_t answer are needed. - Don't convert to time_t until after all divisions are done, since - time_t might be unsigned. */ - int a4 = (year >> 2) + (TM_YEAR_BASE >> 2) - ! (year & 3); - int b4 = (tp->tm_year >> 2) + (TM_YEAR_BASE >> 2) - ! (tp->tm_year & 3); - int a100 = a4 / 25 - (a4 % 25 < 0); - int b100 = b4 / 25 - (b4 % 25 < 0); - int a400 = a100 >> 2; - int b400 = b100 >> 2; - int intervening_leap_days = (a4 - b4) - (a100 - b100) + (a400 - b400); - time_t years = year - (time_t) tp->tm_year; - time_t days = (365 * years + intervening_leap_days - + (yday - tp->tm_yday)); - return (60 * (60 * (24 * days + (hour - tp->tm_hour)) - + (min - tp->tm_min)) - + (sec - tp->tm_sec)); -} - - -static time_t localtime_offset; - -/* Convert *TP to a time_t value. */ -time_t -mktime (tp) - struct tm *tp; +void * +memrchr (const void *s, int c, size_t n) { -#ifdef _LIBC - /* POSIX.1 8.1.1 requires that whenever mktime() is called, the - time zone names contained in the external variable `tzname' shall - be set as if the tzset() function had been called. */ - __tzset (); -#endif - - return __mktime_internal (tp, localtime_r, &localtime_offset); + const char *b = s; + const char *e = b + n; + while (e > b) + if (*--e == c) + return (void *) e; + return NULL; } - -/* Convert *TP to a time_t value, inverting - the monotonic and mostly-unit-linear conversion function CONVERT. - Use *OFFSET to keep track of a guess at the offset of the result, - compared to what the result would be for UTC without leap seconds. - If *OFFSET's guess is correct, only one CONVERT call is needed. */ -time_t -__mktime_internal (tp, convert, offset) - struct tm *tp; - struct tm *(*convert) __P ((const time_t *, struct tm *)); - time_t *offset; -{ - time_t t, dt, t0; - struct tm tm; - - /* The maximum number of probes (calls to CONVERT) should be enough - to handle any combinations of time zone rule changes, solar time, - and leap seconds. Posix.1 prohibits leap seconds, but some hosts - have them anyway. */ - int remaining_probes = 4; - - /* Time requested. Copy it in case CONVERT modifies *TP; this can - occur if TP is localtime's returned value and CONVERT is localtime. */ - int sec = tp->tm_sec; - int min = tp->tm_min; - int hour = tp->tm_hour; - int mday = tp->tm_mday; - int mon = tp->tm_mon; - int year_requested = tp->tm_year; - int isdst = tp->tm_isdst; - - /* Ensure that mon is in range, and set year accordingly. */ - int mon_remainder = mon % 12; - int negative_mon_remainder = mon_remainder < 0; - int mon_years = mon / 12 - negative_mon_remainder; - int year = year_requested + mon_years; - - /* The other values need not be in range: - the remaining code handles minor overflows correctly, - assuming int and time_t arithmetic wraps around. - Major overflows are caught at the end. */ - - /* Calculate day of year from year, month, and day of month. - The result need not be in range. */ - int yday = ((__mon_yday[__isleap (year + TM_YEAR_BASE)] - [mon_remainder + 12 * negative_mon_remainder]) - + mday - 1); - - int sec_requested = sec; -#if LEAP_SECONDS_POSSIBLE - /* Handle out-of-range seconds specially, - since ydhms_tm_diff assumes every minute has 60 seconds. */ - if (sec < 0) - sec = 0; - if (59 < sec) - sec = 59; #endif - - /* Invert CONVERT by probing. First assume the same offset as last time. - Then repeatedly use the error to improve the guess. */ - - tm.tm_year = EPOCH_YEAR - TM_YEAR_BASE; - tm.tm_yday = tm.tm_hour = tm.tm_min = tm.tm_sec = 0; - t0 = ydhms_tm_diff (year, yday, hour, min, sec, &tm); - - for (t = t0 + *offset; - (dt = ydhms_tm_diff (year, yday, hour, min, sec, (*convert) (&t, &tm))); - t += dt) - if (--remaining_probes == 0) - return -1; - - /* Check whether tm.tm_isdst has the requested value, if any. */ - if (0 <= isdst && 0 <= tm.tm_isdst) - { - int dst_diff = (isdst != 0) - (tm.tm_isdst != 0); - if (dst_diff) - { - /* Move two hours in the direction indicated by the disagreement, - probe some more, and switch to a new time if found. - The largest known fallback due to daylight savings is two hours: - once, in Newfoundland, 1988-10-30 02:00 -> 00:00. */ - time_t ot = t - 2 * 60 * 60 * dst_diff; - while (--remaining_probes != 0) - { - struct tm otm; - if (! (dt = ydhms_tm_diff (year, yday, hour, min, sec, - (*convert) (&ot, &otm)))) - { - t = ot; - tm = otm; - break; - } - if ((ot += dt) == t) - break; /* Avoid a redundant probe. */ - } - } - } - - *offset = t - t0; - -#if LEAP_SECONDS_POSSIBLE - if (sec_requested != tm.tm_sec) - { - /* Adjust time to reflect the tm_sec requested, not the normalized value. - Also, repair any damage from a false match due to a leap second. */ - t += sec_requested - sec + (sec == 0 && tm.tm_sec == 60); - (*convert) (&t, &tm); - } -#endif - - if (TIME_T_MAX / INT_MAX / 366 / 24 / 60 / 60 < 3) - { - /* time_t isn't large enough to rule out overflows in ydhms_tm_diff, - so check for major overflows. A gross check suffices, - since if t has overflowed, it is off by a multiple of - TIME_T_MAX - TIME_T_MIN + 1. So ignore any component of - the difference that is bounded by a small value. */ - - double dyear = (double) year_requested + mon_years - tm.tm_year; - double dday = 366 * dyear + mday; - double dsec = 60 * (60 * (24 * dday + hour) + min) + sec_requested; - - if (TIME_T_MAX / 3 - TIME_T_MIN / 3 < (dsec < 0 ? - dsec : dsec)) - return -1; - } - - *tp = tm; - return t; -} - -#ifdef weak_alias -weak_alias (mktime, timelocal) -#endif -#endif /* not HAVE_MKTIME */ /* strptime is required by POSIX, but it is missing from Windows, which means we must keep a fallback implementation. It is - reportedly missing or broken on many older systems as well. */ + reportedly missing or broken on many older Unix systems as well, so + it's good to have around. */ #ifndef HAVE_STRPTIME /* From GNU libc 2.1.3. */ @@ -633,8 +351,6 @@ static char const ab_month_name[][4] = # define HERE_T_FMT_AMPM "%I:%M:%S %p" # define HERE_T_FMT "%H:%M:%S" -/* __mon_yday[][] is common to mktime and strptime implementations. - --abbotti */ const unsigned short int __mon_yday[2][13]; # ifndef NEED_MON_YDAY # define NEED_MON_YDAY @@ -962,10 +678,12 @@ strptime_internal (rp, fmt, tm, decided) } #endif if (!match_string (HERE_AM_STR, rp)) - if (match_string (HERE_PM_STR, rp)) - is_pm = 1; - else - return NULL; + { + if (match_string (HERE_PM_STR, rp)) + is_pm = 1; + else + return NULL; + } break; case 'r': #ifdef _NL_CURRENT @@ -1327,8 +1045,6 @@ strptime (buf, format, tm) #endif /* not HAVE_STRPTIME */ #ifdef NEED_MON_YDAY -/* __mon_yday[][] is common to mktime and strptime implementations. - --abbotti */ const unsigned short int __mon_yday[2][13] = { /* Normal years. */ @@ -1347,11 +1063,10 @@ const unsigned short int __mon_yday[2][13] = and given a prefix, but many systems out there are still (as of this writing in 2005) broken and we must cater to them. - Additionally, according to anecdotal evidence and conventional - wisdom I lack courage to challenge, many implementations of fnmatch - are notoriously buggy and unreliable. So we use our version by - default, except when compiling under systems where fnmatch is known - to work (currently on GNU libc-based systems and Solaris.) */ + Additionally, according to some conventional wisdom, many + historical implementations of fnmatch are buggy and unreliable. If + yours is such, undefine SYSTEM_FNMATCH in sysdep.h and tell us + about it. */ #ifndef SYSTEM_FNMATCH @@ -1436,7 +1151,8 @@ fnmatch (const char *pattern, const char *string, int flags) { register const char *np; - for (np = p; np && *np && *np != ']'; np++); + for (np = p; np && *np && *np != ']'; np++) + ; if (np && !*np) { @@ -1523,3 +1239,190 @@ fnmatch (const char *pattern, const char *string, int flags) } #endif /* not SYSTEM_FNMATCH */ + +#ifndef HAVE_TIMEGM +/* timegm is a GNU extension, but lately also available on *BSD + systems and possibly elsewhere. */ + +/* True if YEAR is a leap year. */ +#define ISLEAP(year) \ + ((year) % 4 == 0 && ((year) % 100 != 0 || (year) % 400 == 0)) + +/* Number of leap years in the range [y1, y2). */ +#define LEAPYEARS(y1, y2) \ + ((y2-1)/4 - (y1-1)/4) - ((y2-1)/100 - (y1-1)/100) + ((y2-1)/400 - (y1-1)/400) + +/* Inverse of gmtime: converts struct tm to time_t, assuming the data + in tm is UTC rather than local timezone. This implementation + returns the number of seconds elapsed since midnight 1970-01-01, + converted to time_t. */ + +time_t +timegm (struct tm *t) +{ + static const unsigned short int month_to_days[][13] = { + { 0, 31, 59, 90, 120, 151, 181, 212, 243, 273, 304, 334 }, /* normal */ + { 0, 31, 60, 91, 121, 152, 182, 213, 244, 274, 305, 335 } /* leap */ + }; + const int year = 1900 + t->tm_year; + unsigned long secs; /* until 2106-02-07 for 32-bit unsigned long */ + int days; + + if (year < 1970) + return (time_t) -1; + + days = 365 * (year - 1970); + /* Take into account leap years between 1970 and YEAR, not counting + YEAR itself. */ + days += LEAPYEARS (1970, year); + if (t->tm_mon < 0 || t->tm_mon >= 12) + return (time_t) -1; + days += month_to_days[ISLEAP (year)][t->tm_mon]; + days += t->tm_mday - 1; + + secs = days * 86400 + t->tm_hour * 3600 + t->tm_min * 60 + t->tm_sec; + return (time_t) secs; +} +#endif /* HAVE_TIMEGM */ + +#ifdef NEED_STRTOLL +/* strtoll is required by C99 and used by Wget only on systems with + LFS. Unfortunately, some systems have LFS, but no strtoll or + equivalent. These include HPUX 11.0 and Windows. + + We use #ifdef NEED_STRTOLL instead of #ifndef HAVE_STRTOLL because + of the systems which have a suitable replacement (e.g. _strtoi64 on + Windows), on which Wget's str_to_wgint is instructed to use that + instead. */ + +static inline int +char_value (char c, int base) +{ + int value; + if (c < '0') + return -1; + if ('0' <= c && c <= '9') + value = c - '0'; + else if ('a' <= c && c <= 'z') + value = c - 'a' + 10; + else if ('A' <= c && c <= 'Z') + value = c - 'A' + 10; + else + return -1; + if (value >= base) + return -1; + return value; +} + +#define STRTOLL_MAX TYPE_MAXIMUM (strtoll_type) +/* This definition assumes two's complement arithmetic */ +#define STRTOLL_MIN (-STRTOLL_MAX - 1) + +/* Like a%b, but always returns a positive number when A is negative. + (C doesn't guarantee the sign of the result.) */ +#define MOD(a, b) ((strtoll_type) -1 % 2 == 1 ? (a) % (b) : - ((a) % (b))) + +/* A strtoll-like replacement for systems that have an integral type + larger than long but don't supply strtoll. This implementation + makes no assumptions about the size of strtoll_type. */ + +strtoll_type +strtoll (const char *nptr, char **endptr, int base) +{ + strtoll_type result = 0; + bool negative; + + if (base != 0 && (base < 2 || base > 36)) + { + errno = EINVAL; + return 0; + } + + while (*nptr == ' ' || *nptr == '\t') + ++nptr; + if (*nptr == '-') + { + negative = true; + ++nptr; + } + else if (*nptr == '+') + { + negative = false; + ++nptr; + } + else + negative = false; + + /* If BASE is 0, determine the real base based on the beginning on + the number; octal numbers begin with "0", hexadecimal with "0x", + and the others are considered octal. */ + if (*nptr == '0') + { + if ((base == 0 || base == 16) + && + (*(nptr + 1) == 'x' || *(nptr + 1) == 'X')) + { + base = 16; + nptr += 2; + /* "0x" must be followed by at least one hex char. If not, + return 0 and place ENDPTR on 'x'. */ + if (!ISXDIGIT (*nptr)) + { + --nptr; + goto out; + } + } + else if (base == 0) + base = 8; + } + else if (base == 0) + base = 10; + + if (!negative) + { + /* Parse positive number, checking for overflow. */ + int digit; + /* Overflow watermark. If RESULT exceeds it, overflow occurs on + this digit. If result==WATERMARK, current digit may not + exceed the last digit of maximum value. */ + const strtoll_type WATERMARK = STRTOLL_MAX / base; + for (; (digit = char_value (*nptr, base)) != -1; ++nptr) + { + if (result > WATERMARK + || (result == WATERMARK && digit > STRTOLL_MAX % base)) + { + result = STRTOLL_MAX; + errno = ERANGE; + break; + } + result = base * result + digit; + } + } + else + { + /* Parse negative number, checking for underflow. */ + int digit; + const strtoll_type WATERMARK = STRTOLL_MIN / base; + for (; (digit = char_value (*nptr, base)) != -1; ++nptr) + { + if (result < WATERMARK + || (result == WATERMARK && digit > MOD (STRTOLL_MIN, base))) + { + result = STRTOLL_MIN; + errno = ERANGE; + break; + } + result = base * result - digit; + } + } + out: + if (endptr) + *endptr = (char *) nptr; + return result; +} + +#undef STRTOLL_MAX +#undef STRTOLL_MIN +#undef ABS + +#endif /* NEED_STRTOLL */