X-Git-Url: http://sjero.net/git/?p=wget;a=blobdiff_plain;f=src%2Fcmpt.c;h=4bd582c85dff8342106f552e2af008d0c4d8949d;hp=4b4d68cb4b34e9bc3b76689f9f3ec258b2e113fa;hb=4d7c5e087b2bc82c9f503dff003916d1047903ce;hpb=0b056d17201d2bae32857dbec4c8f7a95578cdf9 diff --git a/src/cmpt.c b/src/cmpt.c index 4b4d68cb..4bd582c8 100644 --- a/src/cmpt.c +++ b/src/cmpt.c @@ -1,11 +1,11 @@ /* Replacements for routines missing on some systems. - Copyright (C) 1995, 1996, 1997 Free Software Foundation, Inc. + Copyright (C) 1996-2006 Free Software Foundation, Inc. This file is part of GNU Wget. GNU Wget is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by -the Free Software Foundation; either version 2 of the License, or +the Free Software Foundation; either version 3 of the License, or (at your option) any later version. GNU Wget is distributed in the hope that it will be useful, @@ -14,40 +14,46 @@ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License -along with Wget; if not, write to the Free Software -Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. */ +along with Wget. If not, see . + +In addition, as a special exception, the Free Software Foundation +gives permission to link the code of its release of Wget with the +OpenSSL project's "OpenSSL" library (or with modified versions of it +that use the same license as the "OpenSSL" library), and distribute +the linked executables. You must obey the GNU General Public License +in all respects for all of the code used other than "OpenSSL". If you +modify this file, you may extend this exception to your version of the +file, but you are not obligated to do so. If you do not wish to do +so, delete this exception statement from your version. */ #include #include #include -#ifdef HAVE_STRING_H -# include -#else -# include -#endif /* HAVE_STRING_H */ +#include +#include -#include #ifdef HAVE_UNISTD_H # include #endif -#include -#include "wget.h" +#include -#ifndef HAVE_STRERROR -/* A strerror() clone, for systems that don't have it. */ -char * -strerror (int err) -{ - /* This loses on a system without `sys_errlist'. */ - extern char *sys_errlist[]; - return sys_errlist[err]; -} -#endif /* not HAVE_STRERROR */ +#include "wget.h" -/* Some systems don't have some str* functions in libc. Here we - define them. The same goes for strptime. */ +/* Some systems lack certain functions normally taken for granted. + For example, Windows doesn't have strptime, and some systems don't + have a usable fnmatch. This file should contain fallback + implementations of such missing functions. It should *not* define + new Wget-specific interfaces -- those should be placed in utils.c + or elsewhere. */ + +/* strcasecmp and strncasecmp apparently originated with BSD 4.4. + SUSv3 seems to be the only standard out there (that I can find) + that requires their existence, so in theory there might be systems + still in use that lack them. Note that these don't get defined + under Windows because mswindows.h defines them to the equivalent + Windows functions stricmp and strnicmp. */ #ifndef HAVE_STRCASECMP /* From GNU libc. */ @@ -105,387 +111,34 @@ strncasecmp (const char *s1, const char *s2, size_t n) } #endif /* not HAVE_STRNCASECMP */ -#ifndef HAVE_STRSTR -/* From GNU libc 2.0.6. */ -/* Return the first ocurrence of NEEDLE in HAYSTACK. */ -/* - * My personal strstr() implementation that beats most other algorithms. - * Until someone tells me otherwise, I assume that this is the - * fastest implementation of strstr() in C. - * I deliberately chose not to comment it. You should have at least - * as much fun trying to understand it, as I had to write it :-). - * - * Stephen R. van den Berg, berg@pool.informatik.rwth-aachen.de */ -typedef unsigned chartype; - -char * -strstr (phaystack, pneedle) - const char *phaystack; - const char *pneedle; -{ - register const unsigned char *haystack, *needle; - register chartype b, c; - - haystack = (const unsigned char *) phaystack; - needle = (const unsigned char *) pneedle; - - b = *needle; - if (b != '\0') - { - haystack--; /* possible ANSI violation */ - do - { - c = *++haystack; - if (c == '\0') - goto ret0; - } - while (c != b); - - c = *++needle; - if (c == '\0') - goto foundneedle; - ++needle; - goto jin; - - for (;;) - { - register chartype a; - register const unsigned char *rhaystack, *rneedle; - - do - { - a = *++haystack; - if (a == '\0') - goto ret0; - if (a == b) - break; - a = *++haystack; - if (a == '\0') - goto ret0; -shloop: } - while (a != b); - -jin: a = *++haystack; - if (a == '\0') - goto ret0; - - if (a != c) - goto shloop; - - rhaystack = haystack-- + 1; - rneedle = needle; - a = *rneedle; - - if (*rhaystack == a) - do - { - if (a == '\0') - goto foundneedle; - ++rhaystack; - a = *++needle; - if (*rhaystack != a) - break; - if (a == '\0') - goto foundneedle; - ++rhaystack; - a = *++needle; - } - while (*rhaystack == a); - - needle = rneedle; /* took the register-poor approach */ - - if (a == '\0') - break; - } - } -foundneedle: - return (char*) haystack; -ret0: - return 0; -} -#endif /* not HAVE_STRSTR */ - -#ifndef HAVE_MKTIME -/* From GNU libc 2.0. */ - -/* Copyright (C) 1993, 1994, 1995, 1996, 1997 Free Software Foundation, Inc. - This file is part of the GNU C Library. - Contributed by Paul Eggert (eggert@twinsun.com). */ - -#ifdef _LIBC -# define HAVE_LIMITS_H 1 -# define HAVE_LOCALTIME_R 1 -# define STDC_HEADERS 1 -#endif - -/* Assume that leap seconds are possible, unless told otherwise. - If the host has a `zic' command with a `-L leapsecondfilename' option, - then it supports leap seconds; otherwise it probably doesn't. */ -#ifndef LEAP_SECONDS_POSSIBLE -# define LEAP_SECONDS_POSSIBLE 1 -#endif - -#ifndef __P -# define __P(args) PARAMS (args) -#endif /* Not __P. */ - -#ifndef CHAR_BIT -# define CHAR_BIT 8 -#endif - -#ifndef INT_MIN -# define INT_MIN (~0 << (sizeof (int) * CHAR_BIT - 1)) -#endif -#ifndef INT_MAX -# define INT_MAX (~0 - INT_MIN) -#endif - -#ifndef TIME_T_MIN -/* The outer cast to time_t works around a bug in Cray C 5.0.3.0. */ -# define TIME_T_MIN ((time_t) \ - (0 < (time_t) -1 ? (time_t) 0 \ - : ~ (time_t) 0 << (sizeof (time_t) * CHAR_BIT - 1))) -#endif -#ifndef TIME_T_MAX -# define TIME_T_MAX (~ (time_t) 0 - TIME_T_MIN) -#endif - -#define TM_YEAR_BASE 1900 -#define EPOCH_YEAR 1970 - -#ifndef __isleap -/* Nonzero if YEAR is a leap year (every 4 years, - except every 100th isn't, and every 400th is). */ -# define __isleap(year) \ - ((year) % 4 == 0 && ((year) % 100 != 0 || (year) % 400 == 0)) -#endif - -/* How many days come before each month (0-12). */ -const unsigned short int __mon_yday[2][13] = - { - /* Normal years. */ - { 0, 31, 59, 90, 120, 151, 181, 212, 243, 273, 304, 334, 365 }, - /* Leap years. */ - { 0, 31, 60, 91, 121, 152, 182, 213, 244, 274, 305, 335, 366 } - }; - -static time_t ydhms_tm_diff __P ((int, int, int, int, int, const struct tm *)); -time_t __mktime_internal __P ((struct tm *, - struct tm *(*) (const time_t *, struct tm *), - time_t *)); - - -#ifdef _LIBC -# define localtime_r __localtime_r -#else -# if ! HAVE_LOCALTIME_R && ! defined localtime_r -/* Approximate localtime_r as best we can in its absence. */ -# define localtime_r my_mktime_localtime_r -static struct tm *localtime_r __P ((const time_t *, struct tm *)); -static struct tm * -localtime_r (t, tp) - const time_t *t; - struct tm *tp; -{ - struct tm *l = localtime (t); - if (! l) - return 0; - *tp = *l; - return tp; -} -# endif /* ! HAVE_LOCALTIME_R && ! defined (localtime_r) */ -#endif /* ! _LIBC */ - - -/* Yield the difference between (YEAR-YDAY HOUR:MIN:SEC) and (*TP), - measured in seconds, ignoring leap seconds. - YEAR uses the same numbering as TM->tm_year. - All values are in range, except possibly YEAR. - If overflow occurs, yield the low order bits of the correct answer. */ -static time_t -ydhms_tm_diff (year, yday, hour, min, sec, tp) - int year, yday, hour, min, sec; - const struct tm *tp; -{ - /* Compute intervening leap days correctly even if year is negative. - Take care to avoid int overflow. time_t overflow is OK, since - only the low order bits of the correct time_t answer are needed. - Don't convert to time_t until after all divisions are done, since - time_t might be unsigned. */ - int a4 = (year >> 2) + (TM_YEAR_BASE >> 2) - ! (year & 3); - int b4 = (tp->tm_year >> 2) + (TM_YEAR_BASE >> 2) - ! (tp->tm_year & 3); - int a100 = a4 / 25 - (a4 % 25 < 0); - int b100 = b4 / 25 - (b4 % 25 < 0); - int a400 = a100 >> 2; - int b400 = b100 >> 2; - int intervening_leap_days = (a4 - b4) - (a100 - b100) + (a400 - b400); - time_t years = year - (time_t) tp->tm_year; - time_t days = (365 * years + intervening_leap_days - + (yday - tp->tm_yday)); - return (60 * (60 * (24 * days + (hour - tp->tm_hour)) - + (min - tp->tm_min)) - + (sec - tp->tm_sec)); -} - +#ifndef HAVE_MEMRCHR +/* memrchr is a GNU extension. It is like the memchr function, except + that it searches backwards from the end of the n bytes pointed to + by s instead of forwards from the front. */ -static time_t localtime_offset; - -/* Convert *TP to a time_t value. */ -time_t -mktime (tp) - struct tm *tp; +void * +memrchr (const void *s, int c, size_t n) { -#ifdef _LIBC - /* POSIX.1 8.1.1 requires that whenever mktime() is called, the - time zone names contained in the external variable `tzname' shall - be set as if the tzset() function had been called. */ - __tzset (); -#endif - - return __mktime_internal (tp, localtime_r, &localtime_offset); -} - -/* Convert *TP to a time_t value, inverting - the monotonic and mostly-unit-linear conversion function CONVERT. - Use *OFFSET to keep track of a guess at the offset of the result, - compared to what the result would be for UTC without leap seconds. - If *OFFSET's guess is correct, only one CONVERT call is needed. */ -time_t -__mktime_internal (tp, convert, offset) - struct tm *tp; - struct tm *(*convert) __P ((const time_t *, struct tm *)); - time_t *offset; -{ - time_t t, dt, t0; - struct tm tm; - - /* The maximum number of probes (calls to CONVERT) should be enough - to handle any combinations of time zone rule changes, solar time, - and leap seconds. Posix.1 prohibits leap seconds, but some hosts - have them anyway. */ - int remaining_probes = 4; - - /* Time requested. Copy it in case CONVERT modifies *TP; this can - occur if TP is localtime's returned value and CONVERT is localtime. */ - int sec = tp->tm_sec; - int min = tp->tm_min; - int hour = tp->tm_hour; - int mday = tp->tm_mday; - int mon = tp->tm_mon; - int year_requested = tp->tm_year; - int isdst = tp->tm_isdst; - - /* Ensure that mon is in range, and set year accordingly. */ - int mon_remainder = mon % 12; - int negative_mon_remainder = mon_remainder < 0; - int mon_years = mon / 12 - negative_mon_remainder; - int year = year_requested + mon_years; - - /* The other values need not be in range: - the remaining code handles minor overflows correctly, - assuming int and time_t arithmetic wraps around. - Major overflows are caught at the end. */ - - /* Calculate day of year from year, month, and day of month. - The result need not be in range. */ - int yday = ((__mon_yday[__isleap (year + TM_YEAR_BASE)] - [mon_remainder + 12 * negative_mon_remainder]) - + mday - 1); - - int sec_requested = sec; -#if LEAP_SECONDS_POSSIBLE - /* Handle out-of-range seconds specially, - since ydhms_tm_diff assumes every minute has 60 seconds. */ - if (sec < 0) - sec = 0; - if (59 < sec) - sec = 59; -#endif - - /* Invert CONVERT by probing. First assume the same offset as last time. - Then repeatedly use the error to improve the guess. */ - - tm.tm_year = EPOCH_YEAR - TM_YEAR_BASE; - tm.tm_yday = tm.tm_hour = tm.tm_min = tm.tm_sec = 0; - t0 = ydhms_tm_diff (year, yday, hour, min, sec, &tm); - - for (t = t0 + *offset; - (dt = ydhms_tm_diff (year, yday, hour, min, sec, (*convert) (&t, &tm))); - t += dt) - if (--remaining_probes == 0) - return -1; - - /* Check whether tm.tm_isdst has the requested value, if any. */ - if (0 <= isdst && 0 <= tm.tm_isdst) - { - int dst_diff = (isdst != 0) - (tm.tm_isdst != 0); - if (dst_diff) - { - /* Move two hours in the direction indicated by the disagreement, - probe some more, and switch to a new time if found. - The largest known fallback due to daylight savings is two hours: - once, in Newfoundland, 1988-10-30 02:00 -> 00:00. */ - time_t ot = t - 2 * 60 * 60 * dst_diff; - while (--remaining_probes != 0) - { - struct tm otm; - if (! (dt = ydhms_tm_diff (year, yday, hour, min, sec, - (*convert) (&ot, &otm)))) - { - t = ot; - tm = otm; - break; - } - if ((ot += dt) == t) - break; /* Avoid a redundant probe. */ - } - } - } - - *offset = t - t0; - -#if LEAP_SECONDS_POSSIBLE - if (sec_requested != tm.tm_sec) - { - /* Adjust time to reflect the tm_sec requested, not the normalized value. - Also, repair any damage from a false match due to a leap second. */ - t += sec_requested - sec + (sec == 0 && tm.tm_sec == 60); - (*convert) (&t, &tm); - } -#endif - - if (TIME_T_MAX / INT_MAX / 366 / 24 / 60 / 60 < 3) - { - /* time_t isn't large enough to rule out overflows in ydhms_tm_diff, - so check for major overflows. A gross check suffices, - since if t has overflowed, it is off by a multiple of - TIME_T_MAX - TIME_T_MIN + 1. So ignore any component of - the difference that is bounded by a small value. */ - - double dyear = (double) year_requested + mon_years - tm.tm_year; - double dday = 366 * dyear + mday; - double dsec = 60 * (60 * (24 * dday + hour) + min) + sec_requested; - - if (TIME_T_MAX / 3 - TIME_T_MIN / 3 < (dsec < 0 ? - dsec : dsec)) - return -1; - } - - *tp = tm; - return t; + const char *b = s; + const char *e = b + n; + while (e > b) + if (*--e == c) + return (void *) e; + return NULL; } - -#ifdef weak_alias -weak_alias (mktime, timelocal) #endif -#endif /* not HAVE_MKTIME */ - + +/* strptime is required by POSIX, but it is missing from Windows, + which means we must keep a fallback implementation. It is + reportedly missing or broken on many older Unix systems as well, so + it's good to have around. */ #ifndef HAVE_STRPTIME -/* From GNU libc 2.0.6. */ +/* From GNU libc 2.1.3. */ /* Ulrich, thanks for helping me out with this! --hniksic */ /* strptime - Convert a string representation of time to a time value. - Copyright (C) 1996, 1997 Free Software Foundation, Inc. + Copyright (C) 1996, 1997, 1998, 1999, 2000 Free Software Foundation, Inc. This file is part of the GNU C Library. Contributed by Ulrich Drepper , 1996. */ @@ -495,15 +148,15 @@ weak_alias (mktime, timelocal) this is enough information for determining the date. */ #ifndef __P -# define __P(args) PARAMS (args) +# define __P(args) args #endif /* not __P */ -#if ! HAVE_LOCALTIME_R && ! defined (localtime_r) -#ifdef _LIBC -#define localtime_r __localtime_r -#else +#if ! HAVE_LOCALTIME_R && ! defined localtime_r +# ifdef _LIBC +# define localtime_r __localtime_r +# else /* Approximate localtime_r as best we can in its absence. */ -#define localtime_r my_localtime_r +# define localtime_r my_localtime_r static struct tm *localtime_r __P ((const time_t *, struct tm *)); static struct tm * localtime_r (t, tp) @@ -516,7 +169,7 @@ localtime_r (t, tp) *tp = *l; return tp; } -#endif /* ! _LIBC */ +# endif /* ! _LIBC */ #endif /* ! HAVE_LOCALTIME_R && ! defined (localtime_r) */ @@ -534,50 +187,118 @@ localtime_r (t, tp) #endif /* We intentionally do not use isdigit() for testing because this will lead to problems with the wide character version. */ -#define get_number(from, to) \ +#define get_number(from, to, n) \ do { \ + int __n = n; \ val = 0; \ + while (*rp == ' ') \ + ++rp; \ if (*rp < '0' || *rp > '9') \ return NULL; \ do { \ val *= 10; \ val += *rp++ - '0'; \ - } while (val * 10 <= to && *rp >= '0' && *rp <= '9'); \ + } while (--__n > 0 && val * 10 <= to && *rp >= '0' && *rp <= '9'); \ if (val < from || val > to) \ return NULL; \ } while (0) #ifdef _NL_CURRENT -# define get_alt_number(from, to) \ - do { \ +/* Added check for __GNUC__ extensions here for Wget. --abbotti */ +# if defined __GNUC__ && __GNUC__ >= 2 +# define get_alt_number(from, to, n) \ + ({ \ + __label__ do_normal; \ if (*decided != raw) \ { \ const char *alts = _NL_CURRENT (LC_TIME, ALT_DIGITS); \ + int __n = n; \ + int any = 0; \ + while (*rp == ' ') \ + ++rp; \ val = 0; \ - while (*alts != '\0') \ - { \ - size_t len = strlen (alts); \ - if (strncasecmp (alts, rp, len) == 0) \ + do { \ + val *= 10; \ + while (*alts != '\0') \ + { \ + size_t len = strlen (alts); \ + if (strncasecmp (alts, rp, len) == 0) \ + break; \ + alts += len + 1; \ + ++val; \ + } \ + if (*alts == '\0') \ + { \ + if (*decided == not && ! any) \ + goto do_normal; \ + /* If we haven't read anything it's an error. */ \ + if (! any) \ + return NULL; \ + /* Correct the premature multiplication. */ \ + val /= 10; \ break; \ - alts = strchr (alts, '\0') + 1; \ - ++val; \ - } \ - if (*alts == '\0') \ - { \ - if (*decided == loc && val != 0) \ - return NULL; \ - } \ - else \ - { \ + } \ + else \ *decided = loc; \ - break; \ - } \ + } while (--__n > 0 && val * 10 <= to); \ + if (val < from || val > to) \ + return NULL; \ + } \ + else \ + { \ + do_normal: \ + get_number (from, to, n); \ + } \ + 0; \ + }) +# else +# define get_alt_number(from, to, n) \ + do { + if (*decided != raw) \ + { \ + const char *alts = _NL_CURRENT (LC_TIME, ALT_DIGITS); \ + int __n = n; \ + int any = 0; \ + while (*rp == ' ') \ + ++rp; \ + val = 0; \ + do { \ + val *= 10; \ + while (*alts != '\0') \ + { \ + size_t len = strlen (alts); \ + if (strncasecmp (alts, rp, len) == 0) \ + break; \ + alts += len + 1; \ + ++val; \ + } \ + if (*alts == '\0') \ + { \ + if (*decided == not && ! any) \ + goto do_normal; \ + /* If we haven't read anything it's an error. */ \ + if (! any) \ + return NULL; \ + /* Correct the premature multiplication. */ \ + val /= 10; \ + break; \ + } \ + else \ + *decided = loc; \ + } while (--__n > 0 && val * 10 <= to); \ + if (val < from || val > to) \ + return NULL; \ + } \ + else \ + { \ + do_normal: \ + get_number (from, to, n); \ } \ - get_number (from, to); \ } while (0) +# endif /* defined __GNUC__ && __GNUC__ >= 2 */ #else -# define get_alt_number(from, to) \ +# define get_alt_number(from, to, n) \ /* We don't have the alternate representation. */ \ - get_number(from, to) + get_number(from, to, n) #endif #define recursive(new_fmt) \ (*(new_fmt) != '\0' \ @@ -587,6 +308,7 @@ localtime_r (t, tp) #ifdef _LIBC /* This is defined in locale/C-time.c in the GNU libc. */ extern const struct locale_data _nl_C_LC_TIME; +extern const unsigned short int __mon_yday[2][13]; # define weekday_name (&_nl_C_LC_TIME.values[_NL_ITEM_INDEX (DAY_1)].string) # define ab_weekday_name \ @@ -594,12 +316,14 @@ extern const struct locale_data _nl_C_LC_TIME; # define month_name (&_nl_C_LC_TIME.values[_NL_ITEM_INDEX (MON_1)].string) # define ab_month_name (&_nl_C_LC_TIME.values[_NL_ITEM_INDEX (ABMON_1)].string) # define HERE_D_T_FMT (_nl_C_LC_TIME.values[_NL_ITEM_INDEX (D_T_FMT)].string) -# define HERE_D_FMT (_nl_C_LC_TIME.values[_NL_ITEM_INDEX (D_T_FMT)].string) +# define HERE_D_FMT (_nl_C_LC_TIME.values[_NL_ITEM_INDEX (D_FMT)].string) # define HERE_AM_STR (_nl_C_LC_TIME.values[_NL_ITEM_INDEX (AM_STR)].string) # define HERE_PM_STR (_nl_C_LC_TIME.values[_NL_ITEM_INDEX (PM_STR)].string) # define HERE_T_FMT_AMPM \ (_nl_C_LC_TIME.values[_NL_ITEM_INDEX (T_FMT_AMPM)].string) # define HERE_T_FMT (_nl_C_LC_TIME.values[_NL_ITEM_INDEX (T_FMT)].string) + +# define strncasecmp(s1, s2, n) __strncasecmp (s1, s2, n) #else static char const weekday_name[][10] = { @@ -626,31 +350,82 @@ static char const ab_month_name[][4] = # define HERE_PM_STR "PM" # define HERE_T_FMT_AMPM "%I:%M:%S %p" # define HERE_T_FMT "%H:%M:%S" + +const unsigned short int __mon_yday[2][13]; +# ifndef NEED_MON_YDAY +# define NEED_MON_YDAY +# endif #endif /* Status of lookup: do we use the locale data or the raw data? */ enum locale_status { not, loc, raw }; + +#ifndef __isleap +/* Nonzero if YEAR is a leap year (every 4 years, + except every 100th isn't, and every 400th is). */ +# define __isleap(year) \ + ((year) % 4 == 0 && ((year) % 100 != 0 || (year) % 400 == 0)) +#endif + +/* Compute the day of the week. */ +static void +day_of_the_week (struct tm *tm) +{ + /* We know that January 1st 1970 was a Thursday (= 4). Compute the + the difference between this data in the one on TM and so determine + the weekday. */ + int corr_year = 1900 + tm->tm_year - (tm->tm_mon < 2); + int wday = (-473 + + (365 * (tm->tm_year - 70)) + + (corr_year / 4) + - ((corr_year / 4) / 25) + ((corr_year / 4) % 25 < 0) + + (((corr_year / 4) / 25) / 4) + + __mon_yday[0][tm->tm_mon] + + tm->tm_mday - 1); + tm->tm_wday = ((wday % 7) + 7) % 7; +} + +/* Compute the day of the year. */ +static void +day_of_the_year (struct tm *tm) +{ + tm->tm_yday = (__mon_yday[__isleap (1900 + tm->tm_year)][tm->tm_mon] + + (tm->tm_mday - 1)); +} + static char * +#ifdef _LIBC +internal_function +#endif strptime_internal __P ((const char *buf, const char *format, struct tm *tm, enum locale_status *decided)); static char * -strptime_internal (buf, format, tm, decided) - const char *buf; - const char *format; +#ifdef _LIBC +internal_function +#endif +strptime_internal (rp, fmt, tm, decided) + const char *rp; + const char *fmt; struct tm *tm; enum locale_status *decided; { - const char *rp; - const char *fmt; +#ifdef _NL_CURRENT + const char *rp_backup; +#endif int cnt; size_t val; int have_I, is_pm; + int century, want_century; + int have_wday, want_xday; + int have_yday; + int have_mon, have_mday; - rp = buf; - fmt = format; have_I = is_pm = 0; + century = -1; + want_century = 0; + have_wday = want_xday = have_yday = have_mon = have_mday = 0; while (*fmt != '\0') { @@ -677,6 +452,12 @@ strptime_internal (buf, format, tm, decided) /* We need this for handling the `E' modifier. */ start_over: #endif + +#ifdef _NL_CURRENT + /* Make back up of current processing pointer. */ + rp_backup = rp; +#endif + switch (*fmt++) { case '%': @@ -721,6 +502,7 @@ strptime_internal (buf, format, tm, decided) /* Does not match a weekday name. */ return NULL; tm->tm_wday = cnt; + have_wday = 1; break; case 'b': case 'B': @@ -760,6 +542,7 @@ strptime_internal (buf, format, tm, decided) /* Does not match a month name. */ return NULL; tm->tm_mon = cnt; + want_xday = 1; break; case 'c': /* Match locale's date and time format. */ @@ -770,12 +553,15 @@ strptime_internal (buf, format, tm, decided) { if (*decided == loc) return NULL; + else + rp = rp_backup; } else { if (*decided == not && strcmp (_NL_CURRENT (LC_TIME, D_T_FMT), HERE_D_T_FMT)) *decided = loc; + want_xday = 1; break; } *decided = raw; @@ -783,17 +569,26 @@ strptime_internal (buf, format, tm, decided) #endif if (!recursive (HERE_D_T_FMT)) return NULL; + want_xday = 1; break; case 'C': /* Match century number. */ - get_number (0, 99); - /* We don't need the number. */ + get_number (0, 99, 2); + century = val; + want_xday = 1; break; case 'd': case 'e': /* Match day of month. */ - get_number (1, 31); + get_number (1, 31, 2); tm->tm_mday = val; + have_mday = 1; + want_xday = 1; + break; + case 'F': + if (!recursive ("%Y-%m-%d")) + return NULL; + want_xday = 1; break; case 'x': #ifdef _NL_CURRENT @@ -803,12 +598,15 @@ strptime_internal (buf, format, tm, decided) { if (*decided == loc) return NULL; + else + rp = rp_backup; } else { - if (decided == not + if (*decided == not && strcmp (_NL_CURRENT (LC_TIME, D_FMT), HERE_D_FMT)) *decided = loc; + want_xday = 1; break; } *decided = raw; @@ -819,32 +617,37 @@ strptime_internal (buf, format, tm, decided) /* Match standard day format. */ if (!recursive (HERE_D_FMT)) return NULL; + want_xday = 1; break; + case 'k': case 'H': /* Match hour in 24-hour clock. */ - get_number (0, 23); + get_number (0, 23, 2); tm->tm_hour = val; have_I = 0; break; case 'I': /* Match hour in 12-hour clock. */ - get_number (1, 12); + get_number (1, 12, 2); tm->tm_hour = val % 12; have_I = 1; break; case 'j': /* Match day number of year. */ - get_number (1, 366); + get_number (1, 366, 3); tm->tm_yday = val - 1; + have_yday = 1; break; case 'm': /* Match number of month. */ - get_number (1, 12); + get_number (1, 12, 2); tm->tm_mon = val - 1; + have_mon = 1; + want_xday = 1; break; case 'M': /* Match minute. */ - get_number (0, 59); + get_number (0, 59, 2); tm->tm_min = val; break; case 'n': @@ -875,10 +678,12 @@ strptime_internal (buf, format, tm, decided) } #endif if (!match_string (HERE_AM_STR, rp)) - if (match_string (HERE_PM_STR, rp)) - is_pm = 1; - else - return NULL; + { + if (match_string (HERE_PM_STR, rp)) + is_pm = 1; + else + return NULL; + } break; case 'r': #ifdef _NL_CURRENT @@ -888,6 +693,8 @@ strptime_internal (buf, format, tm, decided) { if (*decided == loc) return NULL; + else + rp = rp_backup; } else { @@ -913,7 +720,7 @@ strptime_internal (buf, format, tm, decided) the `get_number' macro. Instead read the number character for character and construct the result while doing this. */ - time_t secs; + time_t secs = 0; if (*rp < '0' || *rp > '9') /* We need at least one digit. */ return NULL; @@ -931,7 +738,7 @@ strptime_internal (buf, format, tm, decided) } break; case 'S': - get_number (0, 61); + get_number (0, 61, 2); tm->tm_sec = val; break; case 'X': @@ -942,6 +749,8 @@ strptime_internal (buf, format, tm, decided) { if (*decided == loc) return NULL; + else + rp = rp_backup; } else { @@ -958,11 +767,12 @@ strptime_internal (buf, format, tm, decided) return NULL; break; case 'u': - get_number (1, 7); + get_number (1, 7, 1); tm->tm_wday = val % 7; + have_wday = 1; break; case 'g': - get_number (0, 99); + get_number (0, 99, 2); /* XXX This cannot determine any field in TM. */ break; case 'G': @@ -977,27 +787,32 @@ strptime_internal (buf, format, tm, decided) case 'U': case 'V': case 'W': - get_number (0, 53); + get_number (0, 53, 2); /* XXX This cannot determine any field in TM without some information. */ break; case 'w': /* Match number of weekday. */ - get_number (0, 6); + get_number (0, 6, 1); tm->tm_wday = val; + have_wday = 1; break; case 'y': /* Match year within century. */ - get_number (0, 99); - tm->tm_year = val >= 50 ? val : val + 100; + get_number (0, 99, 2); + /* The "Year 2000: The Millennium Rollover" paper suggests that + values in the range 69-99 refer to the twentieth century. */ + tm->tm_year = val >= 69 ? val : val + 100; + /* Indicate that we want to use the century, if specified. */ + want_century = 1; + want_xday = 1; break; case 'Y': /* Match year including century number. */ - if (sizeof (time_t) > 4) - get_number (0, 9999); - else - get_number (0, 2036); + get_number (0, 9999, 4); tm->tm_year = val - 1900; + want_century = 0; + want_xday = 1; break; case 'Z': /* XXX How to handle this? */ @@ -1019,11 +834,14 @@ strptime_internal (buf, format, tm, decided) { if (*decided == loc) return NULL; + else + rp = rp_backup; } else { if (strcmp (fmt, HERE_D_T_FMT)) *decided = loc; + want_xday = 1; break; } *decided = raw; @@ -1032,6 +850,7 @@ strptime_internal (buf, format, tm, decided) normal representation. */ if (!recursive (HERE_D_T_FMT)) return NULL; + want_xday = 1; break; case 'C': case 'y': @@ -1053,6 +872,8 @@ strptime_internal (buf, format, tm, decided) { if (*decided == loc) return NULL; + else + rp = rp_backup; } else { @@ -1077,6 +898,8 @@ strptime_internal (buf, format, tm, decided) { if (*decided == loc) return NULL; + else + rp = rp_backup; } else { @@ -1109,53 +932,60 @@ strptime_internal (buf, format, tm, decided) case 'd': case 'e': /* Match day of month using alternate numeric symbols. */ - get_alt_number (1, 31); + get_alt_number (1, 31, 2); tm->tm_mday = val; + have_mday = 1; + want_xday = 1; break; case 'H': /* Match hour in 24-hour clock using alternate numeric symbols. */ - get_alt_number (0, 23); + get_alt_number (0, 23, 2); tm->tm_hour = val; have_I = 0; break; case 'I': /* Match hour in 12-hour clock using alternate numeric symbols. */ - get_alt_number (1, 12); + get_alt_number (1, 12, 2); tm->tm_hour = val - 1; have_I = 1; break; case 'm': /* Match month using alternate numeric symbols. */ - get_alt_number (1, 12); + get_alt_number (1, 12, 2); tm->tm_mon = val - 1; + have_mon = 1; + want_xday = 1; break; case 'M': /* Match minutes using alternate numeric symbols. */ - get_alt_number (0, 59); + get_alt_number (0, 59, 2); tm->tm_min = val; break; case 'S': /* Match seconds using alternate numeric symbols. */ - get_alt_number (0, 61); + get_alt_number (0, 61, 2); tm->tm_sec = val; break; case 'U': case 'V': case 'W': - get_alt_number (0, 53); + get_alt_number (0, 53, 2); /* XXX This cannot determine any field in TM without further information. */ break; case 'w': /* Match number of weekday using alternate numeric symbols. */ - get_alt_number (0, 6); + get_alt_number (0, 6, 1); tm->tm_wday = val; + have_wday = 1; break; case 'y': /* Match year within century using alternate numeric symbols. */ - get_alt_number (0, 99); + get_alt_number (0, 99, 2); + tm->tm_year = val >= 69 ? val : val + 100; + want_xday = 1; break; default: return NULL; @@ -1169,6 +999,31 @@ strptime_internal (buf, format, tm, decided) if (have_I && is_pm) tm->tm_hour += 12; + if (century != -1) + { + if (want_century) + tm->tm_year = tm->tm_year % 100 + (century - 19) * 100; + else + /* Only the century, but not the year. Strange, but so be it. */ + tm->tm_year = (century - 19) * 100; + } + + if (want_xday && !have_wday) { + if ( !(have_mon && have_mday) && have_yday) { + /* we don't have tm_mon and/or tm_mday, compute them */ + int t_mon = 0; + while (__mon_yday[__isleap(1900 + tm->tm_year)][t_mon] <= tm->tm_yday) + t_mon++; + if (!have_mon) + tm->tm_mon = t_mon - 1; + if (!have_mday) + tm->tm_mday = tm->tm_yday - __mon_yday[__isleap(1900 + tm->tm_year)][t_mon - 1] + 1; + } + day_of_the_week (tm); + } + if (want_xday && !have_yday) + day_of_the_year (tm); + return (char *) rp; } @@ -1188,3 +1043,386 @@ strptime (buf, format, tm) return strptime_internal (buf, format, tm, &decided); } #endif /* not HAVE_STRPTIME */ + +#ifdef NEED_MON_YDAY +const unsigned short int __mon_yday[2][13] = + { + /* Normal years. */ + { 0, 31, 59, 90, 120, 151, 181, 212, 243, 273, 304, 334, 365 }, + /* Leap years. */ + { 0, 31, 60, 91, 121, 152, 182, 213, 244, 274, 305, 335, 366 } + }; +#endif + +/* fnmatch is required by POSIX, but we include an implementation for + the sake of systems that don't have it, most notably Windows. Some + systems do have fnmatch, but Apache's installation process installs + its own fnmatch.h (incompatible with the system one!) in a system + include directory, effectively rendering fnmatch unusable. This + has been fixed with Apache 2, where fnmatch has been moved to apr + and given a prefix, but many systems out there are still (as of + this writing in 2005) broken and we must cater to them. + + Additionally, according to some conventional wisdom, many + historical implementations of fnmatch are buggy and unreliable. If + yours is such, undefine SYSTEM_FNMATCH in sysdep.h and tell us + about it. */ + +#ifndef SYSTEM_FNMATCH + +#define __FNM_FLAGS (FNM_PATHNAME | FNM_NOESCAPE | FNM_PERIOD) + +/* Match STRING against the filename pattern PATTERN, returning zero + if it matches, FNM_NOMATCH if not. This implementation comes from + an earlier version of GNU Bash. (It doesn't make sense to update + it with a newer version because those versions add a lot of + features Wget doesn't use or care about.) */ + +int +fnmatch (const char *pattern, const char *string, int flags) +{ + register const char *p = pattern, *n = string; + register char c; + + if ((flags & ~__FNM_FLAGS) != 0) + { + errno = EINVAL; + return (-1); + } + + while ((c = *p++) != '\0') + { + switch (c) + { + case '?': + if (*n == '\0') + return (FNM_NOMATCH); + else if ((flags & FNM_PATHNAME) && *n == '/') + return (FNM_NOMATCH); + else if ((flags & FNM_PERIOD) && *n == '.' && + (n == string || ((flags & FNM_PATHNAME) && n[-1] == '/'))) + return (FNM_NOMATCH); + break; + + case '\\': + if (!(flags & FNM_NOESCAPE)) + c = *p++; + if (*n != c) + return (FNM_NOMATCH); + break; + + case '*': + if ((flags & FNM_PERIOD) && *n == '.' && + (n == string || ((flags & FNM_PATHNAME) && n[-1] == '/'))) + return (FNM_NOMATCH); + + for (c = *p++; c == '?' || c == '*'; c = *p++, ++n) + if (((flags & FNM_PATHNAME) && *n == '/') || + (c == '?' && *n == '\0')) + return (FNM_NOMATCH); + + if (c == '\0') + return (0); + + { + char c1 = (!(flags & FNM_NOESCAPE) && c == '\\') ? *p : c; + for (--p; *n != '\0'; ++n) + if ((c == '[' || *n == c1) && + fnmatch (p, n, flags & ~FNM_PERIOD) == 0) + return (0); + return (FNM_NOMATCH); + } + + case '[': + { + /* Nonzero if the sense of the character class is + inverted. */ + register int not; + + if (*n == '\0') + return (FNM_NOMATCH); + + if ((flags & FNM_PERIOD) && *n == '.' && + (n == string || ((flags & FNM_PATHNAME) && n[-1] == '/'))) + return (FNM_NOMATCH); + + /* Make sure there is a closing `]'. If there isn't, + the `[' is just a character to be matched. */ + { + register const char *np; + + for (np = p; np && *np && *np != ']'; np++) + ; + + if (np && !*np) + { + if (*n != '[') + return (FNM_NOMATCH); + goto next_char; + } + } + + not = (*p == '!' || *p == '^'); + if (not) + ++p; + + c = *p++; + while (1) + { + register char cstart = c, cend = c; + + if (!(flags & FNM_NOESCAPE) && c == '\\') + cstart = cend = *p++; + + if (c == '\0') + /* [ (unterminated) loses. */ + return (FNM_NOMATCH); + + c = *p++; + + if ((flags & FNM_PATHNAME) && c == '/') + /* [/] can never match. */ + return (FNM_NOMATCH); + + if (c == '-' && *p != ']') + { + cend = *p++; + if (!(flags & FNM_NOESCAPE) && cend == '\\') + cend = *p++; + if (cend == '\0') + return (FNM_NOMATCH); + c = *p++; + } + + if (*n >= cstart && *n <= cend) + goto matched; + + if (c == ']') + break; + } + if (!not) + return (FNM_NOMATCH); + + next_char: + break; + + matched: + /* Skip the rest of the [...] that already matched. */ + while (c != ']') + { + if (c == '\0') + /* [... (unterminated) loses. */ + return (FNM_NOMATCH); + + c = *p++; + if (!(flags & FNM_NOESCAPE) && c == '\\') + /* 1003.2d11 is unclear if this is right. %%% */ + ++p; + } + if (not) + return (FNM_NOMATCH); + } + break; + + default: + if (c != *n) + return (FNM_NOMATCH); + } + + ++n; + } + + if (*n == '\0') + return (0); + + return (FNM_NOMATCH); +} + +#endif /* not SYSTEM_FNMATCH */ + +#ifndef HAVE_TIMEGM +/* timegm is a GNU extension, but lately also available on *BSD + systems and possibly elsewhere. */ + +/* True if YEAR is a leap year. */ +#define ISLEAP(year) \ + ((year) % 4 == 0 && ((year) % 100 != 0 || (year) % 400 == 0)) + +/* Number of leap years in the range [y1, y2). */ +#define LEAPYEARS(y1, y2) \ + ((y2-1)/4 - (y1-1)/4) - ((y2-1)/100 - (y1-1)/100) + ((y2-1)/400 - (y1-1)/400) + +/* Inverse of gmtime: converts struct tm to time_t, assuming the data + in tm is UTC rather than local timezone. This implementation + returns the number of seconds elapsed since midnight 1970-01-01, + converted to time_t. */ + +time_t +timegm (struct tm *t) +{ + static const unsigned short int month_to_days[][13] = { + { 0, 31, 59, 90, 120, 151, 181, 212, 243, 273, 304, 334 }, /* normal */ + { 0, 31, 60, 91, 121, 152, 182, 213, 244, 274, 305, 335 } /* leap */ + }; + const int year = 1900 + t->tm_year; + unsigned long secs; /* until 2106-02-07 for 32-bit unsigned long */ + int days; + + if (year < 1970) + return (time_t) -1; + + days = 365 * (year - 1970); + /* Take into account leap years between 1970 and YEAR, not counting + YEAR itself. */ + days += LEAPYEARS (1970, year); + if (t->tm_mon < 0 || t->tm_mon >= 12) + return (time_t) -1; + days += month_to_days[ISLEAP (year)][t->tm_mon]; + days += t->tm_mday - 1; + + secs = days * 86400 + t->tm_hour * 3600 + t->tm_min * 60 + t->tm_sec; + return (time_t) secs; +} +#endif /* HAVE_TIMEGM */ + +#ifdef NEED_STRTOLL +/* strtoll is required by C99 and used by Wget only on systems with + LFS. Unfortunately, some systems have LFS, but no strtoll or + equivalent. These include HPUX 11.0 and Windows. + + We use #ifdef NEED_STRTOLL instead of #ifndef HAVE_STRTOLL because + of the systems which have a suitable replacement (e.g. _strtoi64 on + Windows), on which Wget's str_to_wgint is instructed to use that + instead. */ + +static inline int +char_value (char c, int base) +{ + int value; + if (c < '0') + return -1; + if ('0' <= c && c <= '9') + value = c - '0'; + else if ('a' <= c && c <= 'z') + value = c - 'a' + 10; + else if ('A' <= c && c <= 'Z') + value = c - 'A' + 10; + else + return -1; + if (value >= base) + return -1; + return value; +} + +#define STRTOLL_MAX TYPE_MAXIMUM (strtoll_type) +/* This definition assumes two's complement arithmetic */ +#define STRTOLL_MIN (-STRTOLL_MAX - 1) + +/* Like a%b, but always returns a positive number when A is negative. + (C doesn't guarantee the sign of the result.) */ +#define MOD(a, b) ((strtoll_type) -1 % 2 == 1 ? (a) % (b) : - ((a) % (b))) + +/* A strtoll-like replacement for systems that have an integral type + larger than long but don't supply strtoll. This implementation + makes no assumptions about the size of strtoll_type. */ + +strtoll_type +strtoll (const char *nptr, char **endptr, int base) +{ + strtoll_type result = 0; + bool negative; + + if (base != 0 && (base < 2 || base > 36)) + { + errno = EINVAL; + return 0; + } + + while (*nptr == ' ' || *nptr == '\t') + ++nptr; + if (*nptr == '-') + { + negative = true; + ++nptr; + } + else if (*nptr == '+') + { + negative = false; + ++nptr; + } + else + negative = false; + + /* If BASE is 0, determine the real base based on the beginning on + the number; octal numbers begin with "0", hexadecimal with "0x", + and the others are considered octal. */ + if (*nptr == '0') + { + if ((base == 0 || base == 16) + && + (*(nptr + 1) == 'x' || *(nptr + 1) == 'X')) + { + base = 16; + nptr += 2; + /* "0x" must be followed by at least one hex char. If not, + return 0 and place ENDPTR on 'x'. */ + if (!ISXDIGIT (*nptr)) + { + --nptr; + goto out; + } + } + else if (base == 0) + base = 8; + } + else if (base == 0) + base = 10; + + if (!negative) + { + /* Parse positive number, checking for overflow. */ + int digit; + /* Overflow watermark. If RESULT exceeds it, overflow occurs on + this digit. If result==WATERMARK, current digit may not + exceed the last digit of maximum value. */ + const strtoll_type WATERMARK = STRTOLL_MAX / base; + for (; (digit = char_value (*nptr, base)) != -1; ++nptr) + { + if (result > WATERMARK + || (result == WATERMARK && digit > STRTOLL_MAX % base)) + { + result = STRTOLL_MAX; + errno = ERANGE; + break; + } + result = base * result + digit; + } + } + else + { + /* Parse negative number, checking for underflow. */ + int digit; + const strtoll_type WATERMARK = STRTOLL_MIN / base; + for (; (digit = char_value (*nptr, base)) != -1; ++nptr) + { + if (result < WATERMARK + || (result == WATERMARK && digit > MOD (STRTOLL_MIN, base))) + { + result = STRTOLL_MIN; + errno = ERANGE; + break; + } + result = base * result - digit; + } + } + out: + if (endptr) + *endptr = (char *) nptr; + return result; +} + +#undef STRTOLL_MAX +#undef STRTOLL_MIN +#undef ABS + +#endif /* NEED_STRTOLL */