diff options
Diffstat (limited to 'time/strptime.c')
-rw-r--r-- | time/strptime.c | 471 |
1 files changed, 409 insertions, 62 deletions
diff --git a/time/strptime.c b/time/strptime.c index bd38f9681f..f220313475 100644 --- a/time/strptime.c +++ b/time/strptime.c @@ -1,5 +1,5 @@ -/* strptime - Convert a string representation of time to a time value. - Copyright (C) 1996 Free Software Foundation, Inc. +/* Convert a string representation of time to a time value. + Copyright (C) 1996, 1997 Free Software Foundation, Inc. This file is part of the GNU C Library. Contributed by Ulrich Drepper <drepper@cygnus.com>, 1996. @@ -18,24 +18,71 @@ write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. */ +/* XXX This version of the implementation is not really complete. + Some of the fields cannot add information alone. But if seeing + some of them in the same format (such as year, week and weekday) + this is enough information for determining the date. */ + +#ifdef HAVE_CONFIG_H +# include <config.h> +#endif + #include <ctype.h> #include <langinfo.h> #include <limits.h> #include <string.h> #include <time.h> -#include "../locale/localeinfo.h" +#ifdef _LIBC +# include "../locale/localeinfo.h" +#endif + + +#ifndef __P +# if defined (__GNUC__) || (defined (__STDC__) && __STDC__) +# define __P(args) args +# else +# define __P(args) () +# endif /* GCC. */ +#endif /* Not __P. */ + +#if ! HAVE_LOCALTIME_R && ! defined (localtime_r) +#ifdef _LIBC +#define localtime_r __localtime_r +#else +/* Approximate localtime_r as best we can in its absence. */ +#define localtime_r my_localtime_r +static struct tm *localtime_r __P ((const time_t *, struct tm *)); +static struct tm * +localtime_r (t, tp) + const time_t *t; + struct tm *tp; +{ + struct tm *l = localtime (t); + if (! l) + return 0; + *tp = *l; + return tp; +} +#endif /* ! _LIBC */ +#endif /* ! HAVE_LOCALTIME_R && ! defined (localtime_r) */ #define match_char(ch1, ch2) if (ch1 != ch2) return NULL -#define match_string(cs1, s2) \ +#if defined __GNUC__ && __GNUC__ >= 2 +# define match_string(cs1, s2) \ ({ size_t len = strlen (cs1); \ - int result = strncasecmp (cs1, s2, len) == 0; \ - if (result) s2 += len; \ + int result = strncasecmp ((cs1), (s2), len) == 0; \ + if (result) (s2) += len; \ result; }) +#else +/* Oh come on. Get a reasonable compiler. */ +# define match_string(cs1, s2) \ + (strncasecmp ((cs1), (s2), strlen (cs1)) ? 0 : ((s2) += strlen (cs1), 1)) +#endif /* We intentionally do not use isdigit() for testing because this will lead to problems with the wide character version. */ -#define get_number(from, to) \ +#define get_number(from, to) \ do { \ val = 0; \ if (*rp < '0' || *rp > '9') \ @@ -47,33 +94,98 @@ if (val < from || val > to) \ return NULL; \ } while (0) -#define get_alt_number(from, to) \ +#ifdef _NL_CURRENT +# define get_alt_number(from, to) \ do { \ - const char *alts = _NL_CURRENT (LC_TIME, ALT_DIGITS); \ - val = 0; \ - while (*alts != '\0') \ + if (*decided != raw) \ { \ - size_t len = strlen (alts); \ - if (strncasecmp (alts, rp, len) == 0) \ - break; \ - alts = strchr (alts, '\0') + 1; \ - ++val; \ + const char *alts = _NL_CURRENT (LC_TIME, ALT_DIGITS); \ + val = 0; \ + while (*alts != '\0') \ + { \ + size_t len = strlen (alts); \ + if (strncasecmp (alts, rp, len) == 0) \ + break; \ + alts = strchr (alts, '\0') + 1; \ + ++val; \ + } \ + if (*alts == '\0') \ + { \ + if (*decided == loc && val != 0) \ + return NULL; \ + } \ + else \ + { \ + *decided = loc; \ + break; \ + } \ } \ - if (*alts == '\0') \ - return NULL; \ - } while (0) -#define recursive(new_fmt) \ - do { \ - if (*new_fmt == '\0') \ - return NULL; \ - rp = strptime (rp, new_fmt, tm); \ - if (rp == NULL) \ - return NULL; \ + get_number (from, to); \ } while (0) +#else +# define get_alt_number(from, to) \ + /* We don't have the alternate representation. */ \ + get_number(from, to) +#endif +#define recursive(new_fmt) \ + (*(new_fmt) != '\0' \ + || strptime_internal (rp, (new_fmt), tm, decided) != NULL) -char * -strptime (const char *buf, const char *format, struct tm *tm) +#ifdef _LIBC +/* This is defined in locale/C-time.c in the GNU libc. */ +extern const struct locale_data _nl_C_LC_TIME; + +# define weekday_name (&_nl_C_LC_TIME.values[_NL_ITEM_INDEX (DAY_1)].string) +# define ab_weekday_name \ + (&_nl_C_LC_TIME.values[_NL_ITEM_INDEX (ABDAY_1)].string) +# define month_name (&_nl_C_LC_TIME.values[_NL_ITEM_INDEX (MON_1)].string) +# define ab_month_name (&_nl_C_LC_TIME.values[_NL_ITEM_INDEX (ABMON_1)].string) +# define HERE_D_T_FMT (_nl_C_LC_TIME.values[_NL_ITEM_INDEX (D_T_FMT)].string) +# define HERE_D_FMT (_nl_C_LC_TIME.values[_NL_ITEM_INDEX (D_T_FMT)].string) +# define HERE_AM_STR (_nl_C_LC_TIME.values[_NL_ITEM_INDEX (AM_STR)].string) +# define HERE_PM_STR (_nl_C_LC_TIME.values[_NL_ITEM_INDEX (PM_STR)].string) +# define HERE_T_FMT_AMPM \ + (_nl_C_LC_TIME.values[_NL_ITEM_INDEX (T_FMT_AMPM)].string) +# define HERE_T_FMT (_nl_C_LC_TIME.values[_NL_ITEM_INDEX (T_FMT)].string) +#else +static char const weekday_name[][10] = + { + "Sunday", "Monday", "Tuesday", "Wednesday", + "Thursday", "Friday", "Saturday" + }; +static char const ab_weekday_name[][4] = + { + "Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat" + }; +static char const month_name[][10] = + { + "January", "February", "March", "April", "May", "June", + "July", "August", "September", "October", "November", "December" + }; +static char const ab_month_name[][4] = + { + "Jan", "Feb", "Mar", "Apr", "May", "Jun", + "Jul", "Aug", "Sep", "Oct", "Nov", "Dec" + }; +# define HERE_D_T_FMT "%a %b %e %H:%M:%S %Y" +# define HERE_D_FMT "%m/%d/%y" +# define HERE_AM_STR "AM" +# define HERE_PM_STR "PM" +# define HERE_T_FMT_AMPM "%I:%M:%S %p" +# define HERE_T_FMT "%H:%M:%S" +#endif + +/* Status of lookup: do we use the locale data or the raw data? */ +enum locale_status { not, loc, raw }; + + +static char * +strptime_internal (buf, format, tm, decided) + const char *buf; + const char *format; + struct tm *tm; + enum locale_status *decided; { const char *rp; const char *fmt; @@ -106,6 +218,10 @@ strptime (const char *buf, const char *format, struct tm *tm) } ++fmt; +#ifndef _NL_CURRENT + /* We need this for handling the `E' modifier. */ + start_over: +#endif switch (*fmt++) { case '%': @@ -117,10 +233,34 @@ strptime (const char *buf, const char *format, struct tm *tm) /* Match day of week. */ for (cnt = 0; cnt < 7; ++cnt) { - if (match_string (_NL_CURRENT (LC_TIME, ABDAY_1 + cnt), rp)) - break; - if (match_string (_NL_CURRENT (LC_TIME, DAY_1 + cnt), rp)) - break; +#ifdef _NL_CURRENT + if (*decided !=raw) + { + if (match_string (_NL_CURRENT (LC_TIME, ABDAY_1 + cnt), rp)) + { + if (*decided == not + && strcmp (_NL_CURRENT (LC_TIME, ABDAY_1 + cnt), + ab_weekday_name[cnt])) + *decided = loc; + break; + } + if (match_string (_NL_CURRENT (LC_TIME, DAY_1 + cnt), rp)) + { + if (*decided == not + && strcmp (_NL_CURRENT (LC_TIME, DAY_1 + cnt), + weekday_name[cnt])) + *decided = loc; + break; + } + } +#endif + if (*decided != loc + && (match_string (ab_weekday_name[cnt], rp) + || match_string (weekday_name[cnt], rp))) + { + *decided = raw; + break; + } } if (cnt == 7) /* Does not match a weekday name. */ @@ -133,10 +273,33 @@ strptime (const char *buf, const char *format, struct tm *tm) /* Match month name. */ for (cnt = 0; cnt < 12; ++cnt) { - if (match_string (_NL_CURRENT (LC_TIME, ABMON_1 + cnt), rp)) - break; - if (match_string (_NL_CURRENT (LC_TIME, MON_1 + cnt), rp)) - break; +#ifdef _NL_CURRENT + if (*decided !=raw) + { + if (match_string (_NL_CURRENT (LC_TIME, ABMON_1 + cnt), rp)) + { + if (*decided == not + && strcmp (_NL_CURRENT (LC_TIME, ABMON_1 + cnt), + ab_month_name[cnt])) + *decided = loc; + break; + } + if (match_string (_NL_CURRENT (LC_TIME, MON_1 + cnt), rp)) + { + if (*decided == not + && strcmp (_NL_CURRENT (LC_TIME, MON_1 + cnt), + month_name[cnt])) + *decided = loc; + break; + } + } +#endif + if (match_string (ab_month_name[cnt], rp) + || match_string (month_name[cnt], rp)) + { + *decided = raw; + break; + } } if (cnt == 12) /* Does not match a month name. */ @@ -145,7 +308,26 @@ strptime (const char *buf, const char *format, struct tm *tm) break; case 'c': /* Match locale's date and time format. */ - recursive (_NL_CURRENT (LC_TIME, D_T_FMT)); +#ifdef _NL_CURRENT + if (*decided != raw) + { + if (!recursive (_NL_CURRENT (LC_TIME, D_T_FMT))) + { + if (*decided == loc) + return NULL; + } + else + { + if (*decided == not && + strcmp (_NL_CURRENT (LC_TIME, D_T_FMT), HERE_D_T_FMT)) + *decided = loc; + break; + } + *decided = raw; + } +#endif + if (!recursive (HERE_D_T_FMT)) + return NULL; break; case 'C': /* Match century number. */ @@ -158,9 +340,30 @@ strptime (const char *buf, const char *format, struct tm *tm) get_number (1, 31); tm->tm_mday = val; break; + case 'x': +#ifdef _NL_CURRENT + if (*decided != raw) + { + if (!recursive (_NL_CURRENT (LC_TIME, D_FMT))) + { + if (*decided == loc) + return NULL; + } + else + { + if (decided == not + && strcmp (_NL_CURRENT (LC_TIME, D_FMT), HERE_D_FMT)) + *decided = loc; + break; + } + *decided = raw; + } +#endif + /* Fall through. */ case 'D': /* Match standard day format. */ - recursive ("%m/%d/%y"); + if (!recursive (HERE_D_FMT)) + return NULL; break; case 'H': /* Match hour in 24-hour clock. */ @@ -197,19 +400,57 @@ strptime (const char *buf, const char *format, struct tm *tm) break; case 'p': /* Match locale's equivalent of AM/PM. */ - if (match_string (_NL_CURRENT (LC_TIME, AM_STR), rp)) - break; - if (match_string (_NL_CURRENT (LC_TIME, PM_STR), rp)) +#ifdef _NL_CURRENT + if (*decided != raw) { - is_pm = 1; - break; + if (match_string (_NL_CURRENT (LC_TIME, AM_STR), rp)) + { + if (strcmp (_NL_CURRENT (LC_TIME, AM_STR), HERE_AM_STR)) + *decided = loc; + break; + } + if (match_string (_NL_CURRENT (LC_TIME, PM_STR), rp)) + { + if (strcmp (_NL_CURRENT (LC_TIME, PM_STR), HERE_PM_STR)) + *decided = loc; + is_pm = 1; + break; + } + *decided = raw; } - return NULL; +#endif + if (!match_string (HERE_AM_STR, rp)) + if (match_string (HERE_PM_STR, rp)) + is_pm = 1; + else + return NULL; + break; case 'r': - recursive (_NL_CURRENT (LC_TIME, T_FMT_AMPM)); +#ifdef _NL_CURRENT + if (*decided != raw) + { + if (!recursive (_NL_CURRENT (LC_TIME, T_FMT_AMPM))) + { + if (*decided == loc) + return NULL; + } + else + { + if (*decided == not && + strcmp (_NL_CURRENT (LC_TIME, T_FMT_AMPM), + HERE_T_FMT_AMPM)) + *decided = loc; + break; + } + *decided = raw; + } +#endif + if (!recursive (HERE_T_FMT_AMPM)) + return NULL; break; case 'R': - recursive ("%H:%M"); + if (!recursive ("%H:%M")) + return NULL; break; case 's': { @@ -229,7 +470,7 @@ strptime (const char *buf, const char *format, struct tm *tm) } while (*rp >= '0' && *rp <= '9'); - if (__localtime_r (&secs, tm) == NULL) + if (localtime_r (&secs, tm) == NULL) /* Error in function. */ return NULL; } @@ -238,8 +479,28 @@ strptime (const char *buf, const char *format, struct tm *tm) get_number (0, 61); tm->tm_sec = val; break; + case 'X': +#ifdef _NL_CURRENT + if (*decided != raw) + { + if (!recursive (_NL_CURRENT (LC_TIME, T_FMT))) + { + if (*decided == loc) + return NULL; + } + else + { + if (strcmp (_NL_CURRENT (LC_TIME, T_FMT), HERE_T_FMT)) + *decided = loc; + break; + } + *decided = raw; + } +#endif + /* Fall through. */ case 'T': - recursive ("%H:%M:%S"); + if (!recursive (HERE_T_FMT)) + return NULL; break; case 'u': get_number (1, 7); @@ -262,19 +523,14 @@ strptime (const char *buf, const char *format, struct tm *tm) case 'V': case 'W': get_number (0, 53); - /* XXX This cannot determine any field in TM. */ + /* XXX This cannot determine any field in TM without some + information. */ break; case 'w': /* Match number of weekday. */ get_number (0, 6); tm->tm_wday = val; break; - case 'x': - recursive (_NL_CURRENT (LC_TIME, D_FMT)); - break; - case 'X': - recursive (_NL_CURRENT (LC_TIME, T_FMT)); - break; case 'y': /* Match year within century. */ get_number (0, 99); @@ -289,11 +545,35 @@ strptime (const char *buf, const char *format, struct tm *tm) /* XXX How to handle this? */ break; case 'E': +#ifdef _NL_CURRENT switch (*fmt++) { case 'c': /* Match locale's alternate date and time format. */ - recursive (_NL_CURRENT (LC_TIME, ERA_D_T_FMT)); + if (*decided != raw) + { + const char *fmt = _NL_CURRENT (LC_TIME, ERA_D_T_FMT); + + if (*fmt == '\0') + fmt = _NL_CURRENT (LC_TIME, D_T_FMT); + + if (!recursive (fmt)) + { + if (*decided == loc) + return NULL; + } + else + { + if (strcmp (fmt, HERE_D_T_FMT)) + *decided = loc; + break; + } + *decided = raw; + } + /* The C locale has no era information, so use the + normal representation. */ + if (!recursive (HERE_D_T_FMT)) + return NULL; break; case 'C': case 'y': @@ -301,20 +581,70 @@ strptime (const char *buf, const char *format, struct tm *tm) /* Match name of base year in locale's alternate representation. */ /* XXX This is currently not implemented. It should - use the value _NL_CURRENT (LC_TIME, ERA) but POSIX - leaves this implementation defined and we haven't - figured out how to do it yet. */ + use the value _NL_CURRENT (LC_TIME, ERA). */ break; case 'x': - recursive (_NL_CURRENT (LC_TIME, ERA_D_FMT)); + if (*decided != raw) + { + const char *fmt = _NL_CURRENT (LC_TIME, ERA_D_FMT); + + if (*fmt == '\0') + fmt = _NL_CURRENT (LC_TIME, D_FMT); + + if (!recursive (fmt)) + { + if (*decided == loc) + return NULL; + } + else + { + if (strcmp (fmt, HERE_D_FMT)) + *decided = loc; + break; + } + *decided = raw; + } + if (!recursive (HERE_D_FMT)) + return NULL; break; case 'X': - recursive (_NL_CURRENT (LC_TIME, ERA_T_FMT)); + if (*decided != raw) + { + const char *fmt = _NL_CURRENT (LC_TIME, ERA_T_FMT); + + if (*fmt == '\0') + fmt = _NL_CURRENT (LC_TIME, T_FMT); + + if (!recursive (fmt)) + { + if (*decided == loc) + return NULL; + } + else + { + if (strcmp (fmt, HERE_T_FMT)) + *decided = loc; + break; + } + *decided = raw; + } + if (!recursive (HERE_T_FMT)) + return NULL; break; default: return NULL; } break; +#else + /* We have no information about the era format. Just use + the normal format. */ + if (*fmt != 'c' && *fmt != 'C' && *fmt != 'y' && *fmt != 'Y' + && *fmt != 'x' && *fmt != 'X') + /* This is an illegal format. */ + return NULL; + + goto start_over; +#endif case 'O': switch (*fmt++) { @@ -357,7 +687,8 @@ strptime (const char *buf, const char *format, struct tm *tm) case 'V': case 'W': get_alt_number (0, 53); - /* XXX This cannot determine any field in TM. */ + /* XXX This cannot determine any field in TM without + further information. */ break; case 'w': /* Match number of weekday using alternate numeric symbols. */ @@ -382,3 +713,19 @@ strptime (const char *buf, const char *format, struct tm *tm) return (char *) rp; } + + +char * +strptime (buf, format, tm) + const char *buf; + const char *format; + struct tm *tm; +{ + enum locale_status decided; +#ifdef _NL_CURRENT + decided = not; +#else + decided = raw; +#endif + return strptime_internal (buf, format, tm, &decided); +} |