1 /* Copyright (C) 2002, 2004, 2005, 2007 Free Software Foundation, Inc.
2 This file is part of the GNU C Library.
4 This program is free software; you can redistribute it and/or modify
5 it under the terms of the GNU General Public License as published by
6 the Free Software Foundation; either version 2, or (at your option)
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
14 You should have received a copy of the GNU General Public License along
15 with this program; if not, write to the Free Software Foundation,
16 Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. */
20 # include "strptime.h"
26 # include <langinfo.h>
34 # include "../locale/localeinfo.h"
39 enum ptime_locale_status { not, loc, raw };
44 #define match_char(ch1, ch2) if (ch1 != ch2) return NULL
45 #if defined _LIBC && defined __GNUC__ && __GNUC__ >= 2
46 # define match_string(cs1, s2) \
47 ({ size_t len = strlen (cs1); \
48 int result = __strncasecmp_l ((cs1), (s2), len, locale) == 0; \
49 if (result) (s2) += len; \
52 /* Oh come on. Get a reasonable compiler. */
53 # define match_string(cs1, s2) \
54 (strncasecmp ((cs1), (s2), strlen (cs1)) ? 0 : ((s2) += strlen (cs1), 1))
56 /* We intentionally do not use isdigit() for testing because this will
57 lead to problems with the wide character version. */
58 #define get_number(from, to, n) \
64 if (*rp < '0' || *rp > '9') \
69 } while (--__n > 0 && val * 10 <= to && *rp >= '0' && *rp <= '9'); \
70 if (val < from || val > to) \
74 # define get_alt_number(from, to, n) \
76 __label__ do_normal; \
78 if (*decided != raw) \
80 val = _nl_parse_alt_digit (&rp HELPER_LOCALE_ARG); \
81 if (val == -1 && *decided != loc) \
86 if (val < from || val > to) \
92 get_number (from, to, n); \
97 # define get_alt_number(from, to, n) \
98 /* We don't have the alternate representation. */ \
99 get_number(from, to, n)
101 #define recursive(new_fmt) \
102 (*(new_fmt) != '\0' \
103 && (rp = __strptime_internal (rp, (new_fmt), tm, \
104 decided, era_cnt LOCALE_ARG)) != NULL)
108 /* This is defined in locale/C-time.c in the GNU libc. */
109 extern const struct locale_data _nl_C_LC_TIME attribute_hidden;
111 # define weekday_name (&_nl_C_LC_TIME.values[_NL_ITEM_INDEX (DAY_1)].string)
112 # define ab_weekday_name \
113 (&_nl_C_LC_TIME.values[_NL_ITEM_INDEX (ABDAY_1)].string)
114 # define month_name (&_nl_C_LC_TIME.values[_NL_ITEM_INDEX (MON_1)].string)
115 # define ab_month_name (&_nl_C_LC_TIME.values[_NL_ITEM_INDEX (ABMON_1)].string)
116 # define HERE_D_T_FMT (_nl_C_LC_TIME.values[_NL_ITEM_INDEX (D_T_FMT)].string)
117 # define HERE_D_FMT (_nl_C_LC_TIME.values[_NL_ITEM_INDEX (D_FMT)].string)
118 # define HERE_AM_STR (_nl_C_LC_TIME.values[_NL_ITEM_INDEX (AM_STR)].string)
119 # define HERE_PM_STR (_nl_C_LC_TIME.values[_NL_ITEM_INDEX (PM_STR)].string)
120 # define HERE_T_FMT_AMPM \
121 (_nl_C_LC_TIME.values[_NL_ITEM_INDEX (T_FMT_AMPM)].string)
122 # define HERE_T_FMT (_nl_C_LC_TIME.values[_NL_ITEM_INDEX (T_FMT)].string)
124 # define strncasecmp(s1, s2, n) __strncasecmp (s1, s2, n)
126 static char const weekday_name[][10] =
128 "Sunday", "Monday", "Tuesday", "Wednesday",
129 "Thursday", "Friday", "Saturday"
131 static char const ab_weekday_name[][4] =
133 "Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat"
135 static char const month_name[][10] =
137 "January", "February", "March", "April", "May", "June",
138 "July", "August", "September", "October", "November", "December"
140 static char const ab_month_name[][4] =
142 "Jan", "Feb", "Mar", "Apr", "May", "Jun",
143 "Jul", "Aug", "Sep", "Oct", "Nov", "Dec"
145 # define HERE_D_T_FMT "%a %b %e %H:%M:%S %Y"
146 # define HERE_D_FMT "%m/%d/%y"
147 # define HERE_AM_STR "AM"
148 # define HERE_PM_STR "PM"
149 # define HERE_T_FMT_AMPM "%I:%M:%S %p"
150 # define HERE_T_FMT "%H:%M:%S"
152 static const unsigned short int __mon_yday[2][13] =
155 { 0, 31, 59, 90, 120, 151, 181, 212, 243, 273, 304, 334, 365 },
157 { 0, 31, 60, 91, 121, 152, 182, 213, 244, 274, 305, 335, 366 }
162 /* We use this code also for the extended locale handling where the
163 function gets as an additional argument the locale which has to be
164 used. To access the values we have to redefine the _NL_CURRENT
166 # define strptime __strptime_l
168 # define _NL_CURRENT(category, item) \
169 (current->values[_NL_ITEM_INDEX (item)].string)
170 # undef _NL_CURRENT_WORD
171 # define _NL_CURRENT_WORD(category, item) \
172 (current->values[_NL_ITEM_INDEX (item)].word)
173 # define LOCALE_PARAM , locale
174 # define LOCALE_ARG , locale
175 # define LOCALE_PARAM_PROTO , __locale_t locale
176 # define LOCALE_PARAM_DECL __locale_t locale;
177 # define HELPER_LOCALE_ARG , current
178 # define ISSPACE(Ch) __isspace_l (Ch, locale)
180 # define LOCALE_PARAM
182 # define LOCALE_PARAM_DECL
183 # define LOCALE_PARAM_PROTO
184 # define HELPER_LOCALE_ARG
185 # define ISSPACE(Ch) isspace (Ch)
192 /* Nonzero if YEAR is a leap year (every 4 years,
193 except every 100th isn't, and every 400th is). */
194 # define __isleap(year) \
195 ((year) % 4 == 0 && ((year) % 100 != 0 || (year) % 400 == 0))
198 /* Compute the day of the week. */
200 day_of_the_week (struct tm *tm)
202 /* We know that January 1st 1970 was a Thursday (= 4). Compute the
203 the difference between this data in the one on TM and so determine
205 int corr_year = 1900 + tm->tm_year - (tm->tm_mon < 2);
207 + (365 * (tm->tm_year - 70))
209 - ((corr_year / 4) / 25) + ((corr_year / 4) % 25 < 0)
210 + (((corr_year / 4) / 25) / 4)
211 + __mon_yday[0][tm->tm_mon]
213 tm->tm_wday = ((wday % 7) + 7) % 7;
216 /* Compute the day of the year. */
218 day_of_the_year (struct tm *tm)
220 tm->tm_yday = (__mon_yday[__isleap (1900 + tm->tm_year)][tm->tm_mon]
221 + (tm->tm_mday - 1));
231 __strptime_internal (rp, fmt, tm, decided, era_cnt LOCALE_PARAM)
235 enum ptime_locale_status *decided;
240 struct locale_data *const current = locale->__locales[LC_TIME];
243 const char *rp_backup;
247 int century, want_century;
249 int have_wday, want_xday;
251 int have_mon, have_mday;
252 int have_uweek, have_wweek;
255 struct era_entry *era;
264 have_wday = want_xday = have_yday = have_mon = have_mday = have_uweek = 0;
269 /* A white space in the format string matches 0 more or white
270 space in the input string. */
273 while (ISSPACE (*rp))
279 /* Any character but `%' must be matched by the same character
280 in the iput string. */
283 match_char (*fmt++, *rp++);
289 /* We need this for handling the `E' modifier. */
293 /* Make back up of current processing pointer. */
299 /* Match the `%' character itself. */
300 match_char ('%', *rp++);
304 /* Match day of week. */
305 for (cnt = 0; cnt < 7; ++cnt)
310 if (match_string (_NL_CURRENT (LC_TIME, DAY_1 + cnt), rp))
313 && strcmp (_NL_CURRENT (LC_TIME, DAY_1 + cnt),
318 if (match_string (_NL_CURRENT (LC_TIME, ABDAY_1 + cnt), rp))
321 && strcmp (_NL_CURRENT (LC_TIME, ABDAY_1 + cnt),
322 ab_weekday_name[cnt]))
329 && (match_string (weekday_name[cnt], rp)
330 || match_string (ab_weekday_name[cnt], rp)))
337 /* Does not match a weekday name. */
345 /* Match month name. */
346 for (cnt = 0; cnt < 12; ++cnt)
351 if (match_string (_NL_CURRENT (LC_TIME, MON_1 + cnt), rp))
354 && strcmp (_NL_CURRENT (LC_TIME, MON_1 + cnt),
359 if (match_string (_NL_CURRENT (LC_TIME, ABMON_1 + cnt), rp))
362 && strcmp (_NL_CURRENT (LC_TIME, ABMON_1 + cnt),
369 if (match_string (month_name[cnt], rp)
370 || match_string (ab_month_name[cnt], rp))
377 /* Does not match a month name. */
383 /* Match locale's date and time format. */
387 if (!recursive (_NL_CURRENT (LC_TIME, D_T_FMT)))
396 if (*decided == not &&
397 strcmp (_NL_CURRENT (LC_TIME, D_T_FMT), HERE_D_T_FMT))
405 if (!recursive (HERE_D_T_FMT))
410 /* Match century number. */
412 get_number (0, 99, 2);
418 /* Match day of month. */
419 get_number (1, 31, 2);
425 if (!recursive ("%Y-%m-%d"))
433 if (!recursive (_NL_CURRENT (LC_TIME, D_FMT)))
443 && strcmp (_NL_CURRENT (LC_TIME, D_FMT), HERE_D_FMT))
453 /* Match standard day format. */
454 if (!recursive (HERE_D_FMT))
460 /* Match hour in 24-hour clock. */
461 get_number (0, 23, 2);
466 /* Match hour in 12-hour clock. GNU extension. */
468 /* Match hour in 12-hour clock. */
469 get_number (1, 12, 2);
470 tm->tm_hour = val % 12;
474 /* Match day number of year. */
475 get_number (1, 366, 3);
476 tm->tm_yday = val - 1;
480 /* Match number of month. */
481 get_number (1, 12, 2);
482 tm->tm_mon = val - 1;
488 get_number (0, 59, 2);
493 /* Match any white space. */
494 while (ISSPACE (*rp))
498 /* Match locale's equivalent of AM/PM. */
502 if (match_string (_NL_CURRENT (LC_TIME, AM_STR), rp))
504 if (strcmp (_NL_CURRENT (LC_TIME, AM_STR), HERE_AM_STR))
508 if (match_string (_NL_CURRENT (LC_TIME, PM_STR), rp))
510 if (strcmp (_NL_CURRENT (LC_TIME, PM_STR), HERE_PM_STR))
518 if (!match_string (HERE_AM_STR, rp))
520 if (match_string (HERE_PM_STR, rp))
530 if (!recursive (_NL_CURRENT (LC_TIME, T_FMT_AMPM)))
539 if (*decided == not &&
540 strcmp (_NL_CURRENT (LC_TIME, T_FMT_AMPM),
548 if (!recursive (HERE_T_FMT_AMPM))
552 if (!recursive ("%H:%M"))
557 /* The number of seconds may be very high so we cannot use
558 the `get_number' macro. Instead read the number
559 character for character and construct the result while
562 if (*rp < '0' || *rp > '9')
563 /* We need at least one digit. */
571 while (*rp >= '0' && *rp <= '9');
573 if (localtime_r (&secs, tm) == NULL)
574 /* Error in function. */
579 get_number (0, 61, 2);
586 if (!recursive (_NL_CURRENT (LC_TIME, T_FMT)))
595 if (strcmp (_NL_CURRENT (LC_TIME, T_FMT), HERE_T_FMT))
604 if (!recursive (HERE_T_FMT))
608 get_number (1, 7, 1);
609 tm->tm_wday = val % 7;
613 get_number (0, 99, 2);
614 /* XXX This cannot determine any field in TM. */
617 if (*rp < '0' || *rp > '9')
619 /* XXX Ignore the number since we would need some more
620 information to compute a real date. */
623 while (*rp >= '0' && *rp <= '9');
626 get_number (0, 53, 2);
631 get_number (0, 53, 2);
636 get_number (0, 53, 2);
637 /* XXX This cannot determine any field in TM without some
641 /* Match number of weekday. */
642 get_number (0, 6, 1);
647 match_year_in_century:
648 /* Match year within century. */
649 get_number (0, 99, 2);
650 /* The "Year 2000: The Millennium Rollover" paper suggests that
651 values in the range 69-99 refer to the twentieth century. */
652 tm->tm_year = val >= 69 ? val : val + 100;
653 /* Indicate that we want to use the century, if specified. */
658 /* Match year including century number. */
659 get_number (0, 9999, 4);
660 tm->tm_year = val - 1900;
665 /* XXX How to handle this? */
668 /* We recognize two formats: if two digits are given, these
669 specify hours. If fours digits are used, minutes are
675 if (*rp != '+' && *rp != '-')
677 bool neg = *rp++ == '-';
679 while (n < 4 && *rp >= '0' && *rp <= '9')
681 val = val * 10 + *rp++ - '0';
687 /* Only two or four digits recognized. */
691 /* We have to convert the minutes into decimal. */
694 val = (val / 100) * 100 + ((val % 100) * 50) / 30;
698 #if defined _LIBC || HAVE_TM_GMTOFF
699 tm->tm_gmtoff = (val * 3600) / 100;
701 tm->tm_gmtoff = -tm->tm_gmtoff;
710 /* Match locale's alternate date and time format. */
713 const char *fmt = _NL_CURRENT (LC_TIME, ERA_D_T_FMT);
716 fmt = _NL_CURRENT (LC_TIME, D_T_FMT);
718 if (!recursive (fmt))
727 if (strcmp (fmt, HERE_D_T_FMT))
734 /* The C locale has no era information, so use the
735 normal representation. */
736 if (!recursive (HERE_D_T_FMT))
745 era = _nl_select_era_entry (era_cnt HELPER_LOCALE_ARG);
746 if (era != NULL && match_string (era->era_name, rp))
755 num_eras = _NL_CURRENT_WORD (LC_TIME,
756 _NL_TIME_ERA_NUM_ENTRIES);
757 for (era_cnt = 0; era_cnt < (int) num_eras;
758 ++era_cnt, rp = rp_backup)
760 era = _nl_select_era_entry (era_cnt
762 if (era != NULL && match_string (era->era_name, rp))
768 if (era_cnt != (int) num_eras)
777 /* The C locale has no era information, so use the
778 normal representation. */
783 get_number(0, 9999, 4);
791 assert (*decided == loc);
793 era = _nl_select_era_entry (era_cnt HELPER_LOCALE_ARG);
797 int delta = ((tm->tm_year - era->offset)
798 * era->absolute_direction);
800 && delta < (((int64_t) era->stop_date[0]
801 - (int64_t) era->start_date[0])
802 * era->absolute_direction));
810 num_eras = _NL_CURRENT_WORD (LC_TIME,
811 _NL_TIME_ERA_NUM_ENTRIES);
812 for (era_cnt = 0; era_cnt < (int) num_eras; ++era_cnt)
814 era = _nl_select_era_entry (era_cnt
818 int delta = ((tm->tm_year - era->offset)
819 * era->absolute_direction);
821 && delta < (((int64_t) era->stop_date[0]
822 - (int64_t) era->start_date[0])
823 * era->absolute_direction))
830 if (era_cnt != (int) num_eras)
840 goto match_year_in_century;
844 num_eras = _NL_CURRENT_WORD (LC_TIME,
845 _NL_TIME_ERA_NUM_ENTRIES);
846 for (era_cnt = 0; era_cnt < (int) num_eras;
847 ++era_cnt, rp = rp_backup)
849 era = _nl_select_era_entry (era_cnt HELPER_LOCALE_ARG);
850 if (era != NULL && recursive (era->era_format))
853 if (era_cnt == (int) num_eras)
870 get_number (0, 9999, 4);
871 tm->tm_year = val - 1900;
878 const char *fmt = _NL_CURRENT (LC_TIME, ERA_D_FMT);
881 fmt = _NL_CURRENT (LC_TIME, D_FMT);
883 if (!recursive (fmt))
892 if (strcmp (fmt, HERE_D_FMT))
898 if (!recursive (HERE_D_FMT))
904 const char *fmt = _NL_CURRENT (LC_TIME, ERA_T_FMT);
907 fmt = _NL_CURRENT (LC_TIME, T_FMT);
909 if (!recursive (fmt))
918 if (strcmp (fmt, HERE_T_FMT))
924 if (!recursive (HERE_T_FMT))
932 /* We have no information about the era format. Just use
933 the normal format. */
934 if (*fmt != 'c' && *fmt != 'C' && *fmt != 'y' && *fmt != 'Y'
935 && *fmt != 'x' && *fmt != 'X')
936 /* This is an illegal format. */
946 /* Match day of month using alternate numeric symbols. */
947 get_alt_number (1, 31, 2);
953 /* Match hour in 24-hour clock using alternate numeric
955 get_alt_number (0, 23, 2);
960 /* Match hour in 12-hour clock using alternate numeric
962 get_alt_number (1, 12, 2);
963 tm->tm_hour = val % 12;
967 /* Match month using alternate numeric symbols. */
968 get_alt_number (1, 12, 2);
969 tm->tm_mon = val - 1;
974 /* Match minutes using alternate numeric symbols. */
975 get_alt_number (0, 59, 2);
979 /* Match seconds using alternate numeric symbols. */
980 get_alt_number (0, 61, 2);
984 get_alt_number (0, 53, 2);
989 get_alt_number (0, 53, 2);
994 get_alt_number (0, 53, 2);
995 /* XXX This cannot determine any field in TM without
996 further information. */
999 /* Match number of weekday using alternate numeric symbols. */
1000 get_alt_number (0, 6, 1);
1005 /* Match year within century using alternate numeric symbols. */
1006 get_alt_number (0, 99, 2);
1007 tm->tm_year = val >= 69 ? val : val + 100;
1019 if (have_I && is_pm)
1025 tm->tm_year = tm->tm_year % 100 + (century - 19) * 100;
1027 /* Only the century, but not the year. Strange, but so be it. */
1028 tm->tm_year = (century - 19) * 100;
1034 era = _nl_select_era_entry (era_cnt HELPER_LOCALE_ARG);
1038 tm->tm_year = (era->start_date[0]
1039 + ((tm->tm_year - era->offset)
1040 * era->absolute_direction));
1042 /* Era start year assumed. */
1043 tm->tm_year = era->start_date[0];
1049 /* No era found but we have seen an E modifier. Rectify some
1051 if (want_century && century == -1 && tm->tm_year < 69)
1055 if (want_xday && !have_wday)
1057 if ( !(have_mon && have_mday) && have_yday)
1059 /* We don't have tm_mon and/or tm_mday, compute them. */
1061 while (__mon_yday[__isleap(1900 + tm->tm_year)][t_mon] <= tm->tm_yday)
1064 tm->tm_mon = t_mon - 1;
1068 - __mon_yday[__isleap(1900 + tm->tm_year)][t_mon - 1] + 1);
1070 day_of_the_week (tm);
1073 if (want_xday && !have_yday)
1074 day_of_the_year (tm);
1076 if ((have_uweek || have_wweek) && have_wday)
1078 int save_wday = tm->tm_wday;
1079 int save_mday = tm->tm_mday;
1080 int save_mon = tm->tm_mon;
1081 int w_offset = have_uweek ? 0 : 1;
1085 day_of_the_week (tm);
1087 tm->tm_mday = save_mday;
1089 tm->tm_mon = save_mon;
1092 tm->tm_yday = ((7 - (tm->tm_wday - w_offset)) % 7
1094 + save_wday - w_offset);
1096 if (!have_mday || !have_mon)
1099 while (__mon_yday[__isleap(1900 + tm->tm_year)][t_mon]
1103 tm->tm_mon = t_mon - 1;
1107 - __mon_yday[__isleap(1900 + tm->tm_year)][t_mon - 1] + 1);
1110 tm->tm_wday = save_wday;
1118 strptime (buf, format, tm LOCALE_PARAM)
1119 const char *restrict buf;
1120 const char *restrict format;
1121 struct tm *restrict tm;
1124 enum ptime_locale_status decided;
1131 return __strptime_internal (buf, format, tm, &decided, -1 LOCALE_ARG);
1135 weak_alias (__strptime_l, strptime_l)