/* For inclusion by datetime.c. A modified version of code from the GNU C library with locale support removed and wchar support added. */ /* Convert a string representation of time to a time value. Copyright (C) 1996, 1997, 1998, 1999, 2000 Free Software Foundation, Inc. This file is part of the GNU C Library. Contributed by Ulrich Drepper , 1996. The GNU C Library is free software; you can redistribute it and/or modify it under the terms of the GNU Library General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. The GNU C Library is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Library General Public License for more details. You should have received a copy of the GNU Library General Public License along with the GNU C Library; see the file COPYING.LIB. If not, a copy is available at https://www.R-project.org/Licenses/ */ /* XXX This version of the implementation is not really complete. Some of the fields cannot add information alone. But if seeing some of them in the same format (such as year, week and weekday) this is enough information for determining the date. */ /* #include #include #include */ /* This is C90 */ #ifndef HAVE_LOCALE_H # define HAVE_LOCALE_H 1 #endif static int locale_strings_set = 0; static int locale_w_strings_set = 0; static void get_locale_strings(void); static void get_locale_w_strings(void); #ifdef HAVE_STRINGS_H #include /* for strncasecmp */ #endif #include /* for isspace */ #define match_char(ch1, ch2) if (ch1 != ch2) return NULL /* we guarantee to have strncasecmp in R */ #if defined __GNUC__ && __GNUC__ >= 2 # define match_string(cs1, s2) \ (__extension__ ({ size_t len = strlen (cs1); \ int result = strncasecmp ((cs1), (s2), len) == 0; \ if (result) (s2) += len; \ result; })) #else /* Oh come on. Get a reasonable compiler. */ # define match_string(cs1, s2) \ (strncasecmp ((cs1), (s2), strlen (cs1)) ? 0 : ((s2) += strlen (cs1), 1)) #endif /* We intentionally do not use isdigit() for testing because this will lead to problems with the wide character version. */ #define get_number(from, to, n) \ do { \ int __n = n; \ val = 0; \ while (*rp == ' ') \ ++rp; \ if (*rp < '0' || *rp > '9') \ return NULL; \ do { \ val *= 10; \ val += *rp++ - '0'; \ /* } while (--__n > 0 && val * 10 <= to && *rp >= '0' && *rp <= '9');*/ \ } while (--__n > 0 && *rp >= '0' && *rp <= '9'); \ if (val < from || val > to) \ return NULL; \ } while (0) # define get_alt_number(from, to, n) \ /* We don't have the alternate representation. */ \ get_number(from, to, n) #define recursive(new_fmt) \ (*(new_fmt) != '\0' \ && (rp = strptime_internal (rp, (new_fmt), tm, psecs, poffset)) != NULL) /* This version: may overwrite these with versions for the locale, * hence the extra length of the fields. * The limits here are overestimates from known locales: rare locales * have no abbreviations. * glibc has 11-char am_pm, 10-char abday, 11-char abmon (Dhivehi). * Gaelic has 12-char month names. * Allow for UTF-8 expansion, so these are 4x the wchar limits. */ #define DT_BUFSIZE 100 static char weekday_name[][DT_BUFSIZE] = { "Sunday", "Monday", "Tuesday", "Wednesday", "Thursday", "Friday", "Saturday" }; static char ab_weekday_name[][DT_BUFSIZE] = { "Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat" }; static char month_name[][DT_BUFSIZE] = { "January", "February", "March", "April", "May", "June", "July", "August", "September", "October", "November", "December" }; static char ab_month_name[][DT_BUFSIZE] = { "Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec" }; static char am_pm[][DT_BUFSIZE] = {"AM", "PM"}; # define HERE_D_T_FMT "%a %b %e %H:%M:%S %Y" # define HERE_D_FMT "%y/%m/%d" # define HERE_T_FMT_AMPM "%I:%M:%S %p" # define HERE_T_FMT "%H:%M:%S" static const unsigned short int __mon_yday[2][13] = { /* Normal years. */ { 0, 31, 59, 90, 120, 151, 181, 212, 243, 273, 304, 334, 365 }, /* Leap years. */ { 0, 31, 60, 91, 121, 152, 182, 213, 244, 274, 305, 335, 366 } }; # define __isleap(year) \ ((year) % 4 == 0 && ((year) % 100 != 0 || (year) % 400 == 0)) /* Compute the day of the week. */ static void day_of_the_week (stm *tm) { /* We know that January 1st 1970 was a Thursday (= 4). Compute the the difference between this data in the one on TM and so determine the weekday. */ int corr_year, wday; /* R bug fix: day_of_the_week needs year, month, mday set */ if(tm->tm_year == NA_INTEGER || tm->tm_mon == NA_INTEGER || tm->tm_mday == NA_INTEGER) return; corr_year = 1900 + tm->tm_year - (tm->tm_mon < 2); wday = (-473 + (365 * (tm->tm_year - 70)) + (corr_year / 4) - ((corr_year / 4) / 25) + ((corr_year / 4) % 25 < 0) + (((corr_year / 4) / 25) / 4) + __mon_yday[0][tm->tm_mon] // no check on month in range + tm->tm_mday - 1); tm->tm_wday = ((wday % 7) + 7) % 7; } /* Compute the day of the year. */ static void day_of_the_year (stm *tm) { /* R bug fix: day_of_the_year needs year, month, mday set */ if(tm->tm_year == NA_INTEGER || tm->tm_mon == NA_INTEGER || tm->tm_mday == NA_INTEGER) return; tm->tm_yday = (__mon_yday[__isleap (1900 + tm->tm_year)][tm->tm_mon] + (tm->tm_mday - 1)); } #include #include #include // to possibly override iswspace #define DT_WBUFSIZE 25 static wchar_t w_weekday_name[][DT_WBUFSIZE] = { L"Sunday", L"Monday", L"Tuesday", L"Wednesday", L"Thursday", L"Friday", L"Saturday" }; static wchar_t w_ab_weekday_name[][DT_WBUFSIZE] = { L"Sun", L"Mon", L"Tue", L"Wed", L"Thu", L"Fri", L"Sat" }; static wchar_t w_month_name[][DT_WBUFSIZE] = { L"January", L"February", L"March", L"April", L"May", L"June", L"July", L"August", L"September", L"October", L"November", L"December" }; static wchar_t w_ab_month_name[][DT_WBUFSIZE] = { L"Jan", L"Feb", L"Mar", L"Apr", L"May", L"Jun", L"Jul", L"Aug", L"Sep", L"Oct", L"Nov", L"Dec" }; static wchar_t w_am_pm[][DT_WBUFSIZE] = {L"AM", L"PM"}; /* Need case-insensitive version */ static int Rwcsncasecmp(const wchar_t *cs1, const wchar_t *s2) { size_t i, n = wcslen(cs1); const wchar_t *a = cs1, *b = s2; for(i = 0; i < n; i++, a++, b++) { if(*b == L'\0' || towlower(*a) != towlower(*b)) return 1; } return 0; } #define w_match_string(cs1, s2) \ (Rwcsncasecmp ((cs1), (s2)) ? 0 : ((s2) += wcslen (cs1), 1)) #define w_recursive(new_fmt) \ (*(new_fmt) != '\0' \ && (rp = w_strptime_internal (rp, (new_fmt), tm, psecs, poffset)) != NULL) static wchar_t * w_strptime_internal (wchar_t *rp, const wchar_t *fmt, stm *tm, double *psecs, int *poffset) { int cnt; int val; int have_I, is_pm; int century, want_century; int have_wday, want_xday; int have_yday; int have_mon, have_mday; int have_uweek, have_wweek; int week_no = 0; /* -Wall */ have_I = is_pm = 0; century = -1; want_century = 0; have_wday = want_xday = have_yday = have_mon = have_mday = 0; have_uweek = have_wweek = 0; while (*fmt != L'\0') { /* A white space in the format string matches 0 more or white space in the input string. */ if (iswspace (*fmt)) { while (iswspace (*rp)) ++rp; ++fmt; continue; } /* Any character but `%' must be matched by the same character in the input string. */ if (*fmt != L'%') { match_char (*fmt++, *rp++); continue; } ++fmt; /* We need this for handling the `E' modifier. */ start_over: switch (*fmt++) { case L'%': /* Match the `%' character itself. */ match_char (L'%', *rp++); break; case L'a': case L'A': /* Match day of week. */ #if defined(HAVE_WCSFTIME) if(!locale_w_strings_set) get_locale_w_strings(); #endif /* try full name first */ for (cnt = 0; cnt < 7; ++cnt) if (w_match_string (w_weekday_name[cnt], rp)) break; if (cnt == 7) { for (cnt = 0; cnt < 7; ++cnt) if (w_match_string (w_ab_weekday_name[cnt], rp)) break; } if (cnt == 7) /* Does not match a weekday name. */ return NULL; tm->tm_wday = cnt; have_wday = 1; break; case L'b': case L'B': case L'h': /* Match month name. */ #if defined(HAVE_WCSFTIME) if(!locale_w_strings_set) get_locale_w_strings(); #endif /* try full name first */ for (cnt = 0; cnt < 12; ++cnt) if (w_match_string (w_month_name[cnt], rp)) break; if (cnt == 12) { /* Try full names */ for (cnt = 0; cnt < 12; ++cnt) if (w_match_string (w_ab_month_name[cnt], rp)) break; } if (cnt == 12) /* Does not match a month name. */ return NULL; tm->tm_mon = cnt; want_xday = 1; break; case L'c': /* Match locale's date and time format. */ if (!w_recursive (L"%a %b %e %H:%M:%S %Y")) /* HERE_D_T_FMT */ return NULL; break; case L'C': /* Match century number. */ get_number (0, 99, 2); century = val; want_xday = 1; break; case L'd': case L'e': /* Match day of month. */ get_number (1, 31, 2); tm->tm_mday = val; have_mday = 1; want_xday = 1; break; case L'F': if (!w_recursive (L"%Y-%m-%d")) return NULL; want_xday = 1; break; case L'x': /* Fall through. */ case L'D': /* Match standard day format. */ if (!w_recursive (L"%y/%m/%d")) /* HERE_D_FMT */ return NULL; want_xday = 1; break; case L'k': case L'H': /* Match hour in 24-hour clock. */ get_number (0, 24, 2); /* allow 24:00:00 */ tm->tm_hour = val; have_I = 0; break; case L'l': /* Match hour in 12-hour clock. GNU extension. */ case L'I': /* Match hour in 12-hour clock. */ get_number (1, 12, 2); tm->tm_hour = val % 12; have_I = 1; break; case L'j': /* Match day number of year. */ get_number (1, 366, 3); // NB: 366 would be invalid in most years tm->tm_yday = val - 1; have_yday = 1; break; case L'm': /* Match number of month. */ get_number (1, 12, 2); tm->tm_mon = val - 1; have_mon = 1; want_xday = 1; break; case L'M': /* Match minute. */ get_number (0, 59, 2); tm->tm_min = val; break; case L'n': case L't': /* Match any white space. */ while (iswspace (*rp)) ++rp; break; case L'p': /* Match locale's equivalent of AM/PM. */ #if defined(HAVE_WCSFTIME) if(!locale_w_strings_set) get_locale_w_strings(); #endif if (!w_match_string (w_am_pm[0], rp)) { if (w_match_string (w_am_pm[1], rp)) is_pm = 1; else return NULL; } break; case L'r': if (!w_recursive (L"%I:%M:%S %p")) /* HERE_T_FMT_AMPM */ return NULL; break; case L'R': if (!w_recursive (L"%H:%M")) return NULL; break; case L's': { /* The number of seconds may be very high so we cannot use the `get_number' macro. Instead read the number character for character and construct the result while doing this. */ time_t secs = 0; if (*rp < L'0' || *rp > L'9') /* We need at least one digit. */ return NULL; do { secs *= 10; secs += *rp++ - L'0'; } while (*rp >= L'0' && *rp <= L'9'); #ifdef HAVE_LOCALTIME_R if ((tm = localtime_r (&secs, tm)) == NULL) return NULL; #else if ((tm = localtime (&secs)) == NULL) return NULL; #endif } break; case L'S': get_number (0, 61, 2); tm->tm_sec = val; break; case L'X': /* Fall through. */ case L'T': if (!w_recursive (L"%H:%M:%S")) /* HERE_T_FMT */ return NULL; break; case L'u': get_number (1, 7, 1); tm->tm_wday = val % 7; have_wday = 1; break; case L'g': get_number (0, 99, 2); /* XXX This cannot determine any field in TM. */ break; case L'G': if (*rp < L'0' || *rp > L'9') return NULL; /* XXX Ignore the number since we would need some more information to compute a real date. */ do ++rp; while (*rp >= L'0' && *rp <= L'9'); break; case L'U': get_number (0, 53, 2); week_no = val; have_uweek = 1; break; case L'W': get_number (0, 53, 2); week_no = val; have_wweek = 1; break; case L'V': get_number (0, 53, 2); /* XXX This cannot determine any field in TM without some information. */ break; case L'w': /* Match number of weekday. */ get_number (0, 6, 1); tm->tm_wday = val; have_wday = 1; break; case L'y': /* Match year within century. */ get_number (0, 99, 2); /* The "Year 2000: The Millennium Rollover" paper suggests that values in the range 69-99 refer to the twentieth century. */ int ival = val; tm->tm_year = ival >= 69 ? ival : ival + 100; /* Indicate that we want to use the century, if specified. */ want_century = 1; want_xday = 1; break; case L'Y': /* Match year including century number. */ get_number (0, 9999, 4); tm->tm_year = val - 1900; want_century = 0; want_xday = 1; break; case L'z': { int n = 0, neg, off = 0; val = 0; while (*rp == L' ') ++rp; if (*rp != L'+' && *rp != L'-') return NULL; neg = *rp++ == L'-'; while (n < 4 && *rp >= L'0' && *rp <= L'9') { val = val * 10 + *rp++ - L'0'; ++n; } if (n != 4) return NULL; else { /* We have to convert the minutes into decimal. */ if (val % 100 >= 60) return NULL; val = (val / 100) * 100 + ((val % 100) * 50) / 30; } /* https://en.wikipedia.org/wiki/List_of_UTC_time_offsets */ if (val > 1400) { warning("values for %%z outside +/-1400 are an error"); return NULL; } off = ((val * 3600) / 100); if (neg) off = -off; *poffset = off; } break; case L'Z': error(_("use of %s for input is not supported"), "%Z"); return NULL; break; case L'E': /* We have no information about the era format. Just use the normal format. */ if (*fmt != L'c' && *fmt != L'C' && *fmt != L'y' && *fmt != L'Y' && *fmt != L'x' && *fmt != L'X') /* This is an illegal format. */ return NULL; goto start_over; case L'O': switch (*fmt++) { case L'd': case L'e': /* Match day of month using alternate numeric symbols. */ get_alt_number (1, 31, 2); tm->tm_mday = val; have_mday = 1; want_xday = 1; break; case L'H': /* Match hour in 24-hour clock using alternate numeric symbols. */ get_alt_number (0, 23, 2); tm->tm_hour = val; have_I = 0; break; case L'I': /* Match hour in 12-hour clock using alternate numeric symbols. */ get_alt_number (1, 12, 2); tm->tm_hour = val % 12; have_I = 1; break; case L'm': /* Match month using alternate numeric symbols. */ get_alt_number (1, 12, 2); tm->tm_mon = val - 1; have_mon = 1; want_xday = 1; break; case L'M': /* Match minutes using alternate numeric symbols. */ get_alt_number (0, 59, 2); tm->tm_min = val; break; case L'S': /* Match seconds using alternate numeric symbols. get_alt_number (0, 61, 2); */ { double sval; wchar_t *end; sval = wcstod(rp, &end); if( sval >= 0.0 && sval <= 61.0) { tm->tm_sec = (int) sval; *psecs = sval; } rp = end; } break; case L'U': get_alt_number (0, 53, 2); week_no = val; have_uweek = 1; break; case L'W': get_alt_number (0, 53, 2); week_no = val; have_wweek = 1; break; case L'V': get_alt_number (0, 53, 2); /* XXX This cannot determine any field in TM without further information. */ break; case L'w': /* Match number of weekday using alternate numeric symbols. */ get_alt_number (0, 6, 1); tm->tm_wday = val; have_wday = 1; break; case L'y': /* Match year within century using alternate numeric symbols. */ get_alt_number (0, 99, 2); int ival = val; tm->tm_year = ival >= 69 ? ival : ival + 100; want_xday = 1; break; default: return NULL; } break; default: return NULL; } } if (have_I && is_pm) tm->tm_hour += 12; if (century != -1) { if (want_century) tm->tm_year = tm->tm_year % 100 + (century - 19) * 100; else /* Only the century, but not the year. Strange, but so be it. */ tm->tm_year = (century - 19) * 100; } if (want_xday && !have_wday) { if ( !(have_mon && have_mday) && have_yday) { /* have_yday, so this must have come from %j */ /* We don't have tm_mon and/or tm_mday, compute them. */ int t_mon = 0; int yr = 1900 + tm->tm_year; if(tm->tm_yday > (__isleap(yr) ? 365 : 364)) { warning("day-of-year %d in year %d is invalid\n", tm->tm_yday+1, yr); t_mon = 12; // this will give an invalid mday, so invalid tm } else { while (__mon_yday[__isleap(yr)][t_mon] <= tm->tm_yday) t_mon++; } if (!have_mon) tm->tm_mon = t_mon - 1; if (!have_mday) tm->tm_mday = (tm->tm_yday - __mon_yday[__isleap(yr)][t_mon - 1] + 1); } day_of_the_week (tm); } if (want_xday && !have_yday) day_of_the_year (tm); if ((have_uweek || have_wweek) && have_wday) { int save_wday = tm->tm_wday; int save_mday = tm->tm_mday; int save_mon = tm->tm_mon; int w_offset = have_uweek ? 0 : 1; tm->tm_mday = 1; tm->tm_mon = 0; day_of_the_week (tm); if (have_mday) tm->tm_mday = save_mday; if (have_mon) tm->tm_mon = save_mon; if (!have_yday) { // Get yday from week and day-of-the-week. // This does not validate yday against any upper limit tm->tm_yday = ((7 - (tm->tm_wday - w_offset)) % 7 + (week_no - 1) *7 + save_wday - w_offset); if(tm->tm_yday < 0) tm->tm_yday += 7; } if (!have_mday || !have_mon) { int t_mon = 0; int yr = 1900 + tm->tm_year; if(tm->tm_yday > (__isleap(yr) ? 365 : 364)) { warning("(0-based) yday %d in year %d is invalid\n", tm->tm_yday, yr); t_mon = 12; } else { while (__mon_yday[__isleap(yr)][t_mon] <= tm->tm_yday) t_mon++; } if (!have_mon) tm->tm_mon = t_mon - 1; if (!have_mday) tm->tm_mday = (tm->tm_yday - __mon_yday[__isleap(yr)][t_mon - 1] + 1); } tm->tm_wday = save_wday; } return rp; } static char * strptime_internal (const char *rp, const char *fmt, stm *tm, double *psecs, int *poffset) { int cnt; int val; int have_I, is_pm; int century, want_century; int have_wday, want_xday; int have_yday; int have_mon, have_mday; int have_uweek, have_wweek; int week_no = 0; /* -Wall */ have_I = is_pm = 0; century = -1; want_century = 0; have_wday = want_xday = have_yday = have_mon = have_mday = 0; have_uweek = have_wweek = 0; while (*fmt != '\0') { /* A white space in the format string matches 0 more or white space in the input string. */ if (isspace ((int)*fmt)) { while (isspace ((int)*rp)) ++rp; ++fmt; continue; } /* Any character but `%' must be matched by the same character in the input string. */ if (*fmt != '%') { match_char (*fmt++, *rp++); continue; } ++fmt; /* We need this for handling the `E' modifier. */ start_over: switch (*fmt++) { case '%': /* Match the `%' character itself. */ match_char ('%', *rp++); break; case 'a': case 'A': /* Match day of week. */ if(!locale_strings_set) get_locale_strings(); /* try full name first */ for (cnt = 0; cnt < 7; ++cnt) if (match_string (weekday_name[cnt], rp)) break; if (cnt == 7) { for (cnt = 0; cnt < 7; ++cnt) if (match_string (ab_weekday_name[cnt], rp)) break; } if (cnt == 7) /* Does not match a weekday name. */ return NULL; tm->tm_wday = cnt; have_wday = 1; break; case 'b': case 'B': case 'h': /* Match month name. */ if(!locale_strings_set) get_locale_strings(); /* try full name first */ for (cnt = 0; cnt < 12; ++cnt) if (match_string (month_name[cnt], rp)) break; if (cnt == 12) { /* Try full names */ for (cnt = 0; cnt < 12; ++cnt) if (match_string (ab_month_name[cnt], rp)) break; } if (cnt == 12) /* Does not match a month name. */ return NULL; tm->tm_mon = cnt; want_xday = 1; break; case 'c': /* Match locale's date and time format. */ if (!recursive (HERE_D_T_FMT)) return NULL; break; case 'C': /* Match century number. */ get_number (0, 99, 2); century = val; want_xday = 1; break; case 'd': case 'e': /* Match day of month. */ get_number (1, 31, 2); tm->tm_mday = val; have_mday = 1; want_xday = 1; break; case 'F': if (!recursive ("%Y-%m-%d")) return NULL; want_xday = 1; break; case 'x': /* Fall through. */ case 'D': /* Match standard day format. */ if (!recursive (HERE_D_FMT)) return NULL; want_xday = 1; break; case 'k': case 'H': /* Match hour in 24-hour clock. */ get_number (0, 24, 2); /* allow 24:00:00 */ tm->tm_hour = val; have_I = 0; break; case 'l': /* Match hour in 12-hour clock. GNU extension. */ case 'I': /* Match hour in 12-hour clock. */ get_number (1, 12, 2); tm->tm_hour = val % 12; have_I = 1; break; case 'j': /* Match day number of year. */ get_number (1, 366, 3); tm->tm_yday = val - 1; have_yday = 1; break; case 'm': /* Match number of month. */ get_number (1, 12, 2); tm->tm_mon = val - 1; have_mon = 1; want_xday = 1; break; case 'M': /* Match minute. */ get_number (0, 59, 2); tm->tm_min = val; break; case 'n': case 't': /* Match any white space. */ while (isspace ((int)*rp)) ++rp; break; case 'p': /* Match locale's equivalent of AM/PM. */ if(!locale_strings_set) get_locale_strings(); if (!match_string (am_pm[0], rp)) { if (match_string (am_pm[1], rp)) is_pm = 1; else return NULL; } break; case 'r': if (!recursive (HERE_T_FMT_AMPM)) return NULL; break; case 'R': if (!recursive ("%H:%M")) return NULL; break; case 's': { /* The number of seconds may be very high so we cannot use the `get_number' macro. Instead read the number character for character and construct the result while doing this. */ time_t secs = 0; if (*rp < '0' || *rp > '9') /* We need at least one digit. */ return NULL; do { secs *= 10; secs += *rp++ - '0'; } while (*rp >= '0' && *rp <= '9'); #ifdef HAVE_LOCALTIME_R if ((tm = localtime_r (&secs, tm)) == NULL) return NULL; #else if ((tm = localtime (&secs)) == NULL) return NULL; #endif } break; case 'S': get_number (0, 61, 2); tm->tm_sec = val; break; case 'X': /* Fall through. */ case 'T': if (!recursive (HERE_T_FMT)) return NULL; break; case 'u': get_number (1, 7, 1); tm->tm_wday = val % 7; have_wday = 1; break; case 'g': get_number (0, 99, 2); /* XXX This cannot determine any field in TM. */ break; case 'G': if (*rp < '0' || *rp > '9') return NULL; /* XXX Ignore the number since we would need some more information to compute a real date. */ do ++rp; while (*rp >= '0' && *rp <= '9'); break; case 'U': get_number (0, 53, 2); week_no = val; have_uweek = 1; break; case 'W': get_number (0, 53, 2); week_no = val; have_wweek = 1; break; case 'V': get_number (0, 53, 2); /* XXX This cannot determine any field in TM without some information. */ break; case 'w': /* Match number of weekday. */ get_number (0, 6, 1); tm->tm_wday = val; have_wday = 1; break; case 'y': /* Match year within century. */ get_number (0, 99, 2); /* The "Year 2000: The Millennium Rollover" paper suggests that values in the range 69-99 refer to the twentieth century. And this is mandated by the POSIX 2001 standard, with a caveat that it might change in future. */ int ival = val; tm->tm_year = ival >= 69 ? ival : ival + 100; /* Indicate that we want to use the century, if specified. */ want_century = 1; want_xday = 1; break; case 'Y': /* Match year including century number. */ get_number (0, 9999, 4); tm->tm_year = val - 1900; want_century = 0; want_xday = 1; break; case 'z': /* Only recognize RFC 822 form */ { int n = 0, neg, off = 0; val = 0; while (*rp == ' ') ++rp; if (*rp != '+' && *rp != '-') return NULL; neg = *rp++ == '-'; while (n < 4 && *rp >= '0' && *rp <= '9') { val = val * 10 + *rp++ - '0'; ++n; } if (n != 4) return NULL; else { /* We have to convert the minutes into decimal. */ if (val % 100 >= 60) return NULL; val = (val / 100) * 100 + ((val % 100) * 50) / 30; } if (val > 1400) { warning("values for %%z outside +/-1400 are an error"); return NULL; } off = (val * 3600) / 100; if (neg) off = -off; *poffset = off; } break; case 'Z': error(_("use of %s for input is not supported"), "%Z"); return NULL; break; case 'E': /* We have no information about the era format. Just use the normal format. */ if (*fmt != 'c' && *fmt != 'C' && *fmt != 'y' && *fmt != 'Y' && *fmt != 'x' && *fmt != 'X') /* This is an illegal format. */ return NULL; goto start_over; case 'O': switch (*fmt++) { case 'd': case 'e': /* Match day of month using alternate numeric symbols. */ get_alt_number (1, 31, 2); tm->tm_mday = val; have_mday = 1; want_xday = 1; break; case 'H': /* Match hour in 24-hour clock using alternate numeric symbols. */ get_alt_number (0, 23, 2); tm->tm_hour = val; have_I = 0; break; case 'I': /* Match hour in 12-hour clock using alternate numeric symbols. */ get_alt_number (1, 12, 2); tm->tm_hour = val % 12; have_I = 1; break; case 'm': /* Match month using alternate numeric symbols. */ get_alt_number (1, 12, 2); tm->tm_mon = val - 1; have_mon = 1; want_xday = 1; break; case 'M': /* Match minutes using alternate numeric symbols. */ get_alt_number (0, 59, 2); tm->tm_min = val; break; case 'S': /* Match seconds using alternate numeric symbols. get_alt_number (0, 61, 2); */ { double sval; char *end; sval = strtod(rp, &end); if( sval >= 0.0 && sval <= 61.0) { tm->tm_sec = (int) sval; *psecs = sval; } rp = end; } break; case 'U': get_alt_number (0, 53, 2); week_no = val; have_uweek = 1; break; case 'W': get_alt_number (0, 53, 2); week_no = val; have_wweek = 1; break; case 'V': get_alt_number (0, 53, 2); /* XXX This cannot determine any field in TM without further information. */ break; case 'w': /* Match number of weekday using alternate numeric symbols. */ get_alt_number (0, 6, 1); tm->tm_wday = val; have_wday = 1; break; case 'y': /* Match year within century using alternate numeric symbols. */ get_alt_number (0, 99, 2); int ival = val; tm->tm_year = ival >= 69 ? ival : ival + 100; want_xday = 1; break; default: return NULL; } break; default: return NULL; } } if (have_I && is_pm) tm->tm_hour += 12; if (century != -1) { if (want_century) tm->tm_year = tm->tm_year % 100 + (century - 19) * 100; else /* Only the century, but not the year. Strange, but so be it. */ tm->tm_year = (century - 19) * 100; } if (want_xday && !have_wday) { if ( !(have_mon && have_mday) && have_yday) { /* have_yday, so this must have come from %j */ /* We don't have tm_mon and/or tm_mday, compute them. */ int t_mon = 0; int yr = 1900 + tm->tm_year; if(tm->tm_yday > (__isleap(yr) ? 365 : 364)) { warning("day-of-year %d in year %d is invalid\n", tm->tm_yday+1, yr); t_mon = 12; } else { while (__mon_yday[__isleap(yr)][t_mon] <= tm->tm_yday) t_mon++; } if (!have_mon) tm->tm_mon = t_mon - 1; if (!have_mday) tm->tm_mday = (tm->tm_yday - __mon_yday[__isleap(yr)][t_mon - 1] + 1); } day_of_the_week (tm); } if (want_xday && !have_yday) day_of_the_year (tm); if ((have_uweek || have_wweek) && have_wday) { int save_wday = tm->tm_wday; int save_mday = tm->tm_mday; int save_mon = tm->tm_mon; int w_offset = have_uweek ? 0 : 1; tm->tm_mday = 1; tm->tm_mon = 0; day_of_the_week (tm); if (have_mday) tm->tm_mday = save_mday; if (have_mon) tm->tm_mon = save_mon; if (!have_yday) tm->tm_yday = ((7 - (tm->tm_wday - w_offset)) % 7 + (week_no - 1) *7 + save_wday - w_offset); if (!have_mday || !have_mon) { int t_mon = 0; int yr = 1900 + tm->tm_year; if(tm->tm_yday > (__isleap(yr) ? 365 : 364)) { warning("(0-based) yday %d in year %d is invalid\n", tm->tm_yday, yr); t_mon = 12; } else { while (__mon_yday[__isleap(yr)][t_mon] <= tm->tm_yday) t_mon++; } if (!have_mon) tm->tm_mon = t_mon - 1; if (!have_mday) tm->tm_mday = (tm->tm_yday - __mon_yday[__isleap(yr)][t_mon - 1] + 1); } tm->tm_wday = save_wday; } return (char *) rp; } /* We could use nl_langinfo() here: see src/extra/timezone/strftime.c But we would stil need to do it this way on Windows, and it is not clear if nl_langinfo() has wchar_t versions (some OSes do, some do not). */ attribute_hidden void dt_invalidate_locale(void) // used in platform.c { locale_strings_set = 0; locale_w_strings_set = 0; } /* use system stuct tm and strftime/wcsftime here */ static void get_locale_strings(void) { int i; struct tm tm; char buff[DT_BUFSIZE]; tm.tm_sec = tm.tm_min = tm.tm_hour = tm.tm_mday = tm.tm_mon = tm.tm_isdst = 0; tm.tm_year = 30; for(i = 0; i < 12; i++) { tm.tm_mon = i; // What happens if this does not fit is not well-defined, // so we null-terminate as a precaution. strftime(ab_month_name[i], DT_BUFSIZE, "%b", &tm); ab_month_name[i][DT_BUFSIZE-1] = '\0'; strftime(month_name[i], DT_BUFSIZE, "%B", &tm); month_name[i][DT_BUFSIZE-1] = '\0'; } tm.tm_mon = 0; for(i = 0; i < 7; i++) { tm.tm_mday = tm.tm_yday = i+1; /* 2000-01-02 was a Sunday */ tm.tm_wday = i; strftime(ab_weekday_name[i], DT_BUFSIZE, "%a", &tm); ab_weekday_name[i][DT_BUFSIZE-1] = '\0'; strftime(weekday_name[i], DT_BUFSIZE, "%A", &tm); weekday_name[i][DT_BUFSIZE-1] = '\0'; } tm.tm_hour = 1; /* in locales where these are unused, they may be empty: better not to reset them then */ strftime(buff, DT_BUFSIZE, "%p", &tm); buff[DT_BUFSIZE-1] = '\0'; if(strlen(buff)) strcpy(am_pm[0], buff); tm.tm_hour = 13; strftime(buff, DT_BUFSIZE, "%p", &tm); buff[DT_BUFSIZE-1] = '\0'; if(strlen(buff)) strcpy(am_pm[1], buff); locale_strings_set = 1; } #if defined(HAVE_WCSTOD) && defined(HAVE_WCSFTIME) static void get_locale_w_strings(void) { int i; struct tm tm; wchar_t buff[DT_WBUFSIZE]; tm.tm_sec = tm.tm_min = tm.tm_hour = tm.tm_mday = tm.tm_mon = tm.tm_isdst = 0; tm.tm_year = 30; for(i = 0; i < 12; i++) { tm.tm_mon = i; wcsftime(w_ab_month_name[i], DT_WBUFSIZE, L"%b", &tm); w_ab_month_name[i][DT_WBUFSIZE - 1] = L'\0'; wcsftime(w_month_name[i], DT_WBUFSIZE, L"%B", &tm); w_month_name[i][DT_WBUFSIZE - 1] = L'\0'; } tm.tm_mon = 0; for(i = 0; i < 7; i++) { tm.tm_mday = tm.tm_yday = i+1; /* 2000-01-02 was a Sunday */ tm.tm_wday = i; wcsftime(w_ab_weekday_name[i], DT_WBUFSIZE, L"%a", &tm); w_ab_weekday_name[i][DT_WBUFSIZE - 1] = L'\0'; wcsftime(w_weekday_name[i], DT_WBUFSIZE, L"%A", &tm); w_weekday_name[i][DT_WBUFSIZE - 1] = L'\0'; } tm.tm_hour = 1; /* in locales where these are unused, they may be empty: better not to reset them then */ wcsftime(buff, DT_WBUFSIZE, L"%p", &tm); buff[DT_WBUFSIZE - 1] = L'\0'; if(wcslen(buff)) wcscpy(w_am_pm[0], buff); tm.tm_hour = 13; wcsftime(buff, DT_WBUFSIZE, L"%p", &tm); buff[DT_WBUFSIZE - 1] = L'\0'; if(wcslen(buff)) wcscpy(w_am_pm[1], buff); locale_w_strings_set = 1; } #endif /* We only care if the result is null or not */ static void * R_strptime (const char *buf, const char *format, stm *tm, double *psecs, int *poffset) { #if defined(HAVE_WCSTOD) if(mbcslocale) { wchar_t wbuf[1001], wfmt[1001]; size_t n; // GCC 12 does not ignore third arg, contradicting the glibc man page // but seems content with 0 rather than 1000. // (Not mentioned by C99/C11). n = mbstowcs(NULL, buf, 0); if(n > 1000) error(_("input string is too long")); n = mbstowcs(wbuf, buf, 1000); if(n == -1) error(_("invalid multibyte input string")); n = mbstowcs(NULL, format, 0); // ditto if(n > 1000) error(_("format string is too long")); n = mbstowcs(wfmt, format, 1000); if(n == -1) error(_("invalid multibyte format string")); return (void *) w_strptime_internal (wbuf, wfmt, tm, psecs, poffset); } else #endif { return (void *) strptime_internal (buf, format, tm, psecs, poffset); } }