1 /* $NetBSD: strptime.c,v 1.38 2013/05/17 12:55:57 joerg Exp $ */
4 * Copyright (c) 1997, 1998, 2005, 2008 The NetBSD Foundation, Inc.
7 * This code was contributed to The NetBSD Foundation by Klaus Klein.
8 * Heavily optimised by David Laight
10 * Redistribution and use in source and binary forms, with or without
11 * modification, are permitted provided that the following conditions
13 * 1. Redistributions of source code must retain the above copyright
14 * notice, this list of conditions and the following disclaimer.
15 * 2. Redistributions in binary form must reproduce the above copyright
16 * notice, this list of conditions and the following disclaimer in the
17 * documentation and/or other materials provided with the distribution.
19 * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 * POSSIBILITY OF SUCH DAMAGE.
32 #include <sys/cdefs.h>
33 #if defined(LIBC_SCCS) && !defined(lint)
34 __RCSID("$NetBSD: strptime.c,v 1.38 2013/05/17 12:55:57 joerg Exp $");
37 #include "namespace.h"
38 #include <sys/localedef.h>
45 #include "setlocale_local.h"
48 __weak_alias(strptime
,_strptime
)
49 __weak_alias(strptime_l
, _strptime_l
)
52 #define _TIME_LOCALE(loc) \
53 ((_TimeLocale *)((loc)->part_impl[(size_t)LC_TIME]))
56 * We do not implement alternate representations. However, we always
57 * check whether a given modifier is allowed for a certain conversion.
61 #define LEGAL_ALT(x) { if (alt_format & ~(x)) return NULL; }
63 static char gmt
[] = { "GMT" };
64 static char utc
[] = { "UTC" };
65 /* RFC-822/RFC-2822 */
66 static const char * const nast
[5] = {
67 "EST", "CST", "MST", "PST", "\0\0\0"
69 static const char * const nadt
[5] = {
70 "EDT", "CDT", "MDT", "PDT", "\0\0\0"
73 static const u_char
*conv_num(const unsigned char *, int *, uint
, uint
);
74 static const u_char
*find_string(const u_char
*, int *, const char * const *,
75 const char * const *, int);
78 strptime(const char *buf
, const char *fmt
, struct tm
*tm
)
80 return strptime_l(buf
, fmt
, tm
, _current_locale());
84 strptime_l(const char *buf
, const char *fmt
, struct tm
*tm
, locale_t loc
)
87 const unsigned char *bp
, *ep
;
88 int alt_format
, i
, split_year
= 0, neg
= 0, offs
;
91 bp
= (const u_char
*)buf
;
93 while (bp
!= NULL
&& (c
= *fmt
++) != '\0') {
94 /* Clear `alternate' modifier prior to new conversion. */
98 /* Eat up white-space. */
109 again
: switch (c
= *fmt
++) {
110 case '%': /* "%%" is converted to "%". */
118 * "Alternative" modifiers. Just set the appropriate flag
119 * and start over again.
121 case 'E': /* "%E?" alternative conversion modifier. */
126 case 'O': /* "%O?" alternative conversion modifier. */
132 * "Complex" conversion rules, implemented through recursion.
134 case 'c': /* Date and time, using the locale's format. */
135 new_fmt
= _TIME_LOCALE(loc
)->d_t_fmt
;
138 case 'D': /* The date as "%m/%d/%y". */
139 new_fmt
= "%m/%d/%y";
143 case 'F': /* The date as "%Y-%m-%d". */
144 new_fmt
= "%Y-%m-%d";
148 case 'R': /* The time as "%H:%M". */
153 case 'r': /* The time in 12-hour clock representation. */
154 new_fmt
= _TIME_LOCALE(loc
)->t_fmt_ampm
;
158 case 'T': /* The time as "%H:%M:%S". */
159 new_fmt
= "%H:%M:%S";
163 case 'X': /* The time, using the locale's format. */
164 new_fmt
= _TIME_LOCALE(loc
)->t_fmt
;
167 case 'x': /* The date, using the locale's format. */
168 new_fmt
= _TIME_LOCALE(loc
)->d_fmt
;
170 bp
= (const u_char
*)strptime((const char *)bp
,
176 * "Elementary" conversion rules.
178 case 'A': /* The day of week, using the locale's form. */
180 bp
= find_string(bp
, &tm
->tm_wday
,
181 _TIME_LOCALE(loc
)->day
, _TIME_LOCALE(loc
)->abday
, 7);
185 case 'B': /* The month, using the locale's form. */
188 bp
= find_string(bp
, &tm
->tm_mon
,
189 _TIME_LOCALE(loc
)->mon
, _TIME_LOCALE(loc
)->abmon
,
194 case 'C': /* The century number. */
196 bp
= conv_num(bp
, &i
, 0, 99);
198 i
= i
* 100 - TM_YEAR_BASE
;
200 i
+= tm
->tm_year
% 100;
206 case 'd': /* The day of month. */
208 bp
= conv_num(bp
, &tm
->tm_mday
, 1, 31);
212 case 'k': /* The hour (24-hour clock representation). */
216 bp
= conv_num(bp
, &tm
->tm_hour
, 0, 23);
220 case 'l': /* The hour (12-hour clock representation). */
224 bp
= conv_num(bp
, &tm
->tm_hour
, 1, 12);
225 if (tm
->tm_hour
== 12)
230 case 'j': /* The day of year. */
232 bp
= conv_num(bp
, &i
, 1, 366);
237 case 'M': /* The minute. */
238 bp
= conv_num(bp
, &tm
->tm_min
, 0, 59);
242 case 'm': /* The month. */
244 bp
= conv_num(bp
, &i
, 1, 12);
249 case 'p': /* The locale's equivalent of AM/PM. */
250 bp
= find_string(bp
, &i
, _TIME_LOCALE(loc
)->am_pm
,
252 if (tm
->tm_hour
> 11)
254 tm
->tm_hour
+= i
* 12;
258 case 'S': /* The seconds. */
259 bp
= conv_num(bp
, &tm
->tm_sec
, 0, 61);
264 #define TIME_MAX INT64_MAX
266 case 's': /* seconds since the epoch */
269 uint64_t rulim
= TIME_MAX
;
271 if (*bp
< '0' || *bp
> '9') {
280 } while ((sse
* 10 <= TIME_MAX
) &&
281 rulim
&& *bp
>= '0' && *bp
<= '9');
283 if (sse
< 0 || (uint64_t)sse
> TIME_MAX
) {
288 if (localtime_r(&sse
, tm
) == NULL
)
293 case 'U': /* The week of year, beginning on sunday. */
294 case 'W': /* The week of year, beginning on monday. */
296 * XXX This is bogus, as we can not assume any valid
297 * information present in the tm structure at this
298 * point to calculate a real value, so just check the
301 bp
= conv_num(bp
, &i
, 0, 53);
305 case 'w': /* The day of week, beginning on sunday. */
306 bp
= conv_num(bp
, &tm
->tm_wday
, 0, 6);
310 case 'u': /* The day of week, monday = 1. */
311 bp
= conv_num(bp
, &i
, 1, 7);
316 case 'g': /* The year corresponding to the ISO week
317 * number but without the century.
319 bp
= conv_num(bp
, &i
, 0, 99);
322 case 'G': /* The year corresponding to the ISO week
323 * number with century.
327 while (isdigit(*bp
));
330 case 'V': /* The ISO 8601:1988 week number as decimal */
331 bp
= conv_num(bp
, &i
, 0, 53);
334 case 'Y': /* The year. */
335 i
= TM_YEAR_BASE
; /* just for data sanity... */
336 bp
= conv_num(bp
, &i
, 0, 9999);
337 tm
->tm_year
= i
- TM_YEAR_BASE
;
341 case 'y': /* The year within 100 years of the epoch. */
342 /* LEGAL_ALT(ALT_E | ALT_O); */
343 bp
= conv_num(bp
, &i
, 0, 99);
346 /* preserve century */
347 i
+= (tm
->tm_year
/ 100) * 100;
351 i
= i
+ 2000 - TM_YEAR_BASE
;
353 i
= i
+ 1900 - TM_YEAR_BASE
;
360 if (strncmp((const char *)bp
, gmt
, 3) == 0) {
370 ep
= find_string(bp
, &i
,
371 (const char * const *)tzname
,
376 tm
->TM_GMTOFF
= -(timezone
);
379 tm
->TM_ZONE
= tzname
[i
];
388 * We recognize all ISO 8601 formats:
393 * We recognize all RFC-822/RFC-2822 formats:
395 * North American : UTC offsets
396 * E[DS]T = Eastern : -4 | -5
397 * C[DS]T = Central : -5 | -6
398 * M[DS]T = Mountain: -6 | -7
399 * P[DS]T = Pacific : -7 | -8
401 * [A-IL-M] = -1 ... -9 (J not used)
433 ep
= find_string(bp
, &i
, nast
, NULL
, 4);
436 tm
->TM_GMTOFF
= -5 - i
;
439 tm
->TM_ZONE
= __UNCONST(nast
[i
]);
444 ep
= find_string(bp
, &i
, nadt
, NULL
, 4);
448 tm
->TM_GMTOFF
= -4 - i
;
451 tm
->TM_ZONE
= __UNCONST(nadt
[i
]);
457 if ((*bp
>= 'A' && *bp
<= 'I') ||
458 (*bp
>= 'L' && *bp
<= 'Y')) {
461 if (*bp
>= 'A' && *bp
<= 'I')
463 ('A' - 1) - (int)*bp
;
464 else if (*bp
>= 'L' && *bp
<= 'M')
465 tm
->TM_GMTOFF
= 'A' - (int)*bp
;
466 else if (*bp
>= 'N' && *bp
<= 'Y')
467 tm
->TM_GMTOFF
= (int)*bp
- 'M';
470 tm
->TM_ZONE
= NULL
; /* XXX */
478 for (i
= 0; i
< 4; ) {
480 offs
= offs
* 10 + (*bp
++ - '0');
484 if (i
== 2 && *bp
== ':') {
498 /* Convert minutes into decimal */
499 offs
= (offs
/ 100) * 100 + (i
* 50) / 30;
506 tm
->tm_isdst
= 0; /* XXX */
508 tm
->TM_GMTOFF
= offs
;
511 tm
->TM_ZONE
= NULL
; /* XXX */
516 * Miscellaneous conversions.
518 case 'n': /* Any kind of white-space. */
526 default: /* Unknown/unsupported conversion. */
531 return __UNCONST(bp
);
535 static const u_char
*
536 conv_num(const unsigned char *buf
, int *dest
, uint llim
, uint ulim
)
541 /* The limit also determines the number of valid digits. */
545 if (ch
< '0' || ch
> '9')
553 } while ((result
* 10 <= ulim
) && rulim
&& ch
>= '0' && ch
<= '9');
555 if (result
< llim
|| result
> ulim
)
562 static const u_char
*
563 find_string(const u_char
*bp
, int *tgt
, const char * const *n1
,
564 const char * const *n2
, int c
)
569 /* check full name - then abbreviated ones */
570 for (; n1
!= NULL
; n1
= n2
, n2
= NULL
) {
571 for (i
= 0; i
< c
; i
++, n1
++) {
573 if (strncasecmp(*n1
, (const char *)bp
, len
) == 0) {
580 /* Nothing matched */