]> diplodocus.org Git - nmh/blob - sbr/dtimep.l
Makefile.am: Add test/inc/test-eom-align to XFAIL_TESTS.
[nmh] / sbr / dtimep.l
1 /* dtimep.l -- parse dates and times.
2 *
3 * This exceeds the default table capacities for some old versions
4 * of lex (and the minimum defaults as specified by POSIX). The following
5 * choices meet or exceed the lex defaults for older SunOS4.x, Solaris,
6 * HPUX, and AIX.
7 */
8 %e4000
9 %p7000
10 %n2500
11 %a5000
12 %{
13 #include <h/nmh.h>
14 #include <h/tws.h>
15
16 /* Since we're looking at a string at a time, don't worry about
17 * wrapping to the next buffer.
18 */
19 #if YY_FLEX_MAJOR_VERSION == 2 && \
20 YY_FLEX_MINOR_VERSION == 6 && \
21 YY_FLEX_SUBMINOR_VERSION == 3
22 /* https://github.com/westes/flex/issues/162 */
23 #undef yywrap
24 #endif
25 #define yywrap() 1
26 #define YY_SKIP_YYWRAP
27
28 #define YY_NO_INPUT
29
30 /* This is the tricky thing that makes this function cool. We
31 * replace the traditional int yylex(void) declaration with our
32 * dparsetime() declaration, essentially piggy-backing off the
33 * utility of the yylex() function and adding what we need to make
34 * the parsing function useful to us.
35 */
36 #define YY_DECL struct tws *dparsetime(char *lexstr)
37
38 /* yyterminate() is called after the input string is matched to
39 * completion (actually, when the lexer reaches an EOF). The only
40 * thing that really needs to be in this macro function is the
41 * return call, which must be substituted inline into dparsetime.
42 */
43
44 #define yyterminate() (void)yy_delete_buffer(lexhandle); \
45 if(!(tw.tw_flags & TW_SUCC)) { \
46 return (struct tws *)NULL; \
47 } \
48 if(tw.tw_year < 1970) \
49 tw.tw_year += 1900; \
50 if(tw.tw_year < 1970) \
51 tw.tw_year += 100; \
52 return(&tw)
53
54 /*
55 * Table to convert month names to numeric month. We use the
56 * fact that the low order 5 bits of the sum of the 2nd & 3rd
57 * characters of the name is a hash with no collisions for the 12
58 * valid month names. (The mask to 5 bits maps any combination of
59 * upper and lower case into the same hash value).
60 */
61 static int month_map[] = {
62 0,
63 6, /* 1 - Jul */
64 3, /* 2 - Apr */
65 5, /* 3 - Jun */
66 0,
67 10, /* 5 - Nov */
68 0,
69 1, /* 7 - Feb */
70 11, /* 8 - Dec */
71 0,
72 0,
73 0,
74 0,
75 0,
76 0,
77 0, /*15 - Jan */
78 0,
79 0,
80 0,
81 2, /*19 - Mar */
82 0,
83 8, /*21 - Sep */
84 0,
85 9, /*23 - Oct */
86 0,
87 0,
88 4, /*26 - May */
89 0,
90 7 /*28 - Aug */
91 };
92
93 /*
94 * Lookup table for day-of-week using the same hash trick as for above name-of-
95 * month table, but using the first and second character, not second and third.
96 *
97 * Compute index into table using: (day_name[0] & 7) + (day_name[1] & 4)
98 */
99 static int day_map[] = {
100 0,
101 0,
102 0,
103 6, /* 3 - Sat */
104 4, /* 4 - Thu */
105 0,
106 5, /* 6 - Fri */
107 0, /* 7 - Sun */
108 2, /* 8 - Tue */
109 1 /* 9 - Mon */,
110 0,
111 3 /*11 - Wed */
112 };
113
114 /* The SET* macros will parse for the appropriate field, and leave the
115 * cp pointer at the first character after the desired field. Be
116 * careful with variable-length fields or alpha-num mixes.
117
118 * The SKIP* macros skip over characters of a particular class and
119 * leave cp at the position of the first character that doesn't match
120 * that class. Correspondingly, SKIPTO* skips until it reaches a
121 * character of a particular class.
122 */
123
124 #define INIT() { cp = yytext;}
125 #define SETWDAY() { tw.tw_wday= day_map[(cp[0] & 7) + (cp[1] & 4)]; \
126 tw.tw_flags &= ~TW_SDAY; tw.tw_flags |= TW_SEXP; \
127 SKIPA(); }
128 #define SETMON() { cp++; \
129 tw.tw_mon = month_map[(((unsigned char) cp[0]) + ((unsigned char) cp[1])) & 0x1f]; \
130 SKIPA(); }
131 #define SETMON_NUM() { tw.tw_mon = atoi(cp)-1; \
132 SKIPD(); }
133 #define SETYEAR() { tw.tw_year = atoi(cp); \
134 SKIPD(); }
135 #define SETDAY() { tw.tw_mday = atoi(cp); \
136 tw.tw_flags |= TW_SUCC; \
137 SKIPD(); }
138 #define SETTIME() { tw.tw_hour = atoi(cp); \
139 cp += 2; \
140 SKIPTOD(); \
141 tw.tw_min = atoi(cp); \
142 cp += 2; \
143 if(*cp == ':') { \
144 tw.tw_sec = atoi(++cp); SKIPD(); } }
145 #define SETZONE(x) { tw.tw_zone = ((x)/100)*60+(x)%100; \
146 tw.tw_flags |= TW_SZEXP; \
147 SKIPD(); }
148 #define SETDST() { tw.tw_flags |= TW_DST; }
149 #define SKIPD() { while ( isdigit((unsigned char) *cp++) ) ; \
150 --cp; }
151 #define SKIPTOD() { while ( !isdigit((unsigned char) *cp++) ) ; \
152 --cp; }
153 #define SKIPA() { while ( isalpha((unsigned char) *cp++) ) ; \
154 --cp; }
155 #define SKIPTOA() { while ( !isalpha((unsigned char) *cp++) ) ; \
156 --cp; }
157 #define SKIPSP() { while ( isspace((unsigned char) *cp++) ) ; \
158 --cp; }
159 #define SKIPTOSP() { while ( !isspace((unsigned char) *cp++) ) ; \
160 --cp; }
161
162 # ifdef HAVE_SYS_TIME_H
163 # include <sys/time.h>
164 # endif
165 #include <time.h>
166
167 static void
168 zonehack (struct tws *tw)
169 {
170 struct tm *tm;
171
172 if (dmktime (tw) == (time_t) -1)
173 return;
174
175 tm = localtime (&tw->tw_clock);
176 if (tm->tm_isdst) {
177 tw->tw_flags |= TW_DST;
178 tw->tw_zone -= 60;
179 }
180 }
181 %}
182
183 sun [Ss]un(day)?
184 mon [Mm]on(day)?
185 tue [Tt]ue(sday)?
186 wed [Ww]ed(nesday)?
187 thu [Tt]hu(rsday)?
188 fri [Ff]ri(day)?
189 sat [Ss]at(urday)?
190
191 DAY {sun}|{mon}|{tue}|{wed}|{thu}|{fri}|{sat}
192
193 jan [Jj]an(uary)?
194 feb [Ff]eb(ruary)?
195 mar [Mm]ar(ch)?
196 apr [Aa]pr(il)?
197 may [Mm]ay
198 jun [Jj]une?
199 jul [Jj]uly?
200 aug [Aa]ug(ust)?
201 sep [Ss]ep(tember)?
202 oct [Oo]ct(ober)?
203 nov [Nn]ov(ember)?
204 dec [Dd]ec(ember)?
205
206 MONTH {jan}|{feb}|{mar}|{apr}|{may}|{jun}|{jul}|{aug}|{sep}|{oct}|{nov}|{dec}
207
208 TIME {D}:{d}{d}(:{d}{d})?
209
210 /* The year can either be 2 digits, or 4. However, after
211 Y2K, we found that some MUA were reporting the year 100, hence
212 the middle term here. yyterminate() resolves the actual
213 issues with 2-digit years.
214 */
215
216 YEAR ({d}{d})|(1{d}{d})|({d}{4})
217
218 w [ \t]*
219 W [ \t]+
220 D [0-9]?[0-9]
221 d [0-9]
222 nl [ \t\n()]
223
224 %%
225 %{
226 /* This section begins the definition of dparsetime().
227 Put here any local variable definitions and initializations */
228
229 YY_BUFFER_STATE lexhandle;
230
231 char *cp;
232 static struct tws tw;
233
234 memset(&tw,0,sizeof(struct tws));
235
236 lexhandle = yy_scan_string(lexstr);
237 %}
238
239 {DAY}","?{W}{MONTH}{W}{D}{W}{TIME}{W}{YEAR} {
240 INIT();
241 SETWDAY();
242 SKIPTOA();
243 SETMON();
244 SKIPTOD();
245 SETDAY();
246 SKIPTOD();
247 SETTIME();
248 SKIPTOD();
249 SETYEAR();
250 }
251
252 {DAY}","?{W}{D}{W}{MONTH}{W}{YEAR}{W}{TIME} {
253 INIT();
254 SETWDAY();
255 SKIPTOD();
256 SETDAY();
257 SKIPTOA();
258 SETMON();
259 SKIPTOD();
260 SETYEAR();
261 SKIPTOD();
262 SETTIME();
263 }
264 {D}{W}{MONTH}{W}{YEAR}{W}{TIME} {
265 INIT();
266 SETDAY();
267 SKIPTOA();
268 SETMON();
269 SKIPTOD();
270 SETYEAR();
271 SKIPTOD();
272 SETTIME();
273 }
274 {DAY}","?{W}{MONTH}{W}{D}","?{W}{YEAR}","?{W}{TIME} {
275 INIT();
276 SETWDAY();
277 SKIPTOA();
278 SETMON();
279 SKIPTOD();
280 SETDAY();
281 SKIPTOD();
282 SETYEAR();
283 SKIPTOD();
284 SETTIME();
285 }
286 {DAY}","?{W}{MONTH}{W}{D}","?{W}{YEAR} {
287 INIT();
288 SETWDAY();
289 SKIPTOA();
290 SETMON();
291 SKIPTOD();
292 SETDAY();
293 SKIPTOD();
294 SETYEAR();
295 }
296 {MONTH}{W}{D}","?{W}{YEAR}","?{W}{DAY} {
297 INIT();
298 SETMON();
299 SKIPTOD();
300 SETDAY();
301 SKIPTOD();
302 SETYEAR();
303 SKIPTOA();
304 SETWDAY();
305 }
306 {MONTH}{W}{D}","?{W}{YEAR} {
307 INIT();
308 SETMON();
309 SKIPTOD();
310 SETDAY();
311 SKIPTOD();
312 SETYEAR();
313 }
314 {D}("-"|"/"){D}("-"|"/"){YEAR}{W}{TIME} {
315 INIT();
316 /* MM/DD/YY */
317 SETMON_NUM();
318 SKIPTOD();
319 SETDAY();
320 SKIPTOD();
321 SETYEAR();
322 SKIPTOD();
323 SETTIME();
324 }
325 {D}("-"|"/"){D}("-"|"/"){YEAR} {
326 INIT();
327 /* MM/DD/YY */
328 SETMON_NUM();
329 SKIPTOD();
330 SETDAY();
331 SKIPTOD();
332 SETYEAR();
333 }
334
335 "[Aa][Mm]"
336 "[Pp][Mm]" tw.tw_hour += 12;
337
338 "+"{D}{d}{d} {
339 INIT();
340 SKIPTOD();
341 SETZONE(atoi(cp));
342 zonehack (&tw);
343 yyterminate();
344 }
345 "-"{D}{d}{d} {
346 INIT();
347 SKIPTOD();
348 SETZONE(-atoi(cp));
349 zonehack (&tw);
350 yyterminate();
351
352 }
353 {nl}("ut"|"UT") INIT(); SETZONE(0); yyterminate();
354 {nl}("gmt"|"GMT") INIT(); SETZONE(0); yyterminate();
355 {nl}("est"|"EST") INIT(); SETZONE(-500); yyterminate();
356 {nl}("edt"|"EDT") { INIT(); SETDST(); SETZONE(-500);
357 yyterminate(); }
358 {nl}("cst"|"CST") INIT(); SETZONE(-600); yyterminate();
359 {nl}("cdt"|"CDT") { INIT(); SETDST(); SETZONE(-600);
360 yyterminate(); }
361 {nl}("mst"|"MST") INIT(); SETZONE(-700); yyterminate();
362 {nl}("mdt"|"MDT") { INIT(); SETDST(); SETZONE(-700);
363 yyterminate(); }
364 {nl}("pst"|"PST") INIT(); SETZONE(-800); yyterminate();
365 {nl}("pdt"|"PDT") { INIT(); SETDST(); SETZONE(-800);
366 yyterminate(); }
367 {nl}("nst"|"NST") INIT(); SETZONE(-330); yyterminate();
368 {nl}("ast"|"AST") INIT(); SETZONE(-400); yyterminate();
369 {nl}("adt"|"ADT") { INIT(); SETDST(); SETZONE(-400);
370 yyterminate(); }
371 {nl}("hst"|"HST") INIT(); SETZONE(-1000); yyterminate();
372 {nl}("hdt"|"HDT") { INIT(); SETDST(); SETZONE(-1000);
373 yyterminate(); }
374 .|\n
375
376 %%
377 /* This is a portable way to squash a warning about the yyunput()
378 * function being static but never used. It costs us a tiny amount
379 * of extra code in the binary but the other options are:
380 * "%option nounput" which is flex-specific
381 * makefile hackery just to compile dtimep.c with different flags
382 */
383 void dtimep_yyunput(int c)
384 {
385 unput(c);
386 }