]> diplodocus.org Git - nmh/blob - sbr/datetime.c
Added mhshow-suffix-text entry.
[nmh] / sbr / datetime.c
1 /*
2 * datetime.c -- functions for manipulating RFC 5545 date-time values
3 *
4 * This code is Copyright (c) 2014, by the authors of nmh.
5 * See the COPYRIGHT file in the root directory of the nmh
6 * distribution for complete copyright information.
7 */
8
9 #include "h/mh.h"
10 #include "h/icalendar.h"
11 #include <h/fmt_scan.h>
12 #include "h/tws.h"
13 #include "h/utils.h"
14
15 /*
16 * This doesn't try to support all of the myriad date-time formats
17 * allowed by RFC 5545. It is only used for viewing date-times,
18 * so that shouldn't be a problem: if a particular format can't
19 * be handled by this code, just present it to the user in its
20 * original form.
21 *
22 * And, this assumes a valid iCalendar input file. E.g, it
23 * doesn't check that each BEGIN has a matching END and vice
24 * versa. That should be done in the parser, though it currently
25 * isn't.
26 */
27
28 typedef struct tzparams {
29 /* Pointers to values in parse tree.
30 * TZOFFSETFROM is used to calculate the absolute time at which
31 * the transition to a given observance takes place.
32 * TZOFFSETTO is the timezone offset from UTC. Both are in HHmm
33 * format. */
34 char *offsetfrom, *offsetto;
35 const char *dtstart;
36 const char *rrule;
37
38 /* This is only used to make sure that timezone applies. And not
39 always, because if the timezone DTSTART is before the epoch, we
40 don't try to compare to it. */
41 time_t start_dt; /* in seconds since epoch */
42 } tzparams;
43
44 struct tzdesc {
45 char *tzid;
46
47 /* The following are translations of the pieces of RRULE and DTSTART
48 into seconds from beginning of year. */
49 tzparams standard_params;
50 tzparams daylight_params;
51
52 struct tzdesc *next;
53 };
54
55 /*
56 * Parse a datetime of the form YYYYMMDDThhmmss and a string
57 * representation of the timezone in units of [+-]hhmm and load the
58 * struct tws.
59 */
60 static int
61 parse_datetime (const char *datetime, const char *zone, int dst,
62 struct tws *tws) {
63 char utc_indicator;
64 int form_1 = 0;
65 int items_matched;
66
67 memset(tws, 0, sizeof *tws);
68 items_matched =
69 sscanf (datetime, "%4d%2d%2dT%2d%2d%2d%c",
70 &tws->tw_year, &tws->tw_mon, &tws->tw_mday,
71 &tws->tw_hour, &tws->tw_min, &tws->tw_sec,
72 &utc_indicator);
73 tws->tw_flags = TW_NULL;
74
75 if (items_matched == 7) {
76 /* The 'Z' must be capital according to RFC 5545 Sec. 3.3.5. */
77 if (utc_indicator != 'Z') {
78 advise (NULL, "%s has invalid timezone indicator of 0x%x",
79 datetime, utc_indicator);
80 return NOTOK;
81 }
82 } else if (zone == NULL) {
83 form_1 = 1;
84 }
85
86 /* items_matched of 3 is for, e.g., 20151230. Assume that means
87 the entire day. The time fields of the tws struct were
88 initialized to 0 by the memset() above. */
89 if (items_matched >= 6 || items_matched == 3) {
90 int offset = atoi (zone ? zone : "0");
91
92 /* struct tws defines tw_mon over [0, 11]. */
93 --tws->tw_mon;
94
95 /* Fill out rest of tws, i.e., its tw_wday and tw_flags. */
96 set_dotw (tws);
97 /* set_dotw() sets TW_SIMP. Replace that with TW_SEXP so that
98 dasctime() outputs the dotw before the date instead of after. */
99 tws->tw_flags &= ~TW_SDAY, tws->tw_flags |= TW_SEXP;
100
101 /* For the call to dmktime():
102 - don't need tw_yday
103 - tw_clock must be 0 on entry, and is set by dmktime()
104 - the only flag in tw_flags used is TW_DST
105 */
106 tws->tw_yday = tws->tw_clock = 0;
107 tws->tw_zone = 60 * (offset / 100) + offset % 100;
108 if (dst) {
109 tws->tw_zone -= 60; /* per dlocaltime() */
110 tws->tw_flags |= TW_DST;
111 }
112 /* dmktime() just sets tws->tw_clock. */
113 (void) dmktime (tws);
114
115 if (! form_1) {
116 /* Set TW_SZEXP so that dasctime outputs timezone, except
117 with local time (Form #1). */
118 tws->tw_flags |= TW_SZEXP;
119
120 /* Convert UTC time to time in local timezone. However,
121 don't try for years before 1970 because dlocatime()
122 doesn't handle them well. dlocaltime() will succeed if
123 tws->tw_clock is nonzero. */
124 if (tws->tw_year >= 1970 && tws->tw_clock > 0) {
125 const int was_dst = tws->tw_flags & TW_DST;
126
127 *tws = *dlocaltime (&tws->tw_clock);
128 if (was_dst && ! (tws->tw_flags & TW_DST)) {
129 /* dlocaltime() changed the DST flag from 1 to 0,
130 which means the time is in the hour (assumed to
131 be one hour) that is lost in the transition to
132 DST. So per RFC 5545 Sec. 3.3.5, "the
133 DATE-TIME value is interpreted using the UTC
134 offset before the gap in local times." In
135 other words, add an hour to it.
136 No adjustment is necessary for the transition
137 from DST to standard time, because dasctime()
138 shows the first occurrence of the time. */
139 tws->tw_clock += 3600;
140 *tws = *dlocaltime (&tws->tw_clock);
141 }
142 }
143 }
144
145 return OK;
146 }
147
148 return NOTOK;
149 }
150
151 tzdesc_t
152 load_timezones (const contentline *clines) {
153 tzdesc_t timezones = NULL, timezone = NULL;
154 int in_vtimezone, in_standard, in_daylight;
155 tzparams *params = NULL;
156 const contentline *node;
157
158 /* Interpret each VTIMEZONE section. */
159 in_vtimezone = in_standard = in_daylight = 0;
160 for (node = clines; node; node = node->next) {
161 /* node->name will be NULL if the line was "deleted". */
162 if (! node->name) { continue; }
163
164 if (in_daylight || in_standard) {
165 if (! strcasecmp ("END", node->name) &&
166 ((in_standard && ! strcasecmp ("STANDARD", node->value)) ||
167 (in_daylight && ! strcasecmp ("DAYLIGHT", node->value)))) {
168 struct tws tws;
169
170 if (in_standard) { in_standard = 0; }
171 else if (in_daylight) { in_daylight = 0; }
172 if (parse_datetime (params->dtstart, params->offsetfrom,
173 in_daylight ? 1 : 0,
174 &tws) == OK) {
175 if (tws.tw_year >= 1970) {
176 /* dmktime() falls apart for, e.g., the year 1601. */
177 params->start_dt = tws.tw_clock;
178 }
179 } else {
180 advise (NULL, "failed to parse start time %s for %s",
181 params->dtstart,
182 in_standard ? "standard" : "daylight");
183 return NULL;
184 }
185 params = NULL;
186 } else if (! strcasecmp ("DTSTART", node->name)) {
187 /* Save DTSTART for use after getting TZOFFSETFROM. */
188 params->dtstart = node->value;
189 } else if (! strcasecmp ("TZOFFSETFROM", node->name)) {
190 params->offsetfrom = node->value;
191 } else if (! strcasecmp ("TZOFFSETTO", node->name)) {
192 params->offsetto = node->value;
193 } else if (! strcasecmp ("RRULE", node->name)) {
194 params->rrule = node->value;
195 }
196 } else if (in_vtimezone) {
197 if (! strcasecmp ("END", node->name) &&
198 ! strcasecmp ("VTIMEZONE", node->value)) {
199 in_vtimezone = 0;
200 } else if (! strcasecmp ("BEGIN", node->name) &&
201 ! strcasecmp ("STANDARD", node->value)) {
202 in_standard = 1;
203 params = &timezone->standard_params;
204 } else if (! strcasecmp ("BEGIN", node->name) &&
205 ! strcasecmp ("DAYLIGHT", node->value)) {
206 in_daylight = 1;
207 params = &timezone->daylight_params;
208 } else if (! strcasecmp ("TZID", node->name)) {
209 /* See comment below in format_datetime() about removing any enclosing quotes from a
210 timezone identifier. */
211 char *buf = mh_xmalloc(strlen(node->value) + 1);
212 unquote_string(node->value, buf);
213 timezone->tzid = buf;
214 }
215 } else {
216 if (! strcasecmp ("BEGIN", node->name) &&
217 ! strcasecmp ("VTIMEZONE", node->value)) {
218
219 in_vtimezone = 1;
220 NEW0(timezone);
221 if (timezones) {
222 tzdesc_t t;
223
224 for (t = timezones; t && t->next; t = t->next) { continue; }
225 /* The loop terminated at, not after, the last
226 timezones node. */
227 t->next = timezone;
228 } else {
229 timezones = timezone;
230 }
231 }
232 }
233 }
234
235 return timezones;
236 }
237
238 void
239 free_timezones (tzdesc_t timezone) {
240 tzdesc_t next;
241
242 for ( ; timezone; timezone = next) {
243 free (timezone->tzid);
244 next = timezone->next;
245 free (timezone);
246 }
247 }
248
249 /*
250 * Convert time to local timezone, accounting for daylight saving time:
251 * - Detect which type of datetime the node contains:
252 * Form #1: DATE WITH LOCAL TIME
253 * Form #2: DATE WITH UTC TIME
254 * Form #3: DATE WITH LOCAL TIME AND TIME ZONE REFERENCE
255 * - Convert value to local time in seconds since epoch.
256 * - If there's a DST in the timezone, convert its start and end
257 * date-times to local time in seconds, also. Then determine
258 * if the value is between them, and therefore DST. Otherwise, it's
259 * not.
260 * - Format the time value.
261 */
262
263 /*
264 * Given a recurrence rule and year, calculate its time in seconds
265 * from 01 January UTC of the year.
266 */
267 time_t
268 rrule_clock (const char *rrule, const char *starttime, const char *zone,
269 unsigned int year) {
270 time_t clock = 0;
271
272 if (nmh_strcasestr (rrule, "FREQ=YEARLY;INTERVAL=1") ||
273 (nmh_strcasestr (rrule, "FREQ=YEARLY") && nmh_strcasestr(rrule, "INTERVAL") == NULL)) {
274 struct tws *tws;
275 const char *cp;
276 int wday = -1, month = -1;
277 int specific_day = 1; /* BYDAY integer (prefix) */
278 char buf[32];
279 int day;
280
281 if ((cp = nmh_strcasestr (rrule, "BYDAY="))) {
282 cp += 6;
283 /* BYDAY integers must be ASCII. */
284 if (*cp == '+') { ++cp; } /* +n specific day; don't support '-' */
285 else if (*cp == '-') { goto fail; }
286
287 if (isdigit ((unsigned char) *cp)) { specific_day = *cp++ - 0x30; }
288
289 if (! strncasecmp (cp, "SU", 2)) { wday = 0; }
290 else if (! strncasecmp (cp, "MO", 2)) { wday = 1; }
291 else if (! strncasecmp (cp, "TU", 2)) { wday = 2; }
292 else if (! strncasecmp (cp, "WE", 2)) { wday = 3; }
293 else if (! strncasecmp (cp, "TH", 2)) { wday = 4; }
294 else if (! strncasecmp (cp, "FR", 2)) { wday = 5; }
295 else if (! strncasecmp (cp, "SA", 2)) { wday = 6; }
296 }
297 if ((cp = nmh_strcasestr (rrule, "BYMONTH="))) {
298 month = atoi (cp + 8);
299 }
300
301 for (day = 1; day <= 7; ++day) {
302 /* E.g, 11-01-2014 02:00:00-0400 */
303 snprintf (buf, sizeof buf, "%02d-%02d-%04u %.2s:%.2s:%.2s%s",
304 month, day + 7 * (specific_day-1), year,
305 starttime, starttime + 2, starttime + 4,
306 zone ? zone : "0000");
307 if ((tws = dparsetime (buf))) {
308 if (! (tws->tw_flags & (TW_SEXP|TW_SIMP))) { set_dotw (tws); }
309
310 if (tws->tw_wday == wday) {
311 /* Found the day specified in the RRULE. */
312 break;
313 }
314 }
315 }
316
317 if (day <= 7) {
318 clock = tws->tw_clock;
319 }
320 }
321
322 fail:
323 if (clock == 0) {
324 admonish (NULL,
325 "Unsupported RRULE format: %s, assume local timezone",
326 rrule);
327 }
328
329 return clock;
330 }
331
332 char *
333 format_datetime (tzdesc_t timezones, const contentline *node) {
334 param_list *p;
335 char *dt_timezone = NULL;
336 int dst = 0;
337 struct tws tws[2]; /* [standard, daylight] */
338 tzdesc_t tz;
339 char *tp_std, *tp_dst, *tp_dt;
340
341 /* Extract the timezone, if specified (RFC 5545 Sec. 3.3.5 Form #3). */
342 for (p = node->params; p && p->param_name; p = p->next) {
343 if (! strcasecmp (p->param_name, "TZID") && p->values) {
344 /* Remove any enclosing quotes from the timezone identifier. I don't believe that it's
345 legal for it to be quoted, according to RFC 5545 ยง 3.2.19:
346 tzidparam = "TZID" "=" [tzidprefix] paramtext
347 tzidprefix = "/"
348 where paramtext includes SAFE-CHAR, which specifically excludes DQUOTE. But we'll
349 be generous and strip quotes. */
350 char *buf = mh_xmalloc(strlen(p->values->value) + 1);
351 unquote_string(p->values->value, buf);
352 dt_timezone = buf;
353 break;
354 }
355 }
356
357 if (! dt_timezone) {
358 /* Form #1: DATE WITH LOCAL TIME, i.e., no time zone, or
359 Form #2: DATE WITH UTC TIME */
360 if (parse_datetime (node->value, NULL, 0, &tws[0]) == OK) {
361 return strdup (dasctime (&tws[0], 0));
362 }
363 advise (NULL, "unable to parse datetime %s", node->value);
364 return NULL;
365 }
366
367 /*
368 * must be
369 * Form #3: DATE WITH LOCAL TIME AND TIME ZONE REFERENCE
370 */
371
372 /* Find the corresponding tzdesc. */
373 for (tz = timezones; dt_timezone && tz; tz = tz->next) {
374 /* Property parameter values are case insenstive (RFC 5545
375 Sec. 2) and time zone identifiers are property parameters
376 (RFC 5545 Sec. 3.8.2.4), though it would seem odd to use
377 different case in the same file for identifiers that are
378 supposed to be the same. */
379 if (tz->tzid && ! strcasecmp (dt_timezone, tz->tzid)) { break; }
380 }
381
382 if (tz) {
383 free(dt_timezone);
384 } else {
385 advise (NULL, "did not find VTIMEZONE section for %s", dt_timezone);
386 free(dt_timezone);
387 return NULL;
388 }
389
390 /* Determine if it's Daylight Saving. */
391 tp_std = strchr (tz->standard_params.dtstart, 'T');
392 tp_dt = strchr (node->value, 'T');
393
394 if (tz->daylight_params.dtstart) {
395 tp_dst = strchr (tz->daylight_params.dtstart, 'T');
396 } else {
397 /* No DAYLIGHT section. */
398 tp_dst = NULL;
399 dst = 0;
400 }
401
402 if (tp_std && tp_dt) {
403 time_t transition[2] = { 0, 0 }; /* [standard, daylight] */
404 time_t dt[2]; /* [standard, daylight] */
405 unsigned int year;
406 char buf[5];
407
408 /* Datetime is form YYYYMMDDThhmmss. Extract year. */
409 memcpy (buf, node->value, sizeof buf - 1);
410 buf[sizeof buf - 1] = '\0';
411 year = atoi (buf);
412
413 if (tz->standard_params.rrule) {
414 /* +1 to skip the T before the time */
415 transition[0] =
416 rrule_clock (tz->standard_params.rrule, tp_std + 1,
417 tz->standard_params.offsetfrom, year);
418 }
419 if (tp_dst && tz->daylight_params.rrule) {
420 /* +1 to skip the T before the time */
421 transition[1] =
422 rrule_clock (tz->daylight_params.rrule, tp_dst + 1,
423 tz->daylight_params.offsetfrom, year);
424 }
425
426 if (transition[0] < transition[1]) {
427 advise (NULL, "format_datetime() requires that daylight "
428 "saving time transition precede standard time "
429 "transition");
430 return NULL;
431 }
432
433 if (parse_datetime (node->value, tz->standard_params.offsetto,
434 0, &tws[0]) == OK) {
435 dt[0] = tws[0].tw_clock;
436 } else {
437 advise (NULL, "unable to parse datetime %s", node->value);
438 return NULL;
439 }
440
441 if (tp_dst) {
442 if (dt[0] < transition[1]) {
443 dst = 0;
444 } else {
445 if (parse_datetime (node->value,
446 tz->daylight_params.offsetto, 1,
447 &tws[1]) == OK) {
448 dt[1] = tws[1].tw_clock;
449 } else {
450 advise (NULL, "unable to parse datetime %s",
451 node->value);
452 return NULL;
453 }
454
455 dst = dt[1] > transition[0] ? 0 : 1;
456 }
457 }
458
459 if (dst) {
460 if (tz->daylight_params.start_dt > 0 &&
461 dt[dst] < tz->daylight_params.start_dt) {
462 advise (NULL, "date-time of %s is before VTIMEZONE start "
463 "of %s", node->value,
464 tz->daylight_params.dtstart);
465 return NULL;
466 }
467 } else {
468 if (tz->standard_params.start_dt > 0 &&
469 dt[dst] < tz->standard_params.start_dt) {
470 advise (NULL, "date-time of %s is before VTIMEZONE start "
471 "of %s", node->value,
472 tz->standard_params.dtstart);
473 return NULL;
474 }
475 }
476 } else {
477 if (! tp_std) {
478 advise (NULL, "unsupported date-time format: %s",
479 tz->standard_params.dtstart);
480 return NULL;
481 }
482 if (! tp_dt) {
483 advise (NULL, "unsupported date-time format: %s", node->value);
484 return NULL;
485 }
486 }
487
488 return strdup (dasctime (&tws[dst], 0));
489 }