]>
diplodocus.org Git - nmh/blob - sbr/fmt_compile.c
3 * fmt_compile.c -- "compile" format strings for fmt_scan
5 * This code is Copyright (c) 2002, by the authors of nmh. See the
6 * COPYRIGHT file in the root directory of the nmh distribution for
7 * complete copyright information.
9 * This code compiles the format strings (documented in mh-format(5)) into
10 * an internal form to be later processed by fmt_scan.c.
12 * What happens here is that the format strings are parsed and an array
13 * of struct format structures are returned. Each format structure is
14 * a single operation interpreted by the the routines in fmt_scan.c.
16 * There is a NOT a one-to-one correspondence between format strings and
17 * format instructions; some functions have side effects that can result
18 * in multiple instructions being generated. The exact list of instructions
19 * generated by a format string can be seem with the nmh fmttest utility.
21 * A list of format instructions can be found in fmt_compile.h.
23 * If you wish to add a new function, you will need to do the following
26 * - Add a new instruction to the list of instructions in fmt_compile.h.
27 * Note that test instructions (starting with FT_IF_S_NULL) have special
28 * handling, so if you are NOT writing a test function then you need
29 * to insert it into the list before that _and_ bump all of the
30 * following instruction numbers.
32 * - Add the function name to the functable[] array below, and write any
33 * special code that your function may require in terms of parsing
34 * (it very well may not need anything).
36 * - Add the code in fmt_scan.c to handle your new function.
38 * - Add code to fmttest.c to display your new function.
40 * - Document the new function in the mh-format(5) man page.
45 #include <h/addrsbr.h>
47 #include <h/fmt_scan.h>
48 #include <h/fmt_compile.h>
52 #ifdef HAVE_SYS_TIME_H
53 # include <sys/time.h>
58 * hash table for deciding if a component is "interesting"
60 static struct comp
*wantcomp
[128];
62 static struct format
*formatvec
; /* array to hold formats */
63 static struct format
*next_fp
; /* next free format slot */
64 static struct format
*fp
; /* current format slot */
65 static struct comp
*cm
; /* most recent comp ref */
66 static struct ftable
*ftbl
; /* most recent func ref */
68 static int infunction
; /* function nesting cnt */
70 extern struct mailname fmt_mnull
;
72 /* ftable->type (argument type) */
73 #define TF_COMP 0 /* component expected */
74 #define TF_NUM 1 /* number expected */
75 #define TF_STR 2 /* string expected */
76 #define TF_EXPR 3 /* component or func. expected */
77 #define TF_NONE 4 /* no argument */
78 #define TF_MYBOX 5 /* special - get current user's mbox */
79 #define TF_NOW 6 /* special - get current unix time */
80 #define TF_EXPR_SV 7 /* like expr but save current str reg */
81 #define TF_NOP 8 /* like expr but no result */
82 #define TF_MYNAME 9 /* special - get current name of user */
83 #define TF_MYHOST 10 /* special - get "local" hostname */
84 #define TF_LMBOX 11 /* special - get full local mailbox */
85 #define TF_BOLD 12 /* special - enter terminal bold mode */
86 #define TF_UNDERLN 13 /* special - enter underline mode */
87 #define TF_STNDOUT 14 /* special - enter underline mode */
88 #define TF_RESET 15 /* special - reset terminal modes */
89 #define TF_HASCLR 16 /* special - terminal have color? */
90 #define TF_FGCOLR 17 /* special - foreground term color */
91 #define TF_BGCOLR 18 /* special - background term color */
94 /* NB that TFL_PUTS is also used to decide whether the test
95 * in a "%<(function)..." should be a string or numeric one.
97 #define TFL_PUTS 1 /* implicit putstr if top level */
98 #define TFL_PUTN 2 /* implicit putnum if top level */
101 * The functable array maps between the text names of format functions and
102 * the format instructions interpreted by the engine in fmt_scan.c.
104 * The elements of this structure are as follows:
106 * name - The name of the function as seen in the format string. This is
107 * what maps a particular function name into a format instruction.
108 * type - The type of argument this function expects. Those types are
109 * listed above (with the TF_ prefix). This affects what gets
110 * placed in the format instruction (the f_un union). Also,
111 * instructions that require special handling are distinguished
112 * here (TF_MYMBOX is one example).
113 * f_type - The instruction corresponding to this function (from the list
115 * extra - Used by some functions to provide extra data to the compiler.
117 * - Providing an alternate instruction to combine a load
118 * and test operation (see do_if()).
119 * - Passed in f_value in the format instruction to provide
120 * extra information for the engine (see FT_LV_DAT handling
122 * - Provide a hint as to preprocessing that is required for
123 * this instruction (see do_name()).
124 * flags - See the definitions for TFL_PUTS & TFL_PUTN above.
128 char *name
; /* function name */
129 char type
; /* argument type */
130 char f_type
; /* fmt type */
131 char extra
; /* arg. type dependent extra info */
135 static struct ftable functable
[] = {
136 { "nonzero", TF_EXPR
, FT_V_NE
, FT_IF_V_NE
, 0 },
137 { "zero", TF_EXPR
, FT_V_EQ
, FT_IF_V_EQ
, 0 },
138 { "eq", TF_NUM
, FT_V_EQ
, FT_IF_V_EQ
, 0 },
139 { "ne", TF_NUM
, FT_V_NE
, FT_IF_V_NE
, 0 },
140 { "gt", TF_NUM
, FT_V_GT
, FT_IF_V_GT
, 0 },
141 { "null", TF_EXPR
, FT_S_NULL
, FT_IF_S_NULL
, 0 },
142 { "nonnull", TF_EXPR
, FT_S_NONNULL
, FT_IF_S
, 0 },
143 { "match", TF_STR
, FT_V_MATCH
, FT_IF_MATCH
, 0 },
144 { "amatch", TF_STR
, FT_V_AMATCH
, FT_IF_AMATCH
, 0 },
146 { "putstr", TF_EXPR
, FT_STR
, 0, 0 },
147 { "putstrf", TF_EXPR
, FT_STRF
, 0, 0 },
148 { "putnum", TF_EXPR
, FT_NUM
, 0, 0 },
149 { "putnumf", TF_EXPR
, FT_NUMF
, 0, 0 },
150 { "putaddr", TF_STR
, FT_PUTADDR
, 0, 0 },
151 { "putlit", TF_EXPR
, FT_STRLIT
, 0, 0 },
152 { "zputlit", TF_EXPR
, FT_STRLITZ
, 0, 0 },
153 { "void", TF_NOP
, 0, 0, 0 },
155 { "comp", TF_COMP
, FT_LS_COMP
, 0, TFL_PUTS
},
156 { "lit", TF_STR
, FT_LS_LIT
, 0, TFL_PUTS
},
157 { "getenv", TF_STR
, FT_LS_GETENV
, 0, TFL_PUTS
},
158 { "profile", TF_STR
, FT_LS_CFIND
, 0, TFL_PUTS
},
159 { "decodecomp", TF_COMP
, FT_LS_DECODECOMP
, 0, TFL_PUTS
},
160 { "decode", TF_EXPR
, FT_LS_DECODE
, 0, TFL_PUTS
},
161 { "trim", TF_EXPR
, FT_LS_TRIM
, 0, 0 },
162 { "kilo", TF_EXPR
, FT_LS_KILO
, 0, TFL_PUTS
},
163 { "kibi", TF_EXPR
, FT_LS_KIBI
, 0, TFL_PUTS
},
164 { "compval", TF_COMP
, FT_LV_COMP
, 0, TFL_PUTN
},
165 { "compflag", TF_COMP
, FT_LV_COMPFLAG
, 0, TFL_PUTN
},
166 { "num", TF_NUM
, FT_LV_LIT
, 0, TFL_PUTN
},
167 { "msg", TF_NONE
, FT_LV_DAT
, 0, TFL_PUTN
},
168 { "cur", TF_NONE
, FT_LV_DAT
, 1, TFL_PUTN
},
169 { "size", TF_NONE
, FT_LV_DAT
, 2, TFL_PUTN
},
170 { "width", TF_NONE
, FT_LV_DAT
, 3, TFL_PUTN
},
171 { "unseen", TF_NONE
, FT_LV_DAT
, 4, TFL_PUTN
},
172 { "dat", TF_NUM
, FT_LV_DAT
, 0, TFL_PUTN
},
173 { "strlen", TF_NONE
, FT_LV_STRLEN
, 0, TFL_PUTN
},
174 { "me", TF_MYBOX
, FT_LS_LIT
, 0, TFL_PUTS
},
175 { "myname", TF_MYNAME
, FT_LS_LIT
, 0, TFL_PUTS
},
176 { "myhost", TF_MYHOST
, FT_LS_LIT
, 0, TFL_PUTS
},
177 { "localmbox", TF_LMBOX
, FT_LS_LIT
, 0, TFL_PUTS
},
178 { "plus", TF_NUM
, FT_LV_PLUS_L
, 0, TFL_PUTN
},
179 { "minus", TF_NUM
, FT_LV_MINUS_L
, 0, TFL_PUTN
},
180 { "multiply", TF_NUM
, FT_LV_MULTIPLY_L
, 0, TFL_PUTN
},
181 { "divide", TF_NUM
, FT_LV_DIVIDE_L
, 0, TFL_PUTN
},
182 { "modulo", TF_NUM
, FT_LV_MODULO_L
, 0, TFL_PUTN
},
183 { "charleft", TF_NONE
, FT_LV_CHAR_LEFT
, 0, TFL_PUTN
},
184 { "timenow", TF_NOW
, FT_LV_LIT
, 0, TFL_PUTN
},
186 { "month", TF_COMP
, FT_LS_MONTH
, FT_PARSEDATE
, TFL_PUTS
},
187 { "lmonth", TF_COMP
, FT_LS_LMONTH
, FT_PARSEDATE
, TFL_PUTS
},
188 { "tzone", TF_COMP
, FT_LS_ZONE
, FT_PARSEDATE
, TFL_PUTS
},
189 { "day", TF_COMP
, FT_LS_DAY
, FT_PARSEDATE
, TFL_PUTS
},
190 { "weekday", TF_COMP
, FT_LS_WEEKDAY
, FT_PARSEDATE
, TFL_PUTS
},
191 { "tws", TF_COMP
, FT_LS_822DATE
, FT_PARSEDATE
, TFL_PUTS
},
192 { "sec", TF_COMP
, FT_LV_SEC
, FT_PARSEDATE
, TFL_PUTN
},
193 { "min", TF_COMP
, FT_LV_MIN
, FT_PARSEDATE
, TFL_PUTN
},
194 { "hour", TF_COMP
, FT_LV_HOUR
, FT_PARSEDATE
, TFL_PUTN
},
195 { "mday", TF_COMP
, FT_LV_MDAY
, FT_PARSEDATE
, TFL_PUTN
},
196 { "mon", TF_COMP
, FT_LV_MON
, FT_PARSEDATE
, TFL_PUTN
},
197 { "year", TF_COMP
, FT_LV_YEAR
, FT_PARSEDATE
, TFL_PUTN
},
198 { "yday", TF_COMP
, FT_LV_YDAY
, FT_PARSEDATE
, TFL_PUTN
},
199 { "wday", TF_COMP
, FT_LV_WDAY
, FT_PARSEDATE
, TFL_PUTN
},
200 { "zone", TF_COMP
, FT_LV_ZONE
, FT_PARSEDATE
, TFL_PUTN
},
201 { "clock", TF_COMP
, FT_LV_CLOCK
, FT_PARSEDATE
, TFL_PUTN
},
202 { "rclock", TF_COMP
, FT_LV_RCLOCK
, FT_PARSEDATE
, TFL_PUTN
},
203 { "sday", TF_COMP
, FT_LV_DAYF
, FT_PARSEDATE
, TFL_PUTN
},
204 { "szone", TF_COMP
, FT_LV_ZONEF
, FT_PARSEDATE
, TFL_PUTN
},
205 { "dst", TF_COMP
, FT_LV_DST
, FT_PARSEDATE
, TFL_PUTN
},
206 { "pretty", TF_COMP
, FT_LS_PRETTY
, FT_PARSEDATE
, TFL_PUTS
},
207 { "nodate", TF_COMP
, FT_LV_COMPFLAG
, FT_PARSEDATE
, TFL_PUTN
},
208 { "date2local", TF_COMP
, FT_LOCALDATE
, FT_PARSEDATE
, 0 },
209 { "date2gmt", TF_COMP
, FT_GMTDATE
, FT_PARSEDATE
, 0 },
211 { "pers", TF_COMP
, FT_LS_PERS
, FT_PARSEADDR
, TFL_PUTS
},
212 { "mbox", TF_COMP
, FT_LS_MBOX
, FT_PARSEADDR
, TFL_PUTS
},
213 { "host", TF_COMP
, FT_LS_HOST
, FT_PARSEADDR
, TFL_PUTS
},
214 { "path", TF_COMP
, FT_LS_PATH
, FT_PARSEADDR
, TFL_PUTS
},
215 { "gname", TF_COMP
, FT_LS_GNAME
, FT_PARSEADDR
, TFL_PUTS
},
216 { "note", TF_COMP
, FT_LS_NOTE
, FT_PARSEADDR
, TFL_PUTS
},
217 { "addr", TF_COMP
, FT_LS_ADDR
, FT_PARSEADDR
, TFL_PUTS
},
218 { "proper", TF_COMP
, FT_LS_822ADDR
, FT_PARSEADDR
, TFL_PUTS
},
219 { "type", TF_COMP
, FT_LV_HOSTTYPE
, FT_PARSEADDR
, TFL_PUTN
},
220 { "ingrp", TF_COMP
, FT_LV_INGRPF
, FT_PARSEADDR
, TFL_PUTN
},
221 { "nohost", TF_COMP
, FT_LV_NOHOSTF
, FT_PARSEADDR
, TFL_PUTN
},
222 { "formataddr", TF_EXPR_SV
,FT_FORMATADDR
, FT_FORMATADDR
, 0 },
223 { "concataddr", TF_EXPR_SV
,FT_CONCATADDR
, FT_FORMATADDR
, 0 },
224 { "friendly", TF_COMP
, FT_LS_FRIENDLY
, FT_PARSEADDR
, TFL_PUTS
},
226 { "mymbox", TF_COMP
, FT_LV_COMPFLAG
, FT_MYMBOX
, TFL_PUTN
},
227 { "getmymbox", TF_COMP
, FT_STR
, FT_GETMYMBOX
, 0 },
228 { "getmyaddr", TF_COMP
, FT_LS_ADDR
, FT_GETMYADDR
, TFL_PUTS
},
230 { "unquote", TF_EXPR
, FT_LS_UNQUOTE
, 0, TFL_PUTS
},
232 { "bold", TF_BOLD
, FT_LS_LIT
, 0, TFL_PUTS
},
233 { "underline", TF_UNDERLN
,FT_LS_LIT
, 0, TFL_PUTS
},
234 { "standout", TF_STNDOUT
,FT_LS_LIT
, 0, TFL_PUTS
},
235 { "resetterm", TF_RESET
, FT_LS_LIT
, 0, TFL_PUTS
},
236 { "hascolor", TF_HASCLR
, FT_LV_LIT
, 0, 0 },
237 { "fgcolor", TF_FGCOLR
, FT_LS_LIT
, 0, TFL_PUTS
},
238 { "bgcolor", TF_BGCOLR
, FT_LS_LIT
, 0, TFL_PUTS
},
244 * A mapping of color names to terminfo color numbers.
246 * There are two sets of terminal-setting codes: 'setaf/setab' (ANSI) and
247 * 'setf/setb'. Different terminals support different capabilities, so
248 * we provide a mapping for both. I'm not crazy about putting numbers
249 * directly in here, but it seems these are well defined by terminfo
250 * so it should be okay.
254 char *colorname
; /* Name of color */
255 int ansinum
; /* The ANSI escape color number */
256 int nonansinum
; /* The non-ANSI escape color number */
259 static struct colormap colortable
[] = {
272 * Hash function for component name. The function should be
273 * case independent and probably shouldn't involve a routine
274 * call. This function is pretty good but will not work on
275 * single character component names.
277 #define CHASH(nm) (((((nm)[0]) - ((nm)[1])) & 0x1f) + (((nm)[2]) & 0x5f))
280 * Find a component in the hash table.
282 #define FINDCOMP(comp,name) \
283 for (comp = wantcomp[CHASH(name)]; \
284 comp && strcmp(comp->c_name,name); \
285 comp = comp->c_next) \
288 /* Add new component to the hash table */
289 #define NEWCOMP(cm,name) do { \
290 cm = ((struct comp *) mh_xcalloc (1, sizeof (struct comp)));\
291 cm->c_name = getcpy(name);\
295 cm->c_next = wantcomp[i];\
299 #define NEWFMT (next_fp++)
300 #define NEW(type,fill,wid) do {\
301 fp=NEWFMT; fp->f_type=(type); fp->f_fill=(fill); fp->f_width=(wid); \
304 /* Add (possibly new) component to the hash table */
305 #define ADDC(name) do { \
311 fp->f_flags |= FF_COMPREF; \
315 #define LV(type, value) do { NEW(type,0,0); fp->f_value = (value); } while (0)
316 #define LS(type, str) do { NEW(type,0,0); fp->f_text = getcpy(str); fp->f_flags |= FF_STRALLOC; } while (0)
318 #define PUTCOMP(comp) do { NEW(FT_COMP,0,0); ADDC(comp); } while (0)
319 #define PUTLIT(str) do { NEW(FT_LIT,0,0); fp->f_text = getcpy(str); fp->f_flags |= FF_STRALLOC; } while (0)
320 #define PUTC(c) do { NEW(FT_CHAR,0,0); fp->f_char = (c); } while (0)
322 static char *format_string
;
323 static char *usr_fstring
; /* for CERROR */
325 #define CERROR(str) compile_error (str, cp)
330 static struct ftable
*lookup(char *);
331 static void compile_error(char *, char *);
332 static char *compile (char *);
333 static char *do_spec(char *);
334 static char *do_name(char *, int);
335 static char *do_func(char *);
336 static char *do_expr (char *, int);
337 static char *do_loop(char *);
338 static char *do_if(char *);
339 static void free_component(struct comp
*);
340 static void free_comptable(void);
343 * Lookup a function name in the functable
345 static struct ftable
*
348 register struct ftable
*t
= functable
;
350 register char c
= *name
;
352 while ((nm
= t
->name
)) {
353 if (*nm
== c
&& strcmp (nm
, name
) == 0)
358 return (struct ftable
*) 0;
363 compile_error(char *str
, char *cp
)
365 int i
, errpos
, errctx
;
367 errpos
= cp
- format_string
;
368 errctx
= errpos
> 20 ? 20 : errpos
;
369 usr_fstring
[errpos
] = '\0';
371 for (i
= errpos
-errctx
; i
< errpos
; i
++) {
372 if (iscntrl((unsigned char) usr_fstring
[i
]))
373 usr_fstring
[i
] = '_';
376 advise(NULL
, "\"%s\": format compile error - %s",
377 &usr_fstring
[errpos
-errctx
], str
);
378 adios (NULL
, "%*s", errctx
+1, "^");
382 * Compile format string "fstring" into format list "fmt".
383 * Return the number of header components found in the format
388 fmt_compile(char *fstring
, struct format
**fmt
, int reset_comptable
)
392 static int comptable_initialized
= 0;
394 format_string
= getcpy (fstring
);
395 usr_fstring
= fstring
;
397 if (reset_comptable
|| !comptable_initialized
) {
399 comptable_initialized
= 1;
402 memset((char *) &fmt_mnull
, 0, sizeof(fmt_mnull
));
404 /* it takes at least 4 char to generate one format so we
405 * allocate a worst-case format array using 1/4 the length
406 * of the format string. We actually need twice this much
407 * to handle both pre-processing (e.g., address parsing) and
410 i
= strlen(fstring
)/2 + 1;
412 next_fp
= formatvec
= (struct format
*)mh_xcalloc ((size_t) i
,
413 sizeof(struct format
));
415 adios (NULL
, "unable to allocate format storage");
419 cp
= compile(format_string
);
421 CERROR("extra '%>', '%|' or '%?'");
423 LV(FT_DONE
, 0); /* really done */
433 register char *cp
= sp
;
438 while ((c
= *cp
) && c
!= '%')
474 case ';': /* comment line */
476 while ((c
= *cp
++) && c
!= '\n')
489 * Process functions & components (handle field width here as well
494 register char *cp
= sp
;
497 register int ljust
= 0;
498 #endif /* not lint */
499 register int wid
= 0;
500 register char fill
= ' ';
512 wid
= wid
*10 + (c
- '0');
518 fp
->f_type
= wid
? FT_COMPF
: FT_COMP
;
523 if (ftbl
->flags
& TFL_PUTS
) {
524 LV( wid
? FT_STRF
: FT_STR
, ftbl
->extra
);
526 else if (ftbl
->flags
& TFL_PUTN
) {
527 LV( wid
? FT_NUMF
: FT_NUM
, ftbl
->extra
);
532 CERROR("component or function name expected");
543 * Process a component name. Normally this involves generating an FT_COMP
544 * instruction for the specified component. If preprocess is set, then we
545 * do some extra processing.
548 do_name(char *sp
, int preprocess
)
550 register char *cp
= sp
;
553 static int primed
= 0;
555 while (isalnum(c
= *cp
++) || c
== '-' || c
== '_')
558 CERROR("'}' expected");
562 switch (preprocess
) {
565 if (cm
->c_type
& CT_ADDR
) {
566 CERROR("component used as both date and address");
569 memset (cm
->c_tws
, 0, sizeof *cm
->c_tws
);
571 cm
->c_tws
= mh_xcalloc (1, sizeof *cm
->c_tws
);
573 fp
->f_type
= preprocess
;
575 cm
->c_type
|= CT_DATE
;
582 ismymbox ((struct mailname
*) 0);
587 if (cm
->c_type
& CT_DATE
) {
588 CERROR("component used as both date and address");
590 cm
->c_mn
= &fmt_mnull
;
591 fp
->f_type
= preprocess
;
593 cm
->c_type
|= CT_ADDR
;
597 if (cm
->c_type
& CT_DATE
) {
598 CERROR("component used as both date and address");
600 cm
->c_type
|= CT_ADDR
;
607 * Generate one or more instructions corresponding to the named function.
608 * The different type of function arguments are handled here.
613 register char *cp
= sp
;
615 register struct ftable
*t
;
617 int mflag
; /* minus sign in NUM */
621 while (isalnum(c
= *cp
++))
623 if (c
!= '(' && c
!= '{' && c
!= ' ' && c
!= ')') {
624 CERROR("'(', '{', ' ' or ')' expected");
627 if ((t
= lookup (sp
)) == 0) {
628 CERROR("unknown function");
637 CERROR("component name expected");
639 cp
= do_name(cp
, t
->extra
);
640 fp
->f_type
= t
->f_type
;
645 if ((mflag
= (c
== '-')))
649 n
= n
*10 + (c
- '0');
659 while (c
&& c
!= ')')
666 LV(t
->f_type
,t
->extra
);
670 LS(t
->f_type
, getusername());
674 LS(t
->f_type
, getfullname());
678 LS(t
->f_type
, LocalName(0));
682 LS(t
->f_type
, getlocalmbox());
686 LS(t
->f_type
, get_term_stringcap("bold"));
690 LS(t
->f_type
, get_term_stringcap("smul"));
694 LS(t
->f_type
, get_term_stringcap("smso"));
698 LS(t
->f_type
, get_term_stringcap("sgr0"));
702 LV(t
->f_type
, get_term_numcap("colors") > 1);
707 struct colormap
*cmap
= colortable
;
711 while (c
&& c
!= ')')
715 while (cmap
->colorname
!= NULL
) {
716 if (strcasecmp(sp
, cmap
->colorname
) == 0)
721 if (cmap
->colorname
== NULL
) {
722 CERROR("Unknown color name");
726 code
= get_term_stringparm(t
->type
== TF_FGCOLR
? "setaf" : "setab",
730 * If this doesn't have anything, try falling back to setf/setb
734 code
= get_term_stringparm(t
->type
== TF_FGCOLR
? "setf" : "setb",
735 cmap
->nonansinum
, 0);
742 LV(t
->f_type
, time((time_t *) 0));
750 cp
= do_expr(cp
, t
->extra
);
758 cp
= do_expr(cp
, t
->extra
);
764 CERROR("')' expected");
771 * Handle an expression as an argument. Basically we call one of do_name(),
772 * do_func(), or do_if()
775 do_expr (char *sp
, int preprocess
)
777 register char *cp
= sp
;
780 if ((c
= *cp
++) == '{') {
781 cp
= do_name (cp
, preprocess
);
782 fp
->f_type
= FT_LS_COMP
;
783 } else if (c
== '(') {
785 } else if (c
== ')') {
787 } else if (c
== '%' && *cp
== '<') {
790 CERROR ("'(', '{', '%<' or ')' expected");
796 * I am guessing this was for some kind of loop statement, which would have
797 * looked like %[ .... %]. It looks like the way this would have worked
798 * is that the format engine would have seen that FT_DONE had a 1 in the
799 * f_un.f_un_value and then decided whether or not to continue the loop.
800 * There is no support for this in the format engine, so right now if
801 * you try using it you will reach the FT_DONE and simply stop. I'm leaving
802 * this here in case someone wants to continue the work.
804 * Okay, got some more information on this from John L. Romine! From an
805 * email he sent to the nmh-workers mailing list on December 2, 2010, he
806 * explains it thusly:
808 * In this case (scan, formatsbr) it has to do with an extension to
809 * the mh-format syntax to allow for looping.
811 * The scan format is processed once for each message. Those #ifdef
812 * JLR changes allowed for the top part of the format file to be
813 * processed once, then a second, looping part to be processed
814 * once per message. As I recall, there were new mh-format escape
815 * sequences to delimit the loop. This would have allowed for things
816 * like per-format column headings in the scan output.
818 * Since existing format files didn't include the scan listing
819 * header (it was hard-coded in scan.c) it would not have been
820 * backward-compatible. All existing format files (including any
821 * local ones) would have needed to be changed to include the format
822 * codes for a header. The practice at the time was not to introduce
823 * incompatible changes in a minor release, and I never managed to
824 * put out a newer major release.
826 * I can see how this would work, and I suspect part of the motivation was
827 * because the format compiler routines (at the time) couldn't really be
828 * called multiple times on the same message because the memory management
829 * was so lousy. That's been reworked and things are now a lot cleaner,
830 * so I suspect if we're going to allow a format string to be used for the
831 * scan header it might be simpler to have a separate format string just
832 * for the header. But I'll leave this code in for now just in case we
833 * decide that we want some kind of looping support.
838 register char *cp
= sp
;
839 struct format
*floop
;
844 CERROR ("']' expected");
846 LV(FT_DONE
, 1); /* not yet done */
848 fp
->f_skip
= floop
- fp
; /* skip backwards */
854 * Handle an if-elsif-endif statement. Note here that the branching
855 * is handled by the f_skip member of the struct format (which is really
856 * just f_width overloaded). This number controls how far to move forward
857 * (or back) in the format instruction array.
862 register char *cp
= sp
;
863 register struct format
*fexpr
,
864 *fif
= (struct format
*)NULL
;
865 register int c
= '<';
868 if (c
== '<') { /* doing an IF */
869 if ((c
= *cp
++) == '{') /*}*/{
871 fp
->f_type
= FT_LS_COMP
;
876 /* see if we can merge the load and the "if" */
877 if (ftbl
->f_type
>= IF_FUNCS
)
878 fp
->f_type
= ftbl
->extra
;
880 /* Put out a string test or a value test depending
881 * on what this function's return type is.
883 if (ftbl
->flags
& TFL_PUTS
) {
891 CERROR("'(' or '{' expected"); /*}*/
895 fexpr
= fp
; /* loc of [ELS]IF */
896 cp
= compile (cp
); /* compile IF TRUE stmts */
898 fif
->f_skip
= next_fp
- fif
;
900 if ((c
= *cp
++) == '|') { /* the last ELSE */
902 fif
= fp
; /* loc of GOTO */
903 fexpr
->f_skip
= next_fp
- fexpr
;
905 fexpr
= (struct format
*)NULL
;/* no extra ENDIF */
907 cp
= compile (cp
); /* compile ELSE stmts */
908 fif
->f_skip
= next_fp
- fif
;
911 else if (c
== '?') { /* another ELSIF */
913 fif
= fp
; /* loc of GOTO */
914 fexpr
->f_skip
= next_fp
- fexpr
;
916 c
= '<'; /* impersonate an IF */
923 CERROR("'>' expected.");
926 if (fexpr
) /* IF ... [ELSIF ...] ENDIF */
927 fexpr
->f_skip
= next_fp
- fexpr
;
933 * Free a set of format instructions.
935 * What we do here is:
937 * - Iterate through the list of format instructions, freeing any references
938 * to allocated memory in each instruction.
939 * - Free component references.
940 * - If requested, reset the component hash table; that will also free any
941 * references to components stored there.
946 fmt_free(struct format
*fmt
, int reset_comptable
)
948 struct format
*fp
= fmt
;
951 while (! (fp
->f_type
== FT_DONE
&& fp
->f_value
== 0)) {
952 if (fp
->f_flags
& FF_STRALLOC
)
954 if (fp
->f_flags
& FF_COMPREF
)
955 free_component(fp
->f_comp
);
966 * Free just the text strings from all of the component hash table entries
970 fmt_freecomptext(void)
975 for (i
= 0; i
< sizeof(wantcomp
)/sizeof(wantcomp
[0]); i
++)
976 for (cm
= wantcomp
[i
]; cm
; cm
= cm
->c_next
)
984 * Find a component in our hash table. This is just a public interface to
985 * the FINDCOMP macro, so we don't have to expose our hash table.
989 fmt_findcomp(char *component
)
993 FINDCOMP(cm
, component
);
999 * Like fmt_findcomp, but case-insensitive.
1003 fmt_findcasecomp(char *component
)
1007 for (cm
= wantcomp
[CHASH(component
)]; cm
; cm
= cm
->c_next
)
1008 if (strcasecmp(component
, cm
->c_name
? cm
->c_name
: "") == 0)
1015 * Add an entry to the component hash table
1017 * Returns true if the component was added, 0 if it already existed.
1022 fmt_addcompentry(char *component
)
1027 FINDCOMP(cm
, component
);
1032 NEWCOMP(cm
, component
);
1035 * ncomp is really meant for fmt_compile() and this function is
1036 * meant to be used outside of it. So decrement it just to be safe
1037 * (internal callers should be using NEWCOMP()).
1046 * Add a string to a component hash table entry.
1048 * Note the special handling for components marked with CT_ADDR. The comments
1049 * in fmt_scan.h explain this in more detail.
1053 fmt_addcomptext(char *component
, char *text
)
1055 int i
, found
= 0, bucket
= CHASH(component
);
1056 struct comp
*cptr
= wantcomp
[bucket
];
1060 if (strcasecmp(component
, cptr
->c_name
? cptr
->c_name
: "") == 0) {
1062 if (! cptr
->c_text
) {
1063 cptr
->c_text
= getcpy(text
);
1065 i
= strlen(cp
= cptr
->c_text
) - 1;
1066 if (cp
[i
] == '\n') {
1067 if (cptr
->c_type
& CT_ADDR
) {
1069 cp
= add(",\n\t", cp
);
1074 cptr
->c_text
= add(text
, cp
);
1077 cptr
= cptr
->c_next
;
1080 return found
? bucket
: -1;
1084 * Append text to a component we've already found. See notes in fmt_scan.h
1085 * for more information.
1089 fmt_appendcomp(int bucket
, char *component
, char *text
)
1094 for (cptr
= wantcomp
[bucket
]; cptr
; cptr
= cptr
->c_next
)
1095 if (strcasecmp(component
, cptr
->c_name
? cptr
->c_name
: "") == 0)
1096 cptr
->c_text
= add(text
, cptr
->c_text
);
1101 * Iterate over our component hash table
1105 fmt_nextcomp(struct comp
*comp
, unsigned int *bucket
)
1110 comp
= comp
->c_next
;
1112 while (comp
== NULL
&& *bucket
< sizeof(wantcomp
)/sizeof(wantcomp
[0])) {
1113 comp
= wantcomp
[(*bucket
)++];
1120 * Free and reset our component hash table
1124 free_comptable(void)
1127 struct comp
*cm
, *cm2
;
1129 for (i
= 0; i
< sizeof(wantcomp
)/sizeof(wantcomp
[0]); i
++) {
1131 while (cm
!= NULL
) {
1143 * Decrement the reference count of a component structure. If it reaches
1148 free_component(struct comp
*cm
)
1150 if (--cm
->c_refcount
<= 0) {
1151 /* Shouldn't ever be NULL, but just in case ... */
1156 if (cm
->c_type
& CT_DATE
)
1158 if (cm
->c_type
& CT_ADDR
&& cm
->c_mn
&& cm
->c_mn
!= &fmt_mnull
)