File: | src/usr.bin/mandoc/eqn.c |
Warning: | line 527, column 22 Access to field 'next' results in a dereference of a null pointer (loaded from field 'last') |
Press '?' to see keyboard shortcuts
Keyboard shortcuts:
1 | /* $OpenBSD: eqn.c,v 1.49 2022/12/26 19:16:02 jmc Exp $ */ | |||
2 | /* | |||
3 | * Copyright (c) 2014, 2015, 2017, 2018, 2020, 2022 | |||
4 | * Ingo Schwarze <schwarze@openbsd.org> | |||
5 | * Copyright (c) 2011, 2014 Kristaps Dzonsons <kristaps@bsd.lv> | |||
6 | * | |||
7 | * Permission to use, copy, modify, and distribute this software for any | |||
8 | * purpose with or without fee is hereby granted, provided that the above | |||
9 | * copyright notice and this permission notice appear in all copies. | |||
10 | * | |||
11 | * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES | |||
12 | * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF | |||
13 | * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR | |||
14 | * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES | |||
15 | * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN | |||
16 | * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF | |||
17 | * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. | |||
18 | */ | |||
19 | #include <sys/types.h> | |||
20 | ||||
21 | #include <assert.h> | |||
22 | #include <ctype.h> | |||
23 | #include <limits.h> | |||
24 | #include <stdio.h> | |||
25 | #include <stdlib.h> | |||
26 | #include <string.h> | |||
27 | #include <time.h> | |||
28 | ||||
29 | #include "mandoc_aux.h" | |||
30 | #include "mandoc.h" | |||
31 | #include "roff.h" | |||
32 | #include "eqn.h" | |||
33 | #include "libmandoc.h" | |||
34 | #include "eqn_parse.h" | |||
35 | ||||
36 | #define EQN_NEST_MAX128 128 /* maximum nesting of defines */ | |||
37 | #define STRNEQ(p1, sz1, p2, sz2)((sz1) == (sz2) && 0 == strncmp((p1), (p2), (sz1))) \ | |||
38 | ((sz1) == (sz2) && 0 == strncmp((p1), (p2), (sz1))) | |||
39 | ||||
40 | enum eqn_tok { | |||
41 | EQN_TOK_DYAD = 0, | |||
42 | EQN_TOK_VEC, | |||
43 | EQN_TOK_UNDER, | |||
44 | EQN_TOK_BAR, | |||
45 | EQN_TOK_TILDE, | |||
46 | EQN_TOK_HAT, | |||
47 | EQN_TOK_DOT, | |||
48 | EQN_TOK_DOTDOT, | |||
49 | EQN_TOK_FWD, | |||
50 | EQN_TOK_BACK, | |||
51 | EQN_TOK_DOWN, | |||
52 | EQN_TOK_UP, | |||
53 | EQN_TOK_FAT, | |||
54 | EQN_TOK_ROMAN, | |||
55 | EQN_TOK_ITALIC, | |||
56 | EQN_TOK_BOLD, | |||
57 | EQN_TOK_SIZE, | |||
58 | EQN_TOK_SUB, | |||
59 | EQN_TOK_SUP, | |||
60 | EQN_TOK_SQRT, | |||
61 | EQN_TOK_OVER, | |||
62 | EQN_TOK_FROM, | |||
63 | EQN_TOK_TO, | |||
64 | EQN_TOK_BRACE_OPEN, | |||
65 | EQN_TOK_BRACE_CLOSE, | |||
66 | EQN_TOK_GSIZE, | |||
67 | EQN_TOK_GFONT, | |||
68 | EQN_TOK_MARK, | |||
69 | EQN_TOK_LINEUP, | |||
70 | EQN_TOK_LEFT, | |||
71 | EQN_TOK_RIGHT, | |||
72 | EQN_TOK_PILE, | |||
73 | EQN_TOK_LPILE, | |||
74 | EQN_TOK_RPILE, | |||
75 | EQN_TOK_CPILE, | |||
76 | EQN_TOK_MATRIX, | |||
77 | EQN_TOK_CCOL, | |||
78 | EQN_TOK_LCOL, | |||
79 | EQN_TOK_RCOL, | |||
80 | EQN_TOK_DELIM, | |||
81 | EQN_TOK_DEFINE, | |||
82 | EQN_TOK_TDEFINE, | |||
83 | EQN_TOK_NDEFINE, | |||
84 | EQN_TOK_UNDEF, | |||
85 | EQN_TOK_ABOVE, | |||
86 | EQN_TOK__MAX, | |||
87 | EQN_TOK_FUNC, | |||
88 | EQN_TOK_QUOTED, | |||
89 | EQN_TOK_SYM, | |||
90 | EQN_TOK_EOF | |||
91 | }; | |||
92 | ||||
93 | static const char *eqn_toks[EQN_TOK__MAX] = { | |||
94 | "dyad", /* EQN_TOK_DYAD */ | |||
95 | "vec", /* EQN_TOK_VEC */ | |||
96 | "under", /* EQN_TOK_UNDER */ | |||
97 | "bar", /* EQN_TOK_BAR */ | |||
98 | "tilde", /* EQN_TOK_TILDE */ | |||
99 | "hat", /* EQN_TOK_HAT */ | |||
100 | "dot", /* EQN_TOK_DOT */ | |||
101 | "dotdot", /* EQN_TOK_DOTDOT */ | |||
102 | "fwd", /* EQN_TOK_FWD * */ | |||
103 | "back", /* EQN_TOK_BACK */ | |||
104 | "down", /* EQN_TOK_DOWN */ | |||
105 | "up", /* EQN_TOK_UP */ | |||
106 | "fat", /* EQN_TOK_FAT */ | |||
107 | "roman", /* EQN_TOK_ROMAN */ | |||
108 | "italic", /* EQN_TOK_ITALIC */ | |||
109 | "bold", /* EQN_TOK_BOLD */ | |||
110 | "size", /* EQN_TOK_SIZE */ | |||
111 | "sub", /* EQN_TOK_SUB */ | |||
112 | "sup", /* EQN_TOK_SUP */ | |||
113 | "sqrt", /* EQN_TOK_SQRT */ | |||
114 | "over", /* EQN_TOK_OVER */ | |||
115 | "from", /* EQN_TOK_FROM */ | |||
116 | "to", /* EQN_TOK_TO */ | |||
117 | "{", /* EQN_TOK_BRACE_OPEN */ | |||
118 | "}", /* EQN_TOK_BRACE_CLOSE */ | |||
119 | "gsize", /* EQN_TOK_GSIZE */ | |||
120 | "gfont", /* EQN_TOK_GFONT */ | |||
121 | "mark", /* EQN_TOK_MARK */ | |||
122 | "lineup", /* EQN_TOK_LINEUP */ | |||
123 | "left", /* EQN_TOK_LEFT */ | |||
124 | "right", /* EQN_TOK_RIGHT */ | |||
125 | "pile", /* EQN_TOK_PILE */ | |||
126 | "lpile", /* EQN_TOK_LPILE */ | |||
127 | "rpile", /* EQN_TOK_RPILE */ | |||
128 | "cpile", /* EQN_TOK_CPILE */ | |||
129 | "matrix", /* EQN_TOK_MATRIX */ | |||
130 | "ccol", /* EQN_TOK_CCOL */ | |||
131 | "lcol", /* EQN_TOK_LCOL */ | |||
132 | "rcol", /* EQN_TOK_RCOL */ | |||
133 | "delim", /* EQN_TOK_DELIM */ | |||
134 | "define", /* EQN_TOK_DEFINE */ | |||
135 | "tdefine", /* EQN_TOK_TDEFINE */ | |||
136 | "ndefine", /* EQN_TOK_NDEFINE */ | |||
137 | "undef", /* EQN_TOK_UNDEF */ | |||
138 | "above", /* EQN_TOK_ABOVE */ | |||
139 | }; | |||
140 | ||||
141 | static const char *const eqn_func[] = { | |||
142 | "acos", "acsc", "and", "arc", "asec", "asin", "atan", | |||
143 | "cos", "cosh", "coth", "csc", "det", "exp", "for", | |||
144 | "if", "lim", "ln", "log", "max", "min", | |||
145 | "sec", "sin", "sinh", "tan", "tanh", "Im", "Re", | |||
146 | }; | |||
147 | ||||
148 | enum eqn_symt { | |||
149 | EQNSYM_alpha = 0, | |||
150 | EQNSYM_beta, | |||
151 | EQNSYM_chi, | |||
152 | EQNSYM_delta, | |||
153 | EQNSYM_epsilon, | |||
154 | EQNSYM_eta, | |||
155 | EQNSYM_gamma, | |||
156 | EQNSYM_iota, | |||
157 | EQNSYM_kappa, | |||
158 | EQNSYM_lambda, | |||
159 | EQNSYM_mu, | |||
160 | EQNSYM_nu, | |||
161 | EQNSYM_omega, | |||
162 | EQNSYM_omicron, | |||
163 | EQNSYM_phi, | |||
164 | EQNSYM_pi, | |||
165 | EQNSYM_ps, | |||
166 | EQNSYM_rho, | |||
167 | EQNSYM_sigma, | |||
168 | EQNSYM_tau, | |||
169 | EQNSYM_theta, | |||
170 | EQNSYM_upsilon, | |||
171 | EQNSYM_xi, | |||
172 | EQNSYM_zeta, | |||
173 | EQNSYM_DELTA, | |||
174 | EQNSYM_GAMMA, | |||
175 | EQNSYM_LAMBDA, | |||
176 | EQNSYM_OMEGA, | |||
177 | EQNSYM_PHI, | |||
178 | EQNSYM_PI, | |||
179 | EQNSYM_PSI, | |||
180 | EQNSYM_SIGMA, | |||
181 | EQNSYM_THETA, | |||
182 | EQNSYM_UPSILON, | |||
183 | EQNSYM_XI, | |||
184 | EQNSYM_inter, | |||
185 | EQNSYM_union, | |||
186 | EQNSYM_prod, | |||
187 | EQNSYM_int, | |||
188 | EQNSYM_sum, | |||
189 | EQNSYM_grad, | |||
190 | EQNSYM_del, | |||
191 | EQNSYM_times, | |||
192 | EQNSYM_cdot, | |||
193 | EQNSYM_nothing, | |||
194 | EQNSYM_approx, | |||
195 | EQNSYM_prime, | |||
196 | EQNSYM_half, | |||
197 | EQNSYM_partial, | |||
198 | EQNSYM_inf, | |||
199 | EQNSYM_muchgreat, | |||
200 | EQNSYM_muchless, | |||
201 | EQNSYM_larrow, | |||
202 | EQNSYM_rarrow, | |||
203 | EQNSYM_pm, | |||
204 | EQNSYM_nequal, | |||
205 | EQNSYM_equiv, | |||
206 | EQNSYM_lessequal, | |||
207 | EQNSYM_moreequal, | |||
208 | EQNSYM_minus, | |||
209 | EQNSYM__MAX | |||
210 | }; | |||
211 | ||||
212 | struct eqnsym { | |||
213 | const char *str; | |||
214 | const char *sym; | |||
215 | }; | |||
216 | ||||
217 | static const struct eqnsym eqnsyms[EQNSYM__MAX] = { | |||
218 | { "alpha", "*a" }, /* EQNSYM_alpha */ | |||
219 | { "beta", "*b" }, /* EQNSYM_beta */ | |||
220 | { "chi", "*x" }, /* EQNSYM_chi */ | |||
221 | { "delta", "*d" }, /* EQNSYM_delta */ | |||
222 | { "epsilon", "*e" }, /* EQNSYM_epsilon */ | |||
223 | { "eta", "*y" }, /* EQNSYM_eta */ | |||
224 | { "gamma", "*g" }, /* EQNSYM_gamma */ | |||
225 | { "iota", "*i" }, /* EQNSYM_iota */ | |||
226 | { "kappa", "*k" }, /* EQNSYM_kappa */ | |||
227 | { "lambda", "*l" }, /* EQNSYM_lambda */ | |||
228 | { "mu", "*m" }, /* EQNSYM_mu */ | |||
229 | { "nu", "*n" }, /* EQNSYM_nu */ | |||
230 | { "omega", "*w" }, /* EQNSYM_omega */ | |||
231 | { "omicron", "*o" }, /* EQNSYM_omicron */ | |||
232 | { "phi", "*f" }, /* EQNSYM_phi */ | |||
233 | { "pi", "*p" }, /* EQNSYM_pi */ | |||
234 | { "psi", "*q" }, /* EQNSYM_psi */ | |||
235 | { "rho", "*r" }, /* EQNSYM_rho */ | |||
236 | { "sigma", "*s" }, /* EQNSYM_sigma */ | |||
237 | { "tau", "*t" }, /* EQNSYM_tau */ | |||
238 | { "theta", "*h" }, /* EQNSYM_theta */ | |||
239 | { "upsilon", "*u" }, /* EQNSYM_upsilon */ | |||
240 | { "xi", "*c" }, /* EQNSYM_xi */ | |||
241 | { "zeta", "*z" }, /* EQNSYM_zeta */ | |||
242 | { "DELTA", "*D" }, /* EQNSYM_DELTA */ | |||
243 | { "GAMMA", "*G" }, /* EQNSYM_GAMMA */ | |||
244 | { "LAMBDA", "*L" }, /* EQNSYM_LAMBDA */ | |||
245 | { "OMEGA", "*W" }, /* EQNSYM_OMEGA */ | |||
246 | { "PHI", "*F" }, /* EQNSYM_PHI */ | |||
247 | { "PI", "*P" }, /* EQNSYM_PI */ | |||
248 | { "PSI", "*Q" }, /* EQNSYM_PSI */ | |||
249 | { "SIGMA", "*S" }, /* EQNSYM_SIGMA */ | |||
250 | { "THETA", "*H" }, /* EQNSYM_THETA */ | |||
251 | { "UPSILON", "*U" }, /* EQNSYM_UPSILON */ | |||
252 | { "XI", "*C" }, /* EQNSYM_XI */ | |||
253 | { "inter", "ca" }, /* EQNSYM_inter */ | |||
254 | { "union", "cu" }, /* EQNSYM_union */ | |||
255 | { "prod", "product" }, /* EQNSYM_prod */ | |||
256 | { "int", "integral" }, /* EQNSYM_int */ | |||
257 | { "sum", "sum" }, /* EQNSYM_sum */ | |||
258 | { "grad", "gr" }, /* EQNSYM_grad */ | |||
259 | { "del", "gr" }, /* EQNSYM_del */ | |||
260 | { "times", "mu" }, /* EQNSYM_times */ | |||
261 | { "cdot", "pc" }, /* EQNSYM_cdot */ | |||
262 | { "nothing", "&" }, /* EQNSYM_nothing */ | |||
263 | { "approx", "~~" }, /* EQNSYM_approx */ | |||
264 | { "prime", "fm" }, /* EQNSYM_prime */ | |||
265 | { "half", "12" }, /* EQNSYM_half */ | |||
266 | { "partial", "pd" }, /* EQNSYM_partial */ | |||
267 | { "inf", "if" }, /* EQNSYM_inf */ | |||
268 | { ">>", ">>" }, /* EQNSYM_muchgreat */ | |||
269 | { "<<", "<<" }, /* EQNSYM_muchless */ | |||
270 | { "<-", "<-" }, /* EQNSYM_larrow */ | |||
271 | { "->", "->" }, /* EQNSYM_rarrow */ | |||
272 | { "+-", "+-" }, /* EQNSYM_pm */ | |||
273 | { "!=", "!=" }, /* EQNSYM_nequal */ | |||
274 | { "==", "==" }, /* EQNSYM_equiv */ | |||
275 | { "<=", "<=" }, /* EQNSYM_lessequal */ | |||
276 | { ">=", ">=" }, /* EQNSYM_moreequal */ | |||
277 | { "-", "mi" }, /* EQNSYM_minus */ | |||
278 | }; | |||
279 | ||||
280 | enum parse_mode { | |||
281 | MODE_QUOTED, | |||
282 | MODE_NOSUB, | |||
283 | MODE_SUB, | |||
284 | MODE_TOK | |||
285 | }; | |||
286 | ||||
287 | struct eqn_def { | |||
288 | char *key; | |||
289 | size_t keysz; | |||
290 | char *val; | |||
291 | size_t valsz; | |||
292 | }; | |||
293 | ||||
294 | static struct eqn_box *eqn_box_alloc(struct eqn_node *, struct eqn_box *); | |||
295 | static struct eqn_box *eqn_box_makebinary(struct eqn_node *, | |||
296 | struct eqn_box *); | |||
297 | static void eqn_def(struct eqn_node *); | |||
298 | static struct eqn_def *eqn_def_find(struct eqn_node *); | |||
299 | static void eqn_delim(struct eqn_node *); | |||
300 | static enum eqn_tok eqn_next(struct eqn_node *, enum parse_mode); | |||
301 | static void eqn_undef(struct eqn_node *); | |||
302 | ||||
303 | ||||
304 | struct eqn_node * | |||
305 | eqn_alloc(void) | |||
306 | { | |||
307 | struct eqn_node *ep; | |||
308 | ||||
309 | ep = mandoc_calloc(1, sizeof(*ep)); | |||
310 | ep->gsize = EQN_DEFSIZE(-0x7fffffff-1); | |||
311 | return ep; | |||
312 | } | |||
313 | ||||
314 | void | |||
315 | eqn_reset(struct eqn_node *ep) | |||
316 | { | |||
317 | free(ep->data); | |||
318 | ep->data = ep->start = ep->end = NULL((void *)0); | |||
319 | ep->sz = ep->toksz = 0; | |||
320 | } | |||
321 | ||||
322 | void | |||
323 | eqn_read(struct eqn_node *ep, const char *p) | |||
324 | { | |||
325 | char *cp; | |||
326 | ||||
327 | if (ep->data == NULL((void *)0)) { | |||
328 | ep->sz = strlen(p); | |||
329 | ep->data = mandoc_strdup(p); | |||
330 | } else { | |||
331 | ep->sz = mandoc_asprintf(&cp, "%s %s", ep->data, p); | |||
332 | free(ep->data); | |||
333 | ep->data = cp; | |||
334 | } | |||
335 | ep->sz += 1; | |||
336 | } | |||
337 | ||||
338 | /* | |||
339 | * Find the key "key" of the give size within our eqn-defined values. | |||
340 | */ | |||
341 | static struct eqn_def * | |||
342 | eqn_def_find(struct eqn_node *ep) | |||
343 | { | |||
344 | int i; | |||
345 | ||||
346 | for (i = 0; i < (int)ep->defsz; i++) | |||
347 | if (ep->defs[i].keysz && STRNEQ(ep->defs[i].key,((ep->defs[i].keysz) == (ep->toksz) && 0 == strncmp ((ep->defs[i].key), (ep->start), (ep->defs[i].keysz) )) | |||
348 | ep->defs[i].keysz, ep->start, ep->toksz)((ep->defs[i].keysz) == (ep->toksz) && 0 == strncmp ((ep->defs[i].key), (ep->start), (ep->defs[i].keysz) ))) | |||
349 | return &ep->defs[i]; | |||
350 | ||||
351 | return NULL((void *)0); | |||
352 | } | |||
353 | ||||
354 | /* | |||
355 | * Parse a token from the input text. The modes are: | |||
356 | * MODE_QUOTED: Use *ep->start as the delimiter; the token ends | |||
357 | * before its next occurrence. Do not interpret the token in any | |||
358 | * way and return EQN_TOK_QUOTED. All other modes behave like | |||
359 | * MODE_QUOTED when *ep->start is '"'. | |||
360 | * MODE_NOSUB: If *ep->start is a curly brace, the token ends after it; | |||
361 | * otherwise, it ends before the next whitespace or brace. | |||
362 | * Do not interpret the token and return EQN_TOK__MAX. | |||
363 | * MODE_SUB: Like MODE_NOSUB, but try to interpret the token as an | |||
364 | * alias created with define. If it is an alias, replace it with | |||
365 | * its string value and reparse. | |||
366 | * MODE_TOK: Like MODE_SUB, but also check the token against the list | |||
367 | * of tokens, and if there is a match, return that token. Otherwise, | |||
368 | * if the token matches a symbol, return EQN_TOK_SYM; if it matches | |||
369 | * a function name, EQN_TOK_FUNC, or else EQN_TOK__MAX. Except for | |||
370 | * a token match, *ep->start is set to an allocated string that the | |||
371 | * caller is expected to free. | |||
372 | * All modes skip whitespace following the end of the token. | |||
373 | */ | |||
374 | static enum eqn_tok | |||
375 | eqn_next(struct eqn_node *ep, enum parse_mode mode) | |||
376 | { | |||
377 | struct eqn_def *def; | |||
378 | size_t start; | |||
379 | int diff, i, newlen, quoted; | |||
380 | enum eqn_tok tok; | |||
381 | ||||
382 | /* | |||
383 | * Reset the recursion counter after advancing | |||
384 | * beyond the end of the rightmost substitution. | |||
385 | */ | |||
386 | if (ep->end - ep->data >= ep->sublen) | |||
387 | ep->subcnt = 0; | |||
388 | ||||
389 | ep->start = ep->end; | |||
390 | quoted = mode == MODE_QUOTED; | |||
391 | for (;;) { | |||
392 | switch (*ep->start) { | |||
393 | case '\0': | |||
394 | ep->toksz = 0; | |||
395 | return EQN_TOK_EOF; | |||
396 | case '"': | |||
397 | quoted = 1; | |||
398 | break; | |||
399 | case ' ': | |||
400 | case '\t': | |||
401 | case '~': | |||
402 | case '^': | |||
403 | if (quoted) | |||
404 | break; | |||
405 | ep->start++; | |||
406 | continue; | |||
407 | default: | |||
408 | break; | |||
409 | } | |||
410 | if (quoted) { | |||
411 | ep->end = strchr(ep->start + 1, *ep->start); | |||
412 | ep->start++; /* Skip opening quote. */ | |||
413 | if (ep->end == NULL((void *)0)) { | |||
414 | mandoc_msg(MANDOCERR_ARG_QUOTE, | |||
415 | ep->node->line, ep->node->pos, NULL((void *)0)); | |||
416 | ep->end = strchr(ep->start, '\0'); | |||
417 | } | |||
418 | } else { | |||
419 | ep->end = ep->start + 1; | |||
420 | if (*ep->start != '{' && *ep->start != '}') | |||
421 | ep->end += strcspn(ep->end, " ^~\"{}\t"); | |||
422 | } | |||
423 | ep->toksz = ep->end - ep->start; | |||
424 | if (quoted && *ep->end != '\0') | |||
425 | ep->end++; /* Skip closing quote. */ | |||
426 | while (*ep->end != '\0' && strchr(" \t^~", *ep->end) != NULL((void *)0)) | |||
427 | ep->end++; | |||
428 | if (quoted) /* Cannot return, may have to strndup. */ | |||
429 | break; | |||
430 | if (mode == MODE_NOSUB) | |||
431 | return EQN_TOK__MAX; | |||
432 | if ((def = eqn_def_find(ep)) == NULL((void *)0)) | |||
433 | break; | |||
434 | if (++ep->subcnt > EQN_NEST_MAX128) { | |||
435 | mandoc_msg(MANDOCERR_ROFFLOOP, | |||
436 | ep->node->line, ep->node->pos, NULL((void *)0)); | |||
437 | break; | |||
438 | } | |||
439 | ||||
440 | /* Replace a defined name with its string value. */ | |||
441 | if ((diff = def->valsz - ep->toksz) > 0) { | |||
442 | start = ep->start - ep->data; | |||
443 | ep->sz += diff; | |||
444 | ep->data = mandoc_realloc(ep->data, ep->sz + 1); | |||
445 | ep->start = ep->data + start; | |||
446 | ep->sublen += diff; | |||
447 | } | |||
448 | if (diff) | |||
449 | memmove(ep->start + def->valsz, ep->start + ep->toksz, | |||
450 | strlen(ep->start + ep->toksz) + 1); | |||
451 | memcpy(ep->start, def->val, def->valsz); | |||
452 | newlen = ep->start - ep->data + def->valsz; | |||
453 | if (ep->sublen < newlen) | |||
454 | ep->sublen = newlen; | |||
455 | } | |||
456 | if (mode != MODE_TOK) | |||
457 | return quoted ? EQN_TOK_QUOTED : EQN_TOK__MAX; | |||
458 | if (quoted) { | |||
459 | ep->start = mandoc_strndup(ep->start, ep->toksz); | |||
460 | return EQN_TOK_QUOTED; | |||
461 | } | |||
462 | for (tok = 0; tok < EQN_TOK__MAX; tok++) | |||
463 | if (STRNEQ(ep->start, ep->toksz,((ep->toksz) == (strlen(eqn_toks[tok])) && 0 == strncmp ((ep->start), (eqn_toks[tok]), (ep->toksz))) | |||
464 | eqn_toks[tok], strlen(eqn_toks[tok]))((ep->toksz) == (strlen(eqn_toks[tok])) && 0 == strncmp ((ep->start), (eqn_toks[tok]), (ep->toksz)))) | |||
465 | return tok; | |||
466 | ||||
467 | for (i = 0; i < EQNSYM__MAX; i++) { | |||
468 | if (STRNEQ(ep->start, ep->toksz,((ep->toksz) == (strlen(eqnsyms[i].str)) && 0 == strncmp ((ep->start), (eqnsyms[i].str), (ep->toksz))) | |||
469 | eqnsyms[i].str, strlen(eqnsyms[i].str))((ep->toksz) == (strlen(eqnsyms[i].str)) && 0 == strncmp ((ep->start), (eqnsyms[i].str), (ep->toksz)))) { | |||
470 | mandoc_asprintf(&ep->start, | |||
471 | "\\[%s]", eqnsyms[i].sym); | |||
472 | return EQN_TOK_SYM; | |||
473 | } | |||
474 | } | |||
475 | ep->start = mandoc_strndup(ep->start, ep->toksz); | |||
476 | for (i = 0; i < (int)(sizeof(eqn_func)/sizeof(*eqn_func)); i++) | |||
477 | if (STRNEQ(ep->start, ep->toksz,((ep->toksz) == (strlen(eqn_func[i])) && 0 == strncmp ((ep->start), (eqn_func[i]), (ep->toksz))) | |||
478 | eqn_func[i], strlen(eqn_func[i]))((ep->toksz) == (strlen(eqn_func[i])) && 0 == strncmp ((ep->start), (eqn_func[i]), (ep->toksz)))) | |||
479 | return EQN_TOK_FUNC; | |||
480 | return EQN_TOK__MAX; | |||
481 | } | |||
482 | ||||
483 | void | |||
484 | eqn_box_free(struct eqn_box *bp) | |||
485 | { | |||
486 | if (bp == NULL((void *)0)) | |||
487 | return; | |||
488 | ||||
489 | if (bp->first) | |||
490 | eqn_box_free(bp->first); | |||
491 | if (bp->next) | |||
492 | eqn_box_free(bp->next); | |||
493 | ||||
494 | free(bp->text); | |||
495 | free(bp->left); | |||
496 | free(bp->right); | |||
497 | free(bp->top); | |||
498 | free(bp->bottom); | |||
499 | free(bp); | |||
500 | } | |||
501 | ||||
502 | struct eqn_box * | |||
503 | eqn_box_new(void) | |||
504 | { | |||
505 | struct eqn_box *bp; | |||
506 | ||||
507 | bp = mandoc_calloc(1, sizeof(*bp)); | |||
508 | bp->expectargs = UINT_MAX0xffffffffU; | |||
509 | return bp; | |||
510 | } | |||
511 | ||||
512 | /* | |||
513 | * Allocate a box as the last child of the parent node. | |||
514 | */ | |||
515 | static struct eqn_box * | |||
516 | eqn_box_alloc(struct eqn_node *ep, struct eqn_box *parent) | |||
517 | { | |||
518 | struct eqn_box *bp; | |||
519 | ||||
520 | bp = eqn_box_new(); | |||
521 | bp->parent = parent; | |||
522 | bp->parent->args++; | |||
523 | bp->font = bp->parent->font; | |||
524 | bp->size = ep->gsize; | |||
525 | ||||
526 | if (NULL((void *)0) != parent->first) { | |||
527 | parent->last->next = bp; | |||
| ||||
528 | bp->prev = parent->last; | |||
529 | } else | |||
530 | parent->first = bp; | |||
531 | ||||
532 | parent->last = bp; | |||
533 | return bp; | |||
534 | } | |||
535 | ||||
536 | /* | |||
537 | * Reparent the current last node (of the current parent) under a new | |||
538 | * EQN_SUBEXPR as the first element. | |||
539 | * Then return the new parent. | |||
540 | * The new EQN_SUBEXPR will have a two-child limit. | |||
541 | */ | |||
542 | static struct eqn_box * | |||
543 | eqn_box_makebinary(struct eqn_node *ep, struct eqn_box *parent) | |||
544 | { | |||
545 | struct eqn_box *b, *newb; | |||
546 | ||||
547 | assert(NULL != parent->last)((((void *)0) != parent->last) ? (void)0 : __assert2("/usr/src/usr.bin/mandoc/eqn.c" , 547, __func__, "NULL != parent->last")); | |||
548 | b = parent->last; | |||
549 | if (parent->last == parent->first) | |||
550 | parent->first = NULL((void *)0); | |||
551 | parent->args--; | |||
552 | parent->last = b->prev; | |||
553 | b->prev = NULL((void *)0); | |||
554 | newb = eqn_box_alloc(ep, parent); | |||
555 | newb->type = EQN_SUBEXPR; | |||
556 | newb->expectargs = 2; | |||
557 | newb->args = 1; | |||
558 | newb->first = newb->last = b; | |||
559 | newb->first->next = NULL((void *)0); | |||
560 | b->parent = newb; | |||
561 | return newb; | |||
562 | } | |||
563 | ||||
564 | /* | |||
565 | * Parse the "delim" control statement. | |||
566 | */ | |||
567 | static void | |||
568 | eqn_delim(struct eqn_node *ep) | |||
569 | { | |||
570 | if (ep->end[0] == '\0' || ep->end[1] == '\0') { | |||
571 | mandoc_msg(MANDOCERR_REQ_EMPTY, | |||
572 | ep->node->line, ep->node->pos, "delim"); | |||
573 | if (ep->end[0] != '\0') | |||
574 | ep->end++; | |||
575 | } else if (strncmp(ep->end, "off", 3) == 0) { | |||
576 | ep->delim = 0; | |||
577 | ep->end += 3; | |||
578 | } else if (strncmp(ep->end, "on", 2) == 0) { | |||
579 | if (ep->odelim && ep->cdelim) | |||
580 | ep->delim = 1; | |||
581 | ep->end += 2; | |||
582 | } else { | |||
583 | ep->odelim = *ep->end++; | |||
584 | ep->cdelim = *ep->end++; | |||
585 | ep->delim = 1; | |||
586 | } | |||
587 | } | |||
588 | ||||
589 | /* | |||
590 | * Undefine a previously-defined string. | |||
591 | */ | |||
592 | static void | |||
593 | eqn_undef(struct eqn_node *ep) | |||
594 | { | |||
595 | struct eqn_def *def; | |||
596 | ||||
597 | if (eqn_next(ep, MODE_NOSUB) == EQN_TOK_EOF) { | |||
598 | mandoc_msg(MANDOCERR_REQ_EMPTY, | |||
599 | ep->node->line, ep->node->pos, "undef"); | |||
600 | return; | |||
601 | } | |||
602 | if ((def = eqn_def_find(ep)) == NULL((void *)0)) | |||
603 | return; | |||
604 | free(def->key); | |||
605 | free(def->val); | |||
606 | def->key = def->val = NULL((void *)0); | |||
607 | def->keysz = def->valsz = 0; | |||
608 | } | |||
609 | ||||
610 | static void | |||
611 | eqn_def(struct eqn_node *ep) | |||
612 | { | |||
613 | struct eqn_def *def; | |||
614 | int i; | |||
615 | ||||
616 | if (eqn_next(ep, MODE_NOSUB) == EQN_TOK_EOF) { | |||
617 | mandoc_msg(MANDOCERR_REQ_EMPTY, | |||
618 | ep->node->line, ep->node->pos, "define"); | |||
619 | return; | |||
620 | } | |||
621 | ||||
622 | /* | |||
623 | * Search for a key that already exists. | |||
624 | * Create a new key if none is found. | |||
625 | */ | |||
626 | if ((def = eqn_def_find(ep)) == NULL((void *)0)) { | |||
627 | /* Find holes in string array. */ | |||
628 | for (i = 0; i < (int)ep->defsz; i++) | |||
629 | if (0 == ep->defs[i].keysz) | |||
630 | break; | |||
631 | ||||
632 | if (i == (int)ep->defsz) { | |||
633 | ep->defsz++; | |||
634 | ep->defs = mandoc_reallocarray(ep->defs, | |||
635 | ep->defsz, sizeof(struct eqn_def)); | |||
636 | ep->defs[i].key = ep->defs[i].val = NULL((void *)0); | |||
637 | } | |||
638 | ||||
639 | def = ep->defs + i; | |||
640 | free(def->key); | |||
641 | def->key = mandoc_strndup(ep->start, ep->toksz); | |||
642 | def->keysz = ep->toksz; | |||
643 | } | |||
644 | ||||
645 | if (eqn_next(ep, MODE_QUOTED) == EQN_TOK_EOF) { | |||
646 | mandoc_msg(MANDOCERR_REQ_EMPTY, | |||
647 | ep->node->line, ep->node->pos, "define %s", def->key); | |||
648 | free(def->key); | |||
649 | free(def->val); | |||
650 | def->key = def->val = NULL((void *)0); | |||
651 | def->keysz = def->valsz = 0; | |||
652 | return; | |||
653 | } | |||
654 | free(def->val); | |||
655 | def->val = mandoc_strndup(ep->start, ep->toksz); | |||
656 | def->valsz = ep->toksz; | |||
657 | } | |||
658 | ||||
659 | void | |||
660 | eqn_parse(struct eqn_node *ep) | |||
661 | { | |||
662 | struct eqn_box *cur, *nbox, *parent, *split; | |||
663 | const char *cp, *cpn; | |||
664 | char *p; | |||
665 | enum eqn_tok tok; | |||
666 | enum { CCL_LET, CCL_DIG, CCL_PUN } ccl, ccln; | |||
667 | int size; | |||
668 | ||||
669 | parent = ep->node->eqn; | |||
670 | assert(parent != NULL)((parent != ((void *)0)) ? (void)0 : __assert2("/usr/src/usr.bin/mandoc/eqn.c" , 670, __func__, "parent != NULL")); | |||
| ||||
671 | ||||
672 | /* | |||
673 | * Empty equation. | |||
674 | * Do not add it to the high-level syntax tree. | |||
675 | */ | |||
676 | ||||
677 | if (ep->data == NULL((void *)0)) | |||
678 | return; | |||
679 | ||||
680 | ep->start = ep->end = ep->data; | |||
681 | ep->sublen = 0; | |||
682 | ep->subcnt = 0; | |||
683 | ||||
684 | next_tok: | |||
685 | tok = eqn_next(ep, MODE_TOK); | |||
686 | switch (tok) { | |||
687 | case EQN_TOK_UNDEF: | |||
688 | eqn_undef(ep); | |||
689 | break; | |||
690 | case EQN_TOK_NDEFINE: | |||
691 | case EQN_TOK_DEFINE: | |||
692 | eqn_def(ep); | |||
693 | break; | |||
694 | case EQN_TOK_TDEFINE: | |||
695 | if (eqn_next(ep, MODE_NOSUB) == EQN_TOK_EOF || | |||
696 | eqn_next(ep, MODE_QUOTED) == EQN_TOK_EOF) | |||
697 | mandoc_msg(MANDOCERR_REQ_EMPTY, | |||
698 | ep->node->line, ep->node->pos, "tdefine"); | |||
699 | break; | |||
700 | case EQN_TOK_DELIM: | |||
701 | eqn_delim(ep); | |||
702 | break; | |||
703 | case EQN_TOK_GFONT: | |||
704 | if (eqn_next(ep, MODE_SUB) == EQN_TOK_EOF) | |||
705 | mandoc_msg(MANDOCERR_REQ_EMPTY, ep->node->line, | |||
706 | ep->node->pos, "%s", eqn_toks[tok]); | |||
707 | break; | |||
708 | case EQN_TOK_MARK: | |||
709 | case EQN_TOK_LINEUP: | |||
710 | /* Ignore these. */ | |||
711 | break; | |||
712 | case EQN_TOK_DYAD: | |||
713 | case EQN_TOK_VEC: | |||
714 | case EQN_TOK_UNDER: | |||
715 | case EQN_TOK_BAR: | |||
716 | case EQN_TOK_TILDE: | |||
717 | case EQN_TOK_HAT: | |||
718 | case EQN_TOK_DOT: | |||
719 | case EQN_TOK_DOTDOT: | |||
720 | if (parent->last == NULL((void *)0)) { | |||
721 | mandoc_msg(MANDOCERR_EQN_NOBOX, ep->node->line, | |||
722 | ep->node->pos, "%s", eqn_toks[tok]); | |||
723 | cur = eqn_box_alloc(ep, parent); | |||
724 | cur->type = EQN_TEXT; | |||
725 | cur->text = mandoc_strdup(""); | |||
726 | } | |||
727 | parent = eqn_box_makebinary(ep, parent); | |||
728 | parent->type = EQN_LIST; | |||
729 | parent->expectargs = 1; | |||
730 | parent->font = EQNFONT_ROMAN; | |||
731 | switch (tok) { | |||
732 | case EQN_TOK_DOTDOT: | |||
733 | parent->top = mandoc_strdup("\\[ad]"); | |||
734 | break; | |||
735 | case EQN_TOK_VEC: | |||
736 | parent->top = mandoc_strdup("\\[->]"); | |||
737 | break; | |||
738 | case EQN_TOK_DYAD: | |||
739 | parent->top = mandoc_strdup("\\[<>]"); | |||
740 | break; | |||
741 | case EQN_TOK_TILDE: | |||
742 | parent->top = mandoc_strdup("\\[a~]"); | |||
743 | break; | |||
744 | case EQN_TOK_UNDER: | |||
745 | parent->bottom = mandoc_strdup("\\[ul]"); | |||
746 | break; | |||
747 | case EQN_TOK_BAR: | |||
748 | parent->top = mandoc_strdup("\\[rn]"); | |||
749 | break; | |||
750 | case EQN_TOK_DOT: | |||
751 | parent->top = mandoc_strdup("\\[a.]"); | |||
752 | break; | |||
753 | case EQN_TOK_HAT: | |||
754 | parent->top = mandoc_strdup("\\[ha]"); | |||
755 | break; | |||
756 | default: | |||
757 | abort(); | |||
758 | } | |||
759 | parent = parent->parent; | |||
760 | break; | |||
761 | case EQN_TOK_FWD: | |||
762 | case EQN_TOK_BACK: | |||
763 | case EQN_TOK_DOWN: | |||
764 | case EQN_TOK_UP: | |||
765 | if (eqn_next(ep, MODE_SUB) == EQN_TOK_EOF) | |||
766 | mandoc_msg(MANDOCERR_REQ_EMPTY, ep->node->line, | |||
767 | ep->node->pos, "%s", eqn_toks[tok]); | |||
768 | break; | |||
769 | case EQN_TOK_FAT: | |||
770 | case EQN_TOK_ROMAN: | |||
771 | case EQN_TOK_ITALIC: | |||
772 | case EQN_TOK_BOLD: | |||
773 | while (parent->args == parent->expectargs) | |||
774 | parent = parent->parent; | |||
775 | /* | |||
776 | * These values apply to the next word or sequence of | |||
777 | * words; thus, we mark that we'll have a child with | |||
778 | * exactly one of those. | |||
779 | */ | |||
780 | parent = eqn_box_alloc(ep, parent); | |||
781 | parent->type = EQN_LIST; | |||
782 | parent->expectargs = 1; | |||
783 | switch (tok) { | |||
784 | case EQN_TOK_FAT: | |||
785 | parent->font = EQNFONT_FAT; | |||
786 | break; | |||
787 | case EQN_TOK_ROMAN: | |||
788 | parent->font = EQNFONT_ROMAN; | |||
789 | break; | |||
790 | case EQN_TOK_ITALIC: | |||
791 | parent->font = EQNFONT_ITALIC; | |||
792 | break; | |||
793 | case EQN_TOK_BOLD: | |||
794 | parent->font = EQNFONT_BOLD; | |||
795 | break; | |||
796 | default: | |||
797 | abort(); | |||
798 | } | |||
799 | break; | |||
800 | case EQN_TOK_SIZE: | |||
801 | case EQN_TOK_GSIZE: | |||
802 | /* Accept two values: integral size and a single. */ | |||
803 | if (eqn_next(ep, MODE_SUB) == EQN_TOK_EOF) { | |||
804 | mandoc_msg(MANDOCERR_REQ_EMPTY, ep->node->line, | |||
805 | ep->node->pos, "%s", eqn_toks[tok]); | |||
806 | break; | |||
807 | } | |||
808 | size = mandoc_strntoi(ep->start, ep->toksz, 10); | |||
809 | if (-1 == size) { | |||
810 | mandoc_msg(MANDOCERR_IT_NONUM, ep->node->line, | |||
811 | ep->node->pos, "%s", eqn_toks[tok]); | |||
812 | break; | |||
813 | } | |||
814 | if (EQN_TOK_GSIZE == tok) { | |||
815 | ep->gsize = size; | |||
816 | break; | |||
817 | } | |||
818 | while (parent->args == parent->expectargs) | |||
819 | parent = parent->parent; | |||
820 | parent = eqn_box_alloc(ep, parent); | |||
821 | parent->type = EQN_LIST; | |||
822 | parent->expectargs = 1; | |||
823 | parent->size = size; | |||
824 | break; | |||
825 | case EQN_TOK_FROM: | |||
826 | case EQN_TOK_TO: | |||
827 | case EQN_TOK_SUB: | |||
828 | case EQN_TOK_SUP: | |||
829 | /* | |||
830 | * We have a left-right-associative expression. | |||
831 | * Repivot under a positional node, open a child scope | |||
832 | * and keep on reading. | |||
833 | */ | |||
834 | if (parent->last == NULL((void *)0)) { | |||
835 | mandoc_msg(MANDOCERR_EQN_NOBOX, ep->node->line, | |||
836 | ep->node->pos, "%s", eqn_toks[tok]); | |||
837 | cur = eqn_box_alloc(ep, parent); | |||
838 | cur->type = EQN_TEXT; | |||
839 | cur->text = mandoc_strdup(""); | |||
840 | } | |||
841 | while (parent->expectargs == 1 && parent->args == 1) | |||
842 | parent = parent->parent; | |||
843 | if (tok == EQN_TOK_FROM || tok == EQN_TOK_TO) { | |||
844 | for (cur = parent; cur != NULL((void *)0); cur = cur->parent) | |||
845 | if (cur->pos == EQNPOS_SUB || | |||
846 | cur->pos == EQNPOS_SUP || | |||
847 | cur->pos == EQNPOS_SUBSUP || | |||
848 | cur->pos == EQNPOS_SQRT || | |||
849 | cur->pos == EQNPOS_OVER) | |||
850 | break; | |||
851 | if (cur != NULL((void *)0)) | |||
852 | parent = cur->parent; | |||
853 | } | |||
854 | if (tok == EQN_TOK_SUP && parent->pos == EQNPOS_SUB) { | |||
855 | parent->expectargs = 3; | |||
856 | parent->pos = EQNPOS_SUBSUP; | |||
857 | break; | |||
858 | } | |||
859 | if (tok == EQN_TOK_TO && parent->pos == EQNPOS_FROM) { | |||
860 | parent->expectargs = 3; | |||
861 | parent->pos = EQNPOS_FROMTO; | |||
862 | break; | |||
863 | } | |||
864 | parent = eqn_box_makebinary(ep, parent); | |||
865 | switch (tok) { | |||
866 | case EQN_TOK_FROM: | |||
867 | parent->pos = EQNPOS_FROM; | |||
868 | break; | |||
869 | case EQN_TOK_TO: | |||
870 | parent->pos = EQNPOS_TO; | |||
871 | break; | |||
872 | case EQN_TOK_SUP: | |||
873 | parent->pos = EQNPOS_SUP; | |||
874 | break; | |||
875 | case EQN_TOK_SUB: | |||
876 | parent->pos = EQNPOS_SUB; | |||
877 | break; | |||
878 | default: | |||
879 | abort(); | |||
880 | } | |||
881 | break; | |||
882 | case EQN_TOK_SQRT: | |||
883 | while (parent->args == parent->expectargs) | |||
884 | parent = parent->parent; | |||
885 | /* | |||
886 | * Accept a left-right-associative set of arguments just | |||
887 | * like sub and sup and friends but without rebalancing | |||
888 | * under a pivot. | |||
889 | */ | |||
890 | parent = eqn_box_alloc(ep, parent); | |||
891 | parent->type = EQN_SUBEXPR; | |||
892 | parent->pos = EQNPOS_SQRT; | |||
893 | parent->expectargs = 1; | |||
894 | break; | |||
895 | case EQN_TOK_OVER: | |||
896 | /* | |||
897 | * We have a right-left-associative fraction. | |||
898 | * Close out anything that's currently open, then | |||
899 | * rebalance and continue reading. | |||
900 | */ | |||
901 | if (parent->last == NULL((void *)0)) { | |||
902 | mandoc_msg(MANDOCERR_EQN_NOBOX, ep->node->line, | |||
903 | ep->node->pos, "%s", eqn_toks[tok]); | |||
904 | cur = eqn_box_alloc(ep, parent); | |||
905 | cur->type = EQN_TEXT; | |||
906 | cur->text = mandoc_strdup(""); | |||
907 | } | |||
908 | while (parent->args == parent->expectargs) | |||
909 | parent = parent->parent; | |||
910 | while (EQN_SUBEXPR == parent->type) | |||
911 | parent = parent->parent; | |||
912 | parent = eqn_box_makebinary(ep, parent); | |||
913 | parent->pos = EQNPOS_OVER; | |||
914 | break; | |||
915 | case EQN_TOK_RIGHT: | |||
916 | case EQN_TOK_BRACE_CLOSE: | |||
917 | /* | |||
918 | * Close out the existing brace. | |||
919 | * FIXME: this is a shitty sentinel: we should really | |||
920 | * have a native EQN_BRACE type or whatnot. | |||
921 | */ | |||
922 | for (cur = parent; cur != NULL((void *)0); cur = cur->parent) | |||
923 | if (cur->type == EQN_LIST && | |||
924 | cur->expectargs > 1 && | |||
925 | (tok == EQN_TOK_BRACE_CLOSE || | |||
926 | cur->left != NULL((void *)0))) | |||
927 | break; | |||
928 | if (cur == NULL((void *)0)) { | |||
929 | mandoc_msg(MANDOCERR_BLK_NOTOPEN, ep->node->line, | |||
930 | ep->node->pos, "%s", eqn_toks[tok]); | |||
931 | break; | |||
932 | } | |||
933 | parent = cur; | |||
934 | if (EQN_TOK_RIGHT == tok) { | |||
935 | if (eqn_next(ep, MODE_SUB) == EQN_TOK_EOF) { | |||
936 | mandoc_msg(MANDOCERR_REQ_EMPTY, | |||
937 | ep->node->line, ep->node->pos, | |||
938 | "%s", eqn_toks[tok]); | |||
939 | break; | |||
940 | } | |||
941 | /* Handling depends on right/left. */ | |||
942 | if (STRNEQ(ep->start, ep->toksz, "ceiling", 7)((ep->toksz) == (7) && 0 == strncmp((ep->start) , ("ceiling"), (ep->toksz)))) | |||
943 | parent->right = mandoc_strdup("\\[rc]"); | |||
944 | else if (STRNEQ(ep->start, ep->toksz, "floor", 5)((ep->toksz) == (5) && 0 == strncmp((ep->start) , ("floor"), (ep->toksz)))) | |||
945 | parent->right = mandoc_strdup("\\[rf]"); | |||
946 | else | |||
947 | parent->right = | |||
948 | mandoc_strndup(ep->start, ep->toksz); | |||
949 | } | |||
950 | parent = parent->parent; | |||
951 | if (tok == EQN_TOK_BRACE_CLOSE && | |||
952 | (parent->type == EQN_PILE || | |||
953 | parent->type == EQN_MATRIX)) | |||
954 | parent = parent->parent; | |||
955 | /* Close out any "singleton" lists. */ | |||
956 | while (parent->type == EQN_LIST && | |||
957 | parent->expectargs == 1 && | |||
958 | parent->args == 1) | |||
959 | parent = parent->parent; | |||
960 | break; | |||
961 | case EQN_TOK_BRACE_OPEN: | |||
962 | case EQN_TOK_LEFT: | |||
963 | /* | |||
964 | * If we already have something in the stack and we're | |||
965 | * in an expression, then rewind til we're not any more | |||
966 | * (just like with the text node). | |||
967 | */ | |||
968 | while (parent->args == parent->expectargs) | |||
969 | parent = parent->parent; | |||
970 | if (EQN_TOK_LEFT == tok && | |||
971 | eqn_next(ep, MODE_SUB) == EQN_TOK_EOF) { | |||
972 | mandoc_msg(MANDOCERR_REQ_EMPTY, ep->node->line, | |||
973 | ep->node->pos, "%s", eqn_toks[tok]); | |||
974 | break; | |||
975 | } | |||
976 | parent = eqn_box_alloc(ep, parent); | |||
977 | parent->type = EQN_LIST; | |||
978 | if (EQN_TOK_LEFT == tok) { | |||
979 | if (STRNEQ(ep->start, ep->toksz, "ceiling", 7)((ep->toksz) == (7) && 0 == strncmp((ep->start) , ("ceiling"), (ep->toksz)))) | |||
980 | parent->left = mandoc_strdup("\\[lc]"); | |||
981 | else if (STRNEQ(ep->start, ep->toksz, "floor", 5)((ep->toksz) == (5) && 0 == strncmp((ep->start) , ("floor"), (ep->toksz)))) | |||
982 | parent->left = mandoc_strdup("\\[lf]"); | |||
983 | else | |||
984 | parent->left = | |||
985 | mandoc_strndup(ep->start, ep->toksz); | |||
986 | } | |||
987 | break; | |||
988 | case EQN_TOK_PILE: | |||
989 | case EQN_TOK_LPILE: | |||
990 | case EQN_TOK_RPILE: | |||
991 | case EQN_TOK_CPILE: | |||
992 | case EQN_TOK_CCOL: | |||
993 | case EQN_TOK_LCOL: | |||
994 | case EQN_TOK_RCOL: | |||
995 | while (parent->args == parent->expectargs) | |||
996 | parent = parent->parent; | |||
997 | parent = eqn_box_alloc(ep, parent); | |||
998 | parent->type = EQN_PILE; | |||
999 | parent->expectargs = 1; | |||
1000 | break; | |||
1001 | case EQN_TOK_ABOVE: | |||
1002 | for (cur = parent; cur != NULL((void *)0); cur = cur->parent) | |||
1003 | if (cur->type == EQN_PILE) | |||
1004 | break; | |||
1005 | if (cur == NULL((void *)0)) { | |||
1006 | mandoc_msg(MANDOCERR_IT_STRAY, ep->node->line, | |||
1007 | ep->node->pos, "%s", eqn_toks[tok]); | |||
1008 | break; | |||
1009 | } | |||
1010 | parent = eqn_box_alloc(ep, cur); | |||
1011 | parent->type = EQN_LIST; | |||
1012 | break; | |||
1013 | case EQN_TOK_MATRIX: | |||
1014 | while (parent->args == parent->expectargs) | |||
1015 | parent = parent->parent; | |||
1016 | parent = eqn_box_alloc(ep, parent); | |||
1017 | parent->type = EQN_MATRIX; | |||
1018 | parent->expectargs = 1; | |||
1019 | break; | |||
1020 | case EQN_TOK_EOF: | |||
1021 | return; | |||
1022 | case EQN_TOK__MAX: | |||
1023 | case EQN_TOK_FUNC: | |||
1024 | case EQN_TOK_QUOTED: | |||
1025 | case EQN_TOK_SYM: | |||
1026 | p = ep->start; | |||
1027 | assert(p != NULL)((p != ((void *)0)) ? (void)0 : __assert2("/usr/src/usr.bin/mandoc/eqn.c" , 1027, __func__, "p != NULL")); | |||
1028 | /* | |||
1029 | * If we already have something in the stack and we're | |||
1030 | * in an expression, then rewind til we're not any more. | |||
1031 | */ | |||
1032 | while (parent->args == parent->expectargs) | |||
1033 | parent = parent->parent; | |||
1034 | cur = eqn_box_alloc(ep, parent); | |||
1035 | cur->type = EQN_TEXT; | |||
1036 | cur->text = p; | |||
1037 | switch (tok) { | |||
1038 | case EQN_TOK_FUNC: | |||
1039 | cur->font = EQNFONT_ROMAN; | |||
1040 | break; | |||
1041 | case EQN_TOK_QUOTED: | |||
1042 | if (cur->font == EQNFONT_NONE) | |||
1043 | cur->font = EQNFONT_ITALIC; | |||
1044 | break; | |||
1045 | case EQN_TOK_SYM: | |||
1046 | break; | |||
1047 | default: | |||
1048 | if (cur->font != EQNFONT_NONE || *p == '\0') | |||
1049 | break; | |||
1050 | cpn = p - 1; | |||
1051 | ccln = CCL_LET; | |||
1052 | split = NULL((void *)0); | |||
1053 | for (;;) { | |||
1054 | /* Advance to next character. */ | |||
1055 | cp = cpn++; | |||
1056 | ccl = ccln; | |||
1057 | ccln = isalpha((unsigned char)*cpn) ? CCL_LET : | |||
1058 | isdigit((unsigned char)*cpn) || | |||
1059 | (*cpn == '.' && (ccl == CCL_DIG || | |||
1060 | isdigit((unsigned char)cpn[1]))) ? | |||
1061 | CCL_DIG : CCL_PUN; | |||
1062 | /* No boundary before first character. */ | |||
1063 | if (cp < p) | |||
1064 | continue; | |||
1065 | cur->font = ccl == CCL_LET ? | |||
1066 | EQNFONT_ITALIC : EQNFONT_ROMAN; | |||
1067 | if (*cp == '\\') | |||
1068 | mandoc_escape(&cpn, NULL((void *)0), NULL((void *)0)); | |||
1069 | /* No boundary after last character. */ | |||
1070 | if (*cpn == '\0') | |||
1071 | break; | |||
1072 | if (ccln == ccl && *cp != ',' && *cpn != ',') | |||
1073 | continue; | |||
1074 | /* Boundary found, split the text. */ | |||
1075 | if (parent->args == parent->expectargs) { | |||
1076 | /* Remove the text from the tree. */ | |||
1077 | if (cur->prev == NULL((void *)0)) | |||
1078 | parent->first = cur->next; | |||
1079 | else | |||
1080 | cur->prev->next = NULL((void *)0); | |||
1081 | parent->last = cur->prev; | |||
1082 | parent->args--; | |||
1083 | /* Set up a list instead. */ | |||
1084 | split = eqn_box_alloc(ep, parent); | |||
1085 | split->type = EQN_LIST; | |||
1086 | /* Insert the word into the list. */ | |||
1087 | split->first = split->last = cur; | |||
1088 | cur->parent = split; | |||
1089 | cur->prev = NULL((void *)0); | |||
1090 | parent = split; | |||
1091 | } | |||
1092 | /* Append a new text box. */ | |||
1093 | nbox = eqn_box_alloc(ep, parent); | |||
1094 | nbox->type = EQN_TEXT; | |||
1095 | nbox->text = mandoc_strdup(cpn); | |||
1096 | /* Truncate the old box. */ | |||
1097 | p = mandoc_strndup(cur->text, | |||
1098 | cpn - cur->text); | |||
1099 | free(cur->text); | |||
1100 | cur->text = p; | |||
1101 | /* Setup to process the new box. */ | |||
1102 | cur = nbox; | |||
1103 | p = nbox->text; | |||
1104 | cpn = p - 1; | |||
1105 | ccln = CCL_LET; | |||
1106 | } | |||
1107 | if (split != NULL((void *)0)) | |||
1108 | parent = split->parent; | |||
1109 | break; | |||
1110 | } | |||
1111 | break; | |||
1112 | default: | |||
1113 | abort(); | |||
1114 | } | |||
1115 | goto next_tok; | |||
1116 | } | |||
1117 | ||||
1118 | void | |||
1119 | eqn_free(struct eqn_node *p) | |||
1120 | { | |||
1121 | int i; | |||
1122 | ||||
1123 | if (p == NULL((void *)0)) | |||
1124 | return; | |||
1125 | ||||
1126 | for (i = 0; i < (int)p->defsz; i++) { | |||
1127 | free(p->defs[i].key); | |||
1128 | free(p->defs[i].val); | |||
1129 | } | |||
1130 | ||||
1131 | free(p->data); | |||
1132 | free(p->defs); | |||
1133 | free(p); | |||
1134 | } |