1*99db7d0eSSascha Wildner /* $Id: tbl_layout.c,v 1.50 2021/08/10 12:55:04 schwarze Exp $ */
280387638SSascha Wildner /*
336342e81SSascha Wildner * Copyright (c) 2009, 2010, 2011 Kristaps Dzonsons <kristaps@bsd.lv>
4*99db7d0eSSascha Wildner * Copyright (c) 2012, 2014, 2015, 2017, 2020, 2021
5*99db7d0eSSascha Wildner * Ingo Schwarze <schwarze@openbsd.org>
680387638SSascha Wildner *
780387638SSascha Wildner * Permission to use, copy, modify, and distribute this software for any
880387638SSascha Wildner * purpose with or without fee is hereby granted, provided that the above
980387638SSascha Wildner * copyright notice and this permission notice appear in all copies.
1080387638SSascha Wildner *
1180387638SSascha Wildner * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
1280387638SSascha Wildner * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
1380387638SSascha Wildner * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
1480387638SSascha Wildner * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
1580387638SSascha Wildner * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
1680387638SSascha Wildner * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
1780387638SSascha Wildner * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
1880387638SSascha Wildner */
19a4c7eb57SSascha Wildner #include "config.h"
2054ba9607SSascha Wildner
2154ba9607SSascha Wildner #include <sys/types.h>
22a4c7eb57SSascha Wildner
2380387638SSascha Wildner #include <ctype.h>
2454ba9607SSascha Wildner #include <stdint.h>
2554ba9607SSascha Wildner #include <stdio.h>
2680387638SSascha Wildner #include <stdlib.h>
2780387638SSascha Wildner #include <string.h>
2880387638SSascha Wildner #include <time.h>
2980387638SSascha Wildner
30070c62a6SFranco Fichtner #include "mandoc_aux.h"
3154ba9607SSascha Wildner #include "mandoc.h"
3254ba9607SSascha Wildner #include "tbl.h"
3380387638SSascha Wildner #include "libmandoc.h"
3454ba9607SSascha Wildner #include "tbl_int.h"
3580387638SSascha Wildner
3680387638SSascha Wildner struct tbl_phrase {
3780387638SSascha Wildner char name;
3880387638SSascha Wildner enum tbl_cellt key;
3980387638SSascha Wildner };
4080387638SSascha Wildner
4154ba9607SSascha Wildner static const struct tbl_phrase keys[] = {
4280387638SSascha Wildner { 'c', TBL_CELL_CENTRE },
4380387638SSascha Wildner { 'r', TBL_CELL_RIGHT },
4480387638SSascha Wildner { 'l', TBL_CELL_LEFT },
4580387638SSascha Wildner { 'n', TBL_CELL_NUMBER },
4680387638SSascha Wildner { 's', TBL_CELL_SPAN },
4780387638SSascha Wildner { 'a', TBL_CELL_LONG },
4880387638SSascha Wildner { '^', TBL_CELL_DOWN },
4980387638SSascha Wildner { '-', TBL_CELL_HORIZ },
5080387638SSascha Wildner { '_', TBL_CELL_HORIZ },
51f88b6c16SFranco Fichtner { '=', TBL_CELL_DHORIZ }
5280387638SSascha Wildner };
5380387638SSascha Wildner
5454ba9607SSascha Wildner #define KEYS_MAX ((int)(sizeof(keys)/sizeof(keys[0])))
5554ba9607SSascha Wildner
5654ba9607SSascha Wildner static void mods(struct tbl_node *, struct tbl_cell *,
5780387638SSascha Wildner int, const char *, int *);
5854ba9607SSascha Wildner static void cell(struct tbl_node *, struct tbl_row *,
5980387638SSascha Wildner int, const char *, int *);
60f88b6c16SFranco Fichtner static struct tbl_cell *cell_alloc(struct tbl_node *, struct tbl_row *,
6154ba9607SSascha Wildner enum tbl_cellt);
6280387638SSascha Wildner
63070c62a6SFranco Fichtner
6454ba9607SSascha Wildner static void
mods(struct tbl_node * tbl,struct tbl_cell * cp,int ln,const char * p,int * pos)6580387638SSascha Wildner mods(struct tbl_node *tbl, struct tbl_cell *cp,
6680387638SSascha Wildner int ln, const char *p, int *pos)
6780387638SSascha Wildner {
6854ba9607SSascha Wildner char *endptr;
69*99db7d0eSSascha Wildner unsigned long spacing;
7054ba9607SSascha Wildner size_t sz;
71*99db7d0eSSascha Wildner int isz;
72*99db7d0eSSascha Wildner enum mandoc_esc fontesc;
73a4c7eb57SSascha Wildner
7480387638SSascha Wildner mod:
7554ba9607SSascha Wildner while (p[*pos] == ' ' || p[*pos] == '\t')
7654ba9607SSascha Wildner (*pos)++;
7754ba9607SSascha Wildner
7854ba9607SSascha Wildner /* Row delimiters and cell specifiers end modifier lists. */
7954ba9607SSascha Wildner
8054ba9607SSascha Wildner if (strchr(".,-=^_ACLNRSaclnrs", p[*pos]) != NULL)
8154ba9607SSascha Wildner return;
8280387638SSascha Wildner
8380387638SSascha Wildner /* Throw away parenthesised expression. */
8480387638SSascha Wildner
8580387638SSascha Wildner if ('(' == p[*pos]) {
8680387638SSascha Wildner (*pos)++;
8780387638SSascha Wildner while (p[*pos] && ')' != p[*pos])
8880387638SSascha Wildner (*pos)++;
8980387638SSascha Wildner if (')' == p[*pos]) {
9080387638SSascha Wildner (*pos)++;
9180387638SSascha Wildner goto mod;
9280387638SSascha Wildner }
9354ba9607SSascha Wildner mandoc_msg(MANDOCERR_TBLLAYOUT_PAR, ln, *pos, NULL);
9454ba9607SSascha Wildner return;
9580387638SSascha Wildner }
9680387638SSascha Wildner
9780387638SSascha Wildner /* Parse numerical spacing from modifier string. */
9880387638SSascha Wildner
9980387638SSascha Wildner if (isdigit((unsigned char)p[*pos])) {
100*99db7d0eSSascha Wildner if ((spacing = strtoul(p + *pos, &endptr, 10)) > 9)
101*99db7d0eSSascha Wildner mandoc_msg(MANDOCERR_TBLLAYOUT_SPC, ln, *pos,
102*99db7d0eSSascha Wildner "%lu", spacing);
103*99db7d0eSSascha Wildner else
104*99db7d0eSSascha Wildner cp->spacing = spacing;
10554ba9607SSascha Wildner *pos = endptr - p;
10680387638SSascha Wildner goto mod;
10780387638SSascha Wildner }
10880387638SSascha Wildner
10960e1e752SSascha Wildner switch (tolower((unsigned char)p[(*pos)++])) {
11054ba9607SSascha Wildner case 'b':
111*99db7d0eSSascha Wildner cp->font = ESCAPE_FONTBOLD;
11280387638SSascha Wildner goto mod;
113070c62a6SFranco Fichtner case 'd':
11480387638SSascha Wildner cp->flags |= TBL_CELL_BALIGN;
11580387638SSascha Wildner goto mod;
11654ba9607SSascha Wildner case 'e':
11754ba9607SSascha Wildner cp->flags |= TBL_CELL_EQUAL;
11880387638SSascha Wildner goto mod;
119070c62a6SFranco Fichtner case 'f':
12080387638SSascha Wildner break;
121070c62a6SFranco Fichtner case 'i':
122*99db7d0eSSascha Wildner cp->font = ESCAPE_FONTITALIC;
12380387638SSascha Wildner goto mod;
12454ba9607SSascha Wildner case 'm':
12554ba9607SSascha Wildner mandoc_msg(MANDOCERR_TBLLAYOUT_MOD, ln, *pos, "m");
12654ba9607SSascha Wildner goto mod;
12754ba9607SSascha Wildner case 'p':
12854ba9607SSascha Wildner case 'v':
12954ba9607SSascha Wildner if (p[*pos] == '-' || p[*pos] == '+')
13054ba9607SSascha Wildner (*pos)++;
13154ba9607SSascha Wildner while (isdigit((unsigned char)p[*pos]))
13254ba9607SSascha Wildner (*pos)++;
13354ba9607SSascha Wildner goto mod;
13454ba9607SSascha Wildner case 't':
13554ba9607SSascha Wildner cp->flags |= TBL_CELL_TALIGN;
13654ba9607SSascha Wildner goto mod;
13754ba9607SSascha Wildner case 'u':
13854ba9607SSascha Wildner cp->flags |= TBL_CELL_UP;
13954ba9607SSascha Wildner goto mod;
14054ba9607SSascha Wildner case 'w':
14154ba9607SSascha Wildner sz = 0;
14254ba9607SSascha Wildner if (p[*pos] == '(') {
14354ba9607SSascha Wildner (*pos)++;
14454ba9607SSascha Wildner while (p[*pos + sz] != '\0' && p[*pos + sz] != ')')
14554ba9607SSascha Wildner sz++;
14654ba9607SSascha Wildner } else
14754ba9607SSascha Wildner while (isdigit((unsigned char)p[*pos + sz]))
14854ba9607SSascha Wildner sz++;
14954ba9607SSascha Wildner if (sz) {
15054ba9607SSascha Wildner free(cp->wstr);
15154ba9607SSascha Wildner cp->wstr = mandoc_strndup(p + *pos, sz);
15254ba9607SSascha Wildner *pos += sz;
15354ba9607SSascha Wildner if (p[*pos] == ')')
15454ba9607SSascha Wildner (*pos)++;
15554ba9607SSascha Wildner }
15654ba9607SSascha Wildner goto mod;
15754ba9607SSascha Wildner case 'x':
15854ba9607SSascha Wildner cp->flags |= TBL_CELL_WMAX;
15954ba9607SSascha Wildner goto mod;
16054ba9607SSascha Wildner case 'z':
16154ba9607SSascha Wildner cp->flags |= TBL_CELL_WIGN;
16254ba9607SSascha Wildner goto mod;
16354ba9607SSascha Wildner case '|':
16454ba9607SSascha Wildner if (cp->vert < 2)
16554ba9607SSascha Wildner cp->vert++;
16654ba9607SSascha Wildner else
16754ba9607SSascha Wildner mandoc_msg(MANDOCERR_TBLLAYOUT_VERT,
16854ba9607SSascha Wildner ln, *pos - 1, NULL);
16936342e81SSascha Wildner goto mod;
17080387638SSascha Wildner default:
17154ba9607SSascha Wildner mandoc_msg(MANDOCERR_TBLLAYOUT_CHAR,
17254ba9607SSascha Wildner ln, *pos - 1, "%c", p[*pos - 1]);
17354ba9607SSascha Wildner goto mod;
17480387638SSascha Wildner }
17580387638SSascha Wildner
176*99db7d0eSSascha Wildner while (p[*pos] == ' ' || p[*pos] == '\t')
177*99db7d0eSSascha Wildner (*pos)++;
178*99db7d0eSSascha Wildner
17954ba9607SSascha Wildner /* Ignore parenthised font names for now. */
18054ba9607SSascha Wildner
18154ba9607SSascha Wildner if (p[*pos] == '(')
18254ba9607SSascha Wildner goto mod;
18354ba9607SSascha Wildner
184*99db7d0eSSascha Wildner isz = 0;
185*99db7d0eSSascha Wildner if (p[*pos] != '\0')
186*99db7d0eSSascha Wildner isz++;
187*99db7d0eSSascha Wildner if (strchr(" \t.", p[*pos + isz]) == NULL)
188*99db7d0eSSascha Wildner isz++;
18954ba9607SSascha Wildner
190*99db7d0eSSascha Wildner fontesc = mandoc_font(p + *pos, isz);
191*99db7d0eSSascha Wildner
192*99db7d0eSSascha Wildner switch (fontesc) {
193*99db7d0eSSascha Wildner case ESCAPE_FONTPREV:
194*99db7d0eSSascha Wildner case ESCAPE_ERROR:
19554ba9607SSascha Wildner mandoc_msg(MANDOCERR_FT_BAD,
19654ba9607SSascha Wildner ln, *pos, "TS %s", p + *pos - 1);
197*99db7d0eSSascha Wildner break;
19854ba9607SSascha Wildner default:
199*99db7d0eSSascha Wildner cp->font = fontesc;
200*99db7d0eSSascha Wildner break;
20154ba9607SSascha Wildner }
202*99db7d0eSSascha Wildner *pos += isz;
203*99db7d0eSSascha Wildner goto mod;
20454ba9607SSascha Wildner }
20554ba9607SSascha Wildner
20654ba9607SSascha Wildner static void
cell(struct tbl_node * tbl,struct tbl_row * rp,int ln,const char * p,int * pos)20780387638SSascha Wildner cell(struct tbl_node *tbl, struct tbl_row *rp,
20880387638SSascha Wildner int ln, const char *p, int *pos)
20980387638SSascha Wildner {
21054ba9607SSascha Wildner int i;
21180387638SSascha Wildner enum tbl_cellt c;
21280387638SSascha Wildner
21354ba9607SSascha Wildner /* Handle leading vertical lines */
214f88b6c16SFranco Fichtner
21554ba9607SSascha Wildner while (p[*pos] == ' ' || p[*pos] == '\t' || p[*pos] == '|') {
21654ba9607SSascha Wildner if (p[*pos] == '|') {
21754ba9607SSascha Wildner if (rp->vert < 2)
21854ba9607SSascha Wildner rp->vert++;
21954ba9607SSascha Wildner else
22054ba9607SSascha Wildner mandoc_msg(MANDOCERR_TBLLAYOUT_VERT,
22154ba9607SSascha Wildner ln, *pos, NULL);
22254ba9607SSascha Wildner }
22354ba9607SSascha Wildner (*pos)++;
22454ba9607SSascha Wildner }
22554ba9607SSascha Wildner
22654ba9607SSascha Wildner again:
22754ba9607SSascha Wildner while (p[*pos] == ' ' || p[*pos] == '\t')
228f88b6c16SFranco Fichtner (*pos)++;
229f88b6c16SFranco Fichtner
23054ba9607SSascha Wildner if (p[*pos] == '.' || p[*pos] == '\0')
23154ba9607SSascha Wildner return;
232070c62a6SFranco Fichtner
233f88b6c16SFranco Fichtner /* Parse the column position (`c', `l', `r', ...). */
23480387638SSascha Wildner
23580387638SSascha Wildner for (i = 0; i < KEYS_MAX; i++)
23660e1e752SSascha Wildner if (tolower((unsigned char)p[*pos]) == keys[i].name)
23780387638SSascha Wildner break;
23880387638SSascha Wildner
23954ba9607SSascha Wildner if (i == KEYS_MAX) {
24054ba9607SSascha Wildner mandoc_msg(MANDOCERR_TBLLAYOUT_CHAR,
24154ba9607SSascha Wildner ln, *pos, "%c", p[*pos]);
24254ba9607SSascha Wildner (*pos)++;
24354ba9607SSascha Wildner goto again;
24480387638SSascha Wildner }
24580387638SSascha Wildner c = keys[i].key;
24680387638SSascha Wildner
24754ba9607SSascha Wildner /* Special cases of spanners. */
24880387638SSascha Wildner
24954ba9607SSascha Wildner if (c == TBL_CELL_SPAN) {
25054ba9607SSascha Wildner if (rp->last == NULL)
25154ba9607SSascha Wildner mandoc_msg(MANDOCERR_TBLLAYOUT_SPAN, ln, *pos, NULL);
25254ba9607SSascha Wildner else if (rp->last->pos == TBL_CELL_HORIZ ||
25354ba9607SSascha Wildner rp->last->pos == TBL_CELL_DHORIZ)
25454ba9607SSascha Wildner c = rp->last->pos;
25554ba9607SSascha Wildner } else if (c == TBL_CELL_DOWN && rp == tbl->first_row)
25654ba9607SSascha Wildner mandoc_msg(MANDOCERR_TBLLAYOUT_DOWN, ln, *pos, NULL);
25780387638SSascha Wildner
25880387638SSascha Wildner (*pos)++;
25980387638SSascha Wildner
26080387638SSascha Wildner /* Allocate cell then parse its modifiers. */
26180387638SSascha Wildner
26254ba9607SSascha Wildner mods(tbl, cell_alloc(tbl, rp, c), ln, p, pos);
26380387638SSascha Wildner }
26480387638SSascha Wildner
26554ba9607SSascha Wildner void
tbl_layout(struct tbl_node * tbl,int ln,const char * p,int pos)26654ba9607SSascha Wildner tbl_layout(struct tbl_node *tbl, int ln, const char *p, int pos)
26780387638SSascha Wildner {
26880387638SSascha Wildner struct tbl_row *rp;
26980387638SSascha Wildner
27054ba9607SSascha Wildner rp = NULL;
27154ba9607SSascha Wildner for (;;) {
27254ba9607SSascha Wildner /* Skip whitespace before and after each cell. */
27354ba9607SSascha Wildner
27454ba9607SSascha Wildner while (p[pos] == ' ' || p[pos] == '\t')
27554ba9607SSascha Wildner pos++;
27654ba9607SSascha Wildner
27754ba9607SSascha Wildner switch (p[pos]) {
27854ba9607SSascha Wildner case ',': /* Next row on this input line. */
27954ba9607SSascha Wildner pos++;
28054ba9607SSascha Wildner rp = NULL;
28154ba9607SSascha Wildner continue;
28254ba9607SSascha Wildner case '\0': /* Next row on next input line. */
28354ba9607SSascha Wildner return;
28454ba9607SSascha Wildner case '.': /* End of layout. */
28554ba9607SSascha Wildner pos++;
28654ba9607SSascha Wildner tbl->part = TBL_PART_DATA;
28754ba9607SSascha Wildner
28854ba9607SSascha Wildner /*
28954ba9607SSascha Wildner * When the layout is completely empty,
29054ba9607SSascha Wildner * default to one left-justified column.
29180387638SSascha Wildner */
29280387638SSascha Wildner
29354ba9607SSascha Wildner if (tbl->first_row == NULL) {
29454ba9607SSascha Wildner tbl->first_row = tbl->last_row =
29554ba9607SSascha Wildner mandoc_calloc(1, sizeof(*rp));
29654ba9607SSascha Wildner }
29754ba9607SSascha Wildner if (tbl->first_row->first == NULL) {
29854ba9607SSascha Wildner mandoc_msg(MANDOCERR_TBLLAYOUT_NONE,
29954ba9607SSascha Wildner ln, pos, NULL);
30054ba9607SSascha Wildner cell_alloc(tbl, tbl->first_row,
30154ba9607SSascha Wildner TBL_CELL_LEFT);
30254ba9607SSascha Wildner if (tbl->opts.lvert < tbl->first_row->vert)
30354ba9607SSascha Wildner tbl->opts.lvert = tbl->first_row->vert;
30454ba9607SSascha Wildner return;
30554ba9607SSascha Wildner }
30654ba9607SSascha Wildner
30754ba9607SSascha Wildner /*
30854ba9607SSascha Wildner * Search for the widest line
30954ba9607SSascha Wildner * along the left and right margins.
31054ba9607SSascha Wildner */
31154ba9607SSascha Wildner
31254ba9607SSascha Wildner for (rp = tbl->first_row; rp; rp = rp->next) {
31354ba9607SSascha Wildner if (tbl->opts.lvert < rp->vert)
31454ba9607SSascha Wildner tbl->opts.lvert = rp->vert;
31554ba9607SSascha Wildner if (rp->last != NULL &&
31654ba9607SSascha Wildner rp->last->col + 1 == tbl->opts.cols &&
31754ba9607SSascha Wildner tbl->opts.rvert < rp->last->vert)
31854ba9607SSascha Wildner tbl->opts.rvert = rp->last->vert;
31954ba9607SSascha Wildner
32054ba9607SSascha Wildner /* If the last line is empty, drop it. */
32154ba9607SSascha Wildner
32254ba9607SSascha Wildner if (rp->next != NULL &&
32354ba9607SSascha Wildner rp->next->first == NULL) {
32454ba9607SSascha Wildner free(rp->next);
32554ba9607SSascha Wildner rp->next = NULL;
32654ba9607SSascha Wildner tbl->last_row = rp;
32754ba9607SSascha Wildner }
32854ba9607SSascha Wildner }
32954ba9607SSascha Wildner return;
33054ba9607SSascha Wildner default: /* Cell. */
33154ba9607SSascha Wildner break;
33254ba9607SSascha Wildner }
33354ba9607SSascha Wildner
33454ba9607SSascha Wildner /*
33554ba9607SSascha Wildner * If the last line had at least one cell,
33654ba9607SSascha Wildner * start a new one; otherwise, continue it.
33754ba9607SSascha Wildner */
33854ba9607SSascha Wildner
33954ba9607SSascha Wildner if (rp == NULL) {
34054ba9607SSascha Wildner if (tbl->last_row == NULL ||
34154ba9607SSascha Wildner tbl->last_row->first != NULL) {
34254ba9607SSascha Wildner rp = mandoc_calloc(1, sizeof(*rp));
343f88b6c16SFranco Fichtner if (tbl->last_row)
34480387638SSascha Wildner tbl->last_row->next = rp;
345f88b6c16SFranco Fichtner else
346f88b6c16SFranco Fichtner tbl->first_row = rp;
34780387638SSascha Wildner tbl->last_row = rp;
34854ba9607SSascha Wildner } else
34954ba9607SSascha Wildner rp = tbl->last_row;
35080387638SSascha Wildner }
35154ba9607SSascha Wildner cell(tbl, rp, ln, p, &pos);
35280387638SSascha Wildner }
35380387638SSascha Wildner }
35480387638SSascha Wildner
35580387638SSascha Wildner static struct tbl_cell *
cell_alloc(struct tbl_node * tbl,struct tbl_row * rp,enum tbl_cellt pos)35654ba9607SSascha Wildner cell_alloc(struct tbl_node *tbl, struct tbl_row *rp, enum tbl_cellt pos)
35780387638SSascha Wildner {
35880387638SSascha Wildner struct tbl_cell *p, *pp;
35980387638SSascha Wildner
36054ba9607SSascha Wildner p = mandoc_calloc(1, sizeof(*p));
36154ba9607SSascha Wildner p->spacing = SIZE_MAX;
362*99db7d0eSSascha Wildner p->font = ESCAPE_FONTROMAN;
36354ba9607SSascha Wildner p->pos = pos;
36480387638SSascha Wildner
36554ba9607SSascha Wildner if ((pp = rp->last) != NULL) {
366f88b6c16SFranco Fichtner pp->next = p;
36754ba9607SSascha Wildner p->col = pp->col + 1;
36854ba9607SSascha Wildner } else
369f88b6c16SFranco Fichtner rp->first = p;
37080387638SSascha Wildner rp->last = p;
37180387638SSascha Wildner
37254ba9607SSascha Wildner if (tbl->opts.cols <= p->col)
37354ba9607SSascha Wildner tbl->opts.cols = p->col + 1;
37480387638SSascha Wildner
37554ba9607SSascha Wildner return p;
37680387638SSascha Wildner }
377