1 /* $Vendor-Id: man_validate.c,v 1.42 2010/05/25 12:44:53 kristaps Exp $ */ 2 /* 3 * Copyright (c) 2008, 2009 Kristaps Dzonsons <kristaps@kth.se> 4 * 5 * Permission to use, copy, modify, and distribute this software for any 6 * purpose with or without fee is hereby granted, provided that the above 7 * copyright notice and this permission notice appear in all copies. 8 * 9 * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES 10 * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF 11 * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR 12 * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES 13 * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN 14 * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF 15 * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. 16 */ 17 #ifdef HAVE_CONFIG_H 18 #include "config.h" 19 #endif 20 21 #include <sys/types.h> 22 23 #include <assert.h> 24 #include <ctype.h> 25 #include <errno.h> 26 #include <limits.h> 27 #include <stdarg.h> 28 #include <stdlib.h> 29 30 #include "mandoc.h" 31 #include "libman.h" 32 #include "libmandoc.h" 33 34 #define CHKARGS struct man *m, const struct man_node *n 35 36 typedef int (*v_check)(CHKARGS); 37 38 struct man_valid { 39 v_check *pres; 40 v_check *posts; 41 }; 42 43 static int check_bline(CHKARGS); 44 static int check_eq0(CHKARGS); 45 static int check_le1(CHKARGS); 46 static int check_ge2(CHKARGS); 47 static int check_le5(CHKARGS); 48 static int check_par(CHKARGS); 49 static int check_part(CHKARGS); 50 static int check_root(CHKARGS); 51 static int check_sec(CHKARGS); 52 static int check_text(CHKARGS); 53 static int check_title(CHKARGS); 54 55 static v_check posts_eq0[] = { check_eq0, NULL }; 56 static v_check posts_th[] = { check_ge2, check_le5, check_title, NULL }; 57 static v_check posts_par[] = { check_par, NULL }; 58 static v_check posts_part[] = { check_part, NULL }; 59 static v_check posts_sec[] = { check_sec, NULL }; 60 static v_check posts_le1[] = { check_le1, NULL }; 61 static v_check pres_bline[] = { check_bline, NULL }; 62 63 static const struct man_valid man_valids[MAN_MAX] = { 64 { NULL, posts_eq0 }, /* br */ 65 { pres_bline, posts_th }, /* TH */ 66 { pres_bline, posts_sec }, /* SH */ 67 { pres_bline, posts_sec }, /* SS */ 68 { pres_bline, posts_par }, /* TP */ 69 { pres_bline, posts_par }, /* LP */ 70 { pres_bline, posts_par }, /* PP */ 71 { pres_bline, posts_par }, /* P */ 72 { pres_bline, posts_par }, /* IP */ 73 { pres_bline, posts_par }, /* HP */ 74 { NULL, NULL }, /* SM */ 75 { NULL, NULL }, /* SB */ 76 { NULL, NULL }, /* BI */ 77 { NULL, NULL }, /* IB */ 78 { NULL, NULL }, /* BR */ 79 { NULL, NULL }, /* RB */ 80 { NULL, NULL }, /* R */ 81 { NULL, NULL }, /* B */ 82 { NULL, NULL }, /* I */ 83 { NULL, NULL }, /* IR */ 84 { NULL, NULL }, /* RI */ 85 { NULL, posts_eq0 }, /* na */ 86 { NULL, NULL }, /* i */ 87 { NULL, posts_le1 }, /* sp */ 88 { pres_bline, posts_eq0 }, /* nf */ 89 { pres_bline, posts_eq0 }, /* fi */ 90 { NULL, NULL }, /* r */ 91 { NULL, NULL }, /* RE */ 92 { NULL, posts_part }, /* RS */ 93 { NULL, NULL }, /* DT */ 94 { NULL, NULL }, /* UC */ 95 { NULL, NULL }, /* PD */ 96 { NULL, posts_le1 }, /* Sp */ 97 { pres_bline, posts_le1 }, /* Vb */ 98 { pres_bline, posts_eq0 }, /* Ve */ 99 { NULL, NULL }, /* AT */ 100 }; 101 102 103 int 104 man_valid_pre(struct man *m, const struct man_node *n) 105 { 106 v_check *cp; 107 108 if (MAN_TEXT == n->type) 109 return(1); 110 if (MAN_ROOT == n->type) 111 return(1); 112 113 if (NULL == (cp = man_valids[n->tok].pres)) 114 return(1); 115 for ( ; *cp; cp++) 116 if ( ! (*cp)(m, n)) 117 return(0); 118 return(1); 119 } 120 121 122 int 123 man_valid_post(struct man *m) 124 { 125 v_check *cp; 126 127 if (MAN_VALID & m->last->flags) 128 return(1); 129 m->last->flags |= MAN_VALID; 130 131 switch (m->last->type) { 132 case (MAN_TEXT): 133 return(check_text(m, m->last)); 134 case (MAN_ROOT): 135 return(check_root(m, m->last)); 136 default: 137 break; 138 } 139 140 if (NULL == (cp = man_valids[m->last->tok].posts)) 141 return(1); 142 for ( ; *cp; cp++) 143 if ( ! (*cp)(m, m->last)) 144 return(0); 145 146 return(1); 147 } 148 149 150 static int 151 check_root(CHKARGS) 152 { 153 154 if (MAN_BLINE & m->flags) 155 return(man_nmsg(m, n, MANDOCERR_SCOPEEXIT)); 156 if (MAN_ELINE & m->flags) 157 return(man_nmsg(m, n, MANDOCERR_SCOPEEXIT)); 158 159 m->flags &= ~MAN_BLINE; 160 m->flags &= ~MAN_ELINE; 161 162 if (NULL == m->first->child) { 163 man_nmsg(m, n, MANDOCERR_NODOCBODY); 164 return(0); 165 } else if (NULL == m->meta.title) { 166 if ( ! man_nmsg(m, n, MANDOCERR_NOTITLE)) 167 return(0); 168 /* 169 * If a title hasn't been set, do so now (by 170 * implication, date and section also aren't set). 171 * 172 * FIXME: this should be in man_action.c. 173 */ 174 m->meta.title = mandoc_strdup("unknown"); 175 m->meta.date = time(NULL); 176 m->meta.msec = mandoc_strdup("1"); 177 } 178 179 return(1); 180 } 181 182 183 static int 184 check_title(CHKARGS) 185 { 186 const char *p; 187 188 assert(n->child); 189 /* FIXME: is this sufficient? */ 190 if ('\0' == *n->child->string) { 191 man_nmsg(m, n, MANDOCERR_SYNTARGCOUNT); 192 return(0); 193 } 194 195 for (p = n->child->string; '\0' != *p; p++) 196 if (isalpha((u_char)*p) && ! isupper((u_char)*p)) 197 if ( ! man_nmsg(m, n, MANDOCERR_UPPERCASE)) 198 return(0); 199 200 return(1); 201 } 202 203 204 static int 205 check_text(CHKARGS) 206 { 207 const char *p; 208 int pos, c; 209 210 assert(n->string); 211 212 for (p = n->string, pos = n->pos + 1; *p; p++, pos++) { 213 if ('\\' == *p) { 214 c = mandoc_special(p); 215 if (c) { 216 p += c - 1; 217 pos += c - 1; 218 continue; 219 } 220 221 c = man_pmsg(m, n->line, pos, MANDOCERR_BADESCAPE); 222 if ( ! (MAN_IGN_ESCAPE & m->pflags) && ! c) 223 return(c); 224 } 225 226 if ('\t' == *p || isprint((u_char)*p) || ASCII_HYPH == *p) 227 continue; 228 if ( ! man_pmsg(m, n->line, pos, MANDOCERR_BADCHAR)) 229 return(0); 230 } 231 232 return(1); 233 } 234 235 236 #define INEQ_DEFINE(x, ineq, name) \ 237 static int \ 238 check_##name(CHKARGS) \ 239 { \ 240 if (n->nchild ineq (x)) \ 241 return(1); \ 242 man_vmsg(m, MANDOCERR_SYNTARGCOUNT, n->line, n->pos, \ 243 "line arguments %s %d (have %d)", \ 244 #ineq, (x), n->nchild); \ 245 return(0); \ 246 } 247 248 INEQ_DEFINE(0, ==, eq0) 249 INEQ_DEFINE(1, <=, le1) 250 INEQ_DEFINE(2, >=, ge2) 251 INEQ_DEFINE(5, <=, le5) 252 253 254 static int 255 check_sec(CHKARGS) 256 { 257 258 if (MAN_HEAD == n->type && 0 == n->nchild) { 259 man_nmsg(m, n, MANDOCERR_SYNTARGCOUNT); 260 return(0); 261 } else if (MAN_BODY == n->type && 0 == n->nchild) 262 return(man_nmsg(m, n, MANDOCERR_NOBODY)); 263 264 return(1); 265 } 266 267 268 static int 269 check_part(CHKARGS) 270 { 271 272 if (MAN_BODY == n->type && 0 == n->nchild) 273 return(man_nmsg(m, n, MANDOCERR_NOBODY)); 274 return(1); 275 } 276 277 278 static int 279 check_par(CHKARGS) 280 { 281 282 if (MAN_BODY == n->type) 283 switch (n->tok) { 284 case (MAN_IP): 285 /* FALLTHROUGH */ 286 case (MAN_HP): 287 /* FALLTHROUGH */ 288 case (MAN_TP): 289 /* Body-less lists are ok. */ 290 break; 291 default: 292 if (n->nchild) 293 break; 294 return(man_nmsg(m, n, MANDOCERR_NOBODY)); 295 } 296 if (MAN_HEAD == n->type) 297 switch (n->tok) { 298 case (MAN_PP): 299 /* FALLTHROUGH */ 300 case (MAN_P): 301 /* FALLTHROUGH */ 302 case (MAN_LP): 303 if (0 == n->nchild) 304 break; 305 return(man_nmsg(m, n, MANDOCERR_ARGSLOST)); 306 default: 307 if (n->nchild) 308 break; 309 return(man_nmsg(m, n, MANDOCERR_NOARGS)); 310 } 311 312 return(1); 313 } 314 315 316 static int 317 check_bline(CHKARGS) 318 { 319 320 assert( ! (MAN_ELINE & m->flags)); 321 if (MAN_BLINE & m->flags) { 322 man_nmsg(m, n, MANDOCERR_SYNTLINESCOPE); 323 return(0); 324 } 325 326 return(1); 327 } 328 329