1*893695ceSjsg /* $OpenBSD: fparseln.c,v 1.8 2023/01/04 13:00:11 jsg Exp $ */
203d4f44bSjakob /* $NetBSD: fparseln.c,v 1.7 1999/07/02 15:49:12 simonb Exp $ */
303d4f44bSjakob
403d4f44bSjakob /*
503d4f44bSjakob * Copyright (c) 1997 Christos Zoulas. All rights reserved.
603d4f44bSjakob *
703d4f44bSjakob * Redistribution and use in source and binary forms, with or without
803d4f44bSjakob * modification, are permitted provided that the following conditions
903d4f44bSjakob * are met:
1003d4f44bSjakob * 1. Redistributions of source code must retain the above copyright
1103d4f44bSjakob * notice, this list of conditions and the following disclaimer.
1203d4f44bSjakob * 2. Redistributions in binary form must reproduce the above copyright
1303d4f44bSjakob * notice, this list of conditions and the following disclaimer in the
1403d4f44bSjakob * documentation and/or other materials provided with the distribution.
1503d4f44bSjakob *
1603d4f44bSjakob * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
1703d4f44bSjakob * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
1803d4f44bSjakob * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
1903d4f44bSjakob * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
2003d4f44bSjakob * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
2103d4f44bSjakob * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
2203d4f44bSjakob * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
2303d4f44bSjakob * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
2403d4f44bSjakob * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
2503d4f44bSjakob * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
2603d4f44bSjakob */
2703d4f44bSjakob
2803d4f44bSjakob #include <stdio.h>
2903d4f44bSjakob #include <string.h>
3003d4f44bSjakob #include <stdlib.h>
3179822b59Smillert
3279822b59Smillert #include "util.h"
3303d4f44bSjakob
34c72b5b24Smillert static int isescaped(const char *, const char *, int);
3503d4f44bSjakob
3603d4f44bSjakob /* isescaped():
3703d4f44bSjakob * Return true if the character in *p that belongs to a string
3803d4f44bSjakob * that starts in *sp, is escaped by the escape character esc.
3903d4f44bSjakob */
4003d4f44bSjakob static int
isescaped(const char * sp,const char * p,int esc)411477552aSderaadt isescaped(const char *sp, const char *p, int esc)
4203d4f44bSjakob {
4303d4f44bSjakob const char *cp;
4403d4f44bSjakob size_t ne;
4503d4f44bSjakob
4603d4f44bSjakob /* No escape character */
4703d4f44bSjakob if (esc == '\0')
4803d4f44bSjakob return 1;
4903d4f44bSjakob
5003d4f44bSjakob /* Count the number of escape characters that precede ours */
5103d4f44bSjakob for (ne = 0, cp = p; --cp >= sp && *cp == esc; ne++)
5203d4f44bSjakob continue;
5303d4f44bSjakob
5403d4f44bSjakob /* Return true if odd number of escape characters */
5503d4f44bSjakob return (ne & 1) != 0;
5603d4f44bSjakob }
5703d4f44bSjakob
5803d4f44bSjakob
5903d4f44bSjakob /* fparseln():
6003d4f44bSjakob * Read a line from a file parsing continuations ending in \
6103d4f44bSjakob * and eliminating trailing newlines, or comments starting with
6203d4f44bSjakob * the comment char.
6303d4f44bSjakob */
6403d4f44bSjakob char *
fparseln(FILE * fp,size_t * size,size_t * lineno,const char str[3],int flags)651477552aSderaadt fparseln(FILE *fp, size_t *size, size_t *lineno, const char str[3],
661477552aSderaadt int flags)
6703d4f44bSjakob {
6803d4f44bSjakob static const char dstr[3] = { '\\', '\\', '#' };
691477552aSderaadt char *buf = NULL, *ptr, *cp, esc, con, nl, com;
701477552aSderaadt size_t s, len = 0;
711477552aSderaadt int cnt = 1;
7203d4f44bSjakob
7303d4f44bSjakob if (str == NULL)
7403d4f44bSjakob str = dstr;
7503d4f44bSjakob
7603d4f44bSjakob esc = str[0];
7703d4f44bSjakob con = str[1];
7803d4f44bSjakob com = str[2];
791477552aSderaadt
8003d4f44bSjakob /*
8103d4f44bSjakob * XXX: it would be cool to be able to specify the newline character,
8203d4f44bSjakob * but unfortunately, fgetln does not let us
8303d4f44bSjakob */
8403d4f44bSjakob nl = '\n';
8503d4f44bSjakob
8603d4f44bSjakob while (cnt) {
8703d4f44bSjakob cnt = 0;
8803d4f44bSjakob
8903d4f44bSjakob if (lineno)
9003d4f44bSjakob (*lineno)++;
9103d4f44bSjakob
9203d4f44bSjakob if ((ptr = fgetln(fp, &s)) == NULL)
9303d4f44bSjakob break;
9403d4f44bSjakob
9503d4f44bSjakob if (s && com) { /* Check and eliminate comments */
9603d4f44bSjakob for (cp = ptr; cp < ptr + s; cp++)
9703d4f44bSjakob if (*cp == com && !isescaped(ptr, cp, esc)) {
9803d4f44bSjakob s = cp - ptr;
9903d4f44bSjakob cnt = s == 0 && buf == NULL;
10003d4f44bSjakob break;
10103d4f44bSjakob }
10203d4f44bSjakob }
10303d4f44bSjakob
10403d4f44bSjakob if (s && nl) { /* Check and eliminate newlines */
10503d4f44bSjakob cp = &ptr[s - 1];
10603d4f44bSjakob
10703d4f44bSjakob if (*cp == nl)
10803d4f44bSjakob s--; /* forget newline */
10903d4f44bSjakob }
11003d4f44bSjakob
11103d4f44bSjakob if (s && con) { /* Check and eliminate continuations */
11203d4f44bSjakob cp = &ptr[s - 1];
11303d4f44bSjakob
11403d4f44bSjakob if (*cp == con && !isescaped(ptr, cp, esc)) {
11503d4f44bSjakob s--; /* forget escape */
11603d4f44bSjakob cnt = 1;
11703d4f44bSjakob }
11803d4f44bSjakob }
11903d4f44bSjakob
12003d4f44bSjakob if (s == 0 && buf != NULL)
12103d4f44bSjakob continue;
12203d4f44bSjakob
12303d4f44bSjakob if ((cp = realloc(buf, len + s + 1)) == NULL) {
12403d4f44bSjakob free(buf);
12503d4f44bSjakob return NULL;
12603d4f44bSjakob }
12703d4f44bSjakob buf = cp;
12803d4f44bSjakob
12903d4f44bSjakob (void) memcpy(buf + len, ptr, s);
13003d4f44bSjakob len += s;
13103d4f44bSjakob buf[len] = '\0';
13203d4f44bSjakob }
13303d4f44bSjakob
13403d4f44bSjakob if ((flags & FPARSELN_UNESCALL) != 0 && esc && buf != NULL &&
13503d4f44bSjakob strchr(buf, esc) != NULL) {
13603d4f44bSjakob ptr = cp = buf;
13703d4f44bSjakob while (cp[0] != '\0') {
13803d4f44bSjakob int skipesc;
13903d4f44bSjakob
14003d4f44bSjakob while (cp[0] != '\0' && cp[0] != esc)
14103d4f44bSjakob *ptr++ = *cp++;
14203d4f44bSjakob if (cp[0] == '\0' || cp[1] == '\0')
14303d4f44bSjakob break;
14403d4f44bSjakob
14503d4f44bSjakob skipesc = 0;
14603d4f44bSjakob if (cp[1] == com)
14703d4f44bSjakob skipesc += (flags & FPARSELN_UNESCCOMM);
14803d4f44bSjakob if (cp[1] == con)
14903d4f44bSjakob skipesc += (flags & FPARSELN_UNESCCONT);
15003d4f44bSjakob if (cp[1] == esc)
15103d4f44bSjakob skipesc += (flags & FPARSELN_UNESCESC);
15203d4f44bSjakob if (cp[1] != com && cp[1] != con && cp[1] != esc)
15303d4f44bSjakob skipesc = (flags & FPARSELN_UNESCREST);
15403d4f44bSjakob
15503d4f44bSjakob if (skipesc)
15603d4f44bSjakob cp++;
15703d4f44bSjakob else
15803d4f44bSjakob *ptr++ = *cp++;
15903d4f44bSjakob *ptr++ = *cp++;
16003d4f44bSjakob }
16103d4f44bSjakob *ptr = '\0';
16203d4f44bSjakob len = strlen(buf);
16303d4f44bSjakob }
16403d4f44bSjakob
16503d4f44bSjakob if (size)
16603d4f44bSjakob *size = len;
16703d4f44bSjakob return buf;
16803d4f44bSjakob }
16903d4f44bSjakob
17003d4f44bSjakob #ifdef TEST
17103d4f44bSjakob
172c72b5b24Smillert int main(int, char **);
17303d4f44bSjakob
17403d4f44bSjakob int
main(argc,argv)17503d4f44bSjakob main(argc, argv)
17603d4f44bSjakob int argc;
17703d4f44bSjakob char **argv;
17803d4f44bSjakob {
17903d4f44bSjakob char *ptr;
18003d4f44bSjakob size_t size, line;
18103d4f44bSjakob
18203d4f44bSjakob line = 0;
18303d4f44bSjakob while ((ptr = fparseln(stdin, &size, &line, NULL,
18403d4f44bSjakob FPARSELN_UNESCALL)) != NULL)
18503d4f44bSjakob printf("line %d (%d) |%s|\n", line, size, ptr);
18603d4f44bSjakob return 0;
18703d4f44bSjakob }
18803d4f44bSjakob
18903d4f44bSjakob /*
19003d4f44bSjakob
19103d4f44bSjakob # This is a test
19203d4f44bSjakob line 1
19303d4f44bSjakob line 2 \
19403d4f44bSjakob line 3 # Comment
19503d4f44bSjakob line 4 \# Not comment \\\\
19603d4f44bSjakob
19703d4f44bSjakob # And a comment \
19803d4f44bSjakob line 5 \\\
19903d4f44bSjakob line 6
20003d4f44bSjakob
20103d4f44bSjakob */
20203d4f44bSjakob
20303d4f44bSjakob #endif /* TEST */
204