13e12c5d1SDavid du Colombier #include <u.h>
23e12c5d1SDavid du Colombier #include <libc.h>
33e12c5d1SDavid du Colombier #include <bio.h>
43e12c5d1SDavid du Colombier #include <ctype.h>
53e12c5d1SDavid du Colombier
63e12c5d1SDavid du Colombier /*
73e12c5d1SDavid du Colombier * block up paragraphs, possibly with indentation
83e12c5d1SDavid du Colombier */
93e12c5d1SDavid du Colombier
103ff48bf5SDavid du Colombier int extraindent = 0; /* how many spaces to indent all lines */
113ff48bf5SDavid du Colombier int indent = 0; /* current value of indent, before extra indent */
123e12c5d1SDavid du Colombier int length = 70; /* how many columns per output line */
13117100efSDavid du Colombier int join = 1; /* can lines be joined? */
149a747e4fSDavid du Colombier int maxtab = 8;
153e12c5d1SDavid du Colombier Biobuf bin;
163e12c5d1SDavid du Colombier Biobuf bout;
173e12c5d1SDavid du Colombier
183ff48bf5SDavid du Colombier typedef struct Word Word;
193ff48bf5SDavid du Colombier struct Word{
20117100efSDavid du Colombier int bol;
213ff48bf5SDavid du Colombier int indent;
223ff48bf5SDavid du Colombier char text[1];
233ff48bf5SDavid du Colombier };
243ff48bf5SDavid du Colombier
253ff48bf5SDavid du Colombier void fmt(void);
263ff48bf5SDavid du Colombier
273e12c5d1SDavid du Colombier void
usage(void)2859cc4ca5SDavid du Colombier usage(void)
2959cc4ca5SDavid du Colombier {
3059cc4ca5SDavid du Colombier fprint(2, "usage: %s [-j] [-i indent] [-l length] [file...]\n", argv0);
3159cc4ca5SDavid du Colombier exits("usage");
3259cc4ca5SDavid du Colombier }
3359cc4ca5SDavid du Colombier
3459cc4ca5SDavid du Colombier void
main(int argc,char ** argv)353e12c5d1SDavid du Colombier main(int argc, char **argv)
363e12c5d1SDavid du Colombier {
373e12c5d1SDavid du Colombier int i, f;
389a747e4fSDavid du Colombier char *s, *err;
399a747e4fSDavid du Colombier
403e12c5d1SDavid du Colombier ARGBEGIN{
413e12c5d1SDavid du Colombier case 'i':
423ff48bf5SDavid du Colombier extraindent = atoi(EARGF(usage()));
433e12c5d1SDavid du Colombier break;
44117100efSDavid du Colombier case 'j':
45117100efSDavid du Colombier join = 0;
46117100efSDavid du Colombier break;
473e12c5d1SDavid du Colombier case 'w':
483e12c5d1SDavid du Colombier case 'l':
4959cc4ca5SDavid du Colombier length = atoi(EARGF(usage()));
503e12c5d1SDavid du Colombier break;
513e12c5d1SDavid du Colombier default:
5259cc4ca5SDavid du Colombier usage();
533e12c5d1SDavid du Colombier }ARGEND
549a747e4fSDavid du Colombier
553e12c5d1SDavid du Colombier if(length <= indent){
563e12c5d1SDavid du Colombier fprint(2, "%s: line length<=indentation\n", argv0);
573e12c5d1SDavid du Colombier exits("length");
583e12c5d1SDavid du Colombier }
599a747e4fSDavid du Colombier
609a747e4fSDavid du Colombier s=getenv("tabstop");
619a747e4fSDavid du Colombier if(s!=nil && atoi(s)>0)
629a747e4fSDavid du Colombier maxtab=atoi(s);
639a747e4fSDavid du Colombier err = nil;
643e12c5d1SDavid du Colombier Binit(&bout, 1, OWRITE);
653e12c5d1SDavid du Colombier if(argc <= 0){
663e12c5d1SDavid du Colombier Binit(&bin, 0, OREAD);
673ff48bf5SDavid du Colombier fmt();
683e12c5d1SDavid du Colombier }else{
693e12c5d1SDavid du Colombier for(i=0; i<argc; i++){
703e12c5d1SDavid du Colombier f = open(argv[i], OREAD);
719a747e4fSDavid du Colombier if(f < 0){
729a747e4fSDavid du Colombier fprint(2, "%s: can't open %s: %r\n", argv0, argv[i]);
739a747e4fSDavid du Colombier err = "open";
749a747e4fSDavid du Colombier }else{
753e12c5d1SDavid du Colombier Binit(&bin, f, OREAD);
763ff48bf5SDavid du Colombier fmt();
77219b2ee8SDavid du Colombier Bterm(&bin);
783e12c5d1SDavid du Colombier if(i != argc-1)
793e12c5d1SDavid du Colombier Bputc(&bout, '\n');
803e12c5d1SDavid du Colombier }
813e12c5d1SDavid du Colombier }
823e12c5d1SDavid du Colombier }
839a747e4fSDavid du Colombier exits(err);
843e12c5d1SDavid du Colombier }
859a747e4fSDavid du Colombier
869a747e4fSDavid du Colombier int
indentof(char ** linep)873ff48bf5SDavid du Colombier indentof(char **linep)
889a747e4fSDavid du Colombier {
893ff48bf5SDavid du Colombier int i, ind;
903ff48bf5SDavid du Colombier char *line;
913e12c5d1SDavid du Colombier
923ff48bf5SDavid du Colombier ind = 0;
933ff48bf5SDavid du Colombier line = *linep;
943ff48bf5SDavid du Colombier for(i=0; line[i]; i++)
953ff48bf5SDavid du Colombier switch(line[i]){
963ff48bf5SDavid du Colombier default:
973ff48bf5SDavid du Colombier *linep = line;
983ff48bf5SDavid du Colombier return ind;
993e12c5d1SDavid du Colombier case ' ':
1003ff48bf5SDavid du Colombier ind++;
1013ff48bf5SDavid du Colombier break;
1023e12c5d1SDavid du Colombier case '\t':
1033ff48bf5SDavid du Colombier ind += maxtab;
1043ff48bf5SDavid du Colombier ind -= ind%maxtab;
1059a747e4fSDavid du Colombier break;
1063e12c5d1SDavid du Colombier }
1073ff48bf5SDavid du Colombier
1083ff48bf5SDavid du Colombier /* plain white space doesn't change the indent */
1093ff48bf5SDavid du Colombier *linep = "";
1103ff48bf5SDavid du Colombier return indent;
1113ff48bf5SDavid du Colombier }
1123ff48bf5SDavid du Colombier
1133ff48bf5SDavid du Colombier Word**
addword(Word ** words,int * nwordp,char * s,int l,int indent,int bol)114117100efSDavid du Colombier addword(Word **words, int *nwordp, char *s, int l, int indent, int bol)
1153ff48bf5SDavid du Colombier {
1163ff48bf5SDavid du Colombier Word *w;
1173ff48bf5SDavid du Colombier
1183ff48bf5SDavid du Colombier w = malloc(sizeof(Word)+l+1);
1193ff48bf5SDavid du Colombier memmove(w->text, s, l);
1203ff48bf5SDavid du Colombier w->text[l] = '\0';
1213ff48bf5SDavid du Colombier w->indent = indent;
122117100efSDavid du Colombier w->bol = bol;
1233ff48bf5SDavid du Colombier words = realloc(words, (*nwordp+1)*sizeof(Word*));
1243ff48bf5SDavid du Colombier words[(*nwordp)++] = w;
1253ff48bf5SDavid du Colombier return words;
1263ff48bf5SDavid du Colombier }
1273ff48bf5SDavid du Colombier
1283ff48bf5SDavid du Colombier Word**
parseline(char * line,Word ** words,int * nwordp)1293ff48bf5SDavid du Colombier parseline(char *line, Word **words, int *nwordp)
1303ff48bf5SDavid du Colombier {
131117100efSDavid du Colombier int ind, l, bol;
1323ff48bf5SDavid du Colombier
1333ff48bf5SDavid du Colombier ind = indentof(&line);
1343ff48bf5SDavid du Colombier indent = ind;
135117100efSDavid du Colombier bol = 1;
1363ff48bf5SDavid du Colombier for(;;){
1373ff48bf5SDavid du Colombier /* find next word */
1383ff48bf5SDavid du Colombier while(*line==' ' || *line=='\t')
1393ff48bf5SDavid du Colombier line++;
1403ff48bf5SDavid du Colombier if(*line == '\0'){
141117100efSDavid du Colombier if(bol)
142117100efSDavid du Colombier return addword(words, nwordp, "", 0, -1, bol);
1433e12c5d1SDavid du Colombier break;
1449a747e4fSDavid du Colombier }
1453ff48bf5SDavid du Colombier /* how long is this word? */
1463ff48bf5SDavid du Colombier for(l=0; line[l]; l++)
1473ff48bf5SDavid du Colombier if(line[l]==' ' || line[l]=='\t')
1483ff48bf5SDavid du Colombier break;
149117100efSDavid du Colombier words = addword(words, nwordp, line, l, indent, bol);
150117100efSDavid du Colombier bol = 0;
1513ff48bf5SDavid du Colombier line += l;
1529a747e4fSDavid du Colombier }
1533ff48bf5SDavid du Colombier return words;
1543e12c5d1SDavid du Colombier }
1553e12c5d1SDavid du Colombier
1563e12c5d1SDavid du Colombier void
printindent(int w)1573ff48bf5SDavid du Colombier printindent(int w)
1583e12c5d1SDavid du Colombier {
1593ff48bf5SDavid du Colombier while(w >= maxtab){
1603e12c5d1SDavid du Colombier Bputc(&bout, '\t');
1613ff48bf5SDavid du Colombier w -= maxtab;
1623e12c5d1SDavid du Colombier }
1633ff48bf5SDavid du Colombier while(w > 0){
1643e12c5d1SDavid du Colombier Bputc(&bout, ' ');
1653ff48bf5SDavid du Colombier w--;
1663e12c5d1SDavid du Colombier }
1673e12c5d1SDavid du Colombier }
1689a747e4fSDavid du Colombier
1693ff48bf5SDavid du Colombier /* give extra space if word ends with period, etc. */
1703ff48bf5SDavid du Colombier int
nspaceafter(char * s)1713ff48bf5SDavid du Colombier nspaceafter(char *s)
1723e12c5d1SDavid du Colombier {
1733ff48bf5SDavid du Colombier int n;
1743e12c5d1SDavid du Colombier
1753ff48bf5SDavid du Colombier n = strlen(s);
1763ff48bf5SDavid du Colombier if(n < 2)
1773ff48bf5SDavid du Colombier return 1;
178117100efSDavid du Colombier if(isupper(s[0]) && n < 4)
179117100efSDavid du Colombier return 1;
1803ff48bf5SDavid du Colombier if(strchr(".!?", s[n-1]) != nil)
1813ff48bf5SDavid du Colombier return 2;
1823ff48bf5SDavid du Colombier return 1;
1833e12c5d1SDavid du Colombier }
1843ff48bf5SDavid du Colombier
1853ff48bf5SDavid du Colombier
1863e12c5d1SDavid du Colombier void
printwords(Word ** w,int nw)1873ff48bf5SDavid du Colombier printwords(Word **w, int nw)
1889a747e4fSDavid du Colombier {
189117100efSDavid du Colombier int i, j, n, col, nsp;
1903ff48bf5SDavid du Colombier
1913ff48bf5SDavid du Colombier /* one output line per loop */
1923ff48bf5SDavid du Colombier for(i=0; i<nw; ){
1933ff48bf5SDavid du Colombier /* if it's a blank line, print it */
1943ff48bf5SDavid du Colombier if(w[i]->indent == -1){
1953e12c5d1SDavid du Colombier Bputc(&bout, '\n');
1963ff48bf5SDavid du Colombier if(++i == nw) /* out of words */
1973ff48bf5SDavid du Colombier break;
1983e12c5d1SDavid du Colombier }
1993ff48bf5SDavid du Colombier /* emit leading indent */
2003ff48bf5SDavid du Colombier col = extraindent+w[i]->indent;
2013ff48bf5SDavid du Colombier printindent(col);
2023ff48bf5SDavid du Colombier /* emit words until overflow; always emit at least one word */
203117100efSDavid du Colombier for(n=0;; n++){
2043ff48bf5SDavid du Colombier Bprint(&bout, "%s", w[i]->text);
205b280a0acSDavid du Colombier col += utflen(w[i]->text);
2063ff48bf5SDavid du Colombier if(++i == nw)
2073ff48bf5SDavid du Colombier break; /* out of words */
2083ff48bf5SDavid du Colombier if(w[i]->indent != w[i-1]->indent)
2093ff48bf5SDavid du Colombier break; /* indent change */
2103ff48bf5SDavid du Colombier nsp = nspaceafter(w[i-1]->text);
211b280a0acSDavid du Colombier if(col+nsp+utflen(w[i]->text) > extraindent+length)
2123ff48bf5SDavid du Colombier break; /* fold line */
213*2282df4eSDavid du Colombier if(!join && w[i]->bol)
214117100efSDavid du Colombier break;
2153ff48bf5SDavid du Colombier for(j=0; j<nsp; j++)
2163ff48bf5SDavid du Colombier Bputc(&bout, ' '); /* emit space; another word will follow */
2173ff48bf5SDavid du Colombier col += nsp;
2183ff48bf5SDavid du Colombier }
2193ff48bf5SDavid du Colombier /* emit newline */
2203ff48bf5SDavid du Colombier Bputc(&bout, '\n');
2213ff48bf5SDavid du Colombier }
2223ff48bf5SDavid du Colombier }
2233ff48bf5SDavid du Colombier
2249a747e4fSDavid du Colombier void
fmt(void)2253ff48bf5SDavid du Colombier fmt(void)
2269a747e4fSDavid du Colombier {
2273ff48bf5SDavid du Colombier char *s;
2283ff48bf5SDavid du Colombier int i, nw;
2293ff48bf5SDavid du Colombier Word **w;
2303ff48bf5SDavid du Colombier
2313ff48bf5SDavid du Colombier nw = 0;
2323ff48bf5SDavid du Colombier w = nil;
2333ff48bf5SDavid du Colombier while((s = Brdstr(&bin, '\n', 1)) != nil){
2343ff48bf5SDavid du Colombier w = parseline(s, w, &nw);
2353ff48bf5SDavid du Colombier free(s);
2363ff48bf5SDavid du Colombier }
2373ff48bf5SDavid du Colombier printwords(w, nw);
2383ff48bf5SDavid du Colombier for(i=0; i<nw; i++)
2393ff48bf5SDavid du Colombier free(w[i]);
2403ff48bf5SDavid du Colombier free(w);
2413e12c5d1SDavid du Colombier }
242