xref: /netbsd-src/external/bsd/nvi/dist/ex/ex_join.c (revision 7419ae3a042c9542a122772059cfe2b9f7b20546)
1 /*	$NetBSD: ex_join.c,v 1.5 2017/11/21 07:48:07 rin Exp $ */
2 /*-
3  * Copyright (c) 1992, 1993, 1994
4  *	The Regents of the University of California.  All rights reserved.
5  * Copyright (c) 1992, 1993, 1994, 1995, 1996
6  *	Keith Bostic.  All rights reserved.
7  *
8  * See the LICENSE file for redistribution information.
9  */
10 
11 #include "config.h"
12 
13 #include <sys/cdefs.h>
14 #if 0
15 #ifndef lint
16 static const char sccsid[] = "Id: ex_join.c,v 10.17 2004/03/16 14:14:04 skimo Exp  (Berkeley) Date: 2004/03/16 14:14:04 ";
17 #endif /* not lint */
18 #else
19 __RCSID("$NetBSD: ex_join.c,v 1.5 2017/11/21 07:48:07 rin Exp $");
20 #endif
21 
22 #include <sys/types.h>
23 #include <sys/queue.h>
24 
25 #include <bitstring.h>
26 #include <ctype.h>
27 #include <limits.h>
28 #include <stdio.h>
29 #include <stdlib.h>
30 #include <string.h>
31 
32 #include "../common/common.h"
33 
34 /*
35  * ex_join -- :[line [,line]] j[oin][!] [count] [flags]
36  *	Join lines.
37  *
38  * PUBLIC: int ex_join __P((SCR *, EXCMD *));
39  */
40 int
ex_join(SCR * sp,EXCMD * cmdp)41 ex_join(SCR *sp, EXCMD *cmdp)
42 {
43 	db_recno_t from, to;
44 	size_t blen, clen, len, tlen;
45 	int extra, first;
46 	ARG_CHAR_T echar = 0;
47 	CHAR_T *p, *bp, *tbp = NULL;
48 
49 	NEEDFILE(sp, cmdp);
50 
51 	from = cmdp->addr1.lno;
52 	to = cmdp->addr2.lno;
53 
54 	/* Check for no lines to join. */
55 	if (!db_exist(sp, from + 1)) {
56 		msgq(sp, M_ERR, "131|No following lines to join");
57 		return (1);
58 	}
59 
60 	GET_SPACE_RETW(sp, bp, blen, 256);
61 
62 	/*
63 	 * The count for the join command was off-by-one,
64 	 * historically, to other counts for other commands.
65 	 */
66 	if (F_ISSET(cmdp, E_ADDR_DEF) || cmdp->addrcnt == 1)
67 		++cmdp->addr2.lno;
68 
69 	clen = tlen = 0;
70         for (first = 1,
71 	    from = cmdp->addr1.lno, to = cmdp->addr2.lno; from <= to; ++from) {
72 		/*
73 		 * Get next line.  Historic versions of vi allowed "10J" while
74 		 * less than 10 lines from the end-of-file, so we do too.
75 		 */
76 		if (db_get(sp, from, 0, &p, &len)) {
77 			cmdp->addr2.lno = from - 1;
78 			break;
79 		}
80 
81 		/* Empty lines just go away. */
82 		if (len == 0)
83 			continue;
84 
85 		/*
86 		 * Get more space if necessary.  Note, tlen isn't the length
87 		 * of the new line, it's roughly the amount of space needed.
88 		 * tbp - bp is the length of the new line.
89 		 */
90 		tlen += len + 2;
91 		ADD_SPACE_RETW(sp, bp, blen, tlen);
92 		tbp = bp + clen;
93 
94 		/*
95 		 * Historic practice:
96 		 *
97 		 * If force specified, join without modification.
98 		 * If the current line ends with whitespace, strip leading
99 		 *    whitespace from the joined line.
100 		 * If the next line starts with a ), do nothing.
101 		 * If the current line ends with ., insert two spaces.
102 		 * Else, insert one space.
103 		 *
104 		 * One change -- add ? and ! to the list of characters for
105 		 * which we insert two spaces.  I expect that POSIX 1003.2
106 		 * will require this as well.
107 		 *
108 		 * Echar is the last character in the last line joined.
109 		 */
110 		extra = 0;
111 		if (!first && !FL_ISSET(cmdp->iflags, E_C_FORCE)) {
112 			/*
113 			 * Here we implement behavior just based on nvi-m17n.
114 			 *	last char	first char	behavior
115 			 *	---		---		---
116 			 *	multi-width	multi-width	nothing ins'ed
117 			 *	multi-width	single-width	1 spc ins'ed
118 			 *	single-width	multi-width	1 spc ins'ed
119 			 *	single-width	single-width	original
120 			 */
121 			if (ISMULTIWIDTH(sp, echar)) {
122 				if (ISMULTIWIDTH(sp, p[0])) {
123 					; /* nothing */
124 				} else {
125 					*tbp++ = ' ';
126 					++clen;
127 					for (; len && ISBLANK((UCHAR_T)*p);
128 					    --len, ++p);
129 				}
130 			} else if (ISMULTIWIDTH(sp, p[0])) {
131 				*tbp++ = ' ';
132 				++clen;
133 			} else if (ISBLANK(echar))
134 				for (; len && ISBLANK((UCHAR_T)*p); --len, ++p);
135 			else if (p[0] != ')') {
136 				if (STRCHR(L(".?!"), echar)) {
137 					*tbp++ = ' ';
138 					++clen;
139 					extra = 1;
140 				}
141 				*tbp++ = ' ';
142 				++clen;
143 				for (; len && ISBLANK((UCHAR_T)*p); --len, ++p);
144 			}
145 		}
146 
147 		if (len != 0) {
148 			MEMCPYW(tbp, p, len);
149 			tbp += len;
150 			clen += len;
151 			echar = p[len - 1];
152 		} else
153 			echar = ' ';
154 
155 		/*
156 		 * Historic practice for vi was to put the cursor at the first
157 		 * inserted whitespace character, if there was one, or the
158 		 * first character of the joined line, if there wasn't, or the
159 		 * last character of the line if joined to an empty line.  If
160 		 * a count was specified, the cursor was moved as described
161 		 * for the first line joined, ignoring subsequent lines.  If
162 		 * the join was a ':' command, the cursor was placed at the
163 		 * first non-blank character of the line unless the cursor was
164 		 * "attracted" to the end of line when the command was executed
165 		 * in which case it moved to the new end of line.  There are
166 		 * probably several more special cases, but frankly, my dear,
167 		 * I don't give a damn.  This implementation puts the cursor
168 		 * on the first inserted whitespace character, the first
169 		 * character of the joined line, or the last character of the
170 		 * line regardless.  Note, if the cursor isn't on the joined
171 		 * line (possible with : commands), it is reset to the starting
172 		 * line.
173 		 */
174 		if (first) {
175 			sp->cno = (tbp - bp) - (1 + extra);
176 			first = 0;
177 		} else
178 			sp->cno = (tbp - bp) - len - (1 + extra);
179 	}
180 	sp->lno = cmdp->addr1.lno;
181 
182 	/* Delete the joined lines. */
183         for (from = cmdp->addr1.lno, to = cmdp->addr2.lno; to > from; --to)
184 		if (db_delete(sp, to))
185 			goto err;
186 
187 	/* If the original line changed, reset it. */
188 	if (!first && db_set(sp, from, bp, tbp - bp)) {
189 err:		FREE_SPACEW(sp, bp, blen);
190 		return (1);
191 	}
192 	FREE_SPACEW(sp, bp, blen);
193 
194 	sp->rptlines[L_JOINED] += (cmdp->addr2.lno - cmdp->addr1.lno) + 1;
195 	return (0);
196 }
197