First test with an external encoding.
[nvi.git] / ex / ex_global.c
blob2da556f06aeb21c8ec782ee1982cb094a9bbe80b
1 /*-
2 * Copyright (c) 1992, 1993, 1994
3 * The Regents of the University of California. All rights reserved.
4 * Copyright (c) 1992, 1993, 1994, 1995, 1996
5 * Keith Bostic. All rights reserved.
7 * See the LICENSE file for redistribution information.
8 */
10 #include "config.h"
12 #ifndef lint
13 static const char sccsid[] = "$Id: ex_global.c,v 10.28 2000/07/16 20:49:32 skimo Exp $ (Berkeley) $Date: 2000/07/16 20:49:32 $";
14 #endif /* not lint */
16 #include <sys/types.h>
17 #include <sys/queue.h>
19 #include <bitstring.h>
20 #include <ctype.h>
21 #include <errno.h>
22 #include <limits.h>
23 #include <stdio.h>
24 #include <stdlib.h>
25 #include <string.h>
26 #include <unistd.h>
28 #include "../common/common.h"
30 enum which {GLOBAL, V};
32 static int ex_g_setup __P((SCR *, EXCMD *, enum which));
35 * ex_global -- [line [,line]] g[lobal][!] /pattern/ [commands]
36 * Exec on lines matching a pattern.
38 * PUBLIC: int ex_global __P((SCR *, EXCMD *));
40 int
41 ex_global(sp, cmdp)
42 SCR *sp;
43 EXCMD *cmdp;
45 return (ex_g_setup(sp,
46 cmdp, FL_ISSET(cmdp->iflags, E_C_FORCE) ? V : GLOBAL));
50 * ex_v -- [line [,line]] v /pattern/ [commands]
51 * Exec on lines not matching a pattern.
53 * PUBLIC: int ex_v __P((SCR *, EXCMD *));
55 int
56 ex_v(sp, cmdp)
57 SCR *sp;
58 EXCMD *cmdp;
60 return (ex_g_setup(sp, cmdp, V));
64 * ex_g_setup --
65 * Ex global and v commands.
67 static int
68 ex_g_setup(sp, cmdp, cmd)
69 SCR *sp;
70 EXCMD *cmdp;
71 enum which cmd;
73 CHAR_T *ptrn, *p, *t;
74 EXCMD *ecp;
75 MARK abs;
76 RANGE *rp;
77 busy_t btype;
78 db_recno_t start, end;
79 regex_t *re;
80 regmatch_t match[1];
81 size_t len;
82 int cnt, delim, eval;
83 CHAR_T *dbp;
85 NEEDFILE(sp, cmdp);
87 if (F_ISSET(sp, SC_EX_GLOBAL)) {
88 msgq(sp, M_ERR,
89 "124|The %s command can't be used as part of a global or v command",
90 cmdp->cmd->name);
91 return (1);
95 * Skip leading white space. Historic vi allowed any non-alphanumeric
96 * to serve as the global command delimiter.
98 if (cmdp->argc == 0)
99 goto usage;
100 for (p = cmdp->argv[0]->bp; isblank(*p); ++p);
101 if (*p == '\0' || isalnum(*p) ||
102 *p == '\\' || *p == '|' || *p == '\n') {
103 usage: ex_emsg(sp, cmdp->cmd->usage, EXM_USAGE);
104 return (1);
106 delim = *p++;
109 * Get the pattern string, toss escaped characters.
111 * QUOTING NOTE:
112 * Only toss an escaped character if it escapes a delimiter.
114 for (ptrn = t = p;;) {
115 if (p[0] == '\0' || p[0] == delim) {
116 if (p[0] == delim)
117 ++p;
119 * !!!
120 * Nul terminate the pattern string -- it's passed
121 * to regcomp which doesn't understand anything else.
123 *t = '\0';
124 break;
126 if (p[0] == '\\')
127 if (p[1] == delim)
128 ++p;
129 else if (p[1] == '\\')
130 *t++ = *p++;
131 *t++ = *p++;
134 /* If the pattern string is empty, use the last one. */
135 if (*ptrn == '\0') {
136 if (sp->re == NULL) {
137 ex_emsg(sp, NULL, EXM_NOPREVRE);
138 return (1);
141 /* Re-compile the RE if necessary. */
142 if (!F_ISSET(sp, SC_RE_SEARCH) &&
143 re_compile(sp, sp->re, sp->re_len,
144 NULL, NULL, &sp->re_c, SEARCH_CSEARCH | SEARCH_MSG))
145 return (1);
146 } else {
147 /* Compile the RE. */
148 if (re_compile(sp, ptrn, t - ptrn, &sp->re,
149 &sp->re_len, &sp->re_c, SEARCH_CSEARCH | SEARCH_MSG))
150 return (1);
153 * Set saved RE. Historic practice is that globals set
154 * direction as well as the RE.
156 sp->searchdir = FORWARD;
158 re = &sp->re_c;
160 /* The global commands always set the previous context mark. */
161 abs.lno = sp->lno;
162 abs.cno = sp->cno;
163 if (mark_set(sp, ABSMARK1, &abs, 1))
164 return (1);
166 /* Get an EXCMD structure. */
167 CALLOC_RET(sp, ecp, EXCMD *, 1, sizeof(EXCMD));
168 CIRCLEQ_INIT(&ecp->rq);
171 * Get a copy of the command string; the default command is print.
172 * Don't worry about a set of <blank>s with no command, that will
173 * default to print in the ex parser. We need to have two copies
174 * because the ex parser may step on the command string when it's
175 * parsing it.
177 if ((len = cmdp->argv[0]->len - (p - cmdp->argv[0]->bp)) == 0) {
178 static CHAR_T pp[] = {'p', 'p', 0};
179 p = pp;
180 len = 1;
183 MALLOC_RET(sp, ecp->cp, CHAR_T *, (len * 2) * sizeof(CHAR_T));
184 ecp->o_cp = ecp->cp;
185 ecp->o_clen = len;
186 MEMCPYW(ecp->cp + len, p, len);
187 ecp->range_lno = OOBLNO;
188 FL_SET(ecp->agv_flags, cmd == GLOBAL ? AGV_GLOBAL : AGV_V);
189 LIST_INSERT_HEAD(&sp->wp->ecq, ecp, q);
192 * For each line... The semantics of global matching are that we first
193 * have to decide which lines are going to get passed to the command,
194 * and then pass them to the command, ignoring other changes. There's
195 * really no way to do this in a single pass, since arbitrary line
196 * creation, deletion and movement can be done in the ex command. For
197 * example, a good vi clone test is ":g/X/mo.-3", or "g/X/.,.+1d".
198 * What we do is create linked list of lines that are tracked through
199 * each ex command. There's a callback routine which the DB interface
200 * routines call when a line is created or deleted. This doesn't help
201 * the layering much.
203 btype = BUSY_ON;
204 cnt = INTERRUPT_CHECK;
205 for (start = cmdp->addr1.lno,
206 end = cmdp->addr2.lno; start <= end; ++start) {
207 if (cnt-- == 0) {
208 if (INTERRUPTED(sp)) {
209 LIST_REMOVE(ecp, q);
210 free(ecp->cp);
211 free(ecp);
212 break;
214 search_busy(sp, btype);
215 btype = BUSY_UPDATE;
216 cnt = INTERRUPT_CHECK;
218 if (db_get(sp, start, DBG_FATAL, &dbp, &len))
219 return (1);
220 match[0].rm_so = 0;
221 match[0].rm_eo = len;
222 switch (eval =
223 regexec(&sp->re_c, dbp, 0, match, REG_STARTEND)) {
224 case 0:
225 if (cmd == V)
226 continue;
227 break;
228 case REG_NOMATCH:
229 if (cmd == GLOBAL)
230 continue;
231 break;
232 default:
233 re_error(sp, eval, &sp->re_c);
234 break;
237 /* If follows the last entry, extend the last entry's range. */
238 if ((rp = ecp->rq.cqh_last) != (void *)&ecp->rq &&
239 rp->stop == start - 1) {
240 ++rp->stop;
241 continue;
244 /* Allocate a new range, and append it to the list. */
245 CALLOC(sp, rp, RANGE *, 1, sizeof(RANGE));
246 if (rp == NULL)
247 return (1);
248 rp->start = rp->stop = start;
249 CIRCLEQ_INSERT_TAIL(&ecp->rq, rp, q);
251 search_busy(sp, BUSY_OFF);
252 return (0);
256 * ex_g_insdel --
257 * Update the ranges based on an insertion or deletion.
259 * PUBLIC: int ex_g_insdel __P((SCR *, lnop_t, db_recno_t));
262 ex_g_insdel(sp, op, lno)
263 SCR *sp;
264 lnop_t op;
265 db_recno_t lno;
267 EXCMD *ecp;
268 RANGE *nrp, *rp;
270 /* All insert/append operations are done as inserts. */
271 if (op == LINE_APPEND)
272 abort();
274 if (op == LINE_RESET)
275 return (0);
277 for (ecp = sp->wp->ecq.lh_first; ecp != NULL; ecp = ecp->q.le_next) {
278 if (!FL_ISSET(ecp->agv_flags, AGV_AT | AGV_GLOBAL | AGV_V))
279 continue;
280 for (rp = ecp->rq.cqh_first; rp != (void *)&ecp->rq; rp = nrp) {
281 nrp = rp->q.cqe_next;
283 /* If range less than the line, ignore it. */
284 if (rp->stop < lno)
285 continue;
288 * If range greater than the line, decrement or
289 * increment the range.
291 if (rp->start > lno) {
292 if (op == LINE_DELETE) {
293 --rp->start;
294 --rp->stop;
295 } else {
296 ++rp->start;
297 ++rp->stop;
299 continue;
303 * Lno is inside the range, decrement the end point
304 * for deletion, and split the range for insertion.
305 * In the latter case, since we're inserting a new
306 * element, neither range can be exhausted.
308 if (op == LINE_DELETE) {
309 if (rp->start > --rp->stop) {
310 CIRCLEQ_REMOVE(&ecp->rq, rp, q);
311 free(rp);
313 } else {
314 CALLOC_RET(sp, nrp, RANGE *, 1, sizeof(RANGE));
315 nrp->start = lno + 1;
316 nrp->stop = rp->stop + 1;
317 rp->stop = lno - 1;
318 CIRCLEQ_INSERT_AFTER(&ecp->rq, rp, nrp, q);
319 rp = nrp;
324 * If the command deleted/inserted lines, the cursor moves to
325 * the line after the deleted/inserted line.
327 ecp->range_lno = lno;
329 return (0);