xref: /dragonfly/contrib/nvi2/vi/v_search.c (revision 07bc39c2f4bbca56f12568e06d89da17f2eeb965)
1 /*-
2  * Copyright (c) 1992, 1993, 1994
3  *        The Regents of the University of California.  All rights reserved.
4  * Copyright (c) 1992, 1993, 1994, 1995, 1996
5  *        Keith Bostic.  All rights reserved.
6  *
7  * See the LICENSE file for redistribution information.
8  */
9 
10 #include "config.h"
11 
12 #include <sys/types.h>
13 #include <sys/queue.h>
14 #include <sys/time.h>
15 
16 #include <bitstring.h>
17 #include <ctype.h>
18 #include <errno.h>
19 #include <limits.h>
20 #include <stdio.h>
21 #include <stdlib.h>
22 #include <string.h>
23 
24 #include "../common/common.h"
25 #include "vi.h"
26 
27 static int v_exaddr(SCR *, VICMD *, dir_t);
28 static int v_search(SCR *, VICMD *, CHAR_T *, size_t, u_int, dir_t);
29 
30 /*
31  * v_srch -- [count]?RE[? offset]
32  *        Ex address search backward.
33  *
34  * PUBLIC: int v_searchb(SCR *, VICMD *);
35  */
36 int
v_searchb(SCR * sp,VICMD * vp)37 v_searchb(SCR *sp, VICMD *vp)
38 {
39           return (v_exaddr(sp, vp, BACKWARD));
40 }
41 
42 /*
43  * v_searchf -- [count]/RE[/ offset]
44  *        Ex address search forward.
45  *
46  * PUBLIC: int v_searchf(SCR *, VICMD *);
47  */
48 int
v_searchf(SCR * sp,VICMD * vp)49 v_searchf(SCR *sp, VICMD *vp)
50 {
51           return (v_exaddr(sp, vp, FORWARD));
52 }
53 
54 /*
55  * v_exaddr --
56  *        Do a vi search (which is really an ex address).
57  */
58 static int
v_exaddr(SCR * sp,VICMD * vp,dir_t dir)59 v_exaddr(SCR *sp, VICMD *vp, dir_t dir)
60 {
61           static EXCMDLIST fake = { L("search") };
62           EXCMD *cmdp;
63           GS *gp;
64           TEXT *tp;
65           recno_t s_lno;
66           size_t len, s_cno, tlen;
67           int err, nb, type;
68           char buf[20];
69           CHAR_T *cmd, *t;
70           CHAR_T *w;
71           size_t wlen;
72 
73           /*
74            * !!!
75            * If using the search command as a motion, any addressing components
76            * are lost, i.e. y/ptrn/+2, when repeated, is the same as y/ptrn/.
77            */
78           if (F_ISSET(vp, VC_ISDOT))
79                     return (v_search(sp, vp,
80                         NULL, 0, SEARCH_PARSE | SEARCH_MSG | SEARCH_SET, dir));
81 
82           /* Get the search pattern. */
83           if (v_tcmd(sp, vp, dir == BACKWARD ? CH_BSEARCH : CH_FSEARCH,
84               TXT_BS | TXT_CR | TXT_ESCAPE | TXT_PROMPT |
85               (O_ISSET(sp, O_SEARCHINCR) ? TXT_SEARCHINCR : 0)))
86                     return (1);
87 
88           tp = TAILQ_FIRST(sp->tiq);
89 
90           /* If the user backspaced over the prompt, do nothing. */
91           if (tp->term == TERM_BS)
92                     return (1);
93 
94           /*
95            * If the user was doing an incremental search, then we've already
96            * updated the cursor and moved to the right location.  Return the
97            * correct values, we're done.
98            */
99           if (tp->term == TERM_SEARCH) {
100                     vp->m_stop.lno = sp->lno;
101                     vp->m_stop.cno = sp->cno;
102                     if (ISMOTION(vp))
103                               return (v_correct(sp, vp, 0));
104                     vp->m_final = vp->m_stop;
105                     return (0);
106           }
107 
108           /*
109            * If the user entered <escape> or <carriage-return>, the length is
110            * 1 and the right thing will happen, i.e. the prompt will be used
111            * as a command character.
112            *
113            * Build a fake ex command structure.
114            */
115           gp = sp->gp;
116           gp->excmd.cp = tp->lb;
117           gp->excmd.clen = tp->len;
118           F_INIT(&gp->excmd, E_VISEARCH);
119 
120           /*
121            * XXX
122            * Warn if the search wraps.  This is a pretty special case, but it's
123            * nice feature that wasn't in the original implementations of ex/vi.
124            * (It was added at some point to System V's version.)  This message
125            * is only displayed if there are no keys in the queue. The problem is
126            * the command is going to succeed, and the message is informational,
127            * not an error.  If a macro displays it repeatedly, e.g., the pattern
128            * only occurs once in the file and wrapscan is set, you lose big.  For
129            * example, if the macro does something like:
130            *
131            *        :map K /pattern/^MjK
132            *
133            * Each search will display the message, but the following "/pattern/"
134            * will immediately overwrite it, with strange results.  The System V
135            * vi displays the "wrapped" message multiple times, but because it's
136            * overwritten each time, it's not as noticeable.  As we don't discard
137            * messages, it's a real problem for us.
138            */
139           if (!KEYS_WAITING(sp))
140                     F_SET(&gp->excmd, E_SEARCH_WMSG);
141 
142           /* Save the current line/column. */
143           s_lno = sp->lno;
144           s_cno = sp->cno;
145 
146           /*
147            * !!!
148            * Historically, vi / and ? commands were full-blown ex addresses,
149            * including ';' delimiters, trailing <blank>'s, multiple search
150            * strings (separated by semi-colons) and, finally, full-blown z
151            * commands after the / and ? search strings.  (If the search was
152            * being used as a motion, the trailing z command was ignored.
153            * Also, we do some argument checking on the z command, to be sure
154            * that it's not some other random command.) For multiple search
155            * strings, leading <blank>'s at the second and subsequent strings
156            * were eaten as well.  This has some (unintended?) side-effects:
157            * the command /ptrn/;3 is legal and results in moving to line 3.
158            * I suppose you could use it to optionally move to line 3...
159            *
160            * !!!
161            * Historically, if any part of the search command failed, the cursor
162            * remained unmodified (even if ; was used).  We have to play games
163            * because the underlying ex parser thinks we're modifying the cursor
164            * as we go, but I think we're compatible with historic practice.
165            *
166            * !!!
167            * Historically, the command "/STRING/;   " failed, apparently it
168            * confused the parser.  We're not that compatible.
169            */
170           cmdp = &gp->excmd;
171           if (ex_range(sp, cmdp, &err))
172                     return (1);
173 
174           /*
175            * Remember where any remaining command information is, and clean
176            * up the fake ex command.
177            */
178           cmd = cmdp->cp;
179           len = cmdp->clen;
180           gp->excmd.clen = 0;
181 
182           if (err)
183                     goto err2;
184 
185           /* Copy out the new cursor position and make sure it's okay. */
186           switch (cmdp->addrcnt) {
187           case 1:
188                     vp->m_stop = cmdp->addr1;
189                     break;
190           case 2:
191                     vp->m_stop = cmdp->addr2;
192                     break;
193           }
194           if (!db_exist(sp, vp->m_stop.lno)) {
195                     ex_badaddr(sp, &fake,
196                         vp->m_stop.lno == 0 ? A_ZERO : A_EOF, NUM_OK);
197                     goto err2;
198           }
199 
200           /*
201            * !!!
202            * Historic practice is that a trailing 'z' was ignored if it was a
203            * motion command.  Should probably be an error, but not worth the
204            * effort.
205            */
206           if (ISMOTION(vp))
207                     return (v_correct(sp, vp, F_ISSET(cmdp, E_DELTA)));
208 
209           /*
210            * !!!
211            * Historically, if it wasn't a motion command, a delta in the search
212            * pattern turns it into a first nonblank movement.
213            */
214           nb = F_ISSET(cmdp, E_DELTA);
215 
216           /* Check for the 'z' command. */
217           if (len != 0) {
218                     if (*cmd != 'z')
219                               goto err1;
220 
221                     /* No blanks, just like the z command. */
222                     for (t = cmd + 1, tlen = len - 1; tlen > 0; ++t, --tlen)
223                               if (!isdigit(*t))
224                                         break;
225                     if (tlen &&
226                         (*t == '-' || *t == '.' || *t == '+' || *t == '^')) {
227                               ++t;
228                               --tlen;
229                               type = 1;
230                     } else
231                               type = 0;
232                     if (tlen)
233                               goto err1;
234 
235                     /* The z command will do the nonblank for us. */
236                     nb = 0;
237 
238                     /* Default to z+. */
239                     if (!type &&
240                         v_event_push(sp, NULL, L("+"), 1, CH_NOMAP | CH_QUOTED))
241                               return (1);
242 
243                     /* Push the user's command. */
244                     if (v_event_push(sp, NULL, cmd, len, CH_NOMAP | CH_QUOTED))
245                               return (1);
246 
247                     /* Push line number so get correct z display. */
248                     tlen = snprintf(buf,
249                         sizeof(buf), "%lu", (u_long)vp->m_stop.lno);
250                     CHAR2INT(sp, buf, tlen, w, wlen);
251                     if (v_event_push(sp, NULL, w, wlen, CH_NOMAP | CH_QUOTED))
252                               return (1);
253 
254                     /* Don't refresh until after 'z' happens. */
255                     F_SET(VIP(sp), VIP_S_REFRESH);
256           }
257 
258           /* Non-motion commands move to the end of the range. */
259           vp->m_final = vp->m_stop;
260           if (nb) {
261                     F_CLR(vp, VM_RCM_MASK);
262                     F_SET(vp, VM_RCM_SETFNB);
263           }
264           return (0);
265 
266 err1:     msgq(sp, M_ERR,
267               "188|Characters after search string, line offset and/or z command");
268 err2:     vp->m_final.lno = s_lno;
269           vp->m_final.cno = s_cno;
270           return (1);
271 }
272 
273 /*
274  * v_searchN -- N
275  *        Reverse last search.
276  *
277  * PUBLIC: int v_searchN(SCR *, VICMD *);
278  */
279 int
v_searchN(SCR * sp,VICMD * vp)280 v_searchN(SCR *sp, VICMD *vp)
281 {
282           dir_t dir;
283 
284           switch (sp->searchdir) {
285           case BACKWARD:
286                     dir = FORWARD;
287                     break;
288           case FORWARD:
289                     dir = BACKWARD;
290                     break;
291           default:
292                     dir = sp->searchdir;
293                     break;
294           }
295           return (v_search(sp, vp, NULL, 0, SEARCH_PARSE, dir));
296 }
297 
298 /*
299  * v_searchn -- n
300  *        Repeat last search.
301  *
302  * PUBLIC: int v_searchn(SCR *, VICMD *);
303  */
304 int
v_searchn(SCR * sp,VICMD * vp)305 v_searchn(SCR *sp, VICMD *vp)
306 {
307           return (v_search(sp, vp, NULL, 0, SEARCH_PARSE, sp->searchdir));
308 }
309 
310 /*
311  * is_special --
312  *        Test if the character is special in a basic RE.
313  */
314 static int
is_special(CHAR_T c)315 is_special(CHAR_T c)
316 {
317           /*
318            * !!!
319            * `*' and `$' are ordinary when appear at the beginning of a RE,
320            * but it's safe to distinguish them from the ordinary characters.
321            * The tilde is vi-specific, of course.
322            */
323           return (STRCHR(L(".[*\\^$~"), c) && c);
324 }
325 
326 /*
327  * Rear delimiter for word search when the keyword ends in
328  * (i.e., consists of) a non-word character.  See v_searchw below.
329  */
330 #define RE_NWSTOP   L("([^[:alnum:]_]|$)")
331 #define RE_NWSTOP_LEN         (SIZE(RE_NWSTOP) - 1)
332 
333 /*
334  * v_searchw -- [count]^A
335  *        Search for the word under the cursor.
336  *
337  * PUBLIC: int v_searchw(SCR *, VICMD *);
338  */
339 int
v_searchw(SCR * sp,VICMD * vp)340 v_searchw(SCR *sp, VICMD *vp)
341 {
342           size_t blen, len;
343           int rval;
344           CHAR_T *bp, *p;
345 
346           /* An upper bound for the SIZE of the RE under construction. */
347           len = VIP(sp)->klen + MAX(RE_WSTART_LEN, 1)
348               + MAX(RE_WSTOP_LEN, RE_NWSTOP_LEN);
349           GET_SPACE_RETW(sp, bp, blen, len);
350           p = bp;
351 
352           /* Only the first character can be non-word, see v_curword. */
353           if (inword(VIP(sp)->keyw[0])) {
354                     MEMCPY(p, RE_WSTART, RE_WSTART_LEN);
355                     p += RE_WSTART_LEN;
356           } else if (is_special(VIP(sp)->keyw[0])) {
357                     MEMCPY(p, L("\\"), 1);
358                     p += 1;
359           }
360 
361           MEMCPY(p, VIP(sp)->keyw, VIP(sp)->klen);
362           p += VIP(sp)->klen;
363 
364           if (inword(p[-1])) {
365                     MEMCPY(p, RE_WSTOP, RE_WSTOP_LEN);
366                     p += RE_WSTOP_LEN;
367           } else {
368                     /*
369                      * The keyword is a single non-word character.
370                      * We want it to stay the same when typing ^A several times
371                      * in a row, just the way the other cases behave.
372                      */
373                     MEMCPY(p, RE_NWSTOP, RE_NWSTOP_LEN);
374                     p += RE_NWSTOP_LEN;
375           }
376 
377           len = p - bp;
378           rval = v_search(sp, vp, bp, len, SEARCH_SET, FORWARD);
379 
380           FREE_SPACEW(sp, bp, blen);
381           return (rval);
382 }
383 
384 /*
385  * v_search --
386  *        The search commands.
387  */
388 static int
v_search(SCR * sp,VICMD * vp,CHAR_T * ptrn,size_t plen,u_int flags,dir_t dir)389 v_search(SCR *sp, VICMD *vp, CHAR_T *ptrn, size_t plen, u_int flags, dir_t dir)
390 {
391           /* Display messages. */
392           LF_SET(SEARCH_MSG);
393 
394           /* If it's a motion search, offset past end-of-line is okay. */
395           if (ISMOTION(vp))
396                     LF_SET(SEARCH_EOL);
397 
398           /*
399            * XXX
400            * Warn if the search wraps.  See the comment above, in v_exaddr().
401            */
402           if (!KEYS_WAITING(sp))
403                     LF_SET(SEARCH_WMSG);
404 
405           switch (dir) {
406           case BACKWARD:
407                     if (b_search(sp,
408                         &vp->m_start, &vp->m_stop, ptrn, plen, NULL, flags))
409                               return (1);
410                     break;
411           case FORWARD:
412                     if (f_search(sp,
413                         &vp->m_start, &vp->m_stop, ptrn, plen, NULL, flags))
414                               return (1);
415                     break;
416           case NOTSET:
417                     msgq(sp, M_ERR, "189|No previous search pattern");
418                     return (1);
419           default:
420                     abort();
421           }
422 
423           /* Correct motion commands, otherwise, simply move to the location. */
424           if (ISMOTION(vp)) {
425                     if (v_correct(sp, vp, 0))
426                               return(1);
427           } else
428                     vp->m_final = vp->m_stop;
429           return (0);
430 }
431 
432 /*
433  * v_correct --
434  *        Handle command with a search as the motion.
435  *
436  * !!!
437  * Historically, commands didn't affect the line searched to/from if the
438  * motion command was a search and the final position was the start/end
439  * of the line.  There were some special cases and vi was not consistent;
440  * it was fairly easy to confuse it.  For example, given the two lines:
441  *
442  *        abcdefghi
443  *        ABCDEFGHI
444  *
445  * placing the cursor on the 'A' and doing y?$ would so confuse it that 'h'
446  * 'k' and put would no longer work correctly.  In any case, we try to do
447  * the right thing, but it's not going to exactly match historic practice.
448  *
449  * PUBLIC: int v_correct(SCR *, VICMD *, int);
450  */
451 int
v_correct(SCR * sp,VICMD * vp,int isdelta)452 v_correct(SCR *sp, VICMD *vp, int isdelta)
453 {
454           dir_t dir;
455           MARK m;
456           size_t len;
457 
458           /*
459            * !!!
460            * We may have wrapped if wrapscan was set, and we may have returned
461            * to the position where the cursor started.  Historic vi didn't cope
462            * with this well.  Yank wouldn't beep, but the first put after the
463            * yank would move the cursor right one column (without adding any
464            * text) and the second would put a copy of the current line.  The
465            * change and delete commands would beep, but would leave the cursor
466            * on the colon command line.  I believe that there are macros that
467            * depend on delete, at least, failing.  For now, commands that use
468            * search as a motion component fail when the search returns to the
469            * original cursor position.
470            */
471           if (vp->m_start.lno == vp->m_stop.lno &&
472               vp->m_start.cno == vp->m_stop.cno) {
473                     msgq(sp, M_BERR, "190|Search wrapped to original position");
474                     return (1);
475           }
476 
477           /*
478            * !!!
479            * Searches become line mode operations if there was a delta specified
480            * to the search pattern.
481            */
482           if (isdelta)
483                     F_SET(vp, VM_LMODE);
484 
485           /*
486            * If the motion is in the reverse direction, switch the start and
487            * stop MARK's so that it's in a forward direction.  (There's no
488            * reason for this other than to make the tests below easier.  The
489            * code in vi.c:vi() would have done the switch.)  Both forward
490            * and backward motions can happen for any kind of search command
491            * because of the wrapscan option.
492            */
493           if (vp->m_start.lno > vp->m_stop.lno ||
494               (vp->m_start.lno == vp->m_stop.lno &&
495               vp->m_start.cno > vp->m_stop.cno)) {
496                     m = vp->m_start;
497                     vp->m_start = vp->m_stop;
498                     vp->m_stop = m;
499                     dir = BACKWARD;
500           } else
501                     dir = FORWARD;
502 
503           /*
504            * BACKWARD:
505            *        Delete and yank commands move to the end of the range.
506            *        Ignore others.
507            *
508            * FORWARD:
509            *        Delete and yank commands don't move.  Ignore others.
510            */
511           vp->m_final = vp->m_start;
512 
513           /*
514            * !!!
515            * Delta'd searches don't correct based on column positions.
516            */
517           if (isdelta)
518                     return (0);
519 
520           /*
521            * !!!
522            * Backward searches starting at column 0, and forward searches ending
523            * at column 0 are corrected to the last column of the previous line.
524            * Otherwise, adjust the starting/ending point to the character before
525            * the current one (this is safe because we know the search had to move
526            * to succeed).
527            *
528            * Searches become line mode operations if they start at the first
529            * nonblank and end at column 0 of another line.
530            */
531           if (vp->m_start.lno < vp->m_stop.lno && vp->m_stop.cno == 0) {
532                     if (db_get(sp, --vp->m_stop.lno, DBG_FATAL, NULL, &len))
533                               return (1);
534                     vp->m_stop.cno = len ? len - 1 : 0;
535                     len = 0;
536                     if (nonblank(sp, vp->m_start.lno, &len))
537                               return (1);
538                     if (vp->m_start.cno <= len)
539                               F_SET(vp, VM_LMODE);
540           } else
541                     --vp->m_stop.cno;
542 
543           return (0);
544 }
545