1 /*
2 * Copyright (C) 1984-2017 Mark Nudelman
3 *
4 * You may distribute under the terms of either the GNU General Public
5 * License or the Less License, as specified in the README file.
6 *
7 * For more information, see the README file.
8 */
9
10
11 /*
12 * Routines to search a file for a pattern.
13 */
14
15 #include "less.h"
16 #include "position.h"
17 #include "charset.h"
18
19 #define MINPOS(a,b) (((a) < (b)) ? (a) : (b))
20 #define MAXPOS(a,b) (((a) > (b)) ? (a) : (b))
21
22 extern int sigs;
23 extern int how_search;
24 extern int caseless;
25 extern int linenums;
26 extern int sc_height;
27 extern int jump_sline;
28 extern int bs_mode;
29 extern int ctldisp;
30 extern int status_col;
31 extern void *ml_search;
32 extern POSITION start_attnpos;
33 extern POSITION end_attnpos;
34 extern int utf_mode;
35 extern int screen_trashed;
36 #if HILITE_SEARCH
37 extern int hilite_search;
38 extern int size_linebuf;
39 extern int squished;
40 extern int can_goto_line;
41 static int hide_hilite;
42 static POSITION prep_startpos;
43 static POSITION prep_endpos;
44 static int is_caseless;
45 static int is_ucase_pattern;
46
47 /*
48 * Structures for maintaining a set of ranges for hilites and filtered-out
49 * lines. Each range is stored as a node within a red-black tree, and we
50 * try to extend existing ranges (without creating overlaps) rather than
51 * create new nodes if possible. We remember the last node found by a
52 * search for constant-time lookup if the next search is near enough to
53 * the previous. To aid that, we overlay a secondary doubly-linked list
54 * on top of the red-black tree so we can find the preceding/succeeding
55 * nodes also in constant time.
56 *
57 * Each node is allocated from a series of pools, each pool double the size
58 * of the previous (for amortised constant time allocation). Since our only
59 * tree operations are clear and node insertion, not node removal, we don't
60 * need to maintain a usage bitmap or freelist and can just return nodes
61 * from the pool in-order until capacity is reached.
62 */
63 struct hilite
64 {
65 POSITION hl_startpos;
66 POSITION hl_endpos;
67 };
68 struct hilite_node
69 {
70 struct hilite_node *parent;
71 struct hilite_node *left;
72 struct hilite_node *right;
73 struct hilite_node *prev;
74 struct hilite_node *next;
75 int red;
76 struct hilite r;
77 };
78 struct hilite_storage
79 {
80 int capacity;
81 int used;
82 struct hilite_storage *next;
83 struct hilite_node *nodes;
84 };
85 struct hilite_tree
86 {
87 struct hilite_storage *first;
88 struct hilite_storage *current;
89 struct hilite_node *root;
90 struct hilite_node *lookaside;
91 };
92 #define HILITE_INITIALIZER() { NULL, NULL, NULL, NULL }
93 #define HILITE_LOOKASIDE_STEPS 2
94
95 static struct hilite_tree hilite_anchor = HILITE_INITIALIZER();
96 static struct hilite_tree filter_anchor = HILITE_INITIALIZER();
97
98 #endif
99
100 /*
101 * These are the static variables that represent the "remembered"
102 * search pattern and filter pattern.
103 */
104 struct pattern_info {
105 PATTERN_TYPE compiled;
106 char* text;
107 int search_type;
108 };
109
110 #if NO_REGEX
111 #define info_compiled(info) ((void*)0)
112 #else
113 #define info_compiled(info) ((info)->compiled)
114 #endif
115
116 static struct pattern_info search_info;
117 static struct pattern_info filter_info;
118
119 /*
120 * Are there any uppercase letters in this string?
121 */
122 static int
is_ucase(str)123 is_ucase(str)
124 char *str;
125 {
126 char *str_end = str + strlen(str);
127 LWCHAR ch;
128
129 while (str < str_end)
130 {
131 ch = step_char(&str, +1, str_end);
132 if (IS_UPPER(ch))
133 return (1);
134 }
135 return (0);
136 }
137
138 /*
139 * Compile and save a search pattern.
140 */
141 static int
set_pattern(info,pattern,search_type)142 set_pattern(info, pattern, search_type)
143 struct pattern_info *info;
144 char *pattern;
145 int search_type;
146 {
147 #if !NO_REGEX
148 if (pattern == NULL)
149 CLEAR_PATTERN(info->compiled);
150 else if (compile_pattern(pattern, search_type, &info->compiled) < 0)
151 return -1;
152 #endif
153 /* Pattern compiled successfully; save the text too. */
154 if (info->text != NULL)
155 free(info->text);
156 info->text = NULL;
157 if (pattern != NULL)
158 {
159 info->text = (char *) ecalloc(1, strlen(pattern)+1);
160 strcpy(info->text, pattern);
161 }
162 info->search_type = search_type;
163
164 /*
165 * Ignore case if -I is set OR
166 * -i is set AND the pattern is all lowercase.
167 */
168 is_ucase_pattern = is_ucase(pattern);
169 if (is_ucase_pattern && caseless != OPT_ONPLUS)
170 is_caseless = 0;
171 else
172 is_caseless = caseless;
173 return 0;
174 }
175
176 /*
177 * Discard a saved pattern.
178 */
179 static void
clear_pattern(info)180 clear_pattern(info)
181 struct pattern_info *info;
182 {
183 if (info->text != NULL)
184 free(info->text);
185 info->text = NULL;
186 #if !NO_REGEX
187 uncompile_pattern(&info->compiled);
188 #endif
189 }
190
191 /*
192 * Initialize saved pattern to nothing.
193 */
194 static void
init_pattern(info)195 init_pattern(info)
196 struct pattern_info *info;
197 {
198 CLEAR_PATTERN(info->compiled);
199 info->text = NULL;
200 info->search_type = 0;
201 }
202
203 /*
204 * Initialize search variables.
205 */
206 public void
init_search()207 init_search()
208 {
209 init_pattern(&search_info);
210 init_pattern(&filter_info);
211 }
212
213 /*
214 * Determine which text conversions to perform before pattern matching.
215 */
216 static int
get_cvt_ops()217 get_cvt_ops()
218 {
219 int ops = 0;
220 if (is_caseless || bs_mode == BS_SPECIAL)
221 {
222 if (is_caseless)
223 ops |= CVT_TO_LC;
224 if (bs_mode == BS_SPECIAL)
225 ops |= CVT_BS;
226 if (bs_mode != BS_CONTROL)
227 ops |= CVT_CRLF;
228 } else if (bs_mode != BS_CONTROL)
229 {
230 ops |= CVT_CRLF;
231 }
232 if (ctldisp == OPT_ONPLUS)
233 ops |= CVT_ANSI;
234 return (ops);
235 }
236
237 /*
238 * Is there a previous (remembered) search pattern?
239 */
240 static int
prev_pattern(info)241 prev_pattern(info)
242 struct pattern_info *info;
243 {
244 #if !NO_REGEX
245 if ((info->search_type & SRCH_NO_REGEX) == 0)
246 return (!is_null_pattern(info->compiled));
247 #endif
248 return (info->text != NULL);
249 }
250
251 #if HILITE_SEARCH
252 /*
253 * Repaint the hilites currently displayed on the screen.
254 * Repaint each line which contains highlighted text.
255 * If on==0, force all hilites off.
256 */
257 public void
repaint_hilite(on)258 repaint_hilite(on)
259 int on;
260 {
261 int sindex;
262 POSITION pos;
263 int save_hide_hilite;
264
265 if (squished)
266 repaint();
267
268 save_hide_hilite = hide_hilite;
269 if (!on)
270 {
271 if (hide_hilite)
272 return;
273 hide_hilite = 1;
274 }
275
276 if (!can_goto_line)
277 {
278 repaint();
279 hide_hilite = save_hide_hilite;
280 return;
281 }
282
283 for (sindex = TOP; sindex < TOP + sc_height-1; sindex++)
284 {
285 pos = position(sindex);
286 if (pos == NULL_POSITION)
287 continue;
288 (void) forw_line(pos);
289 goto_line(sindex);
290 put_line();
291 }
292 lower_left();
293 hide_hilite = save_hide_hilite;
294 }
295
296 /*
297 * Clear the attn hilite.
298 */
299 public void
clear_attn()300 clear_attn()
301 {
302 int sindex;
303 POSITION old_start_attnpos;
304 POSITION old_end_attnpos;
305 POSITION pos;
306 POSITION epos;
307 int moved = 0;
308
309 if (start_attnpos == NULL_POSITION)
310 return;
311 old_start_attnpos = start_attnpos;
312 old_end_attnpos = end_attnpos;
313 start_attnpos = end_attnpos = NULL_POSITION;
314
315 if (!can_goto_line)
316 {
317 repaint();
318 return;
319 }
320 if (squished)
321 repaint();
322
323 for (sindex = TOP; sindex < TOP + sc_height-1; sindex++)
324 {
325 pos = position(sindex);
326 if (pos == NULL_POSITION)
327 continue;
328 epos = position(sindex+1);
329 if (pos <= old_end_attnpos &&
330 (epos == NULL_POSITION || epos > old_start_attnpos))
331 {
332 (void) forw_line(pos);
333 goto_line(sindex);
334 put_line();
335 moved = 1;
336 }
337 }
338 if (moved)
339 lower_left();
340 }
341 #endif
342
343 /*
344 * Hide search string highlighting.
345 */
346 public void
undo_search()347 undo_search()
348 {
349 if (!prev_pattern(&search_info))
350 {
351 if (hilite_anchor.first == NULL)
352 {
353 error("No previous regular expression", NULL_PARG);
354 return;
355 }
356 clr_hilite(); /* Next time, hilite_anchor.first will be NULL. */
357 }
358 clear_pattern(&search_info);
359 #if HILITE_SEARCH
360 hide_hilite = !hide_hilite;
361 repaint_hilite(1);
362 #endif
363 }
364
365 #if HILITE_SEARCH
366 /*
367 * Clear the hilite list.
368 */
369 public void
clr_hlist(anchor)370 clr_hlist(anchor)
371 struct hilite_tree *anchor;
372 {
373 struct hilite_storage *hls;
374 struct hilite_storage *nexthls;
375
376 for (hls = anchor->first; hls != NULL; hls = nexthls)
377 {
378 nexthls = hls->next;
379 free((void*)hls->nodes);
380 free((void*)hls);
381 }
382 anchor->first = NULL;
383 anchor->current = NULL;
384 anchor->root = NULL;
385
386 anchor->lookaside = NULL;
387
388 prep_startpos = prep_endpos = NULL_POSITION;
389 }
390
391 public void
clr_hilite()392 clr_hilite()
393 {
394 clr_hlist(&hilite_anchor);
395 }
396
397 public void
clr_filter()398 clr_filter()
399 {
400 clr_hlist(&filter_anchor);
401 }
402
403 struct hilite_node*
hlist_last(anchor)404 hlist_last(anchor)
405 struct hilite_tree *anchor;
406 {
407 struct hilite_node *n = anchor->root;
408 while (n != NULL && n->right != NULL)
409 n = n->right;
410 return n;
411 }
412
413 struct hilite_node*
hlist_next(n)414 hlist_next(n)
415 struct hilite_node *n;
416 {
417 return n->next;
418 }
419
420 struct hilite_node*
hlist_prev(n)421 hlist_prev(n)
422 struct hilite_node *n;
423 {
424 return n->prev;
425 }
426
427 /*
428 * Find the node covering pos, or the node after it if no node covers it,
429 * or return NULL if pos is after the last range. Remember the found node,
430 * to speed up subsequent searches for the same or similar positions (if
431 * we return NULL, remember the last node.)
432 */
433 struct hilite_node*
hlist_find(anchor,pos)434 hlist_find(anchor, pos)
435 struct hilite_tree *anchor;
436 POSITION pos;
437 {
438 struct hilite_node *n, *m;
439
440 if (anchor->lookaside)
441 {
442 int steps = 0;
443 int hit = 0;
444
445 n = anchor->lookaside;
446
447 for (;;)
448 {
449 if (pos < n->r.hl_endpos)
450 {
451 if (n->prev == NULL || pos >= n->prev->r.hl_endpos)
452 {
453 hit = 1;
454 break;
455 }
456 } else if (n->next == NULL)
457 {
458 n = NULL;
459 hit = 1;
460 break;
461 }
462
463 /*
464 * If we don't find the right node within a small
465 * distance, don't keep doing a linear search!
466 */
467 if (steps >= HILITE_LOOKASIDE_STEPS)
468 break;
469 steps++;
470
471 if (pos < n->r.hl_endpos)
472 anchor->lookaside = n = n->prev;
473 else
474 anchor->lookaside = n = n->next;
475 }
476
477 if (hit)
478 return n;
479 }
480
481 n = anchor->root;
482 m = NULL;
483
484 while (n != NULL)
485 {
486 if (pos < n->r.hl_startpos)
487 {
488 if (n->left != NULL)
489 {
490 m = n;
491 n = n->left;
492 continue;
493 }
494 break;
495 }
496 if (pos >= n->r.hl_endpos)
497 {
498 if (n->right != NULL)
499 {
500 n = n->right;
501 continue;
502 }
503 if (m != NULL)
504 {
505 n = m;
506 } else
507 {
508 m = n;
509 n = NULL;
510 }
511 }
512 break;
513 }
514
515 if (n != NULL)
516 anchor->lookaside = n;
517 else if (m != NULL)
518 anchor->lookaside = m;
519
520 return n;
521 }
522
523 /*
524 * Should any characters in a specified range be highlighted?
525 */
526 static int
is_hilited_range(pos,epos)527 is_hilited_range(pos, epos)
528 POSITION pos;
529 POSITION epos;
530 {
531 struct hilite_node *n = hlist_find(&hilite_anchor, pos);
532 return (n != NULL && (epos == NULL_POSITION || epos > n->r.hl_startpos));
533 }
534
535 /*
536 * Is a line "filtered" -- that is, should it be hidden?
537 */
538 public int
is_filtered(pos)539 is_filtered(pos)
540 POSITION pos;
541 {
542 struct hilite_node *n;
543
544 if (ch_getflags() & CH_HELPFILE)
545 return (0);
546
547 n = hlist_find(&filter_anchor, pos);
548 return (n != NULL && pos >= n->r.hl_startpos);
549 }
550
551 /*
552 * If pos is hidden, return the next position which isn't, otherwise
553 * just return pos.
554 */
555 public POSITION
next_unfiltered(pos)556 next_unfiltered(pos)
557 POSITION pos;
558 {
559 struct hilite_node *n;
560
561 if (ch_getflags() & CH_HELPFILE)
562 return (pos);
563
564 n = hlist_find(&filter_anchor, pos);
565 while (n != NULL && pos >= n->r.hl_startpos)
566 {
567 pos = n->r.hl_endpos;
568 n = n->next;
569 }
570 return (pos);
571 }
572
573 /*
574 * If pos is hidden, return the previous position which isn't or 0 if
575 * we're filtered right to the beginning, otherwise just return pos.
576 */
577 public POSITION
prev_unfiltered(pos)578 prev_unfiltered(pos)
579 POSITION pos;
580 {
581 struct hilite_node *n;
582
583 if (ch_getflags() & CH_HELPFILE)
584 return (pos);
585
586 n = hlist_find(&filter_anchor, pos);
587 while (n != NULL && pos >= n->r.hl_startpos)
588 {
589 pos = n->r.hl_startpos;
590 if (pos == 0)
591 break;
592 pos--;
593 n = n->prev;
594 }
595 return (pos);
596 }
597
598
599 /*
600 * Should any characters in a specified range be highlighted?
601 * If nohide is nonzero, don't consider hide_hilite.
602 */
603 public int
is_hilited(pos,epos,nohide,p_matches)604 is_hilited(pos, epos, nohide, p_matches)
605 POSITION pos;
606 POSITION epos;
607 int nohide;
608 int *p_matches;
609 {
610 int match;
611
612 if (p_matches != NULL)
613 *p_matches = 0;
614
615 if (!status_col &&
616 start_attnpos != NULL_POSITION &&
617 pos < end_attnpos &&
618 (epos == NULL_POSITION || epos > start_attnpos))
619 /*
620 * The attn line overlaps this range.
621 */
622 return (1);
623
624 match = is_hilited_range(pos, epos);
625 if (!match)
626 return (0);
627
628 if (p_matches == NULL)
629 /*
630 * Kinda kludgy way to recognize that caller is checking for
631 * hilite in status column. In this case we want to return
632 * hilite status even if hiliting is disabled or hidden.
633 */
634 return (1);
635
636 /*
637 * Report matches, even if we're hiding highlights.
638 */
639 *p_matches = 1;
640
641 if (hilite_search == 0)
642 /*
643 * Not doing highlighting.
644 */
645 return (0);
646
647 if (!nohide && hide_hilite)
648 /*
649 * Highlighting is hidden.
650 */
651 return (0);
652
653 return (1);
654 }
655
656 /*
657 * Tree node storage: get the current block of nodes if it has spare
658 * capacity, or create a new one if not.
659 */
660 static struct hilite_storage*
hlist_getstorage(anchor)661 hlist_getstorage(anchor)
662 struct hilite_tree *anchor;
663 {
664 int capacity = 1;
665 struct hilite_storage *s;
666
667 if (anchor->current)
668 {
669 if (anchor->current->used < anchor->current->capacity)
670 return anchor->current;
671 capacity = anchor->current->capacity * 2;
672 }
673
674 s = (struct hilite_storage *) ecalloc(1, sizeof(struct hilite_storage));
675 s->nodes = (struct hilite_node *) ecalloc(capacity, sizeof(struct hilite_node));
676 s->capacity = capacity;
677 s->used = 0;
678 s->next = NULL;
679 if (anchor->current)
680 anchor->current->next = s;
681 else
682 anchor->first = s;
683 anchor->current = s;
684 return s;
685 }
686
687 /*
688 * Tree node storage: retrieve a new empty node to be inserted into the
689 * tree.
690 */
691 static struct hilite_node*
hlist_getnode(anchor)692 hlist_getnode(anchor)
693 struct hilite_tree *anchor;
694 {
695 struct hilite_storage *s = hlist_getstorage(anchor);
696 return &s->nodes[s->used++];
697 }
698
699 /*
700 * Rotate the tree left around a pivot node.
701 */
702 static void
hlist_rotate_left(anchor,n)703 hlist_rotate_left(anchor, n)
704 struct hilite_tree *anchor;
705 struct hilite_node *n;
706 {
707 struct hilite_node *np = n->parent;
708 struct hilite_node *nr = n->right;
709 struct hilite_node *nrl = n->right->left;
710
711 if (np != NULL)
712 {
713 if (n == np->left)
714 np->left = nr;
715 else
716 np->right = nr;
717 } else
718 {
719 anchor->root = nr;
720 }
721 nr->left = n;
722 n->right = nrl;
723
724 nr->parent = np;
725 n->parent = nr;
726 if (nrl != NULL)
727 nrl->parent = n;
728 }
729
730 /*
731 * Rotate the tree right around a pivot node.
732 */
733 static void
hlist_rotate_right(anchor,n)734 hlist_rotate_right(anchor, n)
735 struct hilite_tree *anchor;
736 struct hilite_node *n;
737 {
738 struct hilite_node *np = n->parent;
739 struct hilite_node *nl = n->left;
740 struct hilite_node *nlr = n->left->right;
741
742 if (np != NULL)
743 {
744 if (n == np->right)
745 np->right = nl;
746 else
747 np->left = nl;
748 } else
749 {
750 anchor->root = nl;
751 }
752 nl->right = n;
753 n->left = nlr;
754
755 nl->parent = np;
756 n->parent = nl;
757 if (nlr != NULL)
758 nlr->parent = n;
759 }
760
761
762 /*
763 * Add a new hilite to a hilite list.
764 */
765 static void
add_hilite(anchor,hl)766 add_hilite(anchor, hl)
767 struct hilite_tree *anchor;
768 struct hilite *hl;
769 {
770 struct hilite_node *p, *n, *u;
771
772 /* Ignore empty ranges. */
773 if (hl->hl_startpos >= hl->hl_endpos)
774 return;
775
776 p = anchor->root;
777
778 /* Inserting the very first node is trivial. */
779 if (p == NULL)
780 {
781 n = hlist_getnode(anchor);
782 n->r = *hl;
783 anchor->root = n;
784 anchor->lookaside = n;
785 return;
786 }
787
788 /*
789 * Find our insertion point. If we come across any overlapping
790 * or adjoining existing ranges, shrink our range and discard
791 * if it become empty.
792 */
793 for (;;)
794 {
795 if (hl->hl_startpos < p->r.hl_startpos)
796 {
797 if (hl->hl_endpos > p->r.hl_startpos)
798 hl->hl_endpos = p->r.hl_startpos;
799 if (p->left != NULL)
800 {
801 p = p->left;
802 continue;
803 }
804 break;
805 }
806 if (hl->hl_startpos < p->r.hl_endpos) {
807 hl->hl_startpos = p->r.hl_endpos;
808 if (hl->hl_startpos >= hl->hl_endpos)
809 return;
810 }
811 if (p->right != NULL)
812 {
813 p = p->right;
814 continue;
815 }
816 break;
817 }
818
819 /*
820 * Now we're at the right leaf, again check for contiguous ranges
821 * and extend the existing node if possible to avoid the
822 * insertion. Otherwise insert a new node at the leaf.
823 */
824 if (hl->hl_startpos < p->r.hl_startpos) {
825 if (hl->hl_endpos == p->r.hl_startpos)
826 {
827 p->r.hl_startpos = hl->hl_startpos;
828 return;
829 }
830 if (p->prev != NULL && p->prev->r.hl_endpos == hl->hl_startpos)
831 {
832 p->prev->r.hl_endpos = hl->hl_endpos;
833 return;
834 }
835
836 p->left = n = hlist_getnode(anchor);
837 n->next = p;
838 if (p->prev != NULL)
839 {
840 n->prev = p->prev;
841 p->prev->next = n;
842 }
843 p->prev = n;
844 } else {
845 if (p->r.hl_endpos == hl->hl_startpos)
846 {
847 p->r.hl_endpos = hl->hl_endpos;
848 return;
849 }
850 if (p->next != NULL && hl->hl_endpos == p->next->r.hl_startpos) {
851 p->next->r.hl_startpos = hl->hl_startpos;
852 return;
853 }
854
855 p->right = n = hlist_getnode(anchor);
856 n->prev = p;
857 if (p->next != NULL)
858 {
859 n->next = p->next;
860 p->next->prev = n;
861 }
862 p->next = n;
863 }
864 n->parent = p;
865 n->red = 1;
866 n->r = *hl;
867
868 /*
869 * The tree is in the correct order and covers the right ranges
870 * now, but may have become unbalanced. Rebalance it using the
871 * standard red-black tree constraints and operations.
872 */
873 for (;;)
874 {
875 /* case 1 - current is root, root is always black */
876 if (n->parent == NULL)
877 {
878 n->red = 0;
879 break;
880 }
881
882 /* case 2 - parent is black, we can always be red */
883 if (!n->parent->red)
884 break;
885
886 /*
887 * constraint: because the root must be black, if our
888 * parent is red it cannot be the root therefore we must
889 * have a grandparent
890 */
891
892 /*
893 * case 3 - parent and uncle are red, repaint them black,
894 * the grandparent red, and start again at the grandparent.
895 */
896 u = n->parent->parent->left;
897 if (n->parent == u)
898 u = n->parent->parent->right;
899 if (u != NULL && u->red)
900 {
901 n->parent->red = 0;
902 u->red = 0;
903 n = n->parent->parent;
904 n->red = 1;
905 continue;
906 }
907
908 /*
909 * case 4 - parent is red but uncle is black, parent and
910 * grandparent on opposite sides. We need to start
911 * changing the structure now. This and case 5 will shorten
912 * our branch and lengthen the sibling, between them
913 * restoring balance.
914 */
915 if (n == n->parent->right &&
916 n->parent == n->parent->parent->left)
917 {
918 hlist_rotate_left(anchor, n->parent);
919 n = n->left;
920 } else if (n == n->parent->left &&
921 n->parent == n->parent->parent->right)
922 {
923 hlist_rotate_right(anchor, n->parent);
924 n = n->right;
925 }
926
927 /*
928 * case 5 - parent is red but uncle is black, parent and
929 * grandparent on same side
930 */
931 n->parent->red = 0;
932 n->parent->parent->red = 1;
933 if (n == n->parent->left)
934 hlist_rotate_right(anchor, n->parent->parent);
935 else
936 hlist_rotate_left(anchor, n->parent->parent);
937 break;
938 }
939 }
940
941 /*
942 * Hilight every character in a range of displayed characters.
943 */
944 static void
create_hilites(linepos,start_index,end_index,chpos)945 create_hilites(linepos, start_index, end_index, chpos)
946 POSITION linepos;
947 int start_index;
948 int end_index;
949 int *chpos;
950 {
951 struct hilite hl;
952 int i;
953
954 /* Start the first hilite. */
955 hl.hl_startpos = linepos + chpos[start_index];
956
957 /*
958 * Step through the displayed chars.
959 * If the source position (before cvt) of the char is one more
960 * than the source pos of the previous char (the usual case),
961 * just increase the size of the current hilite by one.
962 * Otherwise (there are backspaces or something involved),
963 * finish the current hilite and start a new one.
964 */
965 for (i = start_index+1; i <= end_index; i++)
966 {
967 if (chpos[i] != chpos[i-1] + 1 || i == end_index)
968 {
969 hl.hl_endpos = linepos + chpos[i-1] + 1;
970 add_hilite(&hilite_anchor, &hl);
971 /* Start new hilite unless this is the last char. */
972 if (i < end_index)
973 {
974 hl.hl_startpos = linepos + chpos[i];
975 }
976 }
977 }
978 }
979
980 /*
981 * Make a hilite for each string in a physical line which matches
982 * the current pattern.
983 * sp,ep delimit the first match already found.
984 */
985 static void
hilite_line(linepos,line,line_len,chpos,sp,ep,cvt_ops)986 hilite_line(linepos, line, line_len, chpos, sp, ep, cvt_ops)
987 POSITION linepos;
988 char *line;
989 int line_len;
990 int *chpos;
991 char *sp;
992 char *ep;
993 int cvt_ops;
994 {
995 char *searchp;
996 char *line_end = line + line_len;
997
998 /*
999 * sp and ep delimit the first match in the line.
1000 * Mark the corresponding file positions, then
1001 * look for further matches and mark them.
1002 * {{ This technique, of calling match_pattern on subsequent
1003 * substrings of the line, may mark more than is correct
1004 * if the pattern starts with "^". This bug is fixed
1005 * for those regex functions that accept a notbol parameter
1006 * (currently POSIX, PCRE and V8-with-regexec2). }}
1007 */
1008 searchp = line;
1009 do {
1010 if (sp == NULL || ep == NULL)
1011 return;
1012 create_hilites(linepos, sp-line, ep-line, chpos);
1013 /*
1014 * If we matched more than zero characters,
1015 * move to the first char after the string we matched.
1016 * If we matched zero, just move to the next char.
1017 */
1018 if (ep > searchp)
1019 searchp = ep;
1020 else if (searchp != line_end)
1021 searchp++;
1022 else /* end of line */
1023 break;
1024 } while (match_pattern(info_compiled(&search_info), search_info.text,
1025 searchp, line_end - searchp, &sp, &ep, 1, search_info.search_type));
1026 }
1027 #endif
1028
1029 #if HILITE_SEARCH
1030 /*
1031 * Find matching text which is currently on screen and highlight it.
1032 */
1033 static void
hilite_screen()1034 hilite_screen()
1035 {
1036 struct scrpos scrpos;
1037
1038 get_scrpos(&scrpos, TOP);
1039 if (scrpos.pos == NULL_POSITION)
1040 return;
1041 prep_hilite(scrpos.pos, position(BOTTOM_PLUS_ONE), -1);
1042 repaint_hilite(1);
1043 }
1044
1045 /*
1046 * Change highlighting parameters.
1047 */
1048 public void
chg_hilite()1049 chg_hilite()
1050 {
1051 /*
1052 * Erase any highlights currently on screen.
1053 */
1054 clr_hilite();
1055 hide_hilite = 0;
1056
1057 if (hilite_search == OPT_ONPLUS)
1058 /*
1059 * Display highlights.
1060 */
1061 hilite_screen();
1062 }
1063 #endif
1064
1065 /*
1066 * Figure out where to start a search.
1067 */
1068 static POSITION
search_pos(search_type)1069 search_pos(search_type)
1070 int search_type;
1071 {
1072 POSITION pos;
1073 int sindex;
1074
1075 if (empty_screen())
1076 {
1077 /*
1078 * Start at the beginning (or end) of the file.
1079 * The empty_screen() case is mainly for
1080 * command line initiated searches;
1081 * for example, "+/xyz" on the command line.
1082 * Also for multi-file (SRCH_PAST_EOF) searches.
1083 */
1084 if (search_type & SRCH_FORW)
1085 {
1086 pos = ch_zero();
1087 } else
1088 {
1089 pos = ch_length();
1090 if (pos == NULL_POSITION)
1091 {
1092 (void) ch_end_seek();
1093 pos = ch_length();
1094 }
1095 }
1096 sindex = 0;
1097 } else
1098 {
1099 int add_one = 0;
1100
1101 if (how_search == OPT_ON)
1102 {
1103 /*
1104 * Search does not include current screen.
1105 */
1106 if (search_type & SRCH_FORW)
1107 sindex = sc_height-1; /* BOTTOM_PLUS_ONE */
1108 else
1109 sindex = 0; /* TOP */
1110 } else if (how_search == OPT_ONPLUS && !(search_type & SRCH_AFTER_TARGET))
1111 {
1112 /*
1113 * Search includes all of displayed screen.
1114 */
1115 if (search_type & SRCH_FORW)
1116 sindex = 0; /* TOP */
1117 else
1118 sindex = sc_height-1; /* BOTTOM_PLUS_ONE */
1119 } else
1120 {
1121 /*
1122 * Search includes the part of current screen beyond the jump target.
1123 * It starts at the jump target (if searching backwards),
1124 * or at the jump target plus one (if forwards).
1125 */
1126 sindex = sindex_from_sline(jump_sline);
1127 if (search_type & SRCH_FORW)
1128 add_one = 1;
1129 }
1130 pos = position(sindex);
1131 if (add_one)
1132 pos = forw_raw_line(pos, (char **)NULL, (int *)NULL);
1133 }
1134
1135 /*
1136 * If the line is empty, look around for a plausible starting place.
1137 */
1138 if (search_type & SRCH_FORW)
1139 {
1140 while (pos == NULL_POSITION)
1141 {
1142 if (++sindex >= sc_height)
1143 break;
1144 pos = position(sindex);
1145 }
1146 } else
1147 {
1148 while (pos == NULL_POSITION)
1149 {
1150 if (--sindex < 0)
1151 break;
1152 pos = position(sindex);
1153 }
1154 }
1155 return (pos);
1156 }
1157
1158 /*
1159 * Search a subset of the file, specified by start/end position.
1160 */
1161 static int
search_range(pos,endpos,search_type,matches,maxlines,plinepos,pendpos)1162 search_range(pos, endpos, search_type, matches, maxlines, plinepos, pendpos)
1163 POSITION pos;
1164 POSITION endpos;
1165 int search_type;
1166 int matches;
1167 int maxlines;
1168 POSITION *plinepos;
1169 POSITION *pendpos;
1170 {
1171 char *line;
1172 char *cline;
1173 int line_len;
1174 LINENUM linenum;
1175 char *sp, *ep;
1176 int line_match;
1177 int cvt_ops;
1178 int cvt_len;
1179 int *chpos;
1180 POSITION linepos, oldpos;
1181
1182 linenum = find_linenum(pos);
1183 oldpos = pos;
1184 for (;;)
1185 {
1186 /*
1187 * Get lines until we find a matching one or until
1188 * we hit end-of-file (or beginning-of-file if we're
1189 * going backwards), or until we hit the end position.
1190 */
1191 if (ABORT_SIGS())
1192 {
1193 /*
1194 * A signal aborts the search.
1195 */
1196 return (-1);
1197 }
1198
1199 if ((endpos != NULL_POSITION && pos >= endpos) || maxlines == 0)
1200 {
1201 /*
1202 * Reached end position without a match.
1203 */
1204 if (pendpos != NULL)
1205 *pendpos = pos;
1206 return (matches);
1207 }
1208 if (maxlines > 0)
1209 maxlines--;
1210
1211 if (search_type & SRCH_FORW)
1212 {
1213 /*
1214 * Read the next line, and save the
1215 * starting position of that line in linepos.
1216 */
1217 linepos = pos;
1218 pos = forw_raw_line(pos, &line, &line_len);
1219 if (linenum != 0)
1220 linenum++;
1221 } else
1222 {
1223 /*
1224 * Read the previous line and save the
1225 * starting position of that line in linepos.
1226 */
1227 pos = back_raw_line(pos, &line, &line_len);
1228 linepos = pos;
1229 if (linenum != 0)
1230 linenum--;
1231 }
1232
1233 if (pos == NULL_POSITION)
1234 {
1235 /*
1236 * Reached EOF/BOF without a match.
1237 */
1238 if (pendpos != NULL)
1239 *pendpos = oldpos;
1240 return (matches);
1241 }
1242
1243 /*
1244 * If we're using line numbers, we might as well
1245 * remember the information we have now (the position
1246 * and line number of the current line).
1247 * Don't do it for every line because it slows down
1248 * the search. Remember the line number only if
1249 * we're "far" from the last place we remembered it.
1250 */
1251 if (linenums && abs((int)(pos - oldpos)) > 2048)
1252 add_lnum(linenum, pos);
1253 oldpos = pos;
1254
1255 if (is_filtered(linepos))
1256 continue;
1257
1258 /*
1259 * If it's a caseless search, convert the line to lowercase.
1260 * If we're doing backspace processing, delete backspaces.
1261 */
1262 cvt_ops = get_cvt_ops();
1263 cvt_len = cvt_length(line_len, cvt_ops);
1264 cline = (char *) ecalloc(1, cvt_len);
1265 chpos = cvt_alloc_chpos(cvt_len);
1266 cvt_text(cline, line, chpos, &line_len, cvt_ops);
1267
1268 #if HILITE_SEARCH
1269 /*
1270 * Check to see if the line matches the filter pattern.
1271 * If so, add an entry to the filter list.
1272 */
1273 if (((search_type & SRCH_FIND_ALL) ||
1274 prep_startpos == NULL_POSITION ||
1275 linepos < prep_startpos || linepos >= prep_endpos) &&
1276 prev_pattern(&filter_info)) {
1277 int line_filter = match_pattern(info_compiled(&filter_info), filter_info.text,
1278 cline, line_len, &sp, &ep, 0, filter_info.search_type);
1279 if (line_filter)
1280 {
1281 struct hilite hl;
1282 hl.hl_startpos = linepos;
1283 hl.hl_endpos = pos;
1284 add_hilite(&filter_anchor, &hl);
1285 free(cline);
1286 free(chpos);
1287 continue;
1288 }
1289 }
1290 #endif
1291
1292 /*
1293 * Test the next line to see if we have a match.
1294 * We are successful if we either want a match and got one,
1295 * or if we want a non-match and got one.
1296 */
1297 if (prev_pattern(&search_info))
1298 {
1299 line_match = match_pattern(info_compiled(&search_info), search_info.text,
1300 cline, line_len, &sp, &ep, 0, search_type);
1301 if (line_match)
1302 {
1303 /*
1304 * Got a match.
1305 */
1306 if (search_type & SRCH_FIND_ALL)
1307 {
1308 #if HILITE_SEARCH
1309 /*
1310 * We are supposed to find all matches in the range.
1311 * Just add the matches in this line to the
1312 * hilite list and keep searching.
1313 */
1314 hilite_line(linepos, cline, line_len, chpos, sp, ep, cvt_ops);
1315 #endif
1316 } else if (--matches <= 0)
1317 {
1318 /*
1319 * Found the one match we're looking for.
1320 * Return it.
1321 */
1322 #if HILITE_SEARCH
1323 if (hilite_search == OPT_ON)
1324 {
1325 /*
1326 * Clear the hilite list and add only
1327 * the matches in this one line.
1328 */
1329 clr_hilite();
1330 hilite_line(linepos, cline, line_len, chpos, sp, ep, cvt_ops);
1331 }
1332 #endif
1333 free(cline);
1334 free(chpos);
1335 if (plinepos != NULL)
1336 *plinepos = linepos;
1337 return (0);
1338 }
1339 }
1340 }
1341 free(cline);
1342 free(chpos);
1343 }
1344 }
1345
1346 /*
1347 * search for a pattern in history. If found, compile that pattern.
1348 */
1349 static int
hist_pattern(search_type)1350 hist_pattern(search_type)
1351 int search_type;
1352 {
1353 #if CMD_HISTORY
1354 char *pattern;
1355
1356 set_mlist(ml_search, 0);
1357 pattern = cmd_lastpattern();
1358 if (pattern == NULL)
1359 return (0);
1360
1361 if (set_pattern(&search_info, pattern, search_type) < 0)
1362 return (0);
1363
1364 #if HILITE_SEARCH
1365 if (hilite_search == OPT_ONPLUS && !hide_hilite)
1366 hilite_screen();
1367 #endif
1368
1369 return (1);
1370 #else /* CMD_HISTORY */
1371 return (0);
1372 #endif /* CMD_HISTORY */
1373 }
1374
1375 /*
1376 * Change the caseless-ness of searches.
1377 * Updates the internal search state to reflect a change in the -i flag.
1378 */
1379 public void
chg_caseless()1380 chg_caseless()
1381 {
1382 if (!is_ucase_pattern)
1383 /*
1384 * Pattern did not have uppercase.
1385 * Just set the search caselessness to the global caselessness.
1386 */
1387 is_caseless = caseless;
1388 else
1389 {
1390 /*
1391 * Pattern did have uppercase.
1392 * Regenerate the pattern using the new state.
1393 */
1394 clear_pattern(&search_info);
1395 hist_pattern(search_info.search_type);
1396 }
1397 }
1398
1399 /*
1400 * Search for the n-th occurrence of a specified pattern,
1401 * either forward or backward.
1402 * Return the number of matches not yet found in this file
1403 * (that is, n minus the number of matches found).
1404 * Return -1 if the search should be aborted.
1405 * Caller may continue the search in another file
1406 * if less than n matches are found in this file.
1407 */
1408 public int
search(search_type,pattern,n)1409 search(search_type, pattern, n)
1410 int search_type;
1411 char *pattern;
1412 int n;
1413 {
1414 POSITION pos;
1415
1416 if (pattern == NULL || *pattern == '\0')
1417 {
1418 /*
1419 * A null pattern means use the previously compiled pattern.
1420 */
1421 search_type |= SRCH_AFTER_TARGET;
1422 if (!prev_pattern(&search_info) && !hist_pattern(search_type))
1423 {
1424 error("No previous regular expression", NULL_PARG);
1425 return (-1);
1426 }
1427 if ((search_type & SRCH_NO_REGEX) !=
1428 (search_info.search_type & SRCH_NO_REGEX))
1429 {
1430 error("Please re-enter search pattern", NULL_PARG);
1431 return -1;
1432 }
1433 #if HILITE_SEARCH
1434 if (hilite_search == OPT_ON || status_col)
1435 {
1436 /*
1437 * Erase the highlights currently on screen.
1438 * If the search fails, we'll redisplay them later.
1439 */
1440 repaint_hilite(0);
1441 }
1442 if (hilite_search == OPT_ONPLUS && hide_hilite)
1443 {
1444 /*
1445 * Highlight any matches currently on screen,
1446 * before we actually start the search.
1447 */
1448 hide_hilite = 0;
1449 hilite_screen();
1450 }
1451 hide_hilite = 0;
1452 #endif
1453 } else
1454 {
1455 /*
1456 * Compile the pattern.
1457 */
1458 if (set_pattern(&search_info, pattern, search_type) < 0)
1459 return (-1);
1460 #if HILITE_SEARCH
1461 if (hilite_search || status_col)
1462 {
1463 /*
1464 * Erase the highlights currently on screen.
1465 * Also permanently delete them from the hilite list.
1466 */
1467 repaint_hilite(0);
1468 hide_hilite = 0;
1469 clr_hilite();
1470 }
1471 if (hilite_search == OPT_ONPLUS || status_col)
1472 {
1473 /*
1474 * Highlight any matches currently on screen,
1475 * before we actually start the search.
1476 */
1477 hilite_screen();
1478 }
1479 #endif
1480 }
1481
1482 /*
1483 * Figure out where to start the search.
1484 */
1485 pos = search_pos(search_type);
1486 if (pos == NULL_POSITION)
1487 {
1488 /*
1489 * Can't find anyplace to start searching from.
1490 */
1491 if (search_type & SRCH_PAST_EOF)
1492 return (n);
1493 if (hilite_search == OPT_ON || status_col)
1494 repaint_hilite(1);
1495 error("Nothing to search", NULL_PARG);
1496 return (-1);
1497 }
1498
1499 n = search_range(pos, NULL_POSITION, search_type, n, -1,
1500 &pos, (POSITION*)NULL);
1501 if (n != 0)
1502 {
1503 /*
1504 * Search was unsuccessful.
1505 */
1506 #if HILITE_SEARCH
1507 if ((hilite_search == OPT_ON || status_col) && n > 0)
1508 /*
1509 * Redisplay old hilites.
1510 */
1511 repaint_hilite(1);
1512 #endif
1513 return (n);
1514 }
1515
1516 if (!(search_type & SRCH_NO_MOVE))
1517 {
1518 /*
1519 * Go to the matching line.
1520 */
1521 jump_loc(pos, jump_sline);
1522 }
1523
1524 #if HILITE_SEARCH
1525 if (hilite_search == OPT_ON || status_col)
1526 /*
1527 * Display new hilites in the matching line.
1528 */
1529 repaint_hilite(1);
1530 #endif
1531 return (0);
1532 }
1533
1534
1535 #if HILITE_SEARCH
1536 /*
1537 * Prepare hilites in a given range of the file.
1538 *
1539 * The pair (prep_startpos,prep_endpos) delimits a contiguous region
1540 * of the file that has been "prepared"; that is, scanned for matches for
1541 * the current search pattern, and hilites have been created for such matches.
1542 * If prep_startpos == NULL_POSITION, the prep region is empty.
1543 * If prep_endpos == NULL_POSITION, the prep region extends to EOF.
1544 * prep_hilite asks that the range (spos,epos) be covered by the prep region.
1545 */
1546 public void
prep_hilite(spos,epos,maxlines)1547 prep_hilite(spos, epos, maxlines)
1548 POSITION spos;
1549 POSITION epos;
1550 int maxlines;
1551 {
1552 POSITION nprep_startpos = prep_startpos;
1553 POSITION nprep_endpos = prep_endpos;
1554 POSITION new_epos;
1555 POSITION max_epos;
1556 int result;
1557 int i;
1558
1559 /*
1560 * Search beyond where we're asked to search, so the prep region covers
1561 * more than we need. Do one big search instead of a bunch of small ones.
1562 */
1563 #define SEARCH_MORE (3*size_linebuf)
1564
1565 if (!prev_pattern(&search_info) && !is_filtering())
1566 return;
1567
1568 /*
1569 * Make sure our prep region always starts at the beginning of
1570 * a line. (search_range takes care of the end boundary below.)
1571 */
1572 spos = back_raw_line(spos+1, (char **)NULL, (int *)NULL);
1573
1574 /*
1575 * If we're limited to a max number of lines, figure out the
1576 * file position we should stop at.
1577 */
1578 if (maxlines < 0)
1579 max_epos = NULL_POSITION;
1580 else
1581 {
1582 max_epos = spos;
1583 for (i = 0; i < maxlines; i++)
1584 max_epos = forw_raw_line(max_epos, (char **)NULL, (int *)NULL);
1585 }
1586
1587 /*
1588 * Find two ranges:
1589 * The range that we need to search (spos,epos); and the range that
1590 * the "prep" region will then cover (nprep_startpos,nprep_endpos).
1591 */
1592
1593 if (prep_startpos == NULL_POSITION ||
1594 (epos != NULL_POSITION && epos < prep_startpos) ||
1595 spos > prep_endpos)
1596 {
1597 /*
1598 * New range is not contiguous with old prep region.
1599 * Discard the old prep region and start a new one.
1600 */
1601 clr_hilite();
1602 clr_filter();
1603 if (epos != NULL_POSITION)
1604 epos += SEARCH_MORE;
1605 nprep_startpos = spos;
1606 } else
1607 {
1608 /*
1609 * New range partially or completely overlaps old prep region.
1610 */
1611 if (epos == NULL_POSITION)
1612 {
1613 /*
1614 * New range goes to end of file.
1615 */
1616 ;
1617 } else if (epos > prep_endpos)
1618 {
1619 /*
1620 * New range ends after old prep region.
1621 * Extend prep region to end at end of new range.
1622 */
1623 epos += SEARCH_MORE;
1624 } else /* (epos <= prep_endpos) */
1625 {
1626 /*
1627 * New range ends within old prep region.
1628 * Truncate search to end at start of old prep region.
1629 */
1630 epos = prep_startpos;
1631 }
1632
1633 if (spos < prep_startpos)
1634 {
1635 /*
1636 * New range starts before old prep region.
1637 * Extend old prep region backwards to start at
1638 * start of new range.
1639 */
1640 if (spos < SEARCH_MORE)
1641 spos = 0;
1642 else
1643 spos -= SEARCH_MORE;
1644 nprep_startpos = spos;
1645 } else /* (spos >= prep_startpos) */
1646 {
1647 /*
1648 * New range starts within or after old prep region.
1649 * Trim search to start at end of old prep region.
1650 */
1651 spos = prep_endpos;
1652 }
1653 }
1654
1655 if (epos != NULL_POSITION && max_epos != NULL_POSITION &&
1656 epos > max_epos)
1657 /*
1658 * Don't go past the max position we're allowed.
1659 */
1660 epos = max_epos;
1661
1662 if (epos == NULL_POSITION || epos > spos)
1663 {
1664 int search_type = SRCH_FORW | SRCH_FIND_ALL;
1665 search_type |= (search_info.search_type & SRCH_NO_REGEX);
1666 for (;;)
1667 {
1668 result = search_range(spos, epos, search_type, 0, maxlines, (POSITION*)NULL, &new_epos);
1669 if (result < 0)
1670 return;
1671 if (prep_endpos == NULL_POSITION || new_epos > prep_endpos)
1672 nprep_endpos = new_epos;
1673
1674 /*
1675 * Check both ends of the resulting prep region to
1676 * make sure they're not filtered. If they are,
1677 * keep going at least one more line until we find
1678 * something that isn't filtered, or hit the end.
1679 */
1680 if (prep_endpos == NULL_POSITION || nprep_endpos > prep_endpos)
1681 {
1682 if (new_epos >= nprep_endpos && is_filtered(new_epos-1))
1683 {
1684 spos = nprep_endpos;
1685 epos = forw_raw_line(nprep_endpos, (char **)NULL, (int *)NULL);
1686 if (epos == NULL_POSITION)
1687 break;
1688 maxlines = 1;
1689 continue;
1690 }
1691 }
1692
1693 if (prep_startpos == NULL_POSITION || nprep_startpos < prep_startpos)
1694 {
1695 if (nprep_startpos > 0 && is_filtered(nprep_startpos))
1696 {
1697 epos = nprep_startpos;
1698 spos = back_raw_line(nprep_startpos, (char **)NULL, (int *)NULL);
1699 if (spos == NULL_POSITION)
1700 break;
1701 nprep_startpos = spos;
1702 maxlines = 1;
1703 continue;
1704 }
1705 }
1706 break;
1707 }
1708 }
1709 prep_startpos = nprep_startpos;
1710 prep_endpos = nprep_endpos;
1711 }
1712
1713 /*
1714 * Set the pattern to be used for line filtering.
1715 */
1716 public void
set_filter_pattern(pattern,search_type)1717 set_filter_pattern(pattern, search_type)
1718 char *pattern;
1719 int search_type;
1720 {
1721 clr_filter();
1722 if (pattern == NULL || *pattern == '\0')
1723 clear_pattern(&filter_info);
1724 else
1725 set_pattern(&filter_info, pattern, search_type);
1726 screen_trashed = 1;
1727 }
1728
1729 /*
1730 * Is there a line filter in effect?
1731 */
1732 public int
is_filtering()1733 is_filtering()
1734 {
1735 if (ch_getflags() & CH_HELPFILE)
1736 return (0);
1737 return prev_pattern(&filter_info);
1738 }
1739 #endif
1740
1741 #if HAVE_V8_REGCOMP
1742 /*
1743 * This function is called by the V8 regcomp to report
1744 * errors in regular expressions.
1745 */
1746 public int reg_show_error = 1;
1747
1748 void
regerror(s)1749 regerror(s)
1750 char *s;
1751 {
1752 PARG parg;
1753
1754 if (!reg_show_error)
1755 return;
1756 parg.p_string = s;
1757 error("%s", &parg);
1758 }
1759 #endif
1760
1761