551 lines
13 KiB
C
551 lines
13 KiB
C
/* $NetBSD: search.c,v 1.4 2000/03/17 02:23:17 christos Exp $ */
|
|
|
|
/*-
|
|
* Copyright (c) 1992, 1993, 1994
|
|
* The Regents of the University of California. All rights reserved.
|
|
* Copyright (c) 1992, 1993, 1994, 1995, 1996
|
|
* Keith Bostic. All rights reserved.
|
|
*
|
|
* See the LICENSE file for redistribution information.
|
|
*/
|
|
|
|
#include "config.h"
|
|
|
|
#ifndef lint
|
|
static const char sccsid[] = "@(#)search.c 10.24 (Berkeley) 5/26/96";
|
|
#endif /* not lint */
|
|
|
|
#include <sys/types.h>
|
|
#include <sys/queue.h>
|
|
|
|
#include <bitstring.h>
|
|
#include <ctype.h>
|
|
#include <errno.h>
|
|
#include <limits.h>
|
|
#include <stdio.h>
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
#include <unistd.h>
|
|
|
|
#include "common.h"
|
|
|
|
typedef enum { S_EMPTY, S_EOF, S_NOPREV, S_NOTFOUND, S_SOF, S_WRAP } smsg_t;
|
|
|
|
static void search_msg __P((SCR *, smsg_t));
|
|
static int search_setup __P((SCR *, dir_t, char *, char **, u_int));
|
|
|
|
/*
|
|
* search_setup --
|
|
* Set up a search.
|
|
*/
|
|
static int
|
|
search_setup(sp, dir, ptrn, epp, flags)
|
|
SCR *sp;
|
|
dir_t dir;
|
|
char *ptrn, **epp;
|
|
u_int flags;
|
|
{
|
|
recno_t lno;
|
|
int delim;
|
|
char *p, *t;
|
|
|
|
/* If the file is empty, it's a fast search. */
|
|
if (sp->lno <= 1) {
|
|
if (db_last(sp, &lno))
|
|
return (1);
|
|
if (lno == 0) {
|
|
if (LF_ISSET(SEARCH_MSG))
|
|
search_msg(sp, S_EMPTY);
|
|
return (1);
|
|
}
|
|
}
|
|
|
|
if (LF_ISSET(SEARCH_PARSE)) { /* Parse the string. */
|
|
/*
|
|
* Use the saved pattern if no pattern supplied, or if only
|
|
* the delimiter character supplied.
|
|
*
|
|
* !!!
|
|
* Only the pattern itself was saved, historically vi didn't
|
|
* reuse addressing or delta information.
|
|
*/
|
|
if (ptrn == NULL)
|
|
goto prev;
|
|
if (ptrn[1] == '\0') {
|
|
if (epp != NULL)
|
|
*epp = ptrn + 1;
|
|
goto prev;
|
|
}
|
|
if (ptrn[0] == ptrn[1]) {
|
|
if (epp != NULL)
|
|
*epp = ptrn + 2;
|
|
|
|
/* Complain if we don't have a previous pattern. */
|
|
prev: if (sp->re == NULL) {
|
|
search_msg(sp, S_NOPREV);
|
|
return (1);
|
|
}
|
|
/* Compile the search pattern if necessary. */
|
|
if (!F_ISSET(sp, SC_RE_SEARCH) &&
|
|
re_compile(sp, sp->re, NULL, NULL, &sp->re_c,
|
|
RE_C_SEARCH |
|
|
(LF_ISSET(SEARCH_MSG) ? 0 : RE_C_SILENT)))
|
|
return (1);
|
|
|
|
/* Set the search direction. */
|
|
if (LF_ISSET(SEARCH_SET))
|
|
sp->searchdir = dir;
|
|
return (0);
|
|
}
|
|
|
|
/*
|
|
* Set the delimiter, and move forward to the terminating
|
|
* delimiter, handling escaped delimiters.
|
|
*
|
|
* QUOTING NOTE:
|
|
* Only discard an escape character if it escapes a delimiter.
|
|
*/
|
|
for (delim = *ptrn, p = t = ++ptrn;; *t++ = *p++) {
|
|
if (p[0] == '\0' || p[0] == delim) {
|
|
if (p[0] == delim)
|
|
++p;
|
|
*t = '\0';
|
|
break;
|
|
}
|
|
if (p[1] == delim && p[0] == '\\')
|
|
++p;
|
|
}
|
|
if (epp != NULL)
|
|
*epp = p;
|
|
}
|
|
|
|
/* Compile the RE. */
|
|
if (re_compile(sp, ptrn, &sp->re, &sp->re_len, &sp->re_c,
|
|
RE_C_SEARCH |
|
|
(LF_ISSET(SEARCH_MSG) ? 0 : RE_C_SILENT) |
|
|
(LF_ISSET(SEARCH_TAG) ? RE_C_TAG : 0) |
|
|
(LF_ISSET(SEARCH_CSCOPE) ? RE_C_CSCOPE : 0)))
|
|
return (1);
|
|
|
|
/* Set the search direction. */
|
|
if (LF_ISSET(SEARCH_SET))
|
|
sp->searchdir = dir;
|
|
|
|
return (0);
|
|
}
|
|
|
|
/*
|
|
* f_search --
|
|
* Do a forward search.
|
|
*
|
|
* PUBLIC: int f_search __P((SCR *, MARK *, MARK *, char *, char **, u_int));
|
|
*/
|
|
int
|
|
f_search(sp, fm, rm, ptrn, eptrn, flags)
|
|
SCR *sp;
|
|
MARK *fm, *rm;
|
|
char *ptrn, **eptrn;
|
|
u_int flags;
|
|
{
|
|
busy_t btype;
|
|
recno_t lno;
|
|
regmatch_t match[1];
|
|
size_t coff, len;
|
|
int cnt, eval, rval, wrapped;
|
|
char *l;
|
|
#ifndef REG_STARTEND
|
|
char c;
|
|
#endif
|
|
|
|
if (search_setup(sp, FORWARD, ptrn, eptrn, flags))
|
|
return (1);
|
|
|
|
if (LF_ISSET(SEARCH_FILE)) {
|
|
lno = 1;
|
|
coff = 0;
|
|
} else {
|
|
if (db_get(sp, fm->lno, DBG_FATAL, &l, &len))
|
|
return (1);
|
|
lno = fm->lno;
|
|
|
|
/*
|
|
* If doing incremental search, start searching at the previous
|
|
* column, so that we search a minimal distance and still match
|
|
* special patterns, e.g., \< for beginning of a word.
|
|
*
|
|
* Otherwise, start searching immediately after the cursor. If
|
|
* at the end of the line, start searching on the next line.
|
|
* This is incompatible (read bug fix) with the historic vi --
|
|
* searches for the '$' pattern never moved forward, and the
|
|
* "-t foo" didn't work if the 'f' was the first character in
|
|
* the file.
|
|
*/
|
|
if (LF_ISSET(SEARCH_INCR)) {
|
|
if ((coff = fm->cno) != 0)
|
|
--coff;
|
|
} else if (fm->cno + 1 >= len) {
|
|
coff = 0;
|
|
lno = fm->lno + 1;
|
|
if (db_get(sp, lno, 0, &l, &len)) {
|
|
if (!O_ISSET(sp, O_WRAPSCAN)) {
|
|
if (LF_ISSET(SEARCH_MSG))
|
|
search_msg(sp, S_EOF);
|
|
return (1);
|
|
}
|
|
lno = 1;
|
|
}
|
|
} else
|
|
coff = fm->cno + 1;
|
|
}
|
|
|
|
btype = BUSY_ON;
|
|
for (cnt = INTERRUPT_CHECK, rval = 1, wrapped = 0;; ++lno, coff = 0) {
|
|
if (cnt-- == 0) {
|
|
if (INTERRUPTED(sp))
|
|
break;
|
|
if (LF_ISSET(SEARCH_MSG)) {
|
|
search_busy(sp, btype);
|
|
btype = BUSY_UPDATE;
|
|
}
|
|
cnt = INTERRUPT_CHECK;
|
|
}
|
|
if (wrapped && lno > fm->lno || db_get(sp, lno, 0, &l, &len)) {
|
|
if (wrapped) {
|
|
if (LF_ISSET(SEARCH_MSG))
|
|
search_msg(sp, S_NOTFOUND);
|
|
break;
|
|
}
|
|
if (!O_ISSET(sp, O_WRAPSCAN)) {
|
|
if (LF_ISSET(SEARCH_MSG))
|
|
search_msg(sp, S_EOF);
|
|
break;
|
|
}
|
|
lno = 0;
|
|
wrapped = 1;
|
|
continue;
|
|
}
|
|
|
|
/* If already at EOL, just keep going. */
|
|
if (len != 0 && coff == len)
|
|
continue;
|
|
|
|
#ifdef REG_STARTEND
|
|
/* Set the termination. */
|
|
match[0].rm_so = coff;
|
|
match[0].rm_eo = len;
|
|
#else
|
|
c = l[len];
|
|
l[len] = '\0';
|
|
#endif
|
|
|
|
#if defined(DEBUG) && 0
|
|
TRACE(sp, "F search: %lu from %u to %u\n",
|
|
lno, coff, len != 0 ? len - 1 : len);
|
|
#endif
|
|
/* Search the line. */
|
|
#ifdef REG_STARTEND
|
|
eval = regexec(&sp->re_c, l, 1, match,
|
|
(match[0].rm_so == 0 ? 0 : REG_NOTBOL) | REG_STARTEND);
|
|
#else
|
|
eval = regexec(&sp->re_c, &l[coff], 1, match,
|
|
(match[0].rm_so == 0 ? 0 : REG_NOTBOL));
|
|
l[len] = c;
|
|
#endif
|
|
if (eval == REG_NOMATCH)
|
|
continue;
|
|
if (eval != 0) {
|
|
if (LF_ISSET(SEARCH_MSG))
|
|
re_error(sp, eval, &sp->re_c);
|
|
else
|
|
(void)sp->gp->scr_bell(sp);
|
|
break;
|
|
}
|
|
|
|
/*
|
|
* XXX
|
|
* Warn if the search wrapped. This message is only displayed
|
|
* if we're in interactive mode and there are no keys in the
|
|
* queue. The problem is that the command is going to succeed,
|
|
* and the message isn't an error, it's merely informational.
|
|
* So, if we're reading the .exrc file, displaying it causes
|
|
* the screen to pause before entering the file, which is bad.
|
|
* Or, if a macro causes it to be repeatedly displayed, e.g.,
|
|
* the pattern only occurs once in the file and wrapscan is set,
|
|
* you lose, particularly if the macro does something like:
|
|
* :map K /pattern/^MjK
|
|
* Each new search will display the message and the /pattern/
|
|
* will immediately overwrite it, with strange results. The
|
|
* System V vi displays the "wrapped" message multiple times,
|
|
* but it's overwritten each time, so it's not as noticeable.
|
|
* Since we don't discard messages, it's a real problem.
|
|
*
|
|
* XXX
|
|
* The test for SC_SCR_EX or SC_SCR_VI feels wrong to me. I
|
|
* didn't originally intend for that bit to reflect that the
|
|
* user has "gone interactive", but that's the only solution
|
|
* I see.
|
|
*/
|
|
if (wrapped && LF_ISSET(SEARCH_MSG) &&
|
|
F_ISSET(sp, SC_SCR_EX | SC_SCR_VI) && !KEYS_WAITING(sp))
|
|
search_msg(sp, S_WRAP);
|
|
|
|
#if defined(DEBUG) && 0
|
|
TRACE(sp, "F search: %qu to %qu\n",
|
|
match[0].rm_so, match[0].rm_eo);
|
|
#endif
|
|
rm->lno = lno;
|
|
rm->cno = match[0].rm_so;
|
|
|
|
/*
|
|
* If a change command, it's possible to move beyond the end
|
|
* of a line. Historic vi generally got this wrong (e.g. try
|
|
* "c?$<cr>"). Not all that sure this gets it right, there
|
|
* are lots of strange cases.
|
|
*/
|
|
if (!LF_ISSET(SEARCH_EOL) && rm->cno >= len)
|
|
rm->cno = len != 0 ? len - 1 : 0;
|
|
|
|
rval = 0;
|
|
break;
|
|
}
|
|
|
|
if (LF_ISSET(SEARCH_MSG))
|
|
search_busy(sp, BUSY_OFF);
|
|
return (rval);
|
|
}
|
|
|
|
/*
|
|
* b_search --
|
|
* Do a backward search.
|
|
*
|
|
* PUBLIC: int b_search __P((SCR *, MARK *, MARK *, char *, char **, u_int));
|
|
*/
|
|
int
|
|
b_search(sp, fm, rm, ptrn, eptrn, flags)
|
|
SCR *sp;
|
|
MARK *fm, *rm;
|
|
char *ptrn, **eptrn;
|
|
u_int flags;
|
|
{
|
|
busy_t btype;
|
|
recno_t lno;
|
|
regmatch_t match[1];
|
|
size_t coff, last, len;
|
|
int cnt, eval, rval, wrapped;
|
|
char *l;
|
|
#ifndef REG_STARTEND
|
|
char c;
|
|
#endif
|
|
|
|
if (search_setup(sp, BACKWARD, ptrn, eptrn, flags))
|
|
return (1);
|
|
|
|
/*
|
|
* If doing incremental search, set the "starting" position past the
|
|
* current column, so that we search a minimal distance and still
|
|
* match special patterns, e.g., \> for the end of a word. This is
|
|
* safe when the cursor is at the end of a line because we only use
|
|
* it for comparison with the location of the match.
|
|
*
|
|
* Otherwise, start searching immediately before the cursor. If in
|
|
* the first column, start search on the previous line.
|
|
*/
|
|
if (LF_ISSET(SEARCH_INCR)) {
|
|
lno = fm->lno;
|
|
coff = fm->cno + 1;
|
|
} else {
|
|
if (fm->cno == 0) {
|
|
if (fm->lno == 1 && !O_ISSET(sp, O_WRAPSCAN)) {
|
|
if (LF_ISSET(SEARCH_MSG))
|
|
search_msg(sp, S_SOF);
|
|
return (1);
|
|
}
|
|
lno = fm->lno - 1;
|
|
} else
|
|
lno = fm->lno;
|
|
coff = fm->cno;
|
|
}
|
|
|
|
btype = BUSY_ON;
|
|
for (cnt = INTERRUPT_CHECK, rval = 1, wrapped = 0;; --lno, coff = 0) {
|
|
if (cnt-- == 0) {
|
|
if (INTERRUPTED(sp))
|
|
break;
|
|
if (LF_ISSET(SEARCH_MSG)) {
|
|
search_busy(sp, btype);
|
|
btype = BUSY_UPDATE;
|
|
}
|
|
cnt = INTERRUPT_CHECK;
|
|
}
|
|
if (wrapped && lno < fm->lno || lno == 0) {
|
|
if (wrapped) {
|
|
if (LF_ISSET(SEARCH_MSG))
|
|
search_msg(sp, S_NOTFOUND);
|
|
break;
|
|
}
|
|
if (!O_ISSET(sp, O_WRAPSCAN)) {
|
|
if (LF_ISSET(SEARCH_MSG))
|
|
search_msg(sp, S_SOF);
|
|
break;
|
|
}
|
|
if (db_last(sp, &lno))
|
|
break;
|
|
if (lno == 0) {
|
|
if (LF_ISSET(SEARCH_MSG))
|
|
search_msg(sp, S_EMPTY);
|
|
break;
|
|
}
|
|
++lno;
|
|
wrapped = 1;
|
|
continue;
|
|
}
|
|
|
|
if (db_get(sp, lno, 0, &l, &len))
|
|
break;
|
|
|
|
/* Set the termination. */
|
|
#ifdef REG_STARTEND
|
|
match[0].rm_so = 0;
|
|
match[0].rm_eo = len;
|
|
#else
|
|
c = l[len];
|
|
l[len] = '\0';
|
|
#endif
|
|
|
|
#if defined(DEBUG) && 0
|
|
TRACE(sp, "B search: %lu from 0 to %qu\n", lno, match[0].rm_eo);
|
|
#endif
|
|
/* Search the line. */
|
|
#ifdef REG_STARTEND
|
|
eval = regexec(&sp->re_c, l, 1, match,
|
|
(match[0].rm_eo == len ? 0 : REG_NOTEOL) | REG_STARTEND);
|
|
#else
|
|
eval = regexec(&sp->re_c, l, 1, match,
|
|
(match[0].rm_eo == len ? 0 : REG_NOTEOL));
|
|
l[len] = c;
|
|
#endif
|
|
if (eval == REG_NOMATCH)
|
|
continue;
|
|
if (eval != 0) {
|
|
if (LF_ISSET(SEARCH_MSG))
|
|
re_error(sp, eval, &sp->re_c);
|
|
else
|
|
(void)sp->gp->scr_bell(sp);
|
|
break;
|
|
}
|
|
|
|
/* Check for a match starting past the cursor. */
|
|
if (coff != 0 && match[0].rm_so >= coff)
|
|
continue;
|
|
|
|
/*
|
|
* XXX
|
|
* See the comment in f_search() for more information.
|
|
*/
|
|
if (wrapped && LF_ISSET(SEARCH_MSG) &&
|
|
F_ISSET(sp, SC_SCR_EX | SC_SCR_VI) && !KEYS_WAITING(sp))
|
|
search_msg(sp, S_WRAP);
|
|
|
|
#if defined(DEBUG) && 0
|
|
TRACE(sp, "B found: %qu to %qu\n",
|
|
match[0].rm_so, match[0].rm_eo);
|
|
#endif
|
|
/*
|
|
* We now have the first match on the line. Step through the
|
|
* line character by character until find the last acceptable
|
|
* match. This is painful, we need a better interface to regex
|
|
* to make this work.
|
|
*/
|
|
for (;;) {
|
|
last = match[0].rm_so++;
|
|
if (match[0].rm_so >= len)
|
|
break;
|
|
#ifdef REG_STARTEND
|
|
match[0].rm_eo = len;
|
|
eval = regexec(&sp->re_c, l, 1, match,
|
|
(match[0].rm_so == 0 ? 0 : REG_NOTBOL) |
|
|
REG_STARTEND);
|
|
#else
|
|
c = l[len];
|
|
l[len] = '\0';
|
|
eval = regexec(&sp->re_c, &l[last + 1], 1, match,
|
|
(match[0].rm_so == 0 ? 0 : REG_NOTBOL));
|
|
l[len] = c;
|
|
#endif
|
|
if (eval == REG_NOMATCH)
|
|
break;
|
|
if (eval != 0) {
|
|
if (LF_ISSET(SEARCH_MSG))
|
|
re_error(sp, eval, &sp->re_c);
|
|
else
|
|
(void)sp->gp->scr_bell(sp);
|
|
goto err;
|
|
}
|
|
if (coff && match[0].rm_so >= coff)
|
|
break;
|
|
}
|
|
rm->lno = lno;
|
|
|
|
/* See comment in f_search(). */
|
|
if (!LF_ISSET(SEARCH_EOL) && last >= len)
|
|
rm->cno = len != 0 ? len - 1 : 0;
|
|
else
|
|
rm->cno = last;
|
|
rval = 0;
|
|
break;
|
|
}
|
|
|
|
err: if (LF_ISSET(SEARCH_MSG))
|
|
search_busy(sp, BUSY_OFF);
|
|
return (rval);
|
|
}
|
|
|
|
/*
|
|
* search_msg --
|
|
* Display one of the search messages.
|
|
*/
|
|
static void
|
|
search_msg(sp, msg)
|
|
SCR *sp;
|
|
smsg_t msg;
|
|
{
|
|
switch (msg) {
|
|
case S_EMPTY:
|
|
msgq(sp, M_ERR, "072|File empty; nothing to search");
|
|
break;
|
|
case S_EOF:
|
|
msgq(sp, M_ERR,
|
|
"073|Reached end-of-file without finding the pattern");
|
|
break;
|
|
case S_NOPREV:
|
|
msgq(sp, M_ERR, "074|No previous search pattern");
|
|
break;
|
|
case S_NOTFOUND:
|
|
msgq(sp, M_ERR, "075|Pattern not found");
|
|
break;
|
|
case S_SOF:
|
|
msgq(sp, M_ERR,
|
|
"076|Reached top-of-file without finding the pattern");
|
|
break;
|
|
case S_WRAP:
|
|
msgq(sp, M_ERR, "077|Search wrapped");
|
|
break;
|
|
default:
|
|
abort();
|
|
}
|
|
}
|
|
|
|
/*
|
|
* search_busy --
|
|
* Put up the busy searching message.
|
|
*
|
|
* PUBLIC: void search_busy __P((SCR *, busy_t));
|
|
*/
|
|
void
|
|
search_busy(sp, btype)
|
|
SCR *sp;
|
|
busy_t btype;
|
|
{
|
|
sp->gp->scr_busy(sp, "078|Searching...", btype);
|
|
}
|