mc/lib/search/glob.c
Slava Zanko 3facc59837 use g_string_sized_new() instread of g_string_new() to avoid often reallocation action
Signed-off-by: Slava Zanko <slavazanko@gmail.com>
2010-07-07 14:12:45 +03:00

206 lines
6.0 KiB
C

/*
Search text engine.
Glob-style pattern matching
Copyright (C) 2009 The Free Software Foundation, Inc.
Written by:
Slava Zanko <slavazanko@gmail.com>, 2009.
This file is part of the Midnight Commander.
The Midnight Commander is free software; you can redistribute it
and/or modify it under the terms of the GNU General Public License as
published by the Free Software Foundation; either version 2 of the
License, or (at your option) any later version.
The Midnight Commander is distributed in the hope that it will be
useful, but WITHOUT ANY WARRANTY; without even the implied warranty
of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
MA 02110-1301, USA.
*/
#include <config.h>
#include "lib/global.h"
#include "lib/strutil.h"
#include "lib/search.h"
#include "lib/strescape.h"
#include "src/charsets.h"
#include "internal.h"
/*** global variables ****************************************************************************/
/*** file scope macro definitions ****************************************************************/
/*** file scope type declarations ****************************************************************/
/*** file scope variables ************************************************************************/
/*** file scope functions ************************************************************************/
static GString *
mc_search__glob_translate_to_regex (gchar * str, gsize * len)
{
GString *buff = g_string_new ("");
gsize orig_len = *len;
gsize loop = 0;
gboolean inside_group = FALSE;
while (loop < orig_len)
{
switch (str[loop])
{
case '*':
if (!strutils_is_char_escaped (str, &(str[loop])))
{
g_string_append (buff, (inside_group) ? ".*" : "(.*)");
loop++;
continue;
}
break;
case '?':
if (!strutils_is_char_escaped (str, &(str[loop])))
{
g_string_append (buff, (inside_group) ? "." : "(.)");
loop++;
continue;
}
break;
case ',':
if (!strutils_is_char_escaped (str, &(str[loop])))
{
g_string_append (buff, "|");
loop++;
continue;
}
break;
case '{':
if (!strutils_is_char_escaped (str, &(str[loop])))
{
g_string_append (buff, "(");
inside_group = TRUE;
loop++;
continue;
}
break;
case '}':
if (!strutils_is_char_escaped (str, &(str[loop])))
{
g_string_append (buff, ")");
inside_group = FALSE;
loop++;
continue;
}
break;
case '+':
case '.':
case '$':
case '(':
case ')':
case '^':
g_string_append_c (buff, '\\');
g_string_append_c (buff, str[loop]);
loop++;
continue;
}
g_string_append_c (buff, str[loop]);
loop++;
}
*len = buff->len;
return buff;
}
/* --------------------------------------------------------------------------------------------- */
static GString *
mc_search__translate_replace_glob_to_regex (gchar * str)
{
GString *buff = g_string_sized_new (32);
int cnt = '0';
gboolean escaped_mode = FALSE;
while (*str)
{
char c = *str++;
switch (c)
{
case '\\':
if (!escaped_mode)
{
escaped_mode = TRUE;
continue;
}
break;
case '*':
case '?':
if (!escaped_mode)
{
g_string_append_c (buff, '\\');
c = ++cnt;
continue;
}
break;
/* breaks copying: mc uses "\0" internally, it must not be changed */
/*case '\\': */
case '&':
g_string_append_c (buff, '\\');
break;
}
g_string_append_c (buff, c);
escaped_mode = FALSE;
}
return buff;
}
/*** public functions ****************************************************************************/
void
mc_search__cond_struct_new_init_glob (const char *charset, mc_search_t * lc_mc_search,
mc_search_cond_t * mc_search_cond)
{
GString *tmp =
mc_search__glob_translate_to_regex (mc_search_cond->str->str, &mc_search_cond->len);
g_string_free (mc_search_cond->str, TRUE);
if (lc_mc_search->is_entire_line)
{
g_string_prepend_c (tmp, '^');
g_string_append_c (tmp, '$');
}
mc_search_cond->str = tmp;
mc_search__cond_struct_new_init_regex (charset, lc_mc_search, mc_search_cond);
}
/* --------------------------------------------------------------------------------------------- */
gboolean
mc_search__run_glob (mc_search_t * lc_mc_search, const void *user_data,
gsize start_search, gsize end_search, gsize * found_len)
{
return mc_search__run_regex (lc_mc_search, user_data, start_search, end_search, found_len);
}
/* --------------------------------------------------------------------------------------------- */
GString *
mc_search_glob_prepare_replace_str (mc_search_t * lc_mc_search, GString * replace_str)
{
GString *repl = mc_search__translate_replace_glob_to_regex (replace_str->str);
GString *res = mc_search_regex_prepare_replace_str (lc_mc_search, repl);
g_string_free (repl, TRUE);
return res;
}
/* --------------------------------------------------------------------------------------------- */