2005-05-23 04:58:42 +04:00
|
|
|
/*
|
|
|
|
Open Tracker License
|
|
|
|
|
|
|
|
Terms and Conditions
|
|
|
|
|
|
|
|
Copyright (c) 1991-2000, Be Incorporated. All rights reserved.
|
|
|
|
|
|
|
|
Permission is hereby granted, free of charge, to any person obtaining a copy of
|
|
|
|
this software and associated documentation files (the "Software"), to deal in
|
|
|
|
the Software without restriction, including without limitation the rights to
|
|
|
|
use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies
|
|
|
|
of the Software, and to permit persons to whom the Software is furnished to do
|
|
|
|
so, subject to the following conditions:
|
|
|
|
|
|
|
|
The above copyright notice and this permission notice applies to all licensees
|
|
|
|
and shall be included in all copies or substantial portions of the Software.
|
|
|
|
|
|
|
|
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
|
|
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF TITLE, MERCHANTABILITY,
|
|
|
|
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
|
|
BE INCORPORATED BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN
|
|
|
|
AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF, OR IN CONNECTION
|
|
|
|
WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
|
|
|
|
|
|
|
Except as contained in this notice, the name of Be Incorporated shall not be
|
|
|
|
used in advertising or otherwise to promote the sale, use or other dealings in
|
|
|
|
this Software without prior written authorization from Be Incorporated.
|
|
|
|
|
|
|
|
Tracker(TM), Be(R), BeOS(R), and BeIA(TM) are trademarks or registered trademarks
|
|
|
|
of Be Incorporated in the United States and other countries. Other brand product
|
|
|
|
names are registered trademarks or trademarks of their respective holders.
|
|
|
|
All rights reserved.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include "TrackerString.h"
|
|
|
|
|
|
|
|
#include <stdio.h>
|
|
|
|
#include <stdlib.h>
|
2014-08-08 01:12:54 +04:00
|
|
|
#include <strings.h>
|
2005-05-23 04:58:42 +04:00
|
|
|
|
2014-06-21 03:23:06 +04:00
|
|
|
|
|
|
|
// #pragma mark - TrackerString
|
|
|
|
|
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
TrackerString::TrackerString()
|
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2012-07-28 03:07:09 +04:00
|
|
|
TrackerString::TrackerString(const char* string)
|
2014-06-21 03:23:06 +04:00
|
|
|
:
|
|
|
|
BString(string)
|
2005-05-23 04:58:42 +04:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
TrackerString::TrackerString(const TrackerString &string)
|
2014-06-21 03:23:06 +04:00
|
|
|
:
|
|
|
|
BString(string)
|
2005-05-23 04:58:42 +04:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2012-07-28 03:07:09 +04:00
|
|
|
TrackerString::TrackerString(const char* string, int32 maxLength)
|
2014-06-21 03:23:06 +04:00
|
|
|
:
|
|
|
|
BString(string, maxLength)
|
2005-05-23 04:58:42 +04:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
TrackerString::~TrackerString()
|
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
bool
|
2012-07-28 03:07:09 +04:00
|
|
|
TrackerString::Matches(const char* string, bool caseSensitivity,
|
2005-05-23 04:58:42 +04:00
|
|
|
TrackerStringExpressionType expressionType) const
|
|
|
|
{
|
|
|
|
switch (expressionType) {
|
|
|
|
default:
|
|
|
|
case kNone:
|
|
|
|
return false;
|
2013-01-02 14:11:56 +04:00
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
case kStartsWith:
|
|
|
|
return StartsWith(string, caseSensitivity);
|
2013-01-02 14:11:56 +04:00
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
case kEndsWith:
|
|
|
|
return EndsWith(string, caseSensitivity);
|
2013-01-02 14:11:56 +04:00
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
case kContains:
|
|
|
|
return Contains(string, caseSensitivity);
|
|
|
|
|
|
|
|
case kGlobMatch:
|
|
|
|
return MatchesGlob(string, caseSensitivity);
|
|
|
|
|
|
|
|
case kRegexpMatch:
|
|
|
|
return MatchesRegExp(string, caseSensitivity);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
bool
|
2012-07-28 03:07:09 +04:00
|
|
|
TrackerString::MatchesRegExp(const char* pattern, bool caseSensitivity) const
|
2005-05-23 04:58:42 +04:00
|
|
|
{
|
|
|
|
BString patternString(pattern);
|
|
|
|
BString textString(String());
|
2013-01-02 14:11:56 +04:00
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
if (caseSensitivity == false) {
|
|
|
|
patternString.ToLower();
|
|
|
|
textString.ToLower();
|
|
|
|
}
|
2013-01-02 14:11:56 +04:00
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
RegExp expression(patternString);
|
2013-01-02 14:11:56 +04:00
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
if (expression.InitCheck() != B_OK)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
return expression.Matches(textString);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
bool
|
2012-07-28 03:07:09 +04:00
|
|
|
TrackerString::MatchesGlob(const char* string, bool caseSensitivity) const
|
2005-05-23 04:58:42 +04:00
|
|
|
{
|
|
|
|
return StringMatchesPattern(String(), string, caseSensitivity);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
bool
|
2012-07-28 03:07:09 +04:00
|
|
|
TrackerString::EndsWith(const char* string, bool caseSensitivity) const
|
2005-05-23 04:58:42 +04:00
|
|
|
{
|
|
|
|
// If "string" is longer than "this",
|
|
|
|
// we should simply return false
|
|
|
|
int32 position = Length() - (int32)strlen(string);
|
|
|
|
if (position < 0)
|
|
|
|
return false;
|
2013-01-02 14:11:56 +04:00
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
if (caseSensitivity)
|
|
|
|
return FindLast(string) == position;
|
|
|
|
else
|
|
|
|
return IFindLast(string) == position;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
bool
|
2012-07-28 03:07:09 +04:00
|
|
|
TrackerString::StartsWith(const char* string, bool caseSensitivity) const
|
2005-05-23 04:58:42 +04:00
|
|
|
{
|
|
|
|
if (caseSensitivity)
|
|
|
|
return FindFirst(string) == 0;
|
2012-07-28 03:07:09 +04:00
|
|
|
else
|
2005-05-23 04:58:42 +04:00
|
|
|
return IFindFirst(string) == 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
bool
|
2012-07-28 03:07:09 +04:00
|
|
|
TrackerString::Contains(const char* string, bool caseSensitivity) const
|
2005-05-23 04:58:42 +04:00
|
|
|
{
|
|
|
|
if (caseSensitivity)
|
|
|
|
return FindFirst(string) > -1;
|
|
|
|
else
|
|
|
|
return IFindFirst(string) > -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
// MatchesBracketExpression() assumes 'pattern' to point to the
|
|
|
|
// character following the initial '[' in a bracket expression.
|
|
|
|
// The reason is that an encountered '[' will be taken literally.
|
|
|
|
// (Makes it possible to match a '[' with the expression '[[]').
|
|
|
|
bool
|
2012-07-28 22:00:24 +04:00
|
|
|
TrackerString::MatchesBracketExpression(const char* string,
|
|
|
|
const char* pattern, bool caseSensitivity) const
|
2005-05-23 04:58:42 +04:00
|
|
|
{
|
|
|
|
bool GlyphMatch = IsStartOfGlyph(string[0]);
|
2012-07-28 22:00:24 +04:00
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
if (IsInsideGlyph(string[0]))
|
|
|
|
return false;
|
|
|
|
|
|
|
|
char testChar = ConditionalToLower(string[0], caseSensitivity);
|
|
|
|
bool match = false;
|
|
|
|
|
|
|
|
bool inverse = *pattern == '^' || *pattern == '!';
|
|
|
|
// We allow both ^ and ! as a initial inverting character.
|
2013-01-02 14:11:56 +04:00
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
if (inverse)
|
2012-07-28 03:07:09 +04:00
|
|
|
pattern++;
|
2012-07-28 22:00:24 +04:00
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
while (!match && *pattern != ']' && *pattern != '\0') {
|
|
|
|
switch (*pattern) {
|
|
|
|
case '-':
|
2012-07-28 22:00:24 +04:00
|
|
|
{
|
|
|
|
char start = ConditionalToLower(*(pattern - 1),
|
|
|
|
caseSensitivity);
|
|
|
|
char stop = ConditionalToLower(*(pattern + 1),
|
|
|
|
caseSensitivity);
|
|
|
|
|
|
|
|
if (IsGlyph(start) || IsGlyph(stop))
|
|
|
|
return false;
|
|
|
|
// Not a valid range!
|
|
|
|
|
|
|
|
if ((islower(start) && islower(stop))
|
|
|
|
|| (isupper(start) && isupper(stop))
|
|
|
|
|| (isdigit(start) && isdigit(stop))) {
|
|
|
|
// Make sure 'start' and 'stop' are of the same type.
|
|
|
|
match = start <= testChar && testChar <= stop;
|
|
|
|
} else {
|
|
|
|
// If no valid range, we've got a syntax error.
|
|
|
|
return false;
|
2005-05-23 04:58:42 +04:00
|
|
|
}
|
2012-07-28 22:00:24 +04:00
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
break;
|
2012-07-28 22:00:24 +04:00
|
|
|
}
|
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
default:
|
|
|
|
if (GlyphMatch)
|
|
|
|
match = UTF8CharsAreEqual(string, pattern);
|
|
|
|
else
|
|
|
|
match = CharsAreEqual(testChar, *pattern, caseSensitivity);
|
|
|
|
break;
|
|
|
|
}
|
2012-07-28 22:00:24 +04:00
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
if (!match) {
|
|
|
|
pattern++;
|
|
|
|
if (IsInsideGlyph(pattern[0]))
|
|
|
|
pattern = MoveToEndOfGlyph(pattern);
|
|
|
|
}
|
2012-07-28 03:07:09 +04:00
|
|
|
}
|
2012-07-28 22:00:24 +04:00
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
// Consider an unmatched bracket a failure
|
|
|
|
// (i.e. when detecting a '\0' instead of a ']'.)
|
|
|
|
if (*pattern == '\0')
|
|
|
|
return false;
|
2012-07-28 22:00:24 +04:00
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
return (match ^ inverse) != 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
bool
|
2012-07-28 03:07:09 +04:00
|
|
|
TrackerString::StringMatchesPattern(const char* string, const char* pattern,
|
2005-05-23 04:58:42 +04:00
|
|
|
bool caseSensitivity) const
|
|
|
|
{
|
|
|
|
// One could do this dynamically, counting the number of *'s,
|
|
|
|
// but then you have to free them at every exit of this
|
|
|
|
// function, which is awkward and ugly.
|
|
|
|
const int32 kWildCardMaximum = 100;
|
2012-07-28 03:07:09 +04:00
|
|
|
const char* pStorage[kWildCardMaximum];
|
|
|
|
const char* sStorage[kWildCardMaximum];
|
2005-05-23 04:58:42 +04:00
|
|
|
|
|
|
|
int32 patternLevel = 0;
|
2012-07-28 03:07:09 +04:00
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
if (string == NULL || pattern == NULL)
|
|
|
|
return false;
|
|
|
|
|
2012-07-28 03:07:09 +04:00
|
|
|
while (*pattern != '\0') {
|
2005-05-23 04:58:42 +04:00
|
|
|
switch (*pattern) {
|
|
|
|
case '?':
|
|
|
|
pattern++;
|
|
|
|
string++;
|
|
|
|
if (IsInsideGlyph(string[0]))
|
|
|
|
string = MoveToEndOfGlyph(string);
|
|
|
|
break;
|
2012-07-28 22:00:24 +04:00
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
case '*':
|
2012-07-28 03:07:09 +04:00
|
|
|
{
|
|
|
|
// Collapse any ** and *? constructions:
|
|
|
|
while (*pattern == '*' || *pattern == '?') {
|
|
|
|
pattern++;
|
2016-07-02 12:04:01 +03:00
|
|
|
if (*pattern == '?' && *string != '\0') {
|
2012-07-28 03:07:09 +04:00
|
|
|
string++;
|
|
|
|
if (IsInsideGlyph(string[0]))
|
|
|
|
string = MoveToEndOfGlyph(string);
|
2005-05-23 04:58:42 +04:00
|
|
|
}
|
2012-07-28 03:07:09 +04:00
|
|
|
}
|
2013-01-02 14:11:56 +04:00
|
|
|
|
2012-07-28 03:07:09 +04:00
|
|
|
if (*pattern == '\0') {
|
|
|
|
// An ending * matches all strings.
|
|
|
|
return true;
|
|
|
|
}
|
2005-05-23 04:58:42 +04:00
|
|
|
|
2012-07-28 03:07:09 +04:00
|
|
|
bool match = false;
|
|
|
|
const char* pBefore = pattern - 1;
|
2005-05-23 04:58:42 +04:00
|
|
|
|
2012-07-28 03:07:09 +04:00
|
|
|
if (*pattern == '[') {
|
|
|
|
pattern++;
|
|
|
|
|
|
|
|
while (!match && *string != '\0') {
|
|
|
|
match = MatchesBracketExpression(string++, pattern,
|
|
|
|
caseSensitivity);
|
|
|
|
}
|
|
|
|
|
|
|
|
while (*pattern != ']' && *pattern != '\0') {
|
2005-05-23 04:58:42 +04:00
|
|
|
// Skip the rest of the bracket:
|
2012-07-28 03:07:09 +04:00
|
|
|
pattern++;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (*pattern == '\0') {
|
2005-05-23 04:58:42 +04:00
|
|
|
// Failure if no closing bracket;
|
2012-07-28 03:07:09 +04:00
|
|
|
return false;
|
2005-05-23 04:58:42 +04:00
|
|
|
}
|
2012-07-28 03:07:09 +04:00
|
|
|
} else {
|
|
|
|
// No bracket, just one character:
|
|
|
|
while (!match && *string != '\0') {
|
|
|
|
if (IsGlyph(string[0]))
|
|
|
|
match = UTF8CharsAreEqual(string++, pattern);
|
|
|
|
else {
|
|
|
|
match = CharsAreEqual(*string++, *pattern,
|
|
|
|
caseSensitivity);
|
2005-05-23 04:58:42 +04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2012-07-28 03:07:09 +04:00
|
|
|
|
|
|
|
if (!match)
|
|
|
|
return false;
|
|
|
|
else {
|
|
|
|
pStorage[patternLevel] = pBefore;
|
|
|
|
if (IsInsideGlyph(string[0]))
|
|
|
|
string = MoveToEndOfGlyph(string);
|
|
|
|
|
|
|
|
sStorage[patternLevel++] = string;
|
|
|
|
if (patternLevel > kWildCardMaximum)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
pattern++;
|
|
|
|
if (IsInsideGlyph(pattern[0]))
|
|
|
|
pattern = MoveToEndOfGlyph(pattern);
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
2013-01-02 14:11:56 +04:00
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
case '[':
|
|
|
|
pattern++;
|
2012-07-28 03:07:09 +04:00
|
|
|
|
2012-07-28 22:00:24 +04:00
|
|
|
if (!MatchesBracketExpression(string, pattern,
|
|
|
|
caseSensitivity)) {
|
2005-05-23 04:58:42 +04:00
|
|
|
if (patternLevel > 0) {
|
|
|
|
pattern = pStorage[--patternLevel];
|
|
|
|
string = sStorage[patternLevel];
|
|
|
|
} else
|
|
|
|
return false;
|
2012-07-28 03:07:09 +04:00
|
|
|
} else {
|
2005-05-23 04:58:42 +04:00
|
|
|
// Skip the rest of the bracket:
|
|
|
|
while (*pattern != ']' && *pattern != '\0')
|
|
|
|
pattern++;
|
2013-01-02 14:11:56 +04:00
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
// Failure if no closing bracket;
|
|
|
|
if (*pattern == '\0')
|
|
|
|
return false;
|
2012-07-28 03:07:09 +04:00
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
string++;
|
|
|
|
if (IsInsideGlyph(string[0]))
|
|
|
|
string = MoveToEndOfGlyph(string);
|
|
|
|
pattern++;
|
|
|
|
}
|
|
|
|
break;
|
2012-07-28 03:07:09 +04:00
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
default:
|
2012-07-28 03:07:09 +04:00
|
|
|
{
|
|
|
|
bool equal = false;
|
|
|
|
if (IsGlyph(string[0]))
|
|
|
|
equal = UTF8CharsAreEqual(string, pattern);
|
|
|
|
else
|
|
|
|
equal = CharsAreEqual(*string, *pattern, caseSensitivity);
|
|
|
|
|
|
|
|
if (equal) {
|
|
|
|
pattern++;
|
|
|
|
if (IsInsideGlyph(pattern[0]))
|
|
|
|
pattern = MoveToEndOfGlyph(pattern);
|
|
|
|
string++;
|
|
|
|
if (IsInsideGlyph(string[0]))
|
|
|
|
string = MoveToEndOfGlyph(string);
|
|
|
|
} else if (patternLevel > 0) {
|
|
|
|
pattern = pStorage[--patternLevel];
|
|
|
|
string = sStorage[patternLevel];
|
|
|
|
} else
|
|
|
|
return false;
|
|
|
|
break;
|
|
|
|
}
|
2005-05-23 04:58:42 +04:00
|
|
|
}
|
2012-07-28 03:07:09 +04:00
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
if (*pattern == '\0' && *string != '\0' && patternLevel > 0) {
|
|
|
|
pattern = pStorage[--patternLevel];
|
|
|
|
string = sStorage[patternLevel];
|
|
|
|
}
|
|
|
|
}
|
2012-07-28 03:07:09 +04:00
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
return *string == '\0' && *pattern == '\0';
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
bool
|
2012-07-28 22:00:24 +04:00
|
|
|
TrackerString::UTF8CharsAreEqual(const char* string1,
|
|
|
|
const char* string2) const
|
2005-05-23 04:58:42 +04:00
|
|
|
{
|
2012-07-28 03:07:09 +04:00
|
|
|
const char* s1 = string1;
|
|
|
|
const char* s2 = string2;
|
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
if (IsStartOfGlyph(*s1) && *s1 == *s2) {
|
|
|
|
s1++;
|
|
|
|
s2++;
|
2012-07-28 03:07:09 +04:00
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
while (IsInsideGlyph(*s1) && *s1 == *s2) {
|
|
|
|
s1++;
|
|
|
|
s2++;
|
|
|
|
}
|
2012-07-28 03:07:09 +04:00
|
|
|
|
2012-07-28 22:00:24 +04:00
|
|
|
return !IsInsideGlyph(*s1)
|
|
|
|
&& !IsInsideGlyph(*s2) && *(s1 - 1) == *(s2 - 1);
|
2005-05-23 04:58:42 +04:00
|
|
|
} else
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2012-07-28 03:07:09 +04:00
|
|
|
const char*
|
|
|
|
TrackerString::MoveToEndOfGlyph(const char* string) const
|
2005-05-23 04:58:42 +04:00
|
|
|
{
|
2012-07-28 03:07:09 +04:00
|
|
|
const char* ptr = string;
|
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
while (IsInsideGlyph(*ptr))
|
|
|
|
ptr++;
|
2012-07-28 03:07:09 +04:00
|
|
|
|
2005-05-23 04:58:42 +04:00
|
|
|
return ptr;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
bool
|
|
|
|
TrackerString::IsGlyph(char ch) const
|
|
|
|
{
|
|
|
|
return (ch & 0x80) == 0x80;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
bool
|
|
|
|
TrackerString::IsInsideGlyph(char ch) const
|
|
|
|
{
|
|
|
|
return (ch & 0xC0) == 0x80;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
bool
|
|
|
|
TrackerString::IsStartOfGlyph(char ch) const
|
|
|
|
{
|
|
|
|
return (ch & 0xC0) == 0xC0;
|
|
|
|
}
|