ContentSearchUtils.cpp [plain text]
#include "config.h"
#if ENABLE(INSPECTOR)
#include "ContentSearchUtils.h"
#include "InspectorValues.h"
#include "RegularExpression.h"
#include <wtf/BumpPointerAllocator.h>
#include <yarr/Yarr.h>
using namespace std;
namespace WebCore {
namespace ContentSearchUtils {
namespace {
static const char regexSpecialCharacters[] = "[](){}+-*.,?\\^$|";
}
static String createSearchRegexSource(const String& text)
{
String result;
const UChar* characters = text.characters();
String specials(regexSpecialCharacters);
for (unsigned i = 0; i < text.length(); i++) {
if (specials.find(characters[i]) != notFound)
result.append("\\");
result.append(characters[i]);
}
return result;
}
static Vector<pair<int, String> > getRegularExpressionMatchesByLines(const RegularExpression& regex, const String& text)
{
Vector<pair<int, String> > result;
if (text.isEmpty())
return result;
int lineNumber = 0;
unsigned start = 0;
while (start < text.length()) {
size_t lineEnd = text.find('\n', start);
if (lineEnd == notFound)
lineEnd = text.length();
else
lineEnd++;
String line = text.substring(start, lineEnd - start);
if (line.endsWith("\r\n"))
line = line.left(line.length() - 2);
if (line.endsWith('\n'))
line = line.left(line.length() - 1);
int matchLength;
if (regex.match(line, 0, &matchLength) != -1)
result.append(pair<int, String>(lineNumber, line));
start = lineEnd;
lineNumber++;
}
return result;
}
static PassRefPtr<TypeBuilder::Page::SearchMatch> buildObjectForSearchMatch(int lineNumber, String lineContent)
{
return TypeBuilder::Page::SearchMatch::create()
.setLineNumber(lineNumber)
.setLineContent(lineContent)
.release();
}
RegularExpression createSearchRegex(const String& query, bool caseSensitive, bool isRegex)
{
String regexSource = isRegex ? query : createSearchRegexSource(query);
return RegularExpression(regexSource, caseSensitive ? TextCaseSensitive : TextCaseInsensitive);
}
int countRegularExpressionMatches(const RegularExpression& regex, const String& content)
{
if (content.isEmpty())
return 0;
int result = 0;
int position;
unsigned start = 0;
int matchLength;
while ((position = regex.match(content, start, &matchLength)) != -1) {
if (start >= content.length())
break;
if (matchLength > 0)
++result;
start = position + 1;
}
return result;
}
PassRefPtr<TypeBuilder::Array<TypeBuilder::Page::SearchMatch> > searchInTextByLines(const String& text, const String& query, const bool caseSensitive, const bool isRegex)
{
RefPtr<TypeBuilder::Array<TypeBuilder::Page::SearchMatch> > result = TypeBuilder::Array<TypeBuilder::Page::SearchMatch>::create();
RegularExpression regex = ContentSearchUtils::createSearchRegex(query, caseSensitive, isRegex);
Vector<pair<int, String> > matches = getRegularExpressionMatchesByLines(regex, text);
for (Vector<pair<int, String> >::const_iterator it = matches.begin(); it != matches.end(); ++it)
result->addItem(buildObjectForSearchMatch(it->first, it->second));
return result;
}
static String findMagicComment(const String& content, const String& name)
{
String patternString = "//@[\040\t]" + name + "=[\040\t]*([^\\s\'\"]*)[\040\t]*$";
const char* error = 0;
JSC::Yarr::YarrPattern pattern(JSC::UString(patternString.impl()), false, true, &error);
ASSERT(!error);
BumpPointerAllocator regexAllocator;
OwnPtr<JSC::Yarr::BytecodePattern> bytecodePattern = JSC::Yarr::byteCompile(pattern, ®exAllocator);
ASSERT(bytecodePattern);
ASSERT(pattern.m_numSubpatterns == 1);
Vector<int, 4> matches;
matches.resize(4);
unsigned result = JSC::Yarr::interpret(bytecodePattern.get(), JSC::UString(content.impl()), 0, reinterpret_cast<unsigned*>(matches.data()));
if (result == JSC::Yarr::offsetNoMatch)
return String();
ASSERT(matches[2] > 0 && matches[3] > 0);
return content.substring(matches[2], matches[3] - matches[2]);
}
String findSourceURL(const String& content)
{
return findMagicComment(content, "sourceURL");
}
String findSourceMapURL(const String& content)
{
return findMagicComment(content, "sourceMappingURL");
}
} }
#endif // ENABLE(INSPECTOR)