X-Git-Url: https://git.saurik.com/apple/javascriptcore.git/blobdiff_plain/4be4e30906bcb8ee30b4d189205cb70bad6707ce..81345200c95645a1b0d2635520f96ad55dfde63f:/inspector/ContentSearchUtilities.cpp diff --git a/inspector/ContentSearchUtilities.cpp b/inspector/ContentSearchUtilities.cpp new file mode 100644 index 0000000..bcd691b --- /dev/null +++ b/inspector/ContentSearchUtilities.cpp @@ -0,0 +1,220 @@ +/* + * Copyright (C) 2011 Google Inc. All rights reserved. + * + * Redistribution and use in source and binary forms, with or without + * modification, are permitted provided that the following conditions are + * met: + * + * 1. Redistributions of source code must retain the above copyright + * notice, this list of conditions and the following disclaimer. + * + * 2. Redistributions in binary form must reproduce the above + * copyright notice, this list of conditions and the following disclaimer + * in the documentation and/or other materials provided with the + * distribution. + * + * THIS SOFTWARE IS PROVIDED BY GOOGLE INC. AND ITS CONTRIBUTORS + * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT + * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR + * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL GOOGLE INC. + * OR ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, + * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT + * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, + * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY + * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT + * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE + * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. + */ + +#include "config.h" +#include "ContentSearchUtilities.h" + +#if ENABLE(INSPECTOR) + +#include "InspectorJSTypeBuilders.h" +#include "InspectorValues.h" +#include "RegularExpression.h" +#include "Yarr.h" +#include +#include +#include + +using namespace JSC::Yarr; + +namespace Inspector { +namespace ContentSearchUtilities { + +static const char regexSpecialCharacters[] = "[](){}+-*.,?\\^$|"; + +static String createSearchRegexSource(const String& text) +{ + StringBuilder result; + + for (unsigned i = 0; i < text.length(); i++) { + UChar character = text[i]; + if (isASCII(character) && strchr(regexSpecialCharacters, character)) + result.append('\\'); + result.append(character); + } + + return result.toString(); +} + +static inline size_t sizetExtractor(const size_t* value) +{ + return *value; +} + +TextPosition textPositionFromOffset(size_t offset, const Vector& lineEndings) +{ + const size_t* foundNextStart = approximateBinarySearch(lineEndings, lineEndings.size(), offset, sizetExtractor); + size_t lineIndex = foundNextStart - &lineEndings.at(0); + if (offset >= *foundNextStart) + ++lineIndex; + size_t lineStartOffset = lineIndex > 0 ? lineEndings.at(lineIndex - 1) : 0; + size_t column = offset - lineStartOffset; + return TextPosition(OrdinalNumber::fromZeroBasedInt(lineIndex), OrdinalNumber::fromZeroBasedInt(column)); +} + +static Vector> getRegularExpressionMatchesByLines(const JSC::Yarr::RegularExpression& regex, const String& text) +{ + Vector> result; + if (text.isEmpty()) + return result; + + std::unique_ptr> endings(lineEndings(text)); + size_t size = endings->size(); + size_t start = 0; + + for (size_t lineNumber = 0; lineNumber < size; ++lineNumber) { + size_t nextStart = endings->at(lineNumber); + String line = text.substring(start, nextStart - start); + + int matchLength; + if (regex.match(line, 0, &matchLength) != -1) + result.append(std::pair(lineNumber, line)); + + start = nextStart; + } + + return result; +} + +std::unique_ptr> lineEndings(const String& text) +{ + auto result = std::make_unique>(); + + size_t start = 0; + while (start < text.length()) { + size_t nextStart = text.findNextLineStart(start); + if (nextStart == notFound) { + result->append(text.length()); + break; + } + + result->append(nextStart); + start = nextStart; + } + + result->append(text.length()); + + return result; +} + +static PassRefPtr buildObjectForSearchMatch(size_t lineNumber, const String& lineContent) +{ + return Inspector::TypeBuilder::GenericTypes::SearchMatch::create() + .setLineNumber(lineNumber) + .setLineContent(lineContent) + .release(); +} + +JSC::Yarr::RegularExpression createSearchRegex(const String& query, bool caseSensitive, bool isRegex) +{ + String regexSource = isRegex ? query : createSearchRegexSource(query); + return JSC::Yarr::RegularExpression(regexSource, caseSensitive ? TextCaseSensitive : TextCaseInsensitive); +} + +int countRegularExpressionMatches(const JSC::Yarr::RegularExpression& regex, const String& content) +{ + if (content.isEmpty()) + return 0; + + int result = 0; + int position; + unsigned start = 0; + int matchLength; + while ((position = regex.match(content, start, &matchLength)) != -1) { + if (start >= content.length()) + break; + if (matchLength > 0) + ++result; + start = position + 1; + } + return result; +} + +PassRefPtr> searchInTextByLines(const String& text, const String& query, const bool caseSensitive, const bool isRegex) +{ + RefPtr> result = Inspector::TypeBuilder::Array::create(); + + JSC::Yarr::RegularExpression regex = ContentSearchUtilities::createSearchRegex(query, caseSensitive, isRegex); + Vector> matches = getRegularExpressionMatchesByLines(regex, text); + + for (const auto& match : matches) + result->addItem(buildObjectForSearchMatch(match.first, match.second)); + + return result; +} + +static String scriptCommentPattern(const String& name) +{ + // "//# =" and deprecated "//@" + return "//[#@][\040\t]" + name + "=[\040\t]*([^\\s\'\"]*)[\040\t]*$"; +} + +static String stylesheetCommentPattern(const String& name) +{ + // "/*# = */" and deprecated "/*@" + return "/\\*[#@][\040\t]" + name + "=[\040\t]*([^\\s\'\"]*)[\040\t]*\\*/"; +} + +static String findMagicComment(const String& content, const String& patternString) +{ + const char* error = nullptr; + JSC::Yarr::YarrPattern pattern(patternString, false, true, &error); + ASSERT(!error); + BumpPointerAllocator regexAllocator; + OwnPtr bytecodePattern = JSC::Yarr::byteCompile(pattern, ®exAllocator); + ASSERT(bytecodePattern); + + ASSERT(pattern.m_numSubpatterns == 1); + Vector matches; + matches.resize(4); + unsigned result = JSC::Yarr::interpret(bytecodePattern.get(), content, 0, reinterpret_cast(matches.data())); + if (result == JSC::Yarr::offsetNoMatch) + return String(); + + ASSERT(matches[2] > 0 && matches[3] > 0); + return content.substring(matches[2], matches[3] - matches[2]); +} + +String findScriptSourceURL(const String& content) +{ + return findMagicComment(content, scriptCommentPattern(ASCIILiteral("sourceURL"))); +} + +String findScriptSourceMapURL(const String& content) +{ + return findMagicComment(content, scriptCommentPattern(ASCIILiteral("sourceMappingURL"))); +} + +String findStylesheetSourceMapURL(const String& content) +{ + return findMagicComment(content, stylesheetCommentPattern(ASCIILiteral("sourceMappingURL"))); +} + +} // namespace ContentSearchUtilities +} // namespace Inspector + +#endif // ENABLE(INSPECTOR)