/* * Copyright (C) 2011 Google Inc. All rights reserved. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions are * met: * * 1. Redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer. * * 2. Redistributions in binary form must reproduce the above * copyright notice, this list of conditions and the following disclaimer * in the documentation and/or other materials provided with the * distribution. * * THIS SOFTWARE IS PROVIDED BY GOOGLE INC. AND ITS CONTRIBUTORS * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL GOOGLE INC. * OR ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. */ #include "config.h" #include "ContentSearchUtilities.h" #include "InspectorValues.h" #include "RegularExpression.h" #include "Yarr.h" #include "YarrInterpreter.h" #include #include #include using namespace JSC::Yarr; namespace Inspector { namespace ContentSearchUtilities { static const char regexSpecialCharacters[] = "[](){}+-*.,?\\^$|"; static String createSearchRegexSource(const String& text) { StringBuilder result; for (unsigned i = 0; i < text.length(); i++) { UChar character = text[i]; if (isASCII(character) && strchr(regexSpecialCharacters, character)) result.append('\\'); result.append(character); } return result.toString(); } static inline size_t sizetExtractor(const size_t* value) { return *value; } TextPosition textPositionFromOffset(size_t offset, const Vector& lineEndings) { const size_t* foundNextStart = approximateBinarySearch(lineEndings, lineEndings.size(), offset, sizetExtractor); size_t lineIndex = foundNextStart - &lineEndings.at(0); if (offset >= *foundNextStart) ++lineIndex; size_t lineStartOffset = lineIndex > 0 ? lineEndings.at(lineIndex - 1) : 0; size_t column = offset - lineStartOffset; return TextPosition(OrdinalNumber::fromZeroBasedInt(lineIndex), OrdinalNumber::fromZeroBasedInt(column)); } static Vector> getRegularExpressionMatchesByLines(const JSC::Yarr::RegularExpression& regex, const String& text) { Vector> result; if (text.isEmpty()) return result; std::unique_ptr> endings(lineEndings(text)); size_t size = endings->size(); size_t start = 0; for (size_t lineNumber = 0; lineNumber < size; ++lineNumber) { size_t nextStart = endings->at(lineNumber); String line = text.substring(start, nextStart - start); int matchLength; if (regex.match(line, 0, &matchLength) != -1) result.append(std::pair(lineNumber, line)); start = nextStart; } return result; } std::unique_ptr> lineEndings(const String& text) { auto result = std::make_unique>(); size_t start = 0; while (start < text.length()) { size_t nextStart = text.findNextLineStart(start); if (nextStart == notFound) { result->append(text.length()); break; } result->append(nextStart); start = nextStart; } result->append(text.length()); return result; } static Ref buildObjectForSearchMatch(size_t lineNumber, const String& lineContent) { return Inspector::Protocol::GenericTypes::SearchMatch::create() .setLineNumber(lineNumber) .setLineContent(lineContent) .release(); } JSC::Yarr::RegularExpression createSearchRegex(const String& query, bool caseSensitive, bool isRegex) { String regexSource = isRegex ? query : createSearchRegexSource(query); return JSC::Yarr::RegularExpression(regexSource, caseSensitive ? TextCaseSensitive : TextCaseInsensitive); } int countRegularExpressionMatches(const JSC::Yarr::RegularExpression& regex, const String& content) { if (content.isEmpty()) return 0; int result = 0; int position; unsigned start = 0; int matchLength; while ((position = regex.match(content, start, &matchLength)) != -1) { if (start >= content.length()) break; if (matchLength > 0) ++result; start = position + 1; } return result; } Ref> searchInTextByLines(const String& text, const String& query, const bool caseSensitive, const bool isRegex) { Ref> result = Inspector::Protocol::Array::create(); JSC::Yarr::RegularExpression regex = ContentSearchUtilities::createSearchRegex(query, caseSensitive, isRegex); Vector> matches = getRegularExpressionMatchesByLines(regex, text); for (const auto& match : matches) { Ref matchObject = buildObjectForSearchMatch(match.first, match.second); result->addItem(WTFMove(matchObject)); } return result; } static String stylesheetCommentPattern(const String& name) { // "/*# = */" and deprecated "/*@" return "/\\*[#@][\040\t]" + name + "=[\040\t]*([^\\s\'\"]*)[\040\t]*\\*/"; } static String findMagicComment(const String& content, const String& patternString) { ASSERT(!content.isNull()); const char* error = nullptr; JSC::Yarr::YarrPattern pattern(patternString, JSC::RegExpFlags::FlagMultiline, &error); ASSERT(!error); BumpPointerAllocator regexAllocator; auto bytecodePattern = JSC::Yarr::byteCompile(pattern, ®exAllocator); ASSERT(bytecodePattern); ASSERT(pattern.m_numSubpatterns == 1); Vector matches; matches.resize(4); unsigned result = JSC::Yarr::interpret(bytecodePattern.get(), content, 0, reinterpret_cast(matches.data())); if (result == JSC::Yarr::offsetNoMatch) return String(); ASSERT(matches[2] > 0 && matches[3] > 0); return content.substring(matches[2], matches[3] - matches[2]); } String findStylesheetSourceMapURL(const String& content) { return findMagicComment(content, stylesheetCommentPattern(ASCIILiteral("sourceMappingURL"))); } } // namespace ContentSearchUtilities } // namespace Inspector