mirror of
https://github.com/oven-sh/bun
synced 2026-02-18 14:51:52 +00:00
LLVM 21 has stricter warnings for character type conversions: - URLPatternParser: Change isValidNameCodepoint to accept char32_t since codePoints().begin() returns char32_t, not char16_t - EncodeURIComponent: Add explicit static_cast for char16_t to char32_t - highway_strings: Use FixedTag<uint8_t, 16> instead of ScalableTag for the preloaded vector array, since SVE types are sizeless and can't be stored in C++ arrays. Use ResizeBitCast to convert back to scalable vectors when comparing. Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
111 lines
3.9 KiB
C++
111 lines
3.9 KiB
C++
/*
|
|
* Copyright (C) 2024 Apple Inc. All rights reserved.
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without
|
|
* modification, are permitted provided that the following conditions
|
|
* are met:
|
|
* 1. Redistributions of source code must retain the above copyright
|
|
* notice, this list of conditions and the following disclaimer.
|
|
* 2. Redistributions in binary form must reproduce the above copyright
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
* documentation and/or other materials provided with the distribution.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED BY APPLE INC. AND ITS CONTRIBUTORS ``AS IS''
|
|
* AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
|
|
* THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
|
|
* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE INC. OR ITS CONTRIBUTORS
|
|
* BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
|
* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
|
* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
|
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
|
|
* THE POSSIBILITY OF SUCH DAMAGE.
|
|
*/
|
|
|
|
#pragma once
|
|
|
|
#include "URLPatternTokenizer.h"
|
|
#include <wtf/text/StringBuilder.h>
|
|
#include <wtf/text/WTFString.h>
|
|
|
|
namespace WebCore {
|
|
|
|
enum class EncodingCallbackType : uint8_t;
|
|
template<typename> class ExceptionOr;
|
|
|
|
namespace URLPatternUtilities {
|
|
|
|
struct Token;
|
|
enum class TokenType : uint8_t;
|
|
|
|
enum class PartType : uint8_t { FixedText,
|
|
Regexp,
|
|
SegmentWildcard,
|
|
FullWildcard };
|
|
enum class Modifier : uint8_t { None,
|
|
Optional,
|
|
ZeroOrMore,
|
|
OneOrMore };
|
|
enum class IsFirst : bool { No,
|
|
Yes };
|
|
|
|
struct Part {
|
|
PartType type;
|
|
String value;
|
|
Modifier modifier;
|
|
String name {};
|
|
String prefix {};
|
|
String suffix {};
|
|
};
|
|
|
|
struct URLPatternStringOptions {
|
|
String delimiterCodepoint {};
|
|
String prefixCodepoint {};
|
|
bool ignoreCase { false };
|
|
};
|
|
|
|
class URLPatternParser {
|
|
public:
|
|
URLPatternParser(EncodingCallbackType, String&& segmentWildcardRegexp);
|
|
ExceptionOr<void> performParse(const URLPatternStringOptions&);
|
|
|
|
void setTokenList(Vector<Token>&& tokenList) { m_tokenList = WTF::move(tokenList); }
|
|
static ExceptionOr<Vector<Part>> parse(StringView, const URLPatternStringOptions&, EncodingCallbackType);
|
|
|
|
private:
|
|
Token tryToConsumeToken(TokenType);
|
|
Token tryToConsumeRegexOrWildcardToken(const Token&);
|
|
Token tryToConsumeModifierToken();
|
|
|
|
String consumeText();
|
|
ExceptionOr<Token> consumeRequiredToken(TokenType);
|
|
|
|
ExceptionOr<void> maybeAddPartFromPendingFixedValue();
|
|
ExceptionOr<void> addPart(String&& prefix, const Token& nameToken, const Token& regexpOrWildcardToken, String&& suffix, const Token& modifierToken);
|
|
|
|
bool isDuplicateName(StringView) const;
|
|
|
|
Vector<Part> takePartList() { return std::exchange(m_partList, {}); }
|
|
|
|
Vector<Token> m_tokenList;
|
|
Vector<Part> m_partList;
|
|
EncodingCallbackType m_callbackType;
|
|
String m_segmentWildcardRegexp;
|
|
StringBuilder m_pendingFixedValue;
|
|
size_t m_index { 0 };
|
|
int m_nextNumericName { 0 };
|
|
};
|
|
|
|
// FIXME: Consider moving functions to somewhere generic, perhaps refactor Part to its own class.
|
|
String generateSegmentWildcardRegexp(const URLPatternStringOptions&);
|
|
String escapeRegexString(StringView);
|
|
ASCIILiteral convertModifierToString(Modifier);
|
|
std::pair<String, Vector<String>> generateRegexAndNameList(const Vector<Part>& partList, const URLPatternStringOptions&);
|
|
String generatePatternString(const Vector<Part>& partList, const URLPatternStringOptions&);
|
|
String escapePatternString(StringView input);
|
|
bool isValidNameCodepoint(char32_t codepoint, URLPatternUtilities::IsFirst);
|
|
|
|
} // namespace URLPatternUtilities
|
|
} // namespace WebCore
|