mirror of
https://github.com/LadybirdBrowser/ladybird.git
synced 2025-10-24 00:49:46 +00:00
For the web, we allow a wobbly UTF-16 encoding (i.e. lonely surrogates are permitted). Only in a few exceptional cases do we strictly require valid UTF-16. As such, our `validate(AllowLonelySurrogates::Yes)` calls will always succeed. It's a wasted effort to ever make such a check. This patch eliminates such invocations. The validation methods will now only check for strict UTF-16, and are only invoked when needed.
110 lines
4.4 KiB
C++
110 lines
4.4 KiB
C++
/*
|
|
* Copyright (c) 2022, LI YUBEI <leeight@gmail.com>
|
|
*
|
|
* SPDX-License-Identifier: BSD-2-Clause
|
|
*/
|
|
|
|
#pragma once
|
|
|
|
#include <AK/Optional.h>
|
|
#include <AK/Utf16String.h>
|
|
#include <LibJS/Forward.h>
|
|
|
|
namespace JS {
|
|
|
|
// https://github.com/tc39/proposal-regexp-legacy-features#regexp
|
|
// The %RegExp% intrinsic object, which is the builtin RegExp constructor, has the following additional internal slots:
|
|
// [[RegExpInput]]
|
|
// [[RegExpLastMatch]]
|
|
// [[RegExpLastParen]]
|
|
// [[RegExpLeftContext]]
|
|
// [[RegExpRightContext]]
|
|
// [[RegExpParen1]] ... [[RegExpParen9]]
|
|
class RegExpLegacyStaticProperties {
|
|
public:
|
|
Optional<Utf16String> const& input() const { return m_input; }
|
|
Optional<Utf16String> const& last_match() const
|
|
{
|
|
if (!m_last_match_string.has_value())
|
|
m_last_match_string = Utf16String::from_utf16(m_last_match);
|
|
return m_last_match_string;
|
|
}
|
|
Optional<Utf16String> const& last_paren() const { return m_last_paren; }
|
|
Optional<Utf16String> const& left_context() const
|
|
{
|
|
if (!m_left_context_string.has_value())
|
|
m_left_context_string = Utf16String::from_utf16(m_left_context);
|
|
return m_left_context_string;
|
|
}
|
|
Optional<Utf16String> const& right_context() const
|
|
{
|
|
if (!m_right_context_string.has_value())
|
|
m_right_context_string = Utf16String::from_utf16(m_right_context);
|
|
return m_right_context_string;
|
|
}
|
|
Optional<Utf16String> const& $1() const { return m_$1; }
|
|
Optional<Utf16String> const& $2() const { return m_$2; }
|
|
Optional<Utf16String> const& $3() const { return m_$3; }
|
|
Optional<Utf16String> const& $4() const { return m_$4; }
|
|
Optional<Utf16String> const& $5() const { return m_$5; }
|
|
Optional<Utf16String> const& $6() const { return m_$6; }
|
|
Optional<Utf16String> const& $7() const { return m_$7; }
|
|
Optional<Utf16String> const& $8() const { return m_$8; }
|
|
Optional<Utf16String> const& $9() const { return m_$9; }
|
|
|
|
void set_input(Utf16String input) { m_input = move(input); }
|
|
void set_last_match(Utf16View last_match)
|
|
{
|
|
m_last_match = last_match;
|
|
m_last_match_string = {};
|
|
}
|
|
void set_last_paren(Utf16String last_paren) { m_last_paren = move(last_paren); }
|
|
void set_left_context(Utf16View left_context)
|
|
{
|
|
m_left_context = left_context;
|
|
m_left_context_string = {};
|
|
}
|
|
void set_right_context(Utf16View right_context)
|
|
{
|
|
m_right_context = right_context;
|
|
m_right_context_string = {};
|
|
}
|
|
void set_$1(Utf16String value) { m_$1 = move(value); }
|
|
void set_$2(Utf16String value) { m_$2 = move(value); }
|
|
void set_$3(Utf16String value) { m_$3 = move(value); }
|
|
void set_$4(Utf16String value) { m_$4 = move(value); }
|
|
void set_$5(Utf16String value) { m_$5 = move(value); }
|
|
void set_$6(Utf16String value) { m_$6 = move(value); }
|
|
void set_$7(Utf16String value) { m_$7 = move(value); }
|
|
void set_$8(Utf16String value) { m_$8 = move(value); }
|
|
void set_$9(Utf16String value) { m_$9 = move(value); }
|
|
void invalidate();
|
|
|
|
private:
|
|
Optional<Utf16String> m_input;
|
|
Optional<Utf16String> m_last_paren;
|
|
Optional<Utf16String> m_$1;
|
|
Optional<Utf16String> m_$2;
|
|
Optional<Utf16String> m_$3;
|
|
Optional<Utf16String> m_$4;
|
|
Optional<Utf16String> m_$5;
|
|
Optional<Utf16String> m_$6;
|
|
Optional<Utf16String> m_$7;
|
|
Optional<Utf16String> m_$8;
|
|
Optional<Utf16String> m_$9;
|
|
|
|
// NOTE: These are views into m_input and we only turn them into full strings if/when needed.
|
|
Utf16View m_last_match;
|
|
Utf16View m_left_context;
|
|
Utf16View m_right_context;
|
|
mutable Optional<Utf16String> m_last_match_string;
|
|
mutable Optional<Utf16String> m_left_context_string;
|
|
mutable Optional<Utf16String> m_right_context_string;
|
|
};
|
|
|
|
ThrowCompletionOr<void> set_legacy_regexp_static_property(VM& vm, RegExpConstructor& constructor, Value this_value, void (RegExpLegacyStaticProperties::*property_setter)(Utf16String), Value value);
|
|
ThrowCompletionOr<Value> get_legacy_regexp_static_property(VM& vm, RegExpConstructor& constructor, Value this_value, Optional<Utf16String> const& (RegExpLegacyStaticProperties::*property_getter)() const);
|
|
void update_legacy_regexp_static_properties(RegExpConstructor& constructor, Utf16String const& string, size_t start_index, size_t end_index, Vector<Utf16String> const& captured_values);
|
|
void invalidate_legacy_regexp_static_properties(RegExpConstructor& constructor);
|
|
|
|
}
|