blob: e2de33df915bf8ef355873347532622f083a19b9 [file] [log] [blame]
// Copyright (c) 2022, the Dart project authors. Please see the AUTHORS file
// for details. All rights reserved. Use of this source code is governed by a
// BSD-style license that can be found in the LICENSE file.
part of dart._js_helper;
// TODO(joshualitt): This is a fork of the DDC RegExp class. In the longer term,
// with careful factoring we may be able to share this code.
// TODO(joshualitt): We should be able to build this library off of static
// interop.
/// Returns a string for a RegExp pattern that matches [string]. This is done by
/// escaping all RegExp metacharacters.
@pragma('wasm:import', 'dart2wasm.quoteStringForRegExp')
external String quoteStringForRegExp(String string);
class JSNativeMatch extends JSArray {
JSNativeMatch(WasmAnyRef ref) : super(ref);
static JSNativeMatch? box(WasmAnyRef? ref) =>
isDartNull(ref) ? null : JSNativeMatch(ref!);
String get input => jsStringToDartString(
getPropertyRaw(this.toAnyRef(), 'input'.toAnyRef())!);
int get index =>
toDartNumber(getPropertyRaw(this.toAnyRef(), 'index'.toAnyRef())!)
.floor();
JSObject? get groups =>
JSObject.box(getPropertyRaw(this.toAnyRef(), 'groups'.toAnyRef()));
}
class JSNativeRegExp extends JSValue {
JSNativeRegExp(WasmAnyRef ref) : super(ref);
JSNativeMatch? exec(String string) => JSNativeMatch.box(callMethodVarArgsRaw(
this.toAnyRef(), 'exec'.toAnyRef(), [string].toAnyRef()));
bool test(String string) => toDartBool(callMethodVarArgsRaw(
this.toAnyRef(), 'test'.toAnyRef(), [string].toAnyRef())!);
String get flags => jsStringToDartString(
getPropertyRaw(this.toAnyRef(), 'flags'.toAnyRef())!);
bool get multiline =>
toDartBool(getPropertyRaw(this.toAnyRef(), 'multiline'.toAnyRef())!);
bool get ignoreCase =>
toDartBool(getPropertyRaw(this.toAnyRef(), 'ignoreCase'.toAnyRef())!);
bool get unicode =>
toDartBool(getPropertyRaw(this.toAnyRef(), 'unicode'.toAnyRef())!);
bool get dotAll =>
toDartBool(getPropertyRaw(this.toAnyRef(), 'dotAll'.toAnyRef())!);
set lastIndex(int start) => setPropertyRaw(
this.toAnyRef(), 'lastIndex'.toAnyRef(), intToJSNumber(start));
}
class JSSyntaxRegExp implements RegExp {
final String pattern;
final JSNativeRegExp _nativeRegExp;
JSNativeRegExp? _nativeGlobalRegExp;
JSNativeRegExp? _nativeAnchoredRegExp;
String toString() => 'RegExp/$pattern/' + _nativeRegExp.flags;
JSSyntaxRegExp(String source,
{bool multiLine: false,
bool caseSensitive: true,
bool unicode: false,
bool dotAll: false})
: this.pattern = source,
this._nativeRegExp = makeNative(
source, multiLine, caseSensitive, unicode, dotAll, false);
JSNativeRegExp get _nativeGlobalVersion {
if (_nativeGlobalRegExp != null) return _nativeGlobalRegExp!;
return _nativeGlobalRegExp = makeNative(
pattern, isMultiLine, isCaseSensitive, isUnicode, isDotAll, true);
}
JSNativeRegExp get _nativeAnchoredVersion {
if (_nativeAnchoredRegExp != null) return _nativeAnchoredRegExp!;
// An "anchored version" of a regexp is created by adding "|()" to the
// source. This means that the regexp always matches at the first position
// that it tries, and you can see if the original regexp matched, or it
// was the added zero-width match that matched, by looking at the last
// capture. If it is a String, the match participated, otherwise it didn't.
return _nativeAnchoredRegExp = makeNative(
'$pattern|()', isMultiLine, isCaseSensitive, isUnicode, isDotAll, true);
}
bool get isMultiLine => _nativeRegExp.multiline;
bool get isCaseSensitive => _nativeRegExp.ignoreCase;
bool get isUnicode => _nativeRegExp.unicode;
bool get isDotAll => _nativeRegExp.dotAll;
static JSNativeRegExp makeNative(String source, bool multiLine,
bool caseSensitive, bool unicode, bool dotAll, bool global) {
String m = multiLine == true ? 'm' : '';
String i = caseSensitive == true ? '' : 'i';
String u = unicode ? 'u' : '';
String s = dotAll ? 's' : '';
String g = global ? 'g' : '';
String modifiers = '$m$i$u$s$g';
// The call to create the regexp is wrapped in a try catch so we can
// reformat the exception if need be.
WasmAnyRef result = safeCallConstructorVarArgsRaw(
getConstructorRaw('RegExp'), [source, modifiers].toAnyRef());
if (isJSRegExp(result)) return JSNativeRegExp(result);
// The returned value is the stringified JavaScript exception. Turn it into
// a Dart exception.
String errorMessage = jsStringToDartString(result);
throw new FormatException('Illegal RegExp pattern ($errorMessage)', source);
}
RegExpMatch? firstMatch(String string) {
JSNativeMatch? m = _nativeRegExp.exec(string);
if (m == null) return null;
return new _MatchImplementation(this, m);
}
bool hasMatch(String string) {
return _nativeRegExp.test(string);
}
String? stringMatch(String string) {
var match = firstMatch(string);
if (match != null) return match.group(0);
return null;
}
Iterable<RegExpMatch> allMatches(String string, [int start = 0]) {
if (start < 0 || start > string.length) {
throw new RangeError.range(start, 0, string.length);
}
return _AllMatchesIterable(this, string, start);
}
RegExpMatch? _execGlobal(String string, int start) {
JSNativeRegExp regexp = _nativeGlobalVersion;
regexp.lastIndex = start;
JSNativeMatch? match = regexp.exec(string);
if (match == null) return null;
return new _MatchImplementation(this, match);
}
RegExpMatch? _execAnchored(String string, int start) {
JSNativeRegExp regexp = _nativeAnchoredVersion;
regexp.lastIndex = start;
JSNativeMatch? match = regexp.exec(string);
if (match == null) return null;
// If the last capture group participated, the original regexp did not
// match at the start position.
if (match.pop() != null) return null;
return new _MatchImplementation(this, match);
}
RegExpMatch? matchAsPrefix(String string, [int start = 0]) {
if (start < 0 || start > string.length) {
throw new RangeError.range(start, 0, string.length);
}
return _execAnchored(string, start);
}
}
class _MatchImplementation implements RegExpMatch {
final Pattern pattern;
// Contains a JS RegExp match object.
// It is an Array of String values with extra 'index' and 'input' properties.
// If there were named capture groups, there will also be an extra 'groups'
// property containing an object with capture group names as keys and
// matched strings as values.
final JSNativeMatch _match;
_MatchImplementation(this.pattern, this._match);
String get input => _match.input;
int get start => _match.index;
int get end => (start + (_match[0].toString()).length);
String? group(int index) => _match[index]?.toString();
String? operator [](int index) => group(index);
int get groupCount => _match.length - 1;
List<String?> groups(List<int> groups) {
List<String?> out = [];
for (int i in groups) {
out.add(group(i));
}
return out;
}
String? namedGroup(String name) {
JSObject? groups = _match.groups;
if (groups != null) {
JSValue? result = groups[name];
if (result != null ||
hasPropertyRaw(groups.toAnyRef(), name.toAnyRef())) {
return result?.toString();
}
}
throw ArgumentError.value(name, "name", "Not a capture group name");
}
Iterable<String> get groupNames {
JSObject? groups = _match.groups;
if (groups != null) {
return JSArrayIterableAdapter<String>(objectKeys(groups));
}
return Iterable.empty();
}
}
class _AllMatchesIterable extends IterableBase<RegExpMatch> {
final JSSyntaxRegExp _re;
final String _string;
final int _start;
_AllMatchesIterable(this._re, this._string, this._start);
Iterator<RegExpMatch> get iterator =>
new _AllMatchesIterator(_re, _string, _start);
}
class _AllMatchesIterator implements Iterator<RegExpMatch> {
final JSSyntaxRegExp _regExp;
String? _string;
int _nextIndex;
RegExpMatch? _current;
_AllMatchesIterator(this._regExp, this._string, this._nextIndex);
RegExpMatch get current => _current as RegExpMatch;
static bool _isLeadSurrogate(int c) {
return c >= 0xd800 && c <= 0xdbff;
}
static bool _isTrailSurrogate(int c) {
return c >= 0xdc00 && c <= 0xdfff;
}
bool moveNext() {
var string = _string;
if (string == null) return false;
if (_nextIndex <= string.length) {
RegExpMatch? match = _regExp._execGlobal(string, _nextIndex);
if (match != null) {
_current = match;
int nextIndex = match.end;
if (match.start == nextIndex) {
// Zero-width match. Advance by one more, unless the regexp
// is in unicode mode and it would put us within a surrogate
// pair. In that case, advance past the code point as a whole.
if (_regExp.isUnicode &&
_nextIndex + 1 < string.length &&
_isLeadSurrogate(string.codeUnitAt(_nextIndex)) &&
_isTrailSurrogate(string.codeUnitAt(_nextIndex + 1))) {
nextIndex++;
}
nextIndex++;
}
_nextIndex = nextIndex;
return true;
}
}
_current = null;
_string = null; // Marks iteration as ended.
return false;
}
}