pkg/_fe_analyzer_shared/lib/src/scanner/token_impl.dart - sdk - Git at Google

 // Copyright (c) 2011, the Dart project authors.  Please see the AUTHORS file
 // for details. All rights reserved. Use of this source code is governed by a
 // BSD-style license that can be found in the LICENSE file.

 library _fe_analyzer_shared.scanner.token;

 import 'dart:typed_data' show Uint8List;

 import 'token.dart'
     show
         DocumentationCommentToken,
         SimpleToken,
         TokenType,
         CommentToken,
         StringToken,
         LanguageVersionToken;

 import 'token_constants.dart' show IDENTIFIER_TOKEN;

 import 'string_canonicalizer.dart';

 /**
  * A String-valued token. Represents identifiers, string literals,
  * number literals, comments, and error tokens, using the corresponding
  * precedence info.
  */
 class StringTokenImpl extends SimpleToken implements StringToken {
   /**
    * The length threshold above which substring tokens are computed lazily.
    *
    * For string tokens that are substrings of the program source, the actual
    * substring extraction is performed lazily. This is beneficial because
    * not all scanned code are actually used. For unused parts, the substrings
    * are never computed and allocated.
    */
   static const int LAZY_THRESHOLD = 4;

   late Object /* String | LazySubstring */ valueOrLazySubstring;

   /**
    * Creates a non-lazy string token. If [canonicalize] is true, the string
    * is canonicalized before the token is created.
    */
   StringTokenImpl.fromString(
     TokenType type,
     String value,
     int charOffset, {
     bool canonicalize = false,
     CommentToken? precedingComments,
   }) : valueOrLazySubstring = canonicalize ? canonicalizeString(value) : value,
        super(type, charOffset, precedingComments);

   /**
    * Creates a lazy string token. If [canonicalize] is true, the string
    * is canonicalized before the token is created.
    */
   StringTokenImpl.fromSubstring(
     TokenType type,
     String data,
     int start,
     int end,
     int charOffset, {
     bool canonicalize = false,
     CommentToken? precedingComments,
     bool allowLazy = true,
   }) : super(type, charOffset, precedingComments) {
     int length = end - start;
     if (!allowLazy || length <= LAZY_THRESHOLD) {
       valueOrLazySubstring =
           canonicalize
               ? canonicalizeSubString(data, start, end)
               : data.substring(start, end);
     } else {
       valueOrLazySubstring = new _LazySubstring(
         data,
         start,
         length,
         canonicalize,
       );
     }
   }

   /**
    * Creates a lazy string token. If [asciiOnly] is false, the byte array
    * is passed through a UTF-8 decoder.
    */
   StringTokenImpl.fromUtf8Bytes(
     TokenType type,
     Uint8List data,
     int start,
     int end,
     bool asciiOnly,
     int charOffset, {
     CommentToken? precedingComments,
     bool allowLazy = true,
   }) : super(type, charOffset, precedingComments) {
     int length = end - start;
     if (!allowLazy || length <= LAZY_THRESHOLD) {
       valueOrLazySubstring = canonicalizeUtf8SubString(
         data,
         start,
         end,
         asciiOnly,
       );
     } else {
       valueOrLazySubstring = new _LazySubstring(data, start, length, asciiOnly);
     }
   }

   @override
   String get lexeme => valueOrLazySubstring = valueOrLazySubstring.toString();

   @override
   bool get isIdentifier => kind == IDENTIFIER_TOKEN;

   @override
   String toString() => lexeme;

   @override
   String value() => lexeme;
 }

 class CommentTokenImpl extends StringTokenImpl implements CommentToken {
   @override
   SimpleToken? parent;

   /**
    * Creates a lazy comment token. If [canonicalize] is true, the string
    * is canonicalized before the token is created.
    */
   CommentTokenImpl.fromSubstring(
     super.type,
     super.data,
     super.start,
     super.end,
     super.charOffset, {
     super.canonicalize,
   }) : super.fromSubstring();

   /**
    * Creates a non-lazy comment token.
    */
   CommentTokenImpl.fromString(super.type, super.lexeme, super.charOffset)
     : super.fromString();

   /**
    * Creates a lazy string token. If [asciiOnly] is false, the byte array
    * is passed through a UTF-8 decoder.
    */
   CommentTokenImpl.fromUtf8Bytes(
     super.type,
     super.data,
     super.start,
     super.end,
     super.asciiOnly,
     super.charOffset,
   ) : super.fromUtf8Bytes();
 }

 class LanguageVersionTokenImpl extends CommentTokenImpl
     implements LanguageVersionToken {
   @override
   int major;

   @override
   int minor;

   LanguageVersionTokenImpl.from(String text, int offset, this.major, this.minor)
     : super.fromString(TokenType.SINGLE_LINE_COMMENT, text, offset);

   LanguageVersionTokenImpl.fromSubstring(
     String string,
     int start,
     int end,
     int tokenStart,
     this.major,
     this.minor, {
     bool canonicalize = false,
   }) : super.fromSubstring(
          TokenType.SINGLE_LINE_COMMENT,
          string,
          start,
          end,
          tokenStart,
          canonicalize: canonicalize,
        );

   LanguageVersionTokenImpl.fromUtf8Bytes(
     Uint8List bytes,
     int start,
     int end,
     int tokenStart,
     this.major,
     this.minor,
   ) : super.fromUtf8Bytes(
         TokenType.SINGLE_LINE_COMMENT,
         bytes,
         start,
         end,
         true,
         tokenStart,
       );
 }

 class DartDocToken extends CommentTokenImpl
     implements DocumentationCommentToken {
   /**
    * Creates a lazy comment token. If [canonicalize] is true, the string
    * is canonicalized before the token is created.
    */
   DartDocToken.fromSubstring(
     super.type,
     super.data,
     super.start,
     super.end,
     super.charOffset, {
     super.canonicalize,
   }) : super.fromSubstring();

   /**
    * Creates a lazy string token. If [asciiOnly] is false, the byte array
    * is passed through a UTF-8 decoder.
    */
   DartDocToken.fromUtf8Bytes(
     super.type,
     super.data,
     super.start,
     super.end,
     super.asciiOnly,
     super.charOffset,
   ) : super.fromUtf8Bytes();
 }

 /**
  * This class represents the necessary information to compute a substring
  * lazily. The substring can either originate from a string or from
  * a [:Uint8List:] of UTF-8 bytes.
  */
 abstract class _LazySubstring {
   /** The original data, either a string or a Uint8List */
   Object get data;

   int get start;
   int get length;

   /**
    * If this substring is based on a String, the [boolValue] indicates whether
    * the resulting substring should be canonicalized.
    *
    * For substrings based on a byte array, the [boolValue] is true if the
    * array only holds ASCII characters. The resulting substring will be
    * canonicalized after decoding.
    */
   bool get boolValue;

   _LazySubstring.internal();

   factory _LazySubstring(Object data, int start, int length, bool b) {
     // See comment on [CompactLazySubstring].
     if (start < 0x100000 && length < 0x200) {
       int fields = (start << 9);
       fields = fields | length;
       fields = fields << 1;
       if (b) fields |= 1;
       return new _CompactLazySubstring(data, fields);
     } else {
       return new _FullLazySubstring(data, start, length, b);
     }
   }

   String _resolve() {
     Object data = this.data;
     int start = this.start;
     int end = start + this.length;
     if (data is String) {
       final bool canonicalize = this.boolValue;
       return canonicalize
           ? canonicalizeSubString(data, start, end)
           : data.substring(start, end);
     } else {
       final Uint8List bytes = data as Uint8List;
       final bool isAscii = this.boolValue;
       return canonicalizeUtf8SubString(bytes, start, end, isAscii);
     }
   }

   @override
   String toString() => _resolve();
 }

 /**
  * This class encodes [start], [length] and [boolValue] in a single
  * 30 bit integer. It uses 20 bits for [start], which covers source files
  * of 1MB. [length] has 9 bits, which covers 512 characters.
  *
  * The file html_dart2js.dart is currently around 1MB.
  */
 class _CompactLazySubstring extends _LazySubstring {
   @override
   final Object data;
   final int fields;

   _CompactLazySubstring(this.data, this.fields) : super.internal();

   @override
   int get start => fields >> 10;
   @override
   int get length => (fields >> 1) & 0x1ff;
   @override
   bool get boolValue => (fields & 1) == 1;
 }

 class _FullLazySubstring extends _LazySubstring {
   @override
   final Object data;
   @override
   final int start;
   @override
   final int length;
   @override
   final bool boolValue;
   _FullLazySubstring(this.data, this.start, this.length, this.boolValue)
     : super.internal();
 }

 bool isUserDefinableOperator(String value) {
   return isBinaryOperator(value) ||
       isMinusOperator(value) ||
       isTernaryOperator(value) ||
       isUnaryOperator(value);
 }

 bool isUnaryOperator(String value) => identical(value, "~");

 bool isBinaryOperator(String value) {
   return identical(value, "==") ||
       identical(value, "[]") ||
       identical(value, "*") ||
       identical(value, "/") ||
       identical(value, "%") ||
       identical(value, "~/") ||
       identical(value, "+") ||
       identical(value, "<<") ||
       identical(value, ">>") ||
       identical(value, ">>>") ||
       identical(value, ">=") ||
       identical(value, ">") ||
       identical(value, "<=") ||
       identical(value, "<") ||
       identical(value, "&") ||
       identical(value, "^") ||
       identical(value, "|");
 }

 bool isTernaryOperator(String value) => identical(value, "[]=");

 bool isMinusOperator(String value) => identical(value, "-");
	// Copyright (c) 2011, the Dart project authors. Please see the AUTHORS file
	// for details. All rights reserved. Use of this source code is governed by a
	// BSD-style license that can be found in the LICENSE file.

	library _fe_analyzer_shared.scanner.token;

	import 'dart:typed_data' show Uint8List;

	import 'token.dart'
	show
	DocumentationCommentToken,
	SimpleToken,
	TokenType,
	CommentToken,
	StringToken,
	LanguageVersionToken;

	import 'token_constants.dart' show IDENTIFIER_TOKEN;

	import 'string_canonicalizer.dart';

	/**
	* A String-valued token. Represents identifiers, string literals,
	* number literals, comments, and error tokens, using the corresponding
	* precedence info.
	*/
	class StringTokenImpl extends SimpleToken implements StringToken {
	/**
	* The length threshold above which substring tokens are computed lazily.
	*
	* For string tokens that are substrings of the program source, the actual
	* substring extraction is performed lazily. This is beneficial because
	* not all scanned code are actually used. For unused parts, the substrings
	* are never computed and allocated.
	*/
	static const int LAZY_THRESHOLD = 4;

	late Object /* String \| LazySubstring */ valueOrLazySubstring;

	/**
	* Creates a non-lazy string token. If [canonicalize] is true, the string
	* is canonicalized before the token is created.
	*/
	StringTokenImpl.fromString(
	TokenType type,
	String value,
	int charOffset, {
	bool canonicalize = false,
	CommentToken? precedingComments,
	}) : valueOrLazySubstring = canonicalize ? canonicalizeString(value) : value,
	super(type, charOffset, precedingComments);

	/**
	* Creates a lazy string token. If [canonicalize] is true, the string
	* is canonicalized before the token is created.
	*/
	StringTokenImpl.fromSubstring(
	TokenType type,
	String data,
	int start,
	int end,
	int charOffset, {
	bool canonicalize = false,
	CommentToken? precedingComments,
	bool allowLazy = true,
	}) : super(type, charOffset, precedingComments) {
	int length = end - start;
	if (!allowLazy \|\| length <= LAZY_THRESHOLD) {
	valueOrLazySubstring =
	canonicalize
	? canonicalizeSubString(data, start, end)
	: data.substring(start, end);
	} else {
	valueOrLazySubstring = new _LazySubstring(
	data,
	start,
	length,
	canonicalize,
	);
	}
	}

	/**
	* Creates a lazy string token. If [asciiOnly] is false, the byte array
	* is passed through a UTF-8 decoder.
	*/
	StringTokenImpl.fromUtf8Bytes(
	TokenType type,
	Uint8List data,
	int start,
	int end,
	bool asciiOnly,
	int charOffset, {
	CommentToken? precedingComments,
	bool allowLazy = true,
	}) : super(type, charOffset, precedingComments) {
	int length = end - start;
	if (!allowLazy \|\| length <= LAZY_THRESHOLD) {
	valueOrLazySubstring = canonicalizeUtf8SubString(
	data,
	start,
	end,
	asciiOnly,
	);
	} else {
	valueOrLazySubstring = new _LazySubstring(data, start, length, asciiOnly);
	}
	}

	@override
	String get lexeme => valueOrLazySubstring = valueOrLazySubstring.toString();

	@override
	bool get isIdentifier => kind == IDENTIFIER_TOKEN;

	@override
	String toString() => lexeme;

	@override
	String value() => lexeme;
	}

	class CommentTokenImpl extends StringTokenImpl implements CommentToken {
	@override
	SimpleToken? parent;

	/**
	* Creates a lazy comment token. If [canonicalize] is true, the string
	* is canonicalized before the token is created.
	*/
	CommentTokenImpl.fromSubstring(
	super.type,
	super.data,
	super.start,
	super.end,
	super.charOffset, {
	super.canonicalize,
	}) : super.fromSubstring();

	/**
	* Creates a non-lazy comment token.
	*/
	CommentTokenImpl.fromString(super.type, super.lexeme, super.charOffset)
	: super.fromString();

	/**
	* Creates a lazy string token. If [asciiOnly] is false, the byte array
	* is passed through a UTF-8 decoder.
	*/
	CommentTokenImpl.fromUtf8Bytes(
	super.type,
	super.data,
	super.start,
	super.end,
	super.asciiOnly,
	super.charOffset,
	) : super.fromUtf8Bytes();
	}

	class LanguageVersionTokenImpl extends CommentTokenImpl
	implements LanguageVersionToken {
	@override
	int major;

	@override
	int minor;

	LanguageVersionTokenImpl.from(String text, int offset, this.major, this.minor)
	: super.fromString(TokenType.SINGLE_LINE_COMMENT, text, offset);

	LanguageVersionTokenImpl.fromSubstring(
	String string,
	int start,
	int end,
	int tokenStart,
	this.major,
	this.minor, {
	bool canonicalize = false,
	}) : super.fromSubstring(
	TokenType.SINGLE_LINE_COMMENT,
	string,
	start,
	end,
	tokenStart,
	canonicalize: canonicalize,
	);

	LanguageVersionTokenImpl.fromUtf8Bytes(
	Uint8List bytes,
	int start,
	int end,
	int tokenStart,
	this.major,
	this.minor,
	) : super.fromUtf8Bytes(
	TokenType.SINGLE_LINE_COMMENT,
	bytes,
	start,
	end,
	true,
	tokenStart,
	);
	}

	class DartDocToken extends CommentTokenImpl
	implements DocumentationCommentToken {
	/**
	* Creates a lazy comment token. If [canonicalize] is true, the string
	* is canonicalized before the token is created.
	*/
	DartDocToken.fromSubstring(
	super.type,
	super.data,
	super.start,
	super.end,
	super.charOffset, {
	super.canonicalize,
	}) : super.fromSubstring();

	/**
	* Creates a lazy string token. If [asciiOnly] is false, the byte array
	* is passed through a UTF-8 decoder.
	*/
	DartDocToken.fromUtf8Bytes(
	super.type,
	super.data,
	super.start,
	super.end,
	super.asciiOnly,
	super.charOffset,
	) : super.fromUtf8Bytes();
	}

	/**
	* This class represents the necessary information to compute a substring
	* lazily. The substring can either originate from a string or from
	* a [:Uint8List:] of UTF-8 bytes.
	*/
	abstract class _LazySubstring {
	/** The original data, either a string or a Uint8List */
	Object get data;

	int get start;
	int get length;

	/**
	* If this substring is based on a String, the [boolValue] indicates whether
	* the resulting substring should be canonicalized.
	*
	* For substrings based on a byte array, the [boolValue] is true if the
	* array only holds ASCII characters. The resulting substring will be
	* canonicalized after decoding.
	*/
	bool get boolValue;

	_LazySubstring.internal();

	factory _LazySubstring(Object data, int start, int length, bool b) {
	// See comment on [CompactLazySubstring].
	if (start < 0x100000 && length < 0x200) {
	int fields = (start << 9);
	fields = fields \| length;
	fields = fields << 1;
	if (b) fields \|= 1;
	return new _CompactLazySubstring(data, fields);
	} else {
	return new _FullLazySubstring(data, start, length, b);
	}
	}

	String _resolve() {
	Object data = this.data;
	int start = this.start;
	int end = start + this.length;
	if (data is String) {
	final bool canonicalize = this.boolValue;
	return canonicalize
	? canonicalizeSubString(data, start, end)
	: data.substring(start, end);
	} else {
	final Uint8List bytes = data as Uint8List;
	final bool isAscii = this.boolValue;
	return canonicalizeUtf8SubString(bytes, start, end, isAscii);
	}
	}

	@override
	String toString() => _resolve();
	}

	/**
	* This class encodes [start], [length] and [boolValue] in a single
	* 30 bit integer. It uses 20 bits for [start], which covers source files
	* of 1MB. [length] has 9 bits, which covers 512 characters.
	*
	* The file html_dart2js.dart is currently around 1MB.
	*/
	class _CompactLazySubstring extends _LazySubstring {
	@override
	final Object data;
	final int fields;

	_CompactLazySubstring(this.data, this.fields) : super.internal();

	@override
	int get start => fields >> 10;
	@override
	int get length => (fields >> 1) & 0x1ff;
	@override
	bool get boolValue => (fields & 1) == 1;
	}

	class _FullLazySubstring extends _LazySubstring {
	@override
	final Object data;
	@override
	final int start;
	@override
	final int length;
	@override
	final bool boolValue;
	_FullLazySubstring(this.data, this.start, this.length, this.boolValue)
	: super.internal();
	}

	bool isUserDefinableOperator(String value) {
	return isBinaryOperator(value) \|\|
	isMinusOperator(value) \|\|
	isTernaryOperator(value) \|\|
	isUnaryOperator(value);
	}

	bool isUnaryOperator(String value) => identical(value, "~");

	bool isBinaryOperator(String value) {
	return identical(value, "==") \|\|
	identical(value, "[]") \|\|
	identical(value, "*") \|\|
	identical(value, "/") \|\|
	identical(value, "%") \|\|
	identical(value, "~/") \|\|
	identical(value, "+") \|\|
	identical(value, "<<") \|\|
	identical(value, ">>") \|\|
	identical(value, ">>>") \|\|
	identical(value, ">=") \|\|
	identical(value, ">") \|\|
	identical(value, "<=") \|\|
	identical(value, "<") \|\|
	identical(value, "&") \|\|
	identical(value, "^") \|\|
	identical(value, "\|");
	}

	bool isTernaryOperator(String value) => identical(value, "[]=");

	bool isMinusOperator(String value) => identical(value, "-");