lib/src/block_syntaxes/table_syntax.dart - markdown.git - Git at Google

 // Copyright (c) 2022, the Dart project authors.  Please see the AUTHORS file
 // for details. All rights reserved. Use of this source code is governed by a
 // BSD-style license that can be found in the LICENSE file.

 import '../ast.dart';
 import '../block_parser.dart';
 import '../charcode.dart';
 import '../patterns.dart';
 import 'block_syntax.dart';

 /// Parses tables.
 class TableSyntax extends BlockSyntax {
   @override
   bool canEndBlock(BlockParser parser) => false;

   @override
   RegExp get pattern => dummyPattern;

   const TableSyntax();

   @override
   bool canParse(BlockParser parser) {
     // Note: matches *next* line, not the current one. We're looking for the
     // bar separating the head row from the body rows.
     return parser.matchesNext(tablePattern);
   }

   /// Parses a table into its three parts:
   ///
   /// * a head row of head cells (`<th>` cells)
   /// * a divider of hyphens and pipes (not rendered)
   /// * many body rows of body cells (`<td>` cells)
   @override
   Node? parse(BlockParser parser) {
     final alignments = _parseAlignments(parser.next!);
     final columnCount = alignments.length;
     final headRow = _parseRow(parser, alignments, 'th');
     if (headRow.children!.length != columnCount) {
       parser.retreat();
       return null;
     }
     final head = Element('thead', [headRow]);

     // Advance past the divider of hyphens.
     parser.advance();

     final rows = <Element>[];
     while (!parser.isDone && !BlockSyntax.isAtBlockEnd(parser)) {
       final row = _parseRow(parser, alignments, 'td');
       final children = row.children;
       if (children != null) {
         while (children.length < columnCount) {
           // Insert synthetic empty cells.
           children.add(Element('td', const []));
         }
         while (children.length > columnCount) {
           children.removeLast();
         }
       }
       while (row.children!.length > columnCount) {
         row.children!.removeLast();
       }
       rows.add(row);
     }
     if (rows.isEmpty) {
       return Element('table', [head]);
     } else {
       final body = Element('tbody', rows);

       return Element('table', [head, body]);
     }
   }

   List<String?> _parseAlignments(String line) {
     final columns = <String?>[];
     // Set the value to `true` when hitting a non whitespace character other
     // than the first pipe character.
     var started = false;
     var hitDash = false;
     String? alignment;

     for (var i = 0; i < line.length; i++) {
       final char = line.codeUnitAt(i);
       if (char == $space || char == $tab || (!started && char == $pipe)) {
         continue;
       }
       started = true;

       if (char == $colon) {
         if (hitDash) {
           alignment = alignment == 'left' ? 'center' : 'right';
         } else {
           alignment = 'left';
         }
       }

       if (char == $pipe) {
         columns.add(alignment);
         hitDash = false;
         alignment = null;
       } else {
         hitDash = true;
       }
     }

     if (hitDash) {
       columns.add(alignment);
     }

     return columns;
   }

   /// Parses a table row at the current line into a table row element, with
   /// parsed table cells.
   ///
   /// [alignments] is used to annotate an alignment on each cell, and
   /// [cellType] is used to declare either "td" or "th" cells.
   Element _parseRow(
     BlockParser parser,
     List<String?> alignments,
     String cellType,
   ) {
     final line = parser.current;
     final cells = <String>[];
     var index = _walkPastOpeningPipe(line);
     final cellBuffer = StringBuffer();

     while (true) {
       if (index >= line.length) {
         // This row ended without a trailing pipe, which is fine.
         cells.add(cellBuffer.toString().trimRight());
         cellBuffer.clear();
         break;
       }
       final ch = line.codeUnitAt(index);
       if (ch == $backslash) {
         if (index == line.length - 1) {
           // A table row ending in a backslash is not well-specified, but it
           // looks like GitHub just allows the character as part of the text of
           // the last cell.
           cellBuffer.writeCharCode(ch);
           cells.add(cellBuffer.toString().trimRight());
           cellBuffer.clear();
           break;
         }
         final escaped = line.codeUnitAt(index + 1);
         if (escaped == $pipe) {
           // GitHub Flavored Markdown has a strange bit here; the pipe is to be
           // escaped before any other inline processing. One consequence, for
           // example, is that "| `\|` |" should be parsed as a cell with a code
           // element with text "|", rather than "\|". Most parsers are not
           // compliant with this corner, but this is what is specified, and what
           // GitHub does in practice.
           cellBuffer.writeCharCode(escaped);
         } else {
           // The [InlineParser] will handle the escaping.
           cellBuffer.writeCharCode(ch);
           cellBuffer.writeCharCode(escaped);
         }
         index += 2;
       } else if (ch == $pipe) {
         cells.add(cellBuffer.toString().trimRight());
         cellBuffer.clear();
         // Walk forward past any whitespace which leads the next cell.
         index++;
         index = _walkPastWhitespace(line, index);
         if (index >= line.length) {
           // This row ended with a trailing pipe.
           break;
         }
       } else {
         cellBuffer.writeCharCode(ch);
         index++;
       }
     }
     parser.advance();
     final row = [
       for (final cell in cells) Element(cellType, [UnparsedContent(cell)])
     ];

     for (var i = 0; i < row.length && i < alignments.length; i++) {
       if (alignments[i] == null) continue;
       row[i].attributes['align'] = '${alignments[i]}';
     }

     return Element('tr', row);
   }

   /// Walks past whitespace in [line] starting at [index].
   ///
   /// Returns the index of the first non-whitespace character.
   int _walkPastWhitespace(String line, int index) {
     while (index < line.length) {
       final ch = line.codeUnitAt(index);
       if (ch != $space && ch != $tab) {
         break;
       }
       index++;
     }
     return index;
   }

   /// Walks past the opening pipe (and any whitespace that surrounds it) in
   /// [line].
   ///
   /// Returns the index of the first non-whitespace character after the pipe.
   /// If no opening pipe is found, this just returns the index of the first
   /// non-whitespace character.
   int _walkPastOpeningPipe(String line) {
     var index = 0;
     while (index < line.length) {
       final ch = line.codeUnitAt(index);
       if (ch == $pipe) {
         index++;
         index = _walkPastWhitespace(line, index);
       }
       if (ch != $space && ch != $tab) {
         // No leading pipe.
         break;
       }
       index++;
     }
     return index;
   }
 }
	// Copyright (c) 2022, the Dart project authors. Please see the AUTHORS file
	// for details. All rights reserved. Use of this source code is governed by a
	// BSD-style license that can be found in the LICENSE file.

	import '../ast.dart';
	import '../block_parser.dart';
	import '../charcode.dart';
	import '../patterns.dart';
	import 'block_syntax.dart';

	/// Parses tables.
	class TableSyntax extends BlockSyntax {
	@override
	bool canEndBlock(BlockParser parser) => false;

	@override
	RegExp get pattern => dummyPattern;

	const TableSyntax();

	@override
	bool canParse(BlockParser parser) {
	// Note: matches next line, not the current one. We're looking for the
	// bar separating the head row from the body rows.
	return parser.matchesNext(tablePattern);
	}

	/// Parses a table into its three parts:
	///
	/// * a head row of head cells (`<th>` cells)
	/// * a divider of hyphens and pipes (not rendered)
	/// * many body rows of body cells (`<td>` cells)
	@override
	Node? parse(BlockParser parser) {
	final alignments = _parseAlignments(parser.next!);
	final columnCount = alignments.length;
	final headRow = _parseRow(parser, alignments, 'th');
	if (headRow.children!.length != columnCount) {
	parser.retreat();
	return null;
	}
	final head = Element('thead', [headRow]);

	// Advance past the divider of hyphens.
	parser.advance();

	final rows = <Element>[];
	while (!parser.isDone && !BlockSyntax.isAtBlockEnd(parser)) {
	final row = _parseRow(parser, alignments, 'td');
	final children = row.children;
	if (children != null) {
	while (children.length < columnCount) {
	// Insert synthetic empty cells.
	children.add(Element('td', const []));
	}
	while (children.length > columnCount) {
	children.removeLast();
	}
	}
	while (row.children!.length > columnCount) {
	row.children!.removeLast();
	}
	rows.add(row);
	}
	if (rows.isEmpty) {
	return Element('table', [head]);
	} else {
	final body = Element('tbody', rows);

	return Element('table', [head, body]);
	}
	}

	List<String?> _parseAlignments(String line) {
	final columns = <String?>[];
	// Set the value to `true` when hitting a non whitespace character other
	// than the first pipe character.
	var started = false;
	var hitDash = false;
	String? alignment;

	for (var i = 0; i < line.length; i++) {
	final char = line.codeUnitAt(i);
	if (char == $space \|\| char == $tab \|\| (!started && char == $pipe)) {
	continue;
	}
	started = true;

	if (char == $colon) {
	if (hitDash) {
	alignment = alignment == 'left' ? 'center' : 'right';
	} else {
	alignment = 'left';
	}
	}

	if (char == $pipe) {
	columns.add(alignment);
	hitDash = false;
	alignment = null;
	} else {
	hitDash = true;
	}
	}

	if (hitDash) {
	columns.add(alignment);
	}

	return columns;
	}

	/// Parses a table row at the current line into a table row element, with
	/// parsed table cells.
	///
	/// [alignments] is used to annotate an alignment on each cell, and
	/// [cellType] is used to declare either "td" or "th" cells.
	Element _parseRow(
	BlockParser parser,
	List<String?> alignments,
	String cellType,
	) {
	final line = parser.current;
	final cells = <String>[];
	var index = _walkPastOpeningPipe(line);
	final cellBuffer = StringBuffer();

	while (true) {
	if (index >= line.length) {
	// This row ended without a trailing pipe, which is fine.
	cells.add(cellBuffer.toString().trimRight());
	cellBuffer.clear();
	break;
	}
	final ch = line.codeUnitAt(index);
	if (ch == $backslash) {
	if (index == line.length - 1) {
	// A table row ending in a backslash is not well-specified, but it
	// looks like GitHub just allows the character as part of the text of
	// the last cell.
	cellBuffer.writeCharCode(ch);
	cells.add(cellBuffer.toString().trimRight());
	cellBuffer.clear();
	break;
	}
	final escaped = line.codeUnitAt(index + 1);
	if (escaped == $pipe) {
	// GitHub Flavored Markdown has a strange bit here; the pipe is to be
	// escaped before any other inline processing. One consequence, for
	// example, is that "\| `\\|` \|" should be parsed as a cell with a code
	// element with text "\|", rather than "\\|". Most parsers are not
	// compliant with this corner, but this is what is specified, and what
	// GitHub does in practice.
	cellBuffer.writeCharCode(escaped);
	} else {
	// The [InlineParser] will handle the escaping.
	cellBuffer.writeCharCode(ch);
	cellBuffer.writeCharCode(escaped);
	}
	index += 2;
	} else if (ch == $pipe) {
	cells.add(cellBuffer.toString().trimRight());
	cellBuffer.clear();
	// Walk forward past any whitespace which leads the next cell.
	index++;
	index = _walkPastWhitespace(line, index);
	if (index >= line.length) {
	// This row ended with a trailing pipe.
	break;
	}
	} else {
	cellBuffer.writeCharCode(ch);
	index++;
	}
	}
	parser.advance();
	final row = [
	for (final cell in cells) Element(cellType, [UnparsedContent(cell)])
	];

	for (var i = 0; i < row.length && i < alignments.length; i++) {
	if (alignments[i] == null) continue;
	row[i].attributes['align'] = '${alignments[i]}';
	}

	return Element('tr', row);
	}

	/// Walks past whitespace in [line] starting at [index].
	///
	/// Returns the index of the first non-whitespace character.
	int _walkPastWhitespace(String line, int index) {
	while (index < line.length) {
	final ch = line.codeUnitAt(index);
	if (ch != $space && ch != $tab) {
	break;
	}
	index++;
	}
	return index;
	}

	/// Walks past the opening pipe (and any whitespace that surrounds it) in
	/// [line].
	///
	/// Returns the index of the first non-whitespace character after the pipe.
	/// If no opening pipe is found, this just returns the index of the first
	/// non-whitespace character.
	int _walkPastOpeningPipe(String line) {
	var index = 0;
	while (index < line.length) {
	final ch = line.codeUnitAt(index);
	if (ch == $pipe) {
	index++;
	index = _walkPastWhitespace(line, index);
	}
	if (ch != $space && ch != $tab) {
	// No leading pipe.
	break;
	}
	index++;
	}
	return index;
	}
	}