blob: c23665faa5a644c8a2331a288848401f441a7a4b [file] [log] [blame]
// Copyright (c) 2012, the Dart project authors. Please see the AUTHORS file
// for details. All rights reserved. Use of this source code is governed by a
// BSD-style license that can be found in the LICENSE file.
library utf.unicode_core_test;
import 'package:test/test.dart';
import 'package:utf/utf.dart';
import 'package:utf/src/util.dart';
import 'expect.dart' as expect;
void main() {
test('codepoints to utf16 codepoints', testCodepointsToUtf16CodeUnits);
test('utf16 bytes to codepoints', testUtf16bytesToCodepoints);
}
void testCodepointsToUtf16CodeUnits() {
// boundary conditions
expect.listEquals([], codepointsToUtf16CodeUnits([]), "no input");
expect.listEquals([0x0], codepointsToUtf16CodeUnits([0x0]), "0");
expect.listEquals(
[0xd800, 0xdc00], codepointsToUtf16CodeUnits([0x10000]), "10000");
expect.listEquals([0xffff], codepointsToUtf16CodeUnits([0xffff]), "ffff");
expect.listEquals(
[0xdbff, 0xdfff], codepointsToUtf16CodeUnits([0x10ffff]), "10ffff");
expect.listEquals([0xd7ff], codepointsToUtf16CodeUnits([0xd7ff]), "d7ff");
expect.listEquals([0xe000], codepointsToUtf16CodeUnits([0xe000]), "e000");
expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_CODEPOINT],
codepointsToUtf16CodeUnits([0xd800]), "d800");
expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_CODEPOINT],
codepointsToUtf16CodeUnits([0xdfff]), "dfff");
}
void testUtf16bytesToCodepoints() {
// boundary conditions: First possible values
expect.listEquals([], utf16CodeUnitsToCodepoints([]), "no input");
expect.listEquals([0x0], utf16CodeUnitsToCodepoints([0x0]), "0");
expect.listEquals(
[0x10000], utf16CodeUnitsToCodepoints([0xd800, 0xdc00]), "10000");
// boundary conditions: Last possible sequence of a certain length
expect.listEquals([0xffff], utf16CodeUnitsToCodepoints([0xffff]), "ffff");
expect.listEquals(
[0x10ffff], utf16CodeUnitsToCodepoints([0xdbff, 0xdfff]), "10ffff");
// other boundary conditions
expect.listEquals([0xd7ff], utf16CodeUnitsToCodepoints([0xd7ff]), "d7ff");
expect.listEquals([0xe000], utf16CodeUnitsToCodepoints([0xe000]), "e000");
// unexpected continuation bytes
expect.listEquals([0xfffd], utf16CodeUnitsToCodepoints([0xdc00]),
"dc00 first unexpected continuation byte");
expect.listEquals([0xfffd], utf16CodeUnitsToCodepoints([0xdfff]),
"dfff last unexpected continuation byte");
expect.listEquals([0xfffd], utf16CodeUnitsToCodepoints([0xdc00]),
"1 unexpected continuation bytes");
expect.listEquals(
[0xfffd, 0xfffd],
utf16CodeUnitsToCodepoints([0xdc00, 0xdc00]),
"2 unexpected continuation bytes");
expect.listEquals(
[0xfffd, 0xfffd, 0xfffd],
utf16CodeUnitsToCodepoints([0xdc00, 0xdc00, 0xdc00]),
"3 unexpected continuation bytes");
// incomplete sequences
expect.listEquals(
[0xfffd], utf16CodeUnitsToCodepoints([0xd800]), "d800 last byte missing");
expect.listEquals(
[0xfffd], utf16CodeUnitsToCodepoints([0xdbff]), "dbff last byte missing");
// concatenation of incomplete sequences
expect.listEquals(
[0xfffd, 0xfffd],
utf16CodeUnitsToCodepoints([0xd800, 0xdbff]),
"d800 dbff last byte missing");
// impossible bytes
expect.listEquals(
[0xfffd], utf16CodeUnitsToCodepoints([0x110000]), "110000 out of bounds");
// overlong sequences not possible in utf16 (nothing < x10000)
// illegal code positions d800-dfff not encodable (< x10000)
}