blob: be9ee86cc75697b6220144cfee9de511dd9918bb [file] [log] [blame]
// Copyright (c) 2012, the Dart project authors. Please see the AUTHORS file
// for details. All rights reserved. Use of this source code is governed by a
// BSD-style license that can be found in the LICENSE file.
part of dart.async;
abstract class _StringDecoder extends _StreamTransformer<List<int>, String> {
handleData(List<int> bytes, StreamSink<String> sink) {
var data = _carry;
data.addAll(bytes);
_carry = [];
var buffer = new StringBuffer();
int pos = 0;
while (pos < data.length) {
int currentPos = pos;
int getNext() {
if (pos < data.length) {
return data[pos++];
}
return -1;
}
_chars = [];
if (_processByte(data[pos++], getNext)) {
_chars.forEach(buffer.addCharCode);
} else {
_carry = data.getRange(currentPos, data.length - currentPos);
break;
}
}
sink.add(buffer.toString());
}
void handleDone(StreamSink<String> sink) {
if (!_carry.isEmpty) {
sink.signalError(new AsyncError(
new StateError("Unhandled tailing utf8 chars")));
}
sink.close();
}
bool _processByte(int byte, int getNext());
void addChar(int char) {
_chars.add(char);
}
List<int> _carry = [];
List<int> _chars;
}
/**
* StringTransformer class that decodes a utf8 encoded bytes.
*/
class Utf8DecoderTransformer extends _StringDecoder {
bool _processByte(int byte, int getNext()) {
int value = byte & 0xFF;
if ((value & 0x80) == 0x80) {
int additionalBytes;
if ((value & 0xe0) == 0xc0) { // 110xxxxx
value = value & 0x1F;
additionalBytes = 1;
} else if ((value & 0xf0) == 0xe0) { // 1110xxxx
value = value & 0x0F;
additionalBytes = 2;
} else { // 11110xxx
value = value & 0x07;
additionalBytes = 3;
}
for (int i = 0; i < additionalBytes; i++) {
int next = getNext();
if (next < 0) return false;
value = value << 6 | (next & 0x3F);
}
}
addChar(value);
return true;
}
}
abstract class _StringEncoder extends _StreamTransformer<String, List<int>> {
handleData(String string, StreamSink<List<int>> sink) {
sink.add(_processString(string));
}
List<int> _processString(String string);
}
/**
* StringTransformer class that utf8 encodes a string.
*/
class Utf8EncoderTransformer extends _StringEncoder {
List<int> _processString(String string) {
var bytes = [];
int pos = 0;
int length = string.length;
for (int i = 0; i < length; i++) {
int additionalBytes;
int charCode = string.charCodeAt(i);
if (charCode <= 0x007F) {
additionalBytes = 0;
bytes.add(charCode);
} else if (charCode <= 0x07FF) {
// 110xxxxx (xxxxx is top 5 bits).
bytes.add(((charCode >> 6) & 0x1F) | 0xC0);
additionalBytes = 1;
} else if (charCode <= 0xFFFF) {
// 1110xxxx (xxxx is top 4 bits)
bytes.add(((charCode >> 12) & 0x0F)| 0xE0);
additionalBytes = 2;
} else {
// 11110xxx (xxx is top 3 bits)
bytes.add(((charCode >> 18) & 0x07) | 0xF0);
additionalBytes = 3;
}
for (int i = additionalBytes; i > 0; i--) {
// 10xxxxxx (xxxxxx is next 6 bits from the top).
bytes.add(((charCode >> (6 * (i - 1))) & 0x3F) | 0x80);
}
pos += additionalBytes + 1;
}
return bytes;
}
}