dart-sdk/sdk/lib/convert/utf.dart

// Copyright (c) 2013, the Dart project authors.  Please see the AUTHORS file
// for details. All rights reserved. Use of this source code is governed by a
// BSD-style license that can be found in the LICENSE file.

// @dart = 2.6

part of dart.convert;

/// The Unicode Replacement character `U+FFFD` (<28>).
const int unicodeReplacementCharacterRune = 0xFFFD;

/// The Unicode Byte Order Marker (BOM) character `U+FEFF`.
const int unicodeBomCharacterRune = 0xFEFF;

/// An instance of the default implementation of the [Utf8Codec].
///
/// This instance provides a convenient access to the most common UTF-8
/// use cases.
///
/// Examples:
///
///     var encoded = utf8.encode("Îñţérñåţîöñåļîžåţîờñ");
///     var decoded = utf8.decode([0x62, 0x6c, 0xc3, 0xa5, 0x62, 0xc3, 0xa6,
///                                0x72, 0x67, 0x72, 0xc3, 0xb8, 0x64]);
const Utf8Codec utf8 = Utf8Codec();

/// A [Utf8Codec] encodes strings to utf-8 code units (bytes) and decodes
/// UTF-8 code units to strings.
class Utf8Codec extends Encoding {
  final bool _allowMalformed;

  /// Instantiates a new [Utf8Codec].
  ///
  /// The optional [allowMalformed] argument defines how [decoder] (and [decode])
  /// deal with invalid or unterminated character sequences.
  ///
  /// If it is `true` (and not overridden at the method invocation) [decode] and
  /// the [decoder] replace invalid (or unterminated) octet
  /// sequences with the Unicode Replacement character `U+FFFD` (<28>). Otherwise
  /// they throw a [FormatException].
  const Utf8Codec({bool allowMalformed = false})
      : _allowMalformed = allowMalformed;

  /// The name of this codec, "utf-8".
  String get name => "utf-8";

  /// Decodes the UTF-8 [codeUnits] (a list of unsigned 8-bit integers) to the
  /// corresponding string.
  ///
  /// If the [codeUnits] start with the encoding of a
  /// [unicodeBomCharacterRune], that character is discarded.
  ///
  /// If [allowMalformed] is `true` the decoder replaces invalid (or
  /// unterminated) character sequences with the Unicode Replacement character
  /// `U+FFFD` (<28>). Otherwise it throws a [FormatException].
  ///
  /// If [allowMalformed] is not given, it defaults to the `allowMalformed` that
  /// was used to instantiate `this`.
  String decode(List<int> codeUnits, {bool allowMalformed}) {
    allowMalformed ??= _allowMalformed;
    return Utf8Decoder(allowMalformed: allowMalformed).convert(codeUnits);
  }

  Utf8Encoder get encoder => const Utf8Encoder();
  Utf8Decoder get decoder {
    return Utf8Decoder(allowMalformed: _allowMalformed);
  }
}

/// This class converts strings to their UTF-8 code units (a list of
/// unsigned 8-bit integers).
class Utf8Encoder extends Converter<String, List<int>> {
  const Utf8Encoder();

  /// Converts [string] to its UTF-8 code units (a list of
  /// unsigned 8-bit integers).
  ///
  /// If [start] and [end] are provided, only the substring
  /// `string.substring(start, end)` is converted.
  Uint8List convert(String string, [int start = 0, int end]) {
    var stringLength = string.length;
    end = RangeError.checkValidRange(start, end, stringLength);
    var length = end - start;
    if (length == 0) return Uint8List(0);
    // Create a new encoder with a length that is guaranteed to be big enough.
    // A single code unit uses at most 3 bytes, a surrogate pair at most 4.
    var encoder = _Utf8Encoder.withBufferSize(length * 3);
    var endPosition = encoder._fillBuffer(string, start, end);
    assert(endPosition >= end - 1);
    if (endPosition != end) {
      // Encoding skipped the last code unit.
      // That can only happen if the last code unit is a leadsurrogate.
      // Force encoding of the lead surrogate by itself.
      var lastCodeUnit = string.codeUnitAt(end - 1);
      assert(_isLeadSurrogate(lastCodeUnit));
      // We use a non-surrogate as `nextUnit` so that _writeSurrogate just
      // writes the lead-surrogate.
      var wasCombined = encoder._writeSurrogate(lastCodeUnit, 0);
      assert(!wasCombined);
    }
    return encoder._buffer.sublist(0, encoder._bufferIndex);
  }

  /// Starts a chunked conversion.
  ///
  /// The converter works more efficiently if the given [sink] is a
  /// [ByteConversionSink].
  StringConversionSink startChunkedConversion(Sink<List<int>> sink) {
    return _Utf8EncoderSink(
        sink is ByteConversionSink ? sink : ByteConversionSink.from(sink));
  }

  // Override the base-classes bind, to provide a better type.
  Stream<List<int>> bind(Stream<String> stream) => super.bind(stream);
}

/// This class encodes Strings to UTF-8 code units (unsigned 8 bit integers).
// TODO(floitsch): make this class public.
class _Utf8Encoder {
  int _carry = 0;
  int _bufferIndex = 0;
  final Uint8List _buffer;

  static const _DEFAULT_BYTE_BUFFER_SIZE = 1024;

  _Utf8Encoder() : this.withBufferSize(_DEFAULT_BYTE_BUFFER_SIZE);

  _Utf8Encoder.withBufferSize(int bufferSize)
      : _buffer = _createBuffer(bufferSize);

  /// Allow an implementation to pick the most efficient way of storing bytes.
  static Uint8List _createBuffer(int size) => Uint8List(size);

  /// Tries to combine the given [leadingSurrogate] with the [nextCodeUnit] and
  /// writes it to [_buffer].
  ///
  /// Returns true if the [nextCodeUnit] was combined with the
  /// [leadingSurrogate]. If it wasn't then nextCodeUnit was not a trailing
  /// surrogate and has not been written yet.
  ///
  /// It is safe to pass 0 for [nextCodeUnit] in which case only the leading
  /// surrogate is written.
  bool _writeSurrogate(int leadingSurrogate, int nextCodeUnit) {
    if (_isTailSurrogate(nextCodeUnit)) {
      var rune = _combineSurrogatePair(leadingSurrogate, nextCodeUnit);
      // If the rune is encoded with 2 code-units then it must be encoded
      // with 4 bytes in UTF-8.
      assert(rune > _THREE_BYTE_LIMIT);
      assert(rune <= _FOUR_BYTE_LIMIT);
      _buffer[_bufferIndex++] = 0xF0 | (rune >> 18);
      _buffer[_bufferIndex++] = 0x80 | ((rune >> 12) & 0x3f);
      _buffer[_bufferIndex++] = 0x80 | ((rune >> 6) & 0x3f);
      _buffer[_bufferIndex++] = 0x80 | (rune & 0x3f);
      return true;
    } else {
      // TODO(floitsch): allow to throw on malformed strings.
      // Encode the half-surrogate directly into UTF-8. This yields
      // invalid UTF-8, but we started out with invalid UTF-16.

      // Surrogates are always encoded in 3 bytes in UTF-8.
      _buffer[_bufferIndex++] = 0xE0 | (leadingSurrogate >> 12);
      _buffer[_bufferIndex++] = 0x80 | ((leadingSurrogate >> 6) & 0x3f);
      _buffer[_bufferIndex++] = 0x80 | (leadingSurrogate & 0x3f);
      return false;
    }
  }

  /// Fills the [_buffer] with as many characters as possible.
  ///
  /// Does not encode any trailing lead-surrogate. This must be done by the
  /// caller.
  ///
  /// Returns the position in the string. The returned index points to the
  /// first code unit that hasn't been encoded.
  int _fillBuffer(String str, int start, int end) {
    if (start != end && _isLeadSurrogate(str.codeUnitAt(end - 1))) {
      // Don't handle a trailing lead-surrogate in this loop. The caller has
      // to deal with those.
      end--;
    }
    int stringIndex;
    for (stringIndex = start; stringIndex < end; stringIndex++) {
      var codeUnit = str.codeUnitAt(stringIndex);
      // ASCII has the same representation in UTF-8 and UTF-16.
      if (codeUnit <= _ONE_BYTE_LIMIT) {
        if (_bufferIndex >= _buffer.length) break;
        _buffer[_bufferIndex++] = codeUnit;
      } else if (_isLeadSurrogate(codeUnit)) {
        if (_bufferIndex + 3 >= _buffer.length) break;
        // Note that it is safe to read the next code unit. We decremented
        // [end] above when the last valid code unit was a leading surrogate.
        var nextCodeUnit = str.codeUnitAt(stringIndex + 1);
        var wasCombined = _writeSurrogate(codeUnit, nextCodeUnit);
        if (wasCombined) stringIndex++;
      } else {
        var rune = codeUnit;
        if (rune <= _TWO_BYTE_LIMIT) {
          if (_bufferIndex + 1 >= _buffer.length) break;
          _buffer[_bufferIndex++] = 0xC0 | (rune >> 6);
          _buffer[_bufferIndex++] = 0x80 | (rune & 0x3f);
        } else {
          assert(rune <= _THREE_BYTE_LIMIT);
          if (_bufferIndex + 2 >= _buffer.length) break;
          _buffer[_bufferIndex++] = 0xE0 | (rune >> 12);
          _buffer[_bufferIndex++] = 0x80 | ((rune >> 6) & 0x3f);
          _buffer[_bufferIndex++] = 0x80 | (rune & 0x3f);
        }
      }
    }
    return stringIndex;
  }
}

/// This class encodes chunked strings to UTF-8 code units (unsigned 8-bit
/// integers).
class _Utf8EncoderSink extends _Utf8Encoder with StringConversionSinkMixin {
  final ByteConversionSink _sink;

  _Utf8EncoderSink(this._sink);

  void close() {
    if (_carry != 0) {
      // addSlice will call close again, but then the carry must be equal to 0.
      addSlice("", 0, 0, true);
      return;
    }
    _sink.close();
  }

  void addSlice(String str, int start, int end, bool isLast) {
    _bufferIndex = 0;

    if (start == end && !isLast) {
      return;
    }

    if (_carry != 0) {
      var nextCodeUnit = 0;
      if (start != end) {
        nextCodeUnit = str.codeUnitAt(start);
      } else {
        assert(isLast);
      }
      var wasCombined = _writeSurrogate(_carry, nextCodeUnit);
      // Either we got a non-empty string, or we must not have been combined.
      assert(!wasCombined || start != end);
      if (wasCombined) start++;
      _carry = 0;
    }
    do {
      start = _fillBuffer(str, start, end);
      var isLastSlice = isLast && (start == end);
      if (start == end - 1 && _isLeadSurrogate(str.codeUnitAt(start))) {
        if (isLast && _bufferIndex < _buffer.length - 3) {
          // There is still space for the last incomplete surrogate.
          // We use a non-surrogate as second argument. This way the
          // function will just add the surrogate-half to the buffer.
          var hasBeenCombined = _writeSurrogate(str.codeUnitAt(start), 0);
          assert(!hasBeenCombined);
        } else {
          // Otherwise store it in the carry. If isLast is true, then
          // close will flush the last carry.
          _carry = str.codeUnitAt(start);
        }
        start++;
      }
      _sink.addSlice(_buffer, 0, _bufferIndex, isLastSlice);
      _bufferIndex = 0;
    } while (start < end);
    if (isLast) close();
  }

  // TODO(floitsch): implement asUtf8Sink. Sligthly complicated because it
  // needs to deal with malformed input.
}

/// This class converts UTF-8 code units (lists of unsigned 8-bit integers)
/// to a string.
class Utf8Decoder extends Converter<List<int>, String> {
  final bool _allowMalformed;

  /// Instantiates a new [Utf8Decoder].
  ///
  /// The optional [allowMalformed] argument defines how [convert] deals
  /// with invalid or unterminated character sequences.
  ///
  /// If it is `true` [convert] replaces invalid (or unterminated) character
  /// sequences with the Unicode Replacement character `U+FFFD` (<28>). Otherwise
  /// it throws a [FormatException].
  const Utf8Decoder({bool allowMalformed = false})
      : _allowMalformed = allowMalformed;

  /// Converts the UTF-8 [codeUnits] (a list of unsigned 8-bit integers) to the
  /// corresponding string.
  ///
  /// Uses the code units from [start] to, but no including, [end].
  /// If [end] is omitted, it defaults to `codeUnits.length`.
  ///
  /// If the [codeUnits] start with the encoding of a
  /// [unicodeBomCharacterRune], that character is discarded.
  String convert(List<int> codeUnits, [int start = 0, int end]) {
    // Allow the implementation to intercept and specialize based on the type
    // of codeUnits.
    var result = _convertIntercepted(_allowMalformed, codeUnits, start, end);
    if (result != null) {
      return result;
    }

    var length = codeUnits.length;
    end = RangeError.checkValidRange(start, end, length);

    // Fast case for ASCII strings avoids StringBuffer/_Utf8Decoder.
    int oneBytes = _scanOneByteCharacters(codeUnits, start, end);
    StringBuffer buffer;
    bool isFirstCharacter = true;
    if (oneBytes > 0) {
      var firstPart = String.fromCharCodes(codeUnits, start, start + oneBytes);
      start += oneBytes;
      if (start == end) {
        return firstPart;
      }
      buffer = StringBuffer(firstPart);
      isFirstCharacter = false;
    }

    buffer ??= StringBuffer();
    var decoder = _Utf8Decoder(buffer, _allowMalformed);
    decoder._isFirstCharacter = isFirstCharacter;
    decoder.convert(codeUnits, start, end);
    decoder.flush(codeUnits, end);
    return buffer.toString();
  }

  /// Starts a chunked conversion.
  ///
  /// The converter works more efficiently if the given [sink] is a
  /// [StringConversionSink].
  ByteConversionSink startChunkedConversion(Sink<String> sink) {
    StringConversionSink stringSink;
    if (sink is StringConversionSink) {
      stringSink = sink;
    } else {
      stringSink = StringConversionSink.from(sink);
    }
    return stringSink.asUtf8Sink(_allowMalformed);
  }

  // Override the base-classes bind, to provide a better type.
  Stream<String> bind(Stream<List<int>> stream) => super.bind(stream);

  external Converter<List<int>, T> fuse<T>(Converter<String, T> next);

  external static String _convertIntercepted(
      bool allowMalformed, List<int> codeUnits, int start, int end);
}

// UTF-8 constants.
const int _ONE_BYTE_LIMIT = 0x7f; // 7 bits
const int _TWO_BYTE_LIMIT = 0x7ff; // 11 bits
const int _THREE_BYTE_LIMIT = 0xffff; // 16 bits
const int _FOUR_BYTE_LIMIT = 0x10ffff; // 21 bits, truncated to Unicode max.

// UTF-16 constants.
const int _SURROGATE_TAG_MASK = 0xFC00;
const int _SURROGATE_VALUE_MASK = 0x3FF;
const int _LEAD_SURROGATE_MIN = 0xD800;
const int _TAIL_SURROGATE_MIN = 0xDC00;

bool _isLeadSurrogate(int codeUnit) =>
    (codeUnit & _SURROGATE_TAG_MASK) == _LEAD_SURROGATE_MIN;
bool _isTailSurrogate(int codeUnit) =>
    (codeUnit & _SURROGATE_TAG_MASK) == _TAIL_SURROGATE_MIN;
int _combineSurrogatePair(int lead, int tail) =>
    0x10000 + ((lead & _SURROGATE_VALUE_MASK) << 10) |
    (tail & _SURROGATE_VALUE_MASK);

/// Decodes UTF-8.
///
/// The decoder handles chunked input.
// TODO(floitsch): make this class public.
class _Utf8Decoder {
  final bool _allowMalformed;
  final StringSink _stringSink;
  bool _isFirstCharacter = true;
  int _value = 0;
  int _expectedUnits = 0;
  int _extraUnits = 0;

  _Utf8Decoder(this._stringSink, this._allowMalformed);

  bool get hasPartialInput => _expectedUnits > 0;

  // Limits of one through four byte encodings.
  static const List<int> _LIMITS = <int>[
    _ONE_BYTE_LIMIT,
    _TWO_BYTE_LIMIT,
    _THREE_BYTE_LIMIT,
    _FOUR_BYTE_LIMIT
  ];

  void close() {
    flush();
  }

  /// Flushes this decoder as if closed.
  ///
  /// This method throws if the input was partial and the decoder was
  /// constructed with `allowMalformed` set to `false`.
  ///
  /// The [source] and [offset] of the current position may be provided,
  /// and are included in the exception if one is thrown.
  void flush([List<int> source, int offset]) {
    if (hasPartialInput) {
      if (!_allowMalformed) {
        throw FormatException(
            "Unfinished UTF-8 octet sequence", source, offset);
      }
      _stringSink.writeCharCode(unicodeReplacementCharacterRune);
      _value = 0;
      _expectedUnits = 0;
      _extraUnits = 0;
    }
  }

  void convert(List<int> codeUnits, int startIndex, int endIndex) {
    var value = _value;
    var expectedUnits = _expectedUnits;
    var extraUnits = _extraUnits;
    _value = 0;
    _expectedUnits = 0;
    _extraUnits = 0;

    var i = startIndex;
    loop:
    while (true) {
      multibyte:
      if (expectedUnits > 0) {
        do {
          if (i == endIndex) {
            break loop;
          }
          var unit = codeUnits[i];
          if ((unit & 0xC0) != 0x80) {
            expectedUnits = 0;
            if (!_allowMalformed) {
              throw FormatException(
                  "Bad UTF-8 encoding 0x${unit.toRadixString(16)}",
                  codeUnits,
                  i);
            }
            _isFirstCharacter = false;
            _stringSink.writeCharCode(unicodeReplacementCharacterRune);
            break multibyte;
          } else {
            value = (value << 6) | (unit & 0x3f);
            expectedUnits--;
            i++;
          }
        } while (expectedUnits > 0);
        if (value <= _LIMITS[extraUnits - 1]) {
          // Overly long encoding. The value could be encoded with a shorter
          // encoding.
          if (!_allowMalformed) {
            throw FormatException(
                "Overlong encoding of 0x${value.toRadixString(16)}",
                codeUnits,
                i - extraUnits - 1);
          }
          expectedUnits = extraUnits = 0;
          value = unicodeReplacementCharacterRune;
        }
        if (value > _FOUR_BYTE_LIMIT) {
          if (!_allowMalformed) {
            throw FormatException(
                "Character outside valid Unicode range: "
                "0x${value.toRadixString(16)}",
                codeUnits,
                i - extraUnits - 1);
          }
          value = unicodeReplacementCharacterRune;
        }
        if (!_isFirstCharacter || value != unicodeBomCharacterRune) {
          _stringSink.writeCharCode(value);
        }
        _isFirstCharacter = false;
      }

      while (i < endIndex) {
        var oneBytes = _scanOneByteCharacters(codeUnits, i, endIndex);
        if (oneBytes > 0) {
          _isFirstCharacter = false;
          assert(i + oneBytes <= endIndex);
          _stringSink.write(String.fromCharCodes(codeUnits, i, i + oneBytes));

          i += oneBytes;
          if (i == endIndex) break;
        }
        var unit = codeUnits[i++];
        // TODO(floitsch): the way we test we could potentially allow
        // units that are too large, if they happen to have the
        // right bit-pattern. (Same is true for the multibyte loop above).
        // TODO(floitsch): optimize this loop. See:
        // https://codereview.chromium.org/22929022/diff/1/sdk/lib/convert/utf.dart?column_width=80
        if (unit < 0) {
          // TODO(floitsch): should this be unit <= 0 ?
          if (!_allowMalformed) {
            throw FormatException(
                "Negative UTF-8 code unit: -0x${(-unit).toRadixString(16)}",
                codeUnits,
                i - 1);
          }
          _stringSink.writeCharCode(unicodeReplacementCharacterRune);
        } else {
          assert(unit > _ONE_BYTE_LIMIT);
          if ((unit & 0xE0) == 0xC0) {
            value = unit & 0x1F;
            expectedUnits = extraUnits = 1;
            continue loop;
          }
          if ((unit & 0xF0) == 0xE0) {
            value = unit & 0x0F;
            expectedUnits = extraUnits = 2;
            continue loop;
          }
          // 0xF5, 0xF6 ... 0xFF never appear in valid UTF-8 sequences.
          if ((unit & 0xF8) == 0xF0 && unit < 0xF5) {
            value = unit & 0x07;
            expectedUnits = extraUnits = 3;
            continue loop;
          }
          if (!_allowMalformed) {
            throw FormatException(
                "Bad UTF-8 encoding 0x${unit.toRadixString(16)}",
                codeUnits,
                i - 1);
          }
          value = unicodeReplacementCharacterRune;
          expectedUnits = extraUnits = 0;
          _isFirstCharacter = false;
          _stringSink.writeCharCode(value);
        }
      }
      break loop;
    }
    if (expectedUnits > 0) {
      _value = value;
      _expectedUnits = expectedUnits;
      _extraUnits = extraUnits;
    }
  }
}

// Returns the number of bytes in [units] starting at offset [from] which have
// the leftmost bit set to 0.
//
// To increase performance of this critical method we have a special variant of
// it implemented in the VM's patch files, which is why we make it external.
external int _scanOneByteCharacters(List<int> units, int from, int endIndex);
-												First version of Codecs and Converters.

No chunked conversions, yet.

R=asiva@google.com, lrn@google.com

Review URL: https://codereview.chromium.org//19000006

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@24999 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-15 10:26:38 +00:00
+								// Copyright (c) 2013, the Dart project authors.  Please see the AUTHORS file
 								// for details. All rights reserved. Use of this source code is governed by a
 								// BSD-style license that can be found in the LICENSE file.
-												Add non-NNBD language version marker to all sdk (non-nnbd) files

This is practically a copy of the change in
https://dart-review.googlesource.com/c/sdk/+/118040 but applied to the non-nnbd
sdk.

Even though there is no intent to run the non-nnbd sdk with the non-nullable
experiment, we need to add this annotation because of how we
intend to gradually start testing NNBD. The libraries.json under
sdk_nnbd is allowed to point to libraries under the non-nnbd sdk in order to
temporarily build without errors until all patch files are migrated and all CFE
issues are addressed.

Change-Id: I53c1123a8d86c10695832a8a0ad35adb7b4d92fd
Reviewed-on: https://dart-review.googlesource.com/c/sdk/+/125181
Commit-Queue: Sigmund Cherem <sigmund@google.com>
Reviewed-by: Bob Nystrom <rnystrom@google.com>

											
										
										
											2019-11-15 00:22:47 +00:00
+								// @dart = 2.6
-												Revert "Use relative URIs for core library part-of statements."

This reverts commit 62bc61b367b14bfe3a265eaddcce0574e0059985.

R=floitsch@google.com

Review-Url: https://codereview.chromium.org/2968413002 .

											
										
										
											2017-07-07 18:18:20 +00:00
+								part of dart.convert;
-												First version of Codecs and Converters.

No chunked conversions, yet.

R=asiva@google.com, lrn@google.com

Review URL: https://codereview.chromium.org//19000006

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@24999 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-15 10:26:38 +00:00
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								/// The Unicode Replacement character `U+FFFD` (<28>).
-												Change some constant declarations to lowerCase.

Retain the old values.

Reapply of https://dart-review.googlesource.com/c/sdk/+/20680 with fixes
for VM method fingerprints.

Change-Id: Ie14e7ccc3194d5561983348e6b6752728913ff4d
Reviewed-on: https://dart-review.googlesource.com/20664
Reviewed-by: Erik Ernst <eernst@google.com>
Commit-Queue: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2017-11-14 12:59:14 +00:00
+								const int unicodeReplacementCharacterRune = 0xFFFD;
-												Remove Encoding-enum from dart:io and add interface in dart:convert.

BUG= http://dartbug.com/6284
BUG= http://dartbug.com/7966
R=nweiz@google.com, sgjesse@google.com

Review URL: https://codereview.chromium.org//22872012

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@26632 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-08-26 10:37:25 +00:00
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								/// The Unicode Byte Order Marker (BOM) character `U+FEFF`.
-												Change some constant declarations to lowerCase.

Retain the old values.

Reapply of https://dart-review.googlesource.com/c/sdk/+/20680 with fixes
for VM method fingerprints.

Change-Id: Ie14e7ccc3194d5561983348e6b6752728913ff4d
Reviewed-on: https://dart-review.googlesource.com/20664
Reviewed-by: Erik Ernst <eernst@google.com>
Commit-Queue: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2017-11-14 12:59:14 +00:00
+								const int unicodeBomCharacterRune = 0xFEFF;
-												Fix UTF8 encoder for Unicode runes > 0xFFFF.

R=ajohnsen@google.com

Review URL: https://codereview.chromium.org//25463003

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@28095 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-10-01 12:11:02 +00:00
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								/// An instance of the default implementation of the [Utf8Codec].
 								///
 								/// This instance provides a convenient access to the most common UTF-8
 								/// use cases.
 								///
 								/// Examples:
 								///
 								///     var encoded = utf8.encode("Îñţérñåţîöñåļîžåţîờñ");
 								///     var decoded = utf8.decode([0x62, 0x6c, 0xc3, 0xa5, 0x62, 0xc3, 0xa6,
 								///                                0x72, 0x67, 0x72, 0xc3, 0xb8, 0x64]);
 								const Utf8Codec utf8 = Utf8Codec();
 								/// A [Utf8Codec] encodes strings to utf-8 code units (bytes) and decodes
 								/// UTF-8 code units to strings.
-												Remove Encoding-enum from dart:io and add interface in dart:convert.

BUG= http://dartbug.com/6284
BUG= http://dartbug.com/7966
R=nweiz@google.com, sgjesse@google.com

Review URL: https://codereview.chromium.org//22872012

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@26632 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-08-26 10:37:25 +00:00
+								class Utf8Codec extends Encoding {
-												Remove dart:codec and move classes into dart:convert.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19941002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25267 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-22 12:25:16 +00:00
+								  final bool _allowMalformed;
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								  /// Instantiates a new [Utf8Codec].
 								  ///
 								  /// The optional [allowMalformed] argument defines how [decoder] (and [decode])
 								  /// deal with invalid or unterminated character sequences.
 								  ///
 								  /// If it is `true` (and not overridden at the method invocation) [decode] and
 								  /// the [decoder] replace invalid (or unterminated) octet
 								  /// sequences with the Unicode Replacement character `U+FFFD` (<28>). Otherwise
 								  /// they throw a [FormatException].
 								  const Utf8Codec({bool allowMalformed = false})
-												Remove dart:codec and move classes into dart:convert.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19941002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25267 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-22 12:25:16 +00:00
+								      : _allowMalformed = allowMalformed;
-												Fix various Encoding documentation. Fixes #31827, #31828, #31829, #31830, #31831

1. Override documentation for Codec.decoder and Codec.encoder so that
   mysterious type parameters `T` and `S` don't appear in documentation, e.g.
   https://api.dartlang.org/stable/2.0.0/dart-convert/Encoding/decoder.html.
   This fixes the documentation for subclasses, including AsciiCodec,
   Latin1Codec, Utf8Codec, and SystemEncoding.
2. Fix typo in `const AsciiCodec()`.
3. Override documentation for AsciiCodec.name.
4. Override documentation for Latin1Codec.name.
5. Override documentation for Utf8Codec.name.
6. Document `const SystemEncoding()`.

Bug: https://github.com/dart-lang/sdk/issues/31827, https://github.com/dart-lang/sdk/issues/31828, https://github.com/dart-lang/sdk/issues/31829, https://github.com/dart-lang/sdk/issues/31830, https://github.com/dart-lang/sdk/issues/31831
Change-Id: I292e1cbafff991b55ab67dba684692b686f3b8de
Reviewed-on: https://dart-review.googlesource.com/c/82788
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>
Commit-Queue: Samuel Rawlins <srawlins@google.com>

											
										
										
											2018-11-03 14:59:18 +00:00
+								  /// The name of this codec, "utf-8".
-												Remove Encoding-enum from dart:io and add interface in dart:convert.

BUG= http://dartbug.com/6284
BUG= http://dartbug.com/7966
R=nweiz@google.com, sgjesse@google.com

Review URL: https://codereview.chromium.org//22872012

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@26632 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-08-26 10:37:25 +00:00
+								  String get name => "utf-8";
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								  /// Decodes the UTF-8 [codeUnits] (a list of unsigned 8-bit integers) to the
 								  /// corresponding string.
 								  ///
 								  /// If the [codeUnits] start with the encoding of a
 								  /// [unicodeBomCharacterRune], that character is discarded.
 								  ///
 								  /// If [allowMalformed] is `true` the decoder replaces invalid (or
 								  /// unterminated) character sequences with the Unicode Replacement character
 								  /// `U+FFFD` (<28>). Otherwise it throws a [FormatException].
 								  ///
 								  /// If [allowMalformed] is not given, it defaults to the `allowMalformed` that
 								  /// was used to instantiate `this`.
-												Format all dart: library files

BUG=
R=floitsch@google.com, sra@google.com

Review-Url: https://codereview.chromium.org/2754013002 .

											
										
										
											2017-03-16 17:22:19 +00:00
+								  String decode(List<int> codeUnits, {bool allowMalformed}) {
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								    allowMalformed ??= _allowMalformed;
 								    return Utf8Decoder(allowMalformed: allowMalformed).convert(codeUnits);
-												Remove dart:codec and move classes into dart:convert.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19941002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25267 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-22 12:25:16 +00:00
+								  }
-												use const constructors of Utf8*

											
										
										
											2015-08-29 20:44:28 +00:00
+								  Utf8Encoder get encoder => const Utf8Encoder();
-												Make Utf8Decoder and Utf8Encoder's convert methods take start and end too.

BUG= http://dartbug.com/21652
R=floitsch@google.com, sgjesse@google.com

Review URL: https://codereview.chromium.org//736583008

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@41844 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2014-11-20 11:23:51 +00:00
+								  Utf8Decoder get decoder {
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								    return Utf8Decoder(allowMalformed: _allowMalformed);
-												Remove dart:codec and move classes into dart:convert.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19941002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25267 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-22 12:25:16 +00:00
+								  }
 								}
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								/// This class converts strings to their UTF-8 code units (a list of
 								/// unsigned 8-bit integers).
-												Fix some strong mode issues in the core libraries.

R=vsm@google.com

Committed: https://github.com/dart-lang/sdk/commit/e5c091e048370a839919cb341fe68904b9e73207
Reverted: https://github.com/dart-lang/sdk/commit/a382f7845c034f3b97bb8532ad7247fad53494e1
Review-Url: https://codereview.chromium.org/2764943002 .

											
										
										
											2017-05-01 13:20:26 +00:00
+								class Utf8Encoder extends Converter<String, List<int>> {
-												Remove Encoding-enum from dart:io and add interface in dart:convert.

BUG= http://dartbug.com/6284
BUG= http://dartbug.com/7966
R=nweiz@google.com, sgjesse@google.com

Review URL: https://codereview.chromium.org//22872012

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@26632 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-08-26 10:37:25 +00:00
+								  const Utf8Encoder();
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								  /// Converts [string] to its UTF-8 code units (a list of
 								  /// unsigned 8-bit integers).
 								  ///
 								  /// If [start] and [end] are provided, only the substring
 								  /// `string.substring(start, end)` is converted.
-												Declare return types of Uint8List.

These methods all were returning Uint8List, yet they were only
declared to return List<int>. This forced callers to either defensively
wrap the return values in Uint8List, or to assume the contravariant
return value:

* Utf8Codec.encode()
* BytesBuilder.takeBytes()
* BytesBuilder.toBytes()
* File.readAsBytes()
* File.readAsBytesSync()
* RandomAccessFile.read()
* RandomAccessFile.readSync()
* Uint8List.sublist()

Since it's related, this change also updates the following sublist()
methods to declare that they return the a sublist of the same type as
the source list:

* Int8List
* Uint8ClampedList
* Int16List
* Uint16List
* Int32List
* Uint32List
* Int64List
* Uint64List
* Float32List
* Float64List
* Float32x4List
* Int32x4List
* Float64x2List

Bug: https://github.com/dart-lang/sdk/issues/36900
Bug: https://github.com/dart-lang/sdk/issues/31547
Bug: https://github.com/dart-lang/sdk/issues/27818
Bug: https://github.com/dart-lang/sdk/issues/35521
Change-Id: Ic3bc1db0d64de36fb68b1d8d98037eed1464f978
Reviewed-on: https://dart-review.googlesource.com/c/sdk/+/101742
Commit-Queue: Todd Volkert <tvolkert@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2019-06-20 06:43:44 +00:00
+								  Uint8List convert(String string, [int start = 0, int end]) {
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								    var stringLength = string.length;
 								    end = RangeError.checkValidRange(start, end, stringLength);
 								    var length = end - start;
 								    if (length == 0) return Uint8List(0);
-												Add UTF-8 encoder.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19593010

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25342 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-23 14:41:21 +00:00
+								    // Create a new encoder with a length that is guaranteed to be big enough.
-												Make Utf8Decoder and Utf8Encoder's convert methods take start and end too.

BUG= http://dartbug.com/21652
R=floitsch@google.com, sgjesse@google.com

Review URL: https://codereview.chromium.org//736583008

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@41844 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2014-11-20 11:23:51 +00:00
+								    // A single code unit uses at most 3 bytes, a surrogate pair at most 4.
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								    var encoder = _Utf8Encoder.withBufferSize(length * 3);
 								    var endPosition = encoder._fillBuffer(string, start, end);
-												Make Utf8Decoder and Utf8Encoder's convert methods take start and end too.

BUG= http://dartbug.com/21652
R=floitsch@google.com, sgjesse@google.com

Review URL: https://codereview.chromium.org//736583008

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@41844 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2014-11-20 11:23:51 +00:00
+								    assert(endPosition >= end - 1);
 								    if (endPosition != end) {
 								      // Encoding skipped the last code unit.
 								      // That can only happen if the last code unit is a leadsurrogate.
 								      // Force encoding of the lead surrogate by itself.
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								      var lastCodeUnit = string.codeUnitAt(end - 1);
-												Add UTF-8 encoder.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19593010

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25342 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-23 14:41:21 +00:00
+								      assert(_isLeadSurrogate(lastCodeUnit));
 								      // We use a non-surrogate as `nextUnit` so that _writeSurrogate just
 								      // writes the lead-surrogate.
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								      var wasCombined = encoder._writeSurrogate(lastCodeUnit, 0);
-												Add UTF-8 encoder.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19593010

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25342 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-23 14:41:21 +00:00
+								      assert(!wasCombined);
 								    }
 								    return encoder._buffer.sublist(0, encoder._bufferIndex);
 								  }
-												Add chunked conversion to converters.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19883003

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25466 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-25 13:26:09 +00:00
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								  /// Starts a chunked conversion.
 								  ///
 								  /// The converter works more efficiently if the given [sink] is a
 								  /// [ByteConversionSink].
-												Introduce class Sink<T>.

The sink only has "add" and "close" methods. It is the supertype of both EventSink and ChunkedConversionSink.

Made startChunkedConversion take Sink as argument, but still return ChunkedConversionSink. The more specialized chunked conversion sinks are test for, just as they always were.

R=ajohnsen@google.com

Review URL: https://codereview.chromium.org//203603008

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@34157 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2014-03-20 10:13:01 +00:00
+								  StringConversionSink startChunkedConversion(Sink<List<int>> sink) {
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								    return _Utf8EncoderSink(
 								        sink is ByteConversionSink ? sink : ByteConversionSink.from(sink));
-												Add chunked conversion to converters.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19883003

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25466 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-25 13:26:09 +00:00
+								  }
-												Add transformer support to Converters.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//20374003

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25517 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-26 10:35:42 +00:00
 								  // Override the base-classes bind, to provide a better type.
 								  Stream<List<int>> bind(Stream<String> stream) => super.bind(stream);
-												Add UTF-8 encoder.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19593010

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25342 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-23 14:41:21 +00:00
+								}
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								/// This class encodes Strings to UTF-8 code units (unsigned 8 bit integers).
-												Add UTF-8 encoder.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19593010

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25342 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-23 14:41:21 +00:00
+								// TODO(floitsch): make this class public.
 								class _Utf8Encoder {
 								  int _carry = 0;
 								  int _bufferIndex = 0;
-												Declare return types of Uint8List.

These methods all were returning Uint8List, yet they were only
declared to return List<int>. This forced callers to either defensively
wrap the return values in Uint8List, or to assume the contravariant
return value:

* Utf8Codec.encode()
* BytesBuilder.takeBytes()
* BytesBuilder.toBytes()
* File.readAsBytes()
* File.readAsBytesSync()
* RandomAccessFile.read()
* RandomAccessFile.readSync()
* Uint8List.sublist()

Since it's related, this change also updates the following sublist()
methods to declare that they return the a sublist of the same type as
the source list:

* Int8List
* Uint8ClampedList
* Int16List
* Uint16List
* Int32List
* Uint32List
* Int64List
* Uint64List
* Float32List
* Float64List
* Float32x4List
* Int32x4List
* Float64x2List

Bug: https://github.com/dart-lang/sdk/issues/36900
Bug: https://github.com/dart-lang/sdk/issues/31547
Bug: https://github.com/dart-lang/sdk/issues/27818
Bug: https://github.com/dart-lang/sdk/issues/35521
Change-Id: Ic3bc1db0d64de36fb68b1d8d98037eed1464f978
Reviewed-on: https://dart-review.googlesource.com/c/sdk/+/101742
Commit-Queue: Todd Volkert <tvolkert@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2019-06-20 06:43:44 +00:00
+								  final Uint8List _buffer;
-												Add UTF-8 encoder.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19593010

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25342 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-23 14:41:21 +00:00
 								  static const _DEFAULT_BYTE_BUFFER_SIZE = 1024;
 								  _Utf8Encoder() : this.withBufferSize(_DEFAULT_BYTE_BUFFER_SIZE);
 								  _Utf8Encoder.withBufferSize(int bufferSize)
-												Make _Utf8Encoder create its buffer through an external function.

This allows the VM to use a Uint8List, where dart2js still has to use a plain List (due to versions of IE not supporting typed data).

R=floitsch@google.com

Review URL: https://codereview.chromium.org//144473004

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@32193 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2014-01-31 13:11:25 +00:00
+								      : _buffer = _createBuffer(bufferSize);
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								  /// Allow an implementation to pick the most efficient way of storing bytes.
-												Declare return types of Uint8List.

These methods all were returning Uint8List, yet they were only
declared to return List<int>. This forced callers to either defensively
wrap the return values in Uint8List, or to assume the contravariant
return value:

* Utf8Codec.encode()
* BytesBuilder.takeBytes()
* BytesBuilder.toBytes()
* File.readAsBytes()
* File.readAsBytesSync()
* RandomAccessFile.read()
* RandomAccessFile.readSync()
* Uint8List.sublist()

Since it's related, this change also updates the following sublist()
methods to declare that they return the a sublist of the same type as
the source list:

* Int8List
* Uint8ClampedList
* Int16List
* Uint16List
* Int32List
* Uint32List
* Int64List
* Uint64List
* Float32List
* Float64List
* Float32x4List
* Int32x4List
* Float64x2List

Bug: https://github.com/dart-lang/sdk/issues/36900
Bug: https://github.com/dart-lang/sdk/issues/31547
Bug: https://github.com/dart-lang/sdk/issues/27818
Bug: https://github.com/dart-lang/sdk/issues/35521
Change-Id: Ic3bc1db0d64de36fb68b1d8d98037eed1464f978
Reviewed-on: https://dart-review.googlesource.com/c/sdk/+/101742
Commit-Queue: Todd Volkert <tvolkert@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2019-06-20 06:43:44 +00:00
+								  static Uint8List _createBuffer(int size) => Uint8List(size);
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
 								  /// Tries to combine the given [leadingSurrogate] with the [nextCodeUnit] and
 								  /// writes it to [_buffer].
 								  ///
 								  /// Returns true if the [nextCodeUnit] was combined with the
 								  /// [leadingSurrogate]. If it wasn't then nextCodeUnit was not a trailing
 								  /// surrogate and has not been written yet.
 								  ///
 								  /// It is safe to pass 0 for [nextCodeUnit] in which case only the leading
 								  /// surrogate is written.
-												Add UTF-8 encoder.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19593010

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25342 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-23 14:41:21 +00:00
+								  bool _writeSurrogate(int leadingSurrogate, int nextCodeUnit) {
 								    if (_isTailSurrogate(nextCodeUnit)) {
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								      var rune = _combineSurrogatePair(leadingSurrogate, nextCodeUnit);
-												Add UTF-8 encoder.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19593010

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25342 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-23 14:41:21 +00:00
+								      // If the rune is encoded with 2 code-units then it must be encoded
 								      // with 4 bytes in UTF-8.
 								      assert(rune > _THREE_BYTE_LIMIT);
 								      assert(rune <= _FOUR_BYTE_LIMIT);
 								      _buffer[_bufferIndex++] = 0xF0 | (rune >> 18);
 								      _buffer[_bufferIndex++] = 0x80 | ((rune >> 12) & 0x3f);
 								      _buffer[_bufferIndex++] = 0x80 | ((rune >> 6) & 0x3f);
 								      _buffer[_bufferIndex++] = 0x80 | (rune & 0x3f);
 								      return true;
 								    } else {
 								      // TODO(floitsch): allow to throw on malformed strings.
 								      // Encode the half-surrogate directly into UTF-8. This yields
 								      // invalid UTF-8, but we started out with invalid UTF-16.
 								      // Surrogates are always encoded in 3 bytes in UTF-8.
 								      _buffer[_bufferIndex++] = 0xE0 | (leadingSurrogate >> 12);
 								      _buffer[_bufferIndex++] = 0x80 | ((leadingSurrogate >> 6) & 0x3f);
 								      _buffer[_bufferIndex++] = 0x80 | (leadingSurrogate & 0x3f);
 								      return false;
 								    }
 								  }
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								  /// Fills the [_buffer] with as many characters as possible.
 								  ///
 								  /// Does not encode any trailing lead-surrogate. This must be done by the
 								  /// caller.
 								  ///
 								  /// Returns the position in the string. The returned index points to the
 								  /// first code unit that hasn't been encoded.
-												Add UTF-8 encoder.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19593010

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25342 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-23 14:41:21 +00:00
+								  int _fillBuffer(String str, int start, int end) {
 								    if (start != end && _isLeadSurrogate(str.codeUnitAt(end - 1))) {
 								      // Don't handle a trailing lead-surrogate in this loop. The caller has
 								      // to deal with those.
 								      end--;
 								    }
 								    int stringIndex;
 								    for (stringIndex = start; stringIndex < end; stringIndex++) {
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								      var codeUnit = str.codeUnitAt(stringIndex);
-												Add UTF-8 encoder.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19593010

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25342 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-23 14:41:21 +00:00
+								      // ASCII has the same representation in UTF-8 and UTF-16.
-												Fix off-by-one error in UTF-8 encoding.

R=lrn@google.com

Review URL: https://codereview.chromium.org//22854028

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@26355 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-08-20 14:03:35 +00:00
+								      if (codeUnit <= _ONE_BYTE_LIMIT) {
-												Add UTF-8 encoder.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19593010

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25342 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-23 14:41:21 +00:00
+								        if (_bufferIndex >= _buffer.length) break;
 								        _buffer[_bufferIndex++] = codeUnit;
 								      } else if (_isLeadSurrogate(codeUnit)) {
 								        if (_bufferIndex + 3 >= _buffer.length) break;
 								        // Note that it is safe to read the next code unit. We decremented
 								        // [end] above when the last valid code unit was a leading surrogate.
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								        var nextCodeUnit = str.codeUnitAt(stringIndex + 1);
 								        var wasCombined = _writeSurrogate(codeUnit, nextCodeUnit);
-												Add UTF-8 encoder.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19593010

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25342 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-23 14:41:21 +00:00
+								        if (wasCombined) stringIndex++;
 								      } else {
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								        var rune = codeUnit;
-												Add UTF-8 encoder.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19593010

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25342 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-23 14:41:21 +00:00
+								        if (rune <= _TWO_BYTE_LIMIT) {
 								          if (_bufferIndex + 1 >= _buffer.length) break;
 								          _buffer[_bufferIndex++] = 0xC0 | (rune >> 6);
 								          _buffer[_bufferIndex++] = 0x80 | (rune & 0x3f);
 								        } else {
 								          assert(rune <= _THREE_BYTE_LIMIT);
 								          if (_bufferIndex + 2 >= _buffer.length) break;
 								          _buffer[_bufferIndex++] = 0xE0 | (rune >> 12);
 								          _buffer[_bufferIndex++] = 0x80 | ((rune >> 6) & 0x3f);
 								          _buffer[_bufferIndex++] = 0x80 | (rune & 0x3f);
 								        }
 								      }
 								    }
 								    return stringIndex;
 								  }
-												First version of Codecs and Converters.

No chunked conversions, yet.

R=asiva@google.com, lrn@google.com

Review URL: https://codereview.chromium.org//19000006

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@24999 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-15 10:26:38 +00:00
+								}
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								/// This class encodes chunked strings to UTF-8 code units (unsigned 8-bit
 								/// integers).
-												Add chunked conversion to converters.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19883003

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25466 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-25 13:26:09 +00:00
+								class _Utf8EncoderSink extends _Utf8Encoder with StringConversionSinkMixin {
 								  final ByteConversionSink _sink;
 								  _Utf8EncoderSink(this._sink);
 								  void close() {
 								    if (_carry != 0) {
 								      // addSlice will call close again, but then the carry must be equal to 0.
 								      addSlice("", 0, 0, true);
 								      return;
 								    }
 								    _sink.close();
 								  }
 								  void addSlice(String str, int start, int end, bool isLast) {
 								    _bufferIndex = 0;
 								    if (start == end && !isLast) {
 								      return;
 								    }
 								    if (_carry != 0) {
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								      var nextCodeUnit = 0;
-												Add chunked conversion to converters.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19883003

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25466 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-25 13:26:09 +00:00
+								      if (start != end) {
 								        nextCodeUnit = str.codeUnitAt(start);
 								      } else {
 								        assert(isLast);
 								      }
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								      var wasCombined = _writeSurrogate(_carry, nextCodeUnit);
-												Add chunked conversion to converters.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19883003

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25466 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-25 13:26:09 +00:00
+								      // Either we got a non-empty string, or we must not have been combined.
-												Format all dart: library files

BUG=
R=floitsch@google.com, sra@google.com

Review-Url: https://codereview.chromium.org/2754013002 .

											
										
										
											2017-03-16 17:22:19 +00:00
+								      assert(!wasCombined || start != end);
-												Add chunked conversion to converters.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19883003

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25466 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-25 13:26:09 +00:00
+								      if (wasCombined) start++;
 								      _carry = 0;
 								    }
 								    do {
 								      start = _fillBuffer(str, start, end);
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								      var isLastSlice = isLast && (start == end);
-												Add chunked conversion to converters.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19883003

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25466 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-25 13:26:09 +00:00
+								      if (start == end - 1 && _isLeadSurrogate(str.codeUnitAt(start))) {
 								        if (isLast && _bufferIndex < _buffer.length - 3) {
 								          // There is still space for the last incomplete surrogate.
 								          // We use a non-surrogate as second argument. This way the
 								          // function will just add the surrogate-half to the buffer.
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								          var hasBeenCombined = _writeSurrogate(str.codeUnitAt(start), 0);
-												Add chunked conversion to converters.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19883003

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25466 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-25 13:26:09 +00:00
+								          assert(!hasBeenCombined);
 								        } else {
 								          // Otherwise store it in the carry. If isLast is true, then
 								          // close will flush the last carry.
 								          _carry = str.codeUnitAt(start);
 								        }
 								        start++;
 								      }
 								      _sink.addSlice(_buffer, 0, _bufferIndex, isLastSlice);
 								      _bufferIndex = 0;
 								    } while (start < end);
 								    if (isLast) close();
 								  }
 								  // TODO(floitsch): implement asUtf8Sink. Sligthly complicated because it
 								  // needs to deal with malformed input.
 								}
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								/// This class converts UTF-8 code units (lists of unsigned 8-bit integers)
 								/// to a string.
-												Fix some strong mode issues in the core libraries.

R=vsm@google.com

Committed: https://github.com/dart-lang/sdk/commit/e5c091e048370a839919cb341fe68904b9e73207
Reverted: https://github.com/dart-lang/sdk/commit/a382f7845c034f3b97bb8532ad7247fad53494e1
Review-Url: https://codereview.chromium.org/2764943002 .

											
										
										
											2017-05-01 13:20:26 +00:00
+								class Utf8Decoder extends Converter<List<int>, String> {
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
+								  final bool _allowMalformed;
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								  /// Instantiates a new [Utf8Decoder].
 								  ///
 								  /// The optional [allowMalformed] argument defines how [convert] deals
 								  /// with invalid or unterminated character sequences.
 								  ///
 								  /// If it is `true` [convert] replaces invalid (or unterminated) character
 								  /// sequences with the Unicode Replacement character `U+FFFD` (<28>). Otherwise
 								  /// it throws a [FormatException].
 								  const Utf8Decoder({bool allowMalformed = false})
 								      : _allowMalformed = allowMalformed;
 								  /// Converts the UTF-8 [codeUnits] (a list of unsigned 8-bit integers) to the
 								  /// corresponding string.
 								  ///
 								  /// Uses the code units from [start] to, but no including, [end].
 								  /// If [end] is omitted, it defaults to `codeUnits.length`.
 								  ///
 								  /// If the [codeUnits] start with the encoding of a
 								  /// [unicodeBomCharacterRune], that character is discarded.
-												Make Utf8Decoder and Utf8Encoder's convert methods take start and end too.

BUG= http://dartbug.com/21652
R=floitsch@google.com, sgjesse@google.com

Review URL: https://codereview.chromium.org//736583008

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@41844 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2014-11-20 11:23:51 +00:00
+								  String convert(List<int> codeUnits, [int start = 0, int end]) {
-												- Allow implementations to hook into the Utf8Decoder.convert method.

R=srdjan@google.com

Review URL: https://codereview.chromium.org//791323003

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@43033 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2015-01-21 01:29:14 +00:00
+								    // Allow the implementation to intercept and specialize based on the type
 								    // of codeUnits.
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								    var result = _convertIntercepted(_allowMalformed, codeUnits, start, end);
-												- Allow implementations to hook into the Utf8Decoder.convert method.

R=srdjan@google.com

Review URL: https://codereview.chromium.org//791323003

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@43033 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2015-01-21 01:29:14 +00:00
+								    if (result != null) {
-												fix Utf8Decoder hook.

dart2js can infer a non-null String result type with this fix.

TBR=floitsch@google.com

Review URL: https://codereview.chromium.org/1449273002 .

											
										
										
											2015-11-17 02:29:44 +00:00
+								      return result;
-												- Allow implementations to hook into the Utf8Decoder.convert method.

R=srdjan@google.com

Review URL: https://codereview.chromium.org//791323003

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@43033 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2015-01-21 01:29:14 +00:00
+								    }
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								    var length = codeUnits.length;
 								    end = RangeError.checkValidRange(start, end, length);
-												Add fast case for ASCII in Utf8Decoder, it significantly increases decoding speed

Issue https://github.com/dart-lang/sdk/issues/31954

Change-Id: I525157d1c91276d35f6678a9066ac72900cc11ed
Reviewed-on: https://dart-review.googlesource.com/c/93434
Commit-Queue: Martin Kustermann <kustermann@google.com>
Reviewed-by: Sigurd Meldgaard <sigurdm@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2019-02-20 17:19:14 +00:00
 								    // Fast case for ASCII strings avoids StringBuffer/_Utf8Decoder.
 								    int oneBytes = _scanOneByteCharacters(codeUnits, start, end);
 								    StringBuffer buffer;
 								    bool isFirstCharacter = true;
 								    if (oneBytes > 0) {
 								      var firstPart = String.fromCharCodes(codeUnits, start, start + oneBytes);
 								      start += oneBytes;
 								      if (start == end) {
 								        return firstPart;
 								      }
 								      buffer = StringBuffer(firstPart);
 								      isFirstCharacter = false;
 								    }
 								    buffer ??= StringBuffer();
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								    var decoder = _Utf8Decoder(buffer, _allowMalformed);
-												Add fast case for ASCII in Utf8Decoder, it significantly increases decoding speed

Issue https://github.com/dart-lang/sdk/issues/31954

Change-Id: I525157d1c91276d35f6678a9066ac72900cc11ed
Reviewed-on: https://dart-review.googlesource.com/c/93434
Commit-Queue: Martin Kustermann <kustermann@google.com>
Reviewed-by: Sigurd Meldgaard <sigurdm@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2019-02-20 17:19:14 +00:00
+								    decoder._isFirstCharacter = isFirstCharacter;
-												Make Utf8Decoder and Utf8Encoder's convert methods take start and end too.

BUG= http://dartbug.com/21652
R=floitsch@google.com, sgjesse@google.com

Review URL: https://codereview.chromium.org//736583008

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@41844 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2014-11-20 11:23:51 +00:00
+								    decoder.convert(codeUnits, start, end);
-												Add offset to UTF8-decode format exceptions.

Fixes issue #28293

BUG= http://dartbug.com/28293
R=floitsch@google.com

Review-Url: https://codereview.chromium.org/2619793002 .

											
										
										
											2017-01-23 13:18:40 +00:00
+								    decoder.flush(codeUnits, end);
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
+								    return buffer.toString();
 								  }
-												Add chunked conversion to converters.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19883003

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25466 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-25 13:26:09 +00:00
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								  /// Starts a chunked conversion.
 								  ///
 								  /// The converter works more efficiently if the given [sink] is a
 								  /// [StringConversionSink].
-												Introduce class Sink<T>.

The sink only has "add" and "close" methods. It is the supertype of both EventSink and ChunkedConversionSink.

Made startChunkedConversion take Sink as argument, but still return ChunkedConversionSink. The more specialized chunked conversion sinks are test for, just as they always were.

R=ajohnsen@google.com

Review URL: https://codereview.chromium.org//203603008

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@34157 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2014-03-20 10:13:01 +00:00
+								  ByteConversionSink startChunkedConversion(Sink<String> sink) {
-												Add chunked conversion to converters.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19883003

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25466 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-25 13:26:09 +00:00
+								    StringConversionSink stringSink;
 								    if (sink is StringConversionSink) {
 								      stringSink = sink;
 								    } else {
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								      stringSink = StringConversionSink.from(sink);
-												Add chunked conversion to converters.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19883003

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25466 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-25 13:26:09 +00:00
+								    }
 								    return stringSink.asUtf8Sink(_allowMalformed);
 								  }
-												Add transformer support to Converters.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//20374003

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25517 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-26 10:35:42 +00:00
 								  // Override the base-classes bind, to provide a better type.
 								  Stream<String> bind(Stream<List<int>> stream) => super.bind(stream);
-												Make JSON.fuse(UTF8) be more efficient by not creating intermediate string.

Adds JsonUtf8Encoder class that can be used directly, or through jsonEncoder.fuse(utf8Encoder) or jsonEncoder.startChunkedConversion(_Utf8EncoderSink).

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//689043002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@41479 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2014-11-04 10:25:41 +00:00
-												Make core libraries use generic method syntax.

Removes comment syntax where possible for the following platform libraries:
* async
* collection
* convert
* core
* internal
* io
* math

The HTML related libraries are not changed. The templates used to build them
must be changed as well.

R=floitsch@google.com

Committed: https://github.com/dart-lang/sdk/commit/68818315b5cc6c63fea0e10e90f515f6083ec095
Committed: https://github.com/dart-lang/sdk/commit/3f74b8d82edca8c342c43306714e68ddf84548e1
Review-Url: https://codereview.chromium.org/2529393002 .

											
										
										
											2017-01-03 11:05:40 +00:00
+								  external Converter<List<int>, T> fuse<T>(Converter<String, T> next);
-												- Allow implementations to hook into the Utf8Decoder.convert method.

R=srdjan@google.com

Review URL: https://codereview.chromium.org//791323003

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@43033 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2015-01-21 01:29:14 +00:00
 								  external static String _convertIntercepted(
 								      bool allowMalformed, List<int> codeUnits, int start, int end);
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
+								}
 								// UTF-8 constants.
-												Format all dart: library files

BUG=
R=floitsch@google.com, sra@google.com

Review-Url: https://codereview.chromium.org/2754013002 .

											
										
										
											2017-03-16 17:22:19 +00:00
+								const int _ONE_BYTE_LIMIT = 0x7f; // 7 bits
 								const int _TWO_BYTE_LIMIT = 0x7ff; // 11 bits
 								const int _THREE_BYTE_LIMIT = 0xffff; // 16 bits
 								const int _FOUR_BYTE_LIMIT = 0x10ffff; // 21 bits, truncated to Unicode max.
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
 								// UTF-16 constants.
 								const int _SURROGATE_TAG_MASK = 0xFC00;
 								const int _SURROGATE_VALUE_MASK = 0x3FF;
 								const int _LEAD_SURROGATE_MIN = 0xD800;
 								const int _TAIL_SURROGATE_MIN = 0xDC00;
 								bool _isLeadSurrogate(int codeUnit) =>
 								    (codeUnit & _SURROGATE_TAG_MASK) == _LEAD_SURROGATE_MIN;
 								bool _isTailSurrogate(int codeUnit) =>
 								    (codeUnit & _SURROGATE_TAG_MASK) == _TAIL_SURROGATE_MIN;
 								int _combineSurrogatePair(int lead, int tail) =>
-												Format all dart: library files

BUG=
R=floitsch@google.com, sra@google.com

Review-Url: https://codereview.chromium.org/2754013002 .

											
										
										
											2017-03-16 17:22:19 +00:00
+x10000 + ((lead & _SURROGATE_VALUE_MASK) << 10) |
 								    (tail & _SURROGATE_VALUE_MASK);
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								/// Decodes UTF-8.
 								///
 								/// The decoder handles chunked input.
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
+								// TODO(floitsch): make this class public.
 								class _Utf8Decoder {
 								  final bool _allowMalformed;
-												Add chunked conversion to converters.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19883003

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25466 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-25 13:26:09 +00:00
+								  final StringSink _stringSink;
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
+								  bool _isFirstCharacter = true;
 								  int _value = 0;
 								  int _expectedUnits = 0;
 								  int _extraUnits = 0;
-												Add chunked conversion to converters.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19883003

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25466 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-25 13:26:09 +00:00
+								  _Utf8Decoder(this._stringSink, this._allowMalformed);
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
 								  bool get hasPartialInput => _expectedUnits > 0;
 								  // Limits of one through four byte encodings.
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								  static const List<int> _LIMITS = <int>[
-												Format all dart: library files

BUG=
R=floitsch@google.com, sra@google.com

Review-Url: https://codereview.chromium.org/2754013002 .

											
										
										
											2017-03-16 17:22:19 +00:00
+								    _ONE_BYTE_LIMIT,
 								    _TWO_BYTE_LIMIT,
 								    _THREE_BYTE_LIMIT,
 								    _FOUR_BYTE_LIMIT
 								  ];
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
-												Add chunked conversion to converters.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19883003

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25466 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-25 13:26:09 +00:00
+								  void close() {
 								    flush();
 								  }
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								  /// Flushes this decoder as if closed.
 								  ///
 								  /// This method throws if the input was partial and the decoder was
 								  /// constructed with `allowMalformed` set to `false`.
 								  ///
 								  /// The [source] and [offset] of the current position may be provided,
 								  /// and are included in the exception if one is thrown.
-												Add offset to UTF8-decode format exceptions.

Fixes issue #28293

BUG= http://dartbug.com/28293
R=floitsch@google.com

Review-Url: https://codereview.chromium.org/2619793002 .

											
										
										
											2017-01-23 13:18:40 +00:00
+								  void flush([List<int> source, int offset]) {
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
+								    if (hasPartialInput) {
 								      if (!_allowMalformed) {
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								        throw FormatException(
-												Format all dart: library files

BUG=
R=floitsch@google.com, sra@google.com

Review-Url: https://codereview.chromium.org/2754013002 .

											
										
										
											2017-03-16 17:22:19 +00:00
+								            "Unfinished UTF-8 octet sequence", source, offset);
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
+								      }
-												Change some constant declarations to lowerCase.

Retain the old values.

Reapply of https://dart-review.googlesource.com/c/sdk/+/20680 with fixes
for VM method fingerprints.

Change-Id: Ie14e7ccc3194d5561983348e6b6752728913ff4d
Reviewed-on: https://dart-review.googlesource.com/20664
Reviewed-by: Erik Ernst <eernst@google.com>
Commit-Queue: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2017-11-14 12:59:14 +00:00
+								      _stringSink.writeCharCode(unicodeReplacementCharacterRune);
-												Add chunked conversion to converters.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19883003

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25466 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-25 13:26:09 +00:00
+								      _value = 0;
 								      _expectedUnits = 0;
 								      _extraUnits = 0;
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
+								    }
 								  }
-												Add chunked conversion to converters.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19883003

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25466 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-25 13:26:09 +00:00
+								  void convert(List<int> codeUnits, int startIndex, int endIndex) {
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								    var value = _value;
 								    var expectedUnits = _expectedUnits;
 								    var extraUnits = _extraUnits;
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
+								    _value = 0;
 								    _expectedUnits = 0;
 								    _extraUnits = 0;
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								    var i = startIndex;
-												Format all dart: library files

BUG=
R=floitsch@google.com, sra@google.com

Review-Url: https://codereview.chromium.org/2754013002 .

											
										
										
											2017-03-16 17:22:19 +00:00
+								    loop:
 								    while (true) {
 								      multibyte:
 								      if (expectedUnits > 0) {
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
+								        do {
 								          if (i == endIndex) {
 								            break loop;
 								          }
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								          var unit = codeUnits[i];
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
+								          if ((unit & 0xC0) != 0x80) {
 								            expectedUnits = 0;
 								            if (!_allowMalformed) {
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								              throw FormatException(
-												Add offset to UTF8-decode format exceptions.

Fixes issue #28293

BUG= http://dartbug.com/28293
R=floitsch@google.com

Review-Url: https://codereview.chromium.org/2619793002 .

											
										
										
											2017-01-23 13:18:40 +00:00
+								                  "Bad UTF-8 encoding 0x${unit.toRadixString(16)}",
-												Format all dart: library files

BUG=
R=floitsch@google.com, sra@google.com

Review-Url: https://codereview.chromium.org/2754013002 .

											
										
										
											2017-03-16 17:22:19 +00:00
+								                  codeUnits,
 								                  i);
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
+								            }
 								            _isFirstCharacter = false;
-												Change some constant declarations to lowerCase.

Retain the old values.

Reapply of https://dart-review.googlesource.com/c/sdk/+/20680 with fixes
for VM method fingerprints.

Change-Id: Ie14e7ccc3194d5561983348e6b6752728913ff4d
Reviewed-on: https://dart-review.googlesource.com/20664
Reviewed-by: Erik Ernst <eernst@google.com>
Commit-Queue: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2017-11-14 12:59:14 +00:00
+								            _stringSink.writeCharCode(unicodeReplacementCharacterRune);
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
+								            break multibyte;
 								          } else {
 								            value = (value << 6) | (unit & 0x3f);
 								            expectedUnits--;
 								            i++;
 								          }
 								        } while (expectedUnits > 0);
 								        if (value <= _LIMITS[extraUnits - 1]) {
 								          // Overly long encoding. The value could be encoded with a shorter
 								          // encoding.
 								          if (!_allowMalformed) {
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								            throw FormatException(
-												Add offset to UTF8-decode format exceptions.

Fixes issue #28293

BUG= http://dartbug.com/28293
R=floitsch@google.com

Review-Url: https://codereview.chromium.org/2619793002 .

											
										
										
											2017-01-23 13:18:40 +00:00
+								                "Overlong encoding of 0x${value.toRadixString(16)}",
-												Format all dart: library files

BUG=
R=floitsch@google.com, sra@google.com

Review-Url: https://codereview.chromium.org/2754013002 .

											
										
										
											2017-03-16 17:22:19 +00:00
+								                codeUnits,
 								                i - extraUnits - 1);
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
+								          }
 								          expectedUnits = extraUnits = 0;
-												Change some constant declarations to lowerCase.

Retain the old values.

Reapply of https://dart-review.googlesource.com/c/sdk/+/20680 with fixes
for VM method fingerprints.

Change-Id: Ie14e7ccc3194d5561983348e6b6752728913ff4d
Reviewed-on: https://dart-review.googlesource.com/20664
Reviewed-by: Erik Ernst <eernst@google.com>
Commit-Queue: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2017-11-14 12:59:14 +00:00
+								          value = unicodeReplacementCharacterRune;
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
+								        }
 								        if (value > _FOUR_BYTE_LIMIT) {
 								          if (!_allowMalformed) {
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								            throw FormatException(
-												Format all dart: library files

BUG=
R=floitsch@google.com, sra@google.com

Review-Url: https://codereview.chromium.org/2754013002 .

											
										
										
											2017-03-16 17:22:19 +00:00
+								                "Character outside valid Unicode range: "
 								                "0x${value.toRadixString(16)}",
 								                codeUnits,
 								                i - extraUnits - 1);
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
+								          }
-												Change some constant declarations to lowerCase.

Retain the old values.

Reapply of https://dart-review.googlesource.com/c/sdk/+/20680 with fixes
for VM method fingerprints.

Change-Id: Ie14e7ccc3194d5561983348e6b6752728913ff4d
Reviewed-on: https://dart-review.googlesource.com/20664
Reviewed-by: Erik Ernst <eernst@google.com>
Commit-Queue: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2017-11-14 12:59:14 +00:00
+								          value = unicodeReplacementCharacterRune;
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
+								        }
-												Change some constant declarations to lowerCase.

Retain the old values.

Reapply of https://dart-review.googlesource.com/c/sdk/+/20680 with fixes
for VM method fingerprints.

Change-Id: Ie14e7ccc3194d5561983348e6b6752728913ff4d
Reviewed-on: https://dart-review.googlesource.com/20664
Reviewed-by: Erik Ernst <eernst@google.com>
Commit-Queue: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2017-11-14 12:59:14 +00:00
+								        if (!_isFirstCharacter || value != unicodeBomCharacterRune) {
-												Add chunked conversion to converters.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19883003

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25466 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-25 13:26:09 +00:00
+								          _stringSink.writeCharCode(value);
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
+								        }
 								        _isFirstCharacter = false;
 								      }
 								      while (i < endIndex) {
-												Reland "[VM] Inline ClassID.getID() eagerly, extend pattern matching logic to recognize it, use it to special case ascii decoding"

This change extends/fixes the exiting "pattern recognition" which tries
to recognize the pattern

  v2 <- LoadClassIdInstr(v1)
  BranchIf v2 == IntegerConstant(cid)

Furthermore we start inlining the recognized `ClassID.getID` method very
early in the pipeline.  This allows the VM to recognize the above
pattern and insert redefinitions before the actual inlining pass.

Furthermore we special-case two very hot methods in utf8 decoding by
manually having two loops, one of which is guarded by a class-id check
against the _Uint8ArrayView class, which is most common.  (In the future
we would like to unify the typed data layouts so we no longer need to
use `ClassId.getID`, thereby also allowing non core library code to use
this).

This improves dart-aot by
  * 31%+ for a protobuf decoding benchmark we care about

Issue https://github.com/dart-lang/sdk/issues/31954

Change-Id: I7181bbf096aabe303634fd3b2bff9cc96d69719c
Reviewed-on: https://dart-review.googlesource.com/c/85443
Reviewed-by: Vyacheslav Egorov <vegorov@google.com>
Commit-Queue: Martin Kustermann <kustermann@google.com>

											
										
										
											2018-11-28 10:43:32 +00:00
+								        var oneBytes = _scanOneByteCharacters(codeUnits, i, endIndex);
-												Improve utf8 decoding of single-char bytes, by isolating the loop.

BUG=
R=fschneider@google.com

Review URL: https://codereview.chromium.org//435553002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@38776 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2014-07-31 12:23:11 +00:00
+								        if (oneBytes > 0) {
 								          _isFirstCharacter = false;
-												Add fast case for ASCII in Utf8Decoder, it significantly increases decoding speed

Issue https://github.com/dart-lang/sdk/issues/31954

Change-Id: I525157d1c91276d35f6678a9066ac72900cc11ed
Reviewed-on: https://dart-review.googlesource.com/c/93434
Commit-Queue: Martin Kustermann <kustermann@google.com>
Reviewed-by: Sigurd Meldgaard <sigurdm@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2019-02-20 17:19:14 +00:00
+								          assert(i + oneBytes <= endIndex);
 								          _stringSink.write(String.fromCharCodes(codeUnits, i, i + oneBytes));
-												Improve utf8 decoding of single-char bytes, by isolating the loop.

BUG=
R=fschneider@google.com

Review URL: https://codereview.chromium.org//435553002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@38776 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2014-07-31 12:23:11 +00:00
+								          i += oneBytes;
 								          if (i == endIndex) break;
 								        }
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								        var unit = codeUnits[i++];
-												Treat negative utf8-units the same way as other broken encodings.

R=lrn@google.com

Review URL: https://codereview.chromium.org//22929022

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@26528 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-08-22 15:40:41 +00:00
+								        // TODO(floitsch): the way we test we could potentially allow
 								        // units that are too large, if they happen to have the
 								        // right bit-pattern. (Same is true for the multibyte loop above).
 								        // TODO(floitsch): optimize this loop. See:
 								        // https://codereview.chromium.org/22929022/diff/1/sdk/lib/convert/utf.dart?column_width=80
 								        if (unit < 0) {
 								          // TODO(floitsch): should this be unit <= 0 ?
 								          if (!_allowMalformed) {
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								            throw FormatException(
-												Add offset to UTF8-decode format exceptions.

Fixes issue #28293

BUG= http://dartbug.com/28293
R=floitsch@google.com

Review-Url: https://codereview.chromium.org/2619793002 .

											
										
										
											2017-01-23 13:18:40 +00:00
+								                "Negative UTF-8 code unit: -0x${(-unit).toRadixString(16)}",
-												Format all dart: library files

BUG=
R=floitsch@google.com, sra@google.com

Review-Url: https://codereview.chromium.org/2754013002 .

											
										
										
											2017-03-16 17:22:19 +00:00
+								                codeUnits,
 								                i - 1);
-												Treat negative utf8-units the same way as other broken encodings.

R=lrn@google.com

Review URL: https://codereview.chromium.org//22929022

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@26528 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-08-22 15:40:41 +00:00
+								          }
-												Change some constant declarations to lowerCase.

Retain the old values.

Reapply of https://dart-review.googlesource.com/c/sdk/+/20680 with fixes
for VM method fingerprints.

Change-Id: Ie14e7ccc3194d5561983348e6b6752728913ff4d
Reviewed-on: https://dart-review.googlesource.com/20664
Reviewed-by: Erik Ernst <eernst@google.com>
Commit-Queue: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2017-11-14 12:59:14 +00:00
+								          _stringSink.writeCharCode(unicodeReplacementCharacterRune);
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
+								        } else {
-												Improve utf8 decoding of single-char bytes, by isolating the loop.

BUG=
R=fschneider@google.com

Review URL: https://codereview.chromium.org//435553002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@38776 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2014-07-31 12:23:11 +00:00
+								          assert(unit > _ONE_BYTE_LIMIT);
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
+								          if ((unit & 0xE0) == 0xC0) {
 								            value = unit & 0x1F;
 								            expectedUnits = extraUnits = 1;
 								            continue loop;
 								          }
 								          if ((unit & 0xF0) == 0xE0) {
 								            value = unit & 0x0F;
 								            expectedUnits = extraUnits = 2;
 								            continue loop;
 								          }
 								          // 0xF5, 0xF6 ... 0xFF never appear in valid UTF-8 sequences.
 								          if ((unit & 0xF8) == 0xF0 && unit < 0xF5) {
 								            value = unit & 0x07;
 								            expectedUnits = extraUnits = 3;
 								            continue loop;
 								          }
 								          if (!_allowMalformed) {
-												cleanup dart:convert

Fixed a number of standard lints

Change-Id: I36e535c6dc91f3c7407c66a8089c38e0463bee83
Reviewed-on: https://dart-review.googlesource.com/c/81700
Auto-Submit: Kevin Moore <kevmoo@google.com>
Commit-Queue: Kevin Moore <kevmoo@google.com>
Reviewed-by: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2018-10-26 23:05:24 +00:00
+								            throw FormatException(
-												Add offset to UTF8-decode format exceptions.

Fixes issue #28293

BUG= http://dartbug.com/28293
R=floitsch@google.com

Review-Url: https://codereview.chromium.org/2619793002 .

											
										
										
											2017-01-23 13:18:40 +00:00
+								                "Bad UTF-8 encoding 0x${unit.toRadixString(16)}",
-												Format all dart: library files

BUG=
R=floitsch@google.com, sra@google.com

Review-Url: https://codereview.chromium.org/2754013002 .

											
										
										
											2017-03-16 17:22:19 +00:00
+								                codeUnits,
 								                i - 1);
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
+								          }
-												Change some constant declarations to lowerCase.

Retain the old values.

Reapply of https://dart-review.googlesource.com/c/sdk/+/20680 with fixes
for VM method fingerprints.

Change-Id: Ie14e7ccc3194d5561983348e6b6752728913ff4d
Reviewed-on: https://dart-review.googlesource.com/20664
Reviewed-by: Erik Ernst <eernst@google.com>
Commit-Queue: Lasse R.H. Nielsen <lrn@google.com>

											
										
										
											2017-11-14 12:59:14 +00:00
+								          value = unicodeReplacementCharacterRune;
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
+								          expectedUnits = extraUnits = 0;
 								          _isFirstCharacter = false;
-												Add chunked conversion to converters.

R=sgjesse@google.com

Review URL: https://codereview.chromium.org//19883003

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25466 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-25 13:26:09 +00:00
+								          _stringSink.writeCharCode(value);
-												Replace old utf8 decoder with new one.

R=lrn@google.com

Review URL: https://codereview.chromium.org//19187002

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@25089 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-17 11:35:12 +00:00
+								        }
 								      }
 								      break loop;
 								    }
 								    if (expectedUnits > 0) {
 								      _value = value;
 								      _expectedUnits = expectedUnits;
 								      _extraUnits = extraUnits;
 								    }
 								  }
-												First version of Codecs and Converters.

No chunked conversions, yet.

R=asiva@google.com, lrn@google.com

Review URL: https://codereview.chromium.org//19000006

git-svn-id: https://dart.googlecode.com/svn/branches/bleeding_edge/dart@24999 260f80e4-7a28-3924-810f-c04153c831b5

											
										
										
											2013-07-15 10:26:38 +00:00
+								}
-												Reland "[VM] Inline ClassID.getID() eagerly, extend pattern matching logic to recognize it, use it to special case ascii decoding"

This change extends/fixes the exiting "pattern recognition" which tries
to recognize the pattern

  v2 <- LoadClassIdInstr(v1)
  BranchIf v2 == IntegerConstant(cid)

Furthermore we start inlining the recognized `ClassID.getID` method very
early in the pipeline.  This allows the VM to recognize the above
pattern and insert redefinitions before the actual inlining pass.

Furthermore we special-case two very hot methods in utf8 decoding by
manually having two loops, one of which is guarded by a class-id check
against the _Uint8ArrayView class, which is most common.  (In the future
we would like to unify the typed data layouts so we no longer need to
use `ClassId.getID`, thereby also allowing non core library code to use
this).

This improves dart-aot by
  * 31%+ for a protobuf decoding benchmark we care about

Issue https://github.com/dart-lang/sdk/issues/31954

Change-Id: I7181bbf096aabe303634fd3b2bff9cc96d69719c
Reviewed-on: https://dart-review.googlesource.com/c/85443
Reviewed-by: Vyacheslav Egorov <vegorov@google.com>
Commit-Queue: Martin Kustermann <kustermann@google.com>

											
										
										
											2018-11-28 10:43:32 +00:00
 								// Returns the number of bytes in [units] starting at offset [from] which have
 								// the leftmost bit set to 0.
 								//
 								// To increase performance of this critical method we have a special variant of
 								// it implemented in the VM's patch files, which is why we make it external.
 								external int _scanOneByteCharacters(List<int> units, int from, int endIndex);