|  | /* | 
|  | * Copyright (C) 2013 Google Inc. All rights reserved. | 
|  | * | 
|  | * Redistribution and use in source and binary forms, with or without | 
|  | * modification, are permitted provided that the following conditions are | 
|  | * met: | 
|  | * | 
|  | *     * Redistributions of source code must retain the above copyright | 
|  | * notice, this list of conditions and the following disclaimer. | 
|  | *     * Redistributions in binary form must reproduce the above | 
|  | * copyright notice, this list of conditions and the following disclaimer | 
|  | * in the documentation and/or other materials provided with the | 
|  | * distribution. | 
|  | *     * Neither the name of Google Inc. nor the names of its | 
|  | * contributors may be used to endorse or promote products derived from | 
|  | * this software without specific prior written permission. | 
|  | * | 
|  | * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | 
|  | * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | 
|  | * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | 
|  | * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT | 
|  | * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, | 
|  | * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT | 
|  | * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, | 
|  | * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY | 
|  | * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | 
|  | * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE | 
|  | * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | 
|  | */ | 
|  |  | 
|  | #include "third_party/blink/renderer/modules/encoding/text_decoder.h" | 
|  |  | 
|  | #include "third_party/blink/renderer/bindings/core/v8/v8_union_arraybuffer_arraybufferview.h" | 
|  | #include "third_party/blink/renderer/core/typed_arrays/dom_array_buffer.h" | 
|  | #include "third_party/blink/renderer/core/typed_arrays/dom_array_buffer_view.h" | 
|  | #include "third_party/blink/renderer/modules/encoding/encoding.h" | 
|  | #include "third_party/blink/renderer/platform/bindings/exception_state.h" | 
|  | #include "third_party/blink/renderer/platform/wtf/text/string_view.h" | 
|  | #include "third_party/blink/renderer/platform/wtf/text/text_encoding_registry.h" | 
|  |  | 
|  | namespace blink { | 
|  |  | 
|  | TextDecoder* TextDecoder::Create(const String& label, | 
|  | const TextDecoderOptions* options, | 
|  | ExceptionState& exception_state) { | 
|  | WTF::TextEncoding encoding( | 
|  | label.StripWhiteSpace(&encoding::IsASCIIWhiteSpace)); | 
|  | // The replacement encoding is not valid, but the Encoding API also | 
|  | // rejects aliases of the replacement encoding. | 
|  | if (!encoding.IsValid() || | 
|  | WTF::EqualIgnoringASCIICase(encoding.GetName(), "replacement")) { | 
|  | exception_state.ThrowRangeError("The encoding label provided ('" + label + | 
|  | "') is invalid."); | 
|  | return nullptr; | 
|  | } | 
|  |  | 
|  | return MakeGarbageCollected<TextDecoder>(encoding, options->fatal(), | 
|  | options->ignoreBOM()); | 
|  | } | 
|  |  | 
|  | TextDecoder::TextDecoder(const WTF::TextEncoding& encoding, | 
|  | bool fatal, | 
|  | bool ignore_bom) | 
|  | : encoding_(encoding), | 
|  | fatal_(fatal), | 
|  | ignore_bom_(ignore_bom), | 
|  | bom_seen_(false) {} | 
|  |  | 
|  | TextDecoder::~TextDecoder() = default; | 
|  |  | 
|  | String TextDecoder::encoding() const { | 
|  | String name = String(encoding_.GetName()).DeprecatedLower(); | 
|  | // Where possible, encoding aliases should be handled by changes to Chromium's | 
|  | // ICU or Blink's WTF.  The same codec is used, but WTF maintains a different | 
|  | // name/identity for these. | 
|  | if (name == "iso-8859-1" || name == "us-ascii") | 
|  | return "windows-1252"; | 
|  | return name; | 
|  | } | 
|  |  | 
|  | #if defined(USE_BLINK_V8_BINDING_NEW_IDL_UNION) | 
|  | String TextDecoder::decode(const V8BufferSource* input, | 
|  | const TextDecodeOptions* options, | 
|  | ExceptionState& exception_state) { | 
|  | DCHECK(options); | 
|  | // In case of `input` == IDL "missing" special value, default to (nullptr, 0). | 
|  | void* start = nullptr; | 
|  | size_t length = 0; | 
|  | if (input) { | 
|  | switch (input->GetContentType()) { | 
|  | case V8BufferSource::ContentType::kArrayBuffer: | 
|  | start = input->GetAsArrayBuffer()->Data(); | 
|  | length = input->GetAsArrayBuffer()->ByteLength(); | 
|  | break; | 
|  | case V8BufferSource::ContentType::kArrayBufferView: | 
|  | start = input->GetAsArrayBufferView()->BaseAddress(); | 
|  | length = input->GetAsArrayBufferView()->byteLength(); | 
|  | break; | 
|  | } | 
|  | } | 
|  |  | 
|  | if (length > std::numeric_limits<uint32_t>::max()) { | 
|  | exception_state.ThrowRangeError( | 
|  | "Buffer size exceeds maximum heap object size."); | 
|  | return String(); | 
|  | } | 
|  |  | 
|  | return decode(static_cast<const char*>(start), static_cast<uint32_t>(length), | 
|  | options, exception_state); | 
|  | } | 
|  | #else   // defined(USE_BLINK_V8_BINDING_NEW_IDL_UNION) | 
|  | String TextDecoder::decode(const BufferSource& input, | 
|  | const TextDecodeOptions* options, | 
|  | ExceptionState& exception_state) { | 
|  | DCHECK(options); | 
|  | // In case of `input` == IDL "missing" special value, default to (nullptr, 0). | 
|  | void* start = nullptr; | 
|  | size_t length = 0; | 
|  | if (input.IsArrayBufferView()) { | 
|  | start = input.GetAsArrayBufferView()->BaseAddress(); | 
|  | length = input.GetAsArrayBufferView()->byteLength(); | 
|  | } else if (input.IsArrayBuffer()) { | 
|  | start = input.GetAsArrayBuffer()->Data(); | 
|  | length = input.GetAsArrayBuffer()->ByteLength(); | 
|  | } | 
|  |  | 
|  | if (length > std::numeric_limits<uint32_t>::max()) { | 
|  | exception_state.ThrowRangeError( | 
|  | "Buffer size exceeds maximum heap object size."); | 
|  | return String(); | 
|  | } | 
|  |  | 
|  | return decode(static_cast<const char*>(start), static_cast<uint32_t>(length), | 
|  | options, exception_state); | 
|  | } | 
|  | #endif  // defined(USE_BLINK_V8_BINDING_NEW_IDL_UNION) | 
|  |  | 
|  | String TextDecoder::decode(const char* start, | 
|  | uint32_t length, | 
|  | const TextDecodeOptions* options, | 
|  | ExceptionState& exception_state) { | 
|  | DCHECK(options); | 
|  | if (!do_not_flush_) { | 
|  | if (!codec_) { | 
|  | // In the spec, a new decoder is created unconditionally here, but that | 
|  | // requires an extra allocation. Since the TextCodec would be flushed | 
|  | // here by the previous call if `!do_not_flush` (sorry about the double | 
|  | // negatives), then we don't need a new TextCodec to match the spec | 
|  | // behavior. | 
|  | // https://encoding.spec.whatwg.org/#dom-textdecoder-decode | 
|  | codec_ = NewTextCodec(encoding_); | 
|  | } | 
|  | bom_seen_ = false; | 
|  | } | 
|  |  | 
|  | DCHECK(codec_); | 
|  | do_not_flush_ = options->stream(); | 
|  | WTF::FlushBehavior flush = do_not_flush_ ? WTF::FlushBehavior::kDoNotFlush | 
|  | : WTF::FlushBehavior::kDataEOF; | 
|  |  | 
|  | bool saw_error = false; | 
|  | String s = codec_->Decode(start, length, flush, fatal_, saw_error); | 
|  |  | 
|  | if (fatal_ && saw_error) { | 
|  | if (!do_not_flush_) { | 
|  | // If flushing, the error should not persist. | 
|  | codec_.reset(); | 
|  | } | 
|  | exception_state.ThrowTypeError("The encoded data was not valid."); | 
|  | return String(); | 
|  | } | 
|  |  | 
|  | if (!ignore_bom_ && !bom_seen_ && !s.IsEmpty()) { | 
|  | bom_seen_ = true; | 
|  | String name(encoding_.GetName()); | 
|  | if ((name == "UTF-8" || name == "UTF-16LE" || name == "UTF-16BE") && | 
|  | s[0] == 0xFEFF) | 
|  | s.Remove(0); | 
|  | } | 
|  |  | 
|  | return s; | 
|  | } | 
|  |  | 
|  | String TextDecoder::decode(ExceptionState& exception_state) { | 
|  | TextDecodeOptions* options = TextDecodeOptions::Create(); | 
|  | return decode(nullptr, 0, options, exception_state); | 
|  | } | 
|  |  | 
|  | }  // namespace blink |