| // Copyright 2018 The Chromium Authors |
| // Use of this source code is governed by a BSD-style license that can be |
| // found in the LICENSE file. |
| |
| #include "third_party/blink/renderer/modules/encoding/text_decoder_stream.h" |
| |
| #include <memory> |
| #include <utility> |
| |
| #include "third_party/blink/renderer/bindings/core/v8/script_promise.h" |
| #include "third_party/blink/renderer/bindings/core/v8/script_value.h" |
| #include "third_party/blink/renderer/bindings/core/v8/to_v8_traits.h" |
| #include "third_party/blink/renderer/bindings/core/v8/v8_binding_for_core.h" |
| #include "third_party/blink/renderer/bindings/core/v8/v8_typedefs.h" |
| #include "third_party/blink/renderer/bindings/core/v8/v8_union_arraybuffer_arraybufferview.h" |
| #include "third_party/blink/renderer/bindings/modules/v8/v8_text_decoder_options.h" |
| #include "third_party/blink/renderer/core/streams/transform_stream_default_controller.h" |
| #include "third_party/blink/renderer/core/streams/transform_stream_transformer.h" |
| #include "third_party/blink/renderer/core/typed_arrays/dom_array_piece.h" |
| #include "third_party/blink/renderer/core/typed_arrays/dom_typed_array.h" |
| #include "third_party/blink/renderer/modules/encoding/encoding.h" |
| #include "third_party/blink/renderer/platform/bindings/exception_messages.h" |
| #include "third_party/blink/renderer/platform/bindings/exception_state.h" |
| #include "third_party/blink/renderer/platform/wtf/text/string_view.h" |
| #include "third_party/blink/renderer/platform/wtf/text/text_codec.h" |
| #include "third_party/blink/renderer/platform/wtf/text/text_encoding.h" |
| #include "third_party/blink/renderer/platform/wtf/text/text_encoding_registry.h" |
| |
| namespace blink { |
| |
| class TextDecoderStream::Transformer final : public TransformStreamTransformer { |
| public: |
| explicit Transformer(ScriptState* script_state, |
| WTF::TextEncoding encoding, |
| bool fatal, |
| bool ignore_bom) |
| : decoder_(NewTextCodec(encoding)), |
| script_state_(script_state), |
| fatal_(fatal), |
| ignore_bom_(ignore_bom), |
| encoding_has_bom_removal_(EncodingHasBomRemoval(encoding)) {} |
| |
| Transformer(const Transformer&) = delete; |
| Transformer& operator=(const Transformer&) = delete; |
| |
| // Implements the type conversion part of the "decode and enqueue a chunk" |
| // algorithm. |
| ScriptPromise Transform(v8::Local<v8::Value> chunk, |
| TransformStreamDefaultController* controller, |
| ExceptionState& exception_state) override { |
| auto* buffer_source = V8BufferSource::Create(script_state_->GetIsolate(), |
| chunk, exception_state); |
| if (exception_state.HadException()) |
| return ScriptPromise(); |
| |
| // This implements the "get a copy of the bytes held by the buffer source" |
| // algorithm (https://webidl.spec.whatwg.org/#dfn-get-buffer-source-copy). |
| DOMArrayPiece array_piece(buffer_source); |
| if (array_piece.ByteLength() > std::numeric_limits<uint32_t>::max()) { |
| exception_state.ThrowRangeError( |
| "Buffer size exceeds maximum heap object size."); |
| return ScriptPromise(); |
| } |
| DecodeAndEnqueue(static_cast<char*>(array_piece.Data()), |
| static_cast<uint32_t>(array_piece.ByteLength()), |
| WTF::FlushBehavior::kDoNotFlush, controller, |
| exception_state); |
| return ScriptPromise::CastUndefined(script_state_.Get()); |
| } |
| |
| // Implements the "encode and flush" algorithm. |
| ScriptPromise Flush(TransformStreamDefaultController* controller, |
| ExceptionState& exception_state) override { |
| DecodeAndEnqueue(nullptr, 0u, WTF::FlushBehavior::kDataEOF, controller, |
| exception_state); |
| |
| return ScriptPromise::CastUndefined(script_state_.Get()); |
| } |
| |
| ScriptState* GetScriptState() override { return script_state_.Get(); } |
| |
| void Trace(Visitor* visitor) const override { |
| visitor->Trace(script_state_); |
| TransformStreamTransformer::Trace(visitor); |
| } |
| |
| private: |
| // Implements the second part of "decode and enqueue a chunk" as well as the |
| // "flush and enqueue" algorithm. |
| void DecodeAndEnqueue(const char* start, |
| uint32_t length, |
| WTF::FlushBehavior flush, |
| TransformStreamDefaultController* controller, |
| ExceptionState& exception_state) { |
| const UChar kBOM = 0xFEFF; |
| |
| bool saw_error = false; |
| String outputChunk = |
| decoder_->Decode(start, length, flush, fatal_, saw_error); |
| |
| if (fatal_ && saw_error) { |
| exception_state.ThrowTypeError("The encoded data was not valid."); |
| return; |
| } |
| |
| if (outputChunk.empty()) |
| return; |
| |
| if (!ignore_bom_ && !bom_seen_) { |
| bom_seen_ = true; |
| if (encoding_has_bom_removal_ && outputChunk[0] == kBOM) { |
| outputChunk.Remove(0); |
| if (outputChunk.empty()) |
| return; |
| } |
| } |
| |
| controller->enqueue( |
| script_state_, |
| ScriptValue(script_state_->GetIsolate(), |
| V8String(script_state_->GetIsolate(), outputChunk)), |
| exception_state); |
| } |
| |
| static bool EncodingHasBomRemoval(const WTF::TextEncoding& encoding) { |
| String name(encoding.GetName()); |
| return name == "UTF-8" || name == "UTF-16LE" || name == "UTF-16BE"; |
| } |
| |
| std::unique_ptr<WTF::TextCodec> decoder_; |
| // There is no danger of ScriptState leaking across worlds because a |
| // TextDecoderStream can only be accessed from the world that created it. |
| Member<ScriptState> script_state_; |
| const bool fatal_; |
| const bool ignore_bom_; |
| const bool encoding_has_bom_removal_; |
| bool bom_seen_; |
| }; |
| |
| TextDecoderStream* TextDecoderStream::Create(ScriptState* script_state, |
| const String& label, |
| const TextDecoderOptions* options, |
| ExceptionState& exception_state) { |
| WTF::TextEncoding encoding( |
| label.StripWhiteSpace(&encoding::IsASCIIWhiteSpace)); |
| // The replacement encoding is not valid, but the Encoding API also |
| // rejects aliases of the replacement encoding. |
| if (!encoding.IsValid() || |
| WTF::EqualIgnoringASCIICase(encoding.GetName(), "replacement")) { |
| exception_state.ThrowRangeError("The encoding label provided ('" + label + |
| "') is invalid."); |
| return nullptr; |
| } |
| |
| return MakeGarbageCollected<TextDecoderStream>(script_state, encoding, |
| options, exception_state); |
| } |
| |
| TextDecoderStream::~TextDecoderStream() = default; |
| |
| String TextDecoderStream::encoding() const { |
| return String(encoding_.GetName()).LowerASCII(); |
| } |
| |
| ReadableStream* TextDecoderStream::readable() const { |
| return transform_->Readable(); |
| } |
| |
| WritableStream* TextDecoderStream::writable() const { |
| return transform_->Writable(); |
| } |
| |
| void TextDecoderStream::Trace(Visitor* visitor) const { |
| visitor->Trace(transform_); |
| ScriptWrappable::Trace(visitor); |
| } |
| |
| TextDecoderStream::TextDecoderStream(ScriptState* script_state, |
| const WTF::TextEncoding& encoding, |
| const TextDecoderOptions* options, |
| ExceptionState& exception_state) |
| : transform_(TransformStream::Create( |
| script_state, |
| MakeGarbageCollected<Transformer>(script_state, |
| encoding, |
| options->fatal(), |
| options->ignoreBOM()), |
| exception_state)), |
| encoding_(encoding), |
| fatal_(options->fatal()), |
| ignore_bom_(options->ignoreBOM()) {} |
| |
| } // namespace blink |