blob: 77212bc311c10b07f10a81654bc1663392675cab [file] [log] [blame]
/*
* Copyright (C) 2010 Google, Inc. All Rights Reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY APPLE INC. ``AS IS'' AND ANY
* EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE INC. OR
* CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
* EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
* PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
* PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
* OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
#include "third_party/blink/renderer/core/html/parser/html_view_source_parser.h"
#include <memory>
#include "third_party/blink/renderer/core/dom/dom_implementation.h"
#include "third_party/blink/renderer/core/html/parser/html_parser_idioms.h"
#include "third_party/blink/renderer/core/html/parser/html_parser_options.h"
#include "third_party/blink/renderer/core/html/parser/html_token.h"
#include "third_party/blink/renderer/core/html/parser/xss_auditor_delegate.h"
namespace blink {
HTMLViewSourceParser::HTMLViewSourceParser(HTMLViewSourceDocument& document,
const String& mime_type)
: DecodedDataDocumentParser(document),
tokenizer_(HTMLTokenizer::Create(HTMLParserOptions(&document))) {
if (mime_type != "text/html" && !DOMImplementation::IsXMLMIMEType(mime_type))
tokenizer_->SetState(HTMLTokenizer::kPLAINTEXTState);
}
void HTMLViewSourceParser::PumpTokenizer() {
xss_auditor_.Init(GetDocument(), nullptr);
while (true) {
source_tracker_.Start(input_.Current(), tokenizer_.get(), token_);
if (!tokenizer_->NextToken(input_.Current(), token_))
return;
source_tracker_.end(input_.Current(), tokenizer_.get(), token_);
std::unique_ptr<XSSInfo> xss_info =
xss_auditor_.FilterToken(FilterTokenRequest(
token_, source_tracker_, tokenizer_->ShouldAllowCDATA()));
HTMLViewSourceDocument::SourceAnnotation annotation =
xss_info ? HTMLViewSourceDocument::kAnnotateSourceAsXSS
: HTMLViewSourceDocument::kAnnotateSourceAsSafe;
GetDocument()->AddSource(source_tracker_.SourceForToken(token_), token_,
annotation);
// FIXME: The tokenizer should do this work for us.
if (token_.GetType() == HTMLToken::kStartTag)
tokenizer_->UpdateStateFor(
AttemptStaticStringCreation(token_.GetName(), kLikely8Bit));
token_.Clear();
}
}
void HTMLViewSourceParser::Append(const String& input) {
input_.AppendToEnd(input);
PumpTokenizer();
}
void HTMLViewSourceParser::Finish() {
Flush();
if (!input_.HaveSeenEndOfFile())
input_.MarkEndOfFile();
if (!IsDetached()) {
PumpTokenizer();
GetDocument()->FinishedParsing();
}
}
} // namespace blink