blob: 7ceaabe6d582fc797f5350d51b1ba5743c7f734d [file] [log] [blame]
/*
* Copyright (C) 2010 Google, Inc. All Rights Reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY APPLE INC. ``AS IS'' AND ANY
* EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE INC. OR
* CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
* EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
* PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
* PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
* OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
#include "config.h"
#include "core/dom/DecodedDataDocumentParser.h"
#include "bindings/v8/ExceptionStatePlaceholder.h"
#include "core/dom/Document.h"
#include "core/dom/Element.h"
#include "core/loader/TextResourceDecoder.h"
#include "wtf/text/TextEncodingRegistry.h"
namespace WebCore {
namespace {
class TitleEncodingFixer {
public:
explicit TitleEncodingFixer(Document* document)
: m_document(document)
, m_firstEncoding(document->decoder()->encoding())
{
}
// It's possible for the encoding of the document to change while we're decoding
// data. That can only occur while we're processing the <head> portion of the
// document. There isn't much user-visible content in the <head>, but there is
// the <title> element. This function detects that situation and re-decodes the
// document's title so that the user doesn't see an incorrectly decoded title
// in the title bar.
inline void fixTitleEncodingIfNeeded()
{
if (m_firstEncoding == m_document->decoder()->encoding())
return; // In the common case, the encoding doesn't change and there isn't any work to do.
fixTitleEncoding();
}
private:
void fixTitleEncoding();
Document* m_document;
WTF::TextEncoding m_firstEncoding;
};
void TitleEncodingFixer::fixTitleEncoding()
{
RefPtr<Element> titleElement = m_document->titleElement();
if (!titleElement
|| titleElement->firstElementChild()
|| m_firstEncoding != Latin1Encoding()
|| !titleElement->textContent().containsOnlyLatin1())
return; // Either we don't have a title yet or something bizzare as happened and we give up.
CString originalBytes = titleElement->textContent().latin1();
OwnPtr<TextCodec> codec = newTextCodec(m_document->decoder()->encoding());
String correctlyDecodedTitle = codec->decode(originalBytes.data(), originalBytes.length(), true);
titleElement->setTextContent(correctlyDecodedTitle, IGNORE_EXCEPTION);
}
}
DecodedDataDocumentParser::DecodedDataDocumentParser(Document* document)
: DocumentParser(document)
{
}
size_t DecodedDataDocumentParser::appendBytes(const char* data, size_t length)
{
if (!length)
return 0;
TitleEncodingFixer encodingFixer(document());
String decoded = document()->decoder()->decode(data, length);
encodingFixer.fixTitleEncodingIfNeeded();
if (decoded.isEmpty())
return 0;
size_t consumedChars = decoded.length();
append(decoded.releaseImpl());
return consumedChars;
}
size_t DecodedDataDocumentParser::flush()
{
// null decoder indicates there is no data received.
// We have nothing to do in that case.
TextResourceDecoder* decoder = document()->decoder();
if (!decoder)
return 0;
String remainingData = decoder->flush();
if (remainingData.isEmpty())
return 0;
size_t consumedChars = remainingData.length();
append(remainingData.releaseImpl());
return consumedChars;
}
};