|  | /* | 
|  | * Copyright (C) 2012-2020 Apple Inc. All rights reserved. | 
|  | * | 
|  | * Redistribution and use in source and binary forms, with or without | 
|  | * modification, are permitted provided that the following conditions | 
|  | * are met: | 
|  | * 1. Redistributions of source code must retain the above copyright | 
|  | *    notice, this list of conditions and the following disclaimer. | 
|  | * 2. Redistributions in binary form must reproduce the above copyright | 
|  | *    notice, this list of conditions and the following disclaimer in the | 
|  | *    documentation and/or other materials provided with the distribution. | 
|  | * | 
|  | * THIS SOFTWARE IS PROVIDED BY APPLE INC. ``AS IS'' AND ANY | 
|  | * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | 
|  | * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR | 
|  | * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL APPLE INC. OR | 
|  | * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | 
|  | * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | 
|  | * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | 
|  | * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY | 
|  | * OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | 
|  | * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE | 
|  | * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | 
|  | */ | 
|  |  | 
|  | #include "config.h" | 
|  | #include "CodeBlockHash.h" | 
|  |  | 
|  | #include "SourceCode.h" | 
|  | #include <wtf/SHA1.h> | 
|  | #include <wtf/SixCharacterHash.h> | 
|  |  | 
|  | namespace JSC { | 
|  |  | 
|  | CodeBlockHash::CodeBlockHash(const char* string) | 
|  | : m_hash(sixCharacterHashStringToInteger(string)) | 
|  | { | 
|  | } | 
|  |  | 
|  | CodeBlockHash::CodeBlockHash(const SourceCode& sourceCode, CodeSpecializationKind kind) | 
|  | : m_hash(0) | 
|  | { | 
|  | SHA1 sha1; | 
|  |  | 
|  | // The maxSourceCodeLengthToHash is a heuristic to avoid crashing fuzzers | 
|  | // due to resource exhaustion. This is OK to do because: | 
|  | // 1. CodeBlockHash is not a critical hash. | 
|  | // 2. In practice, reasonable source code are not 500 MB or more long. | 
|  | // 3. And if they are that long, then we are still diversifying the hash on | 
|  | //    their length. But if they do collide, it's OK. | 
|  | // The only invariant here is that we should always produce the same hash | 
|  | // for the same source string. The algorithm below achieves that. | 
|  | ASSERT(sourceCode.length() >= 0); | 
|  | constexpr unsigned maxSourceCodeLengthToHash = 500 * MB; | 
|  | if (static_cast<unsigned>(sourceCode.length()) < maxSourceCodeLengthToHash) | 
|  | sha1.addBytes(sourceCode.toUTF8()); | 
|  | else { | 
|  | // Just hash with the length and samples of the source string instead. | 
|  | StringView str = sourceCode.provider()->source(); | 
|  | unsigned index = 0; | 
|  | unsigned oldIndex = 0; | 
|  | unsigned length = str.length(); | 
|  | unsigned step = (length >> 10) + 1; | 
|  |  | 
|  | sha1.addBytes(bitwise_cast<uint8_t*>(&length), sizeof(length)); | 
|  | do { | 
|  | UChar character = str[index]; | 
|  | sha1.addBytes(bitwise_cast<uint8_t*>(&character), sizeof(character)); | 
|  | oldIndex = index; | 
|  | index += step; | 
|  | } while (index > oldIndex && index < length); | 
|  | } | 
|  |  | 
|  | SHA1::Digest digest; | 
|  | sha1.computeHash(digest); | 
|  | m_hash = digest[0] | (digest[1] << 8) | (digest[2] << 16) | (digest[3] << 24); | 
|  |  | 
|  | if (m_hash == 0 || m_hash == 1) | 
|  | m_hash += 0x2d5a93d0; // Ensures a non-zero hash, and gets us #Azero0 for CodeForCall and #Azero1 for CodeForConstruct. | 
|  | static_assert(static_cast<unsigned>(CodeForCall) == 0); | 
|  | static_assert(static_cast<unsigned>(CodeForConstruct) == 1); | 
|  | m_hash ^= static_cast<unsigned>(kind); | 
|  | ASSERT(m_hash); | 
|  | } | 
|  |  | 
|  | void CodeBlockHash::dump(PrintStream& out) const | 
|  | { | 
|  | std::array<char, 7> buffer = integerToSixCharacterHashString(m_hash); | 
|  |  | 
|  | #if ASSERT_ENABLED | 
|  | CodeBlockHash recompute(buffer.data()); | 
|  | ASSERT(recompute == *this); | 
|  | #endif // ASSERT_ENABLED | 
|  |  | 
|  | out.print(buffer.data()); | 
|  | } | 
|  |  | 
|  | } // namespace JSC | 
|  |  |