|  | /* | 
|  | * Copyright (C) 2015 Andy VanWagoner (andy@vanwagoner.family) | 
|  | * Copyright (C) 2015 Sukolsak Sakshuwong (sukolsak@gmail.com) | 
|  | * Copyright (C) 2016 Apple Inc. All rights reserved. | 
|  | * | 
|  | * Redistribution and use in source and binary forms, with or without | 
|  | * modification, are permitted provided that the following conditions | 
|  | * are met: | 
|  | * 1. Redistributions of source code must retain the above copyright | 
|  | *    notice, this list of conditions and the following disclaimer. | 
|  | * 2. Redistributions in binary form must reproduce the above copyright | 
|  | *    notice, this list of conditions and the following disclaimer in the | 
|  | *    documentation and/or other materials provided with the distribution. | 
|  | * | 
|  | * THIS SOFTWARE IS PROVIDED BY APPLE INC. AND ITS CONTRIBUTORS ``AS IS'' | 
|  | * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, | 
|  | * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR | 
|  | * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE INC. OR ITS CONTRIBUTORS | 
|  | * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | 
|  | * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | 
|  | * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS | 
|  | * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN | 
|  | * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | 
|  | * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF | 
|  | * THE POSSIBILITY OF SUCH DAMAGE. | 
|  | */ | 
|  |  | 
|  | #include "config.h" | 
|  | #include "IntlObject.h" | 
|  |  | 
|  | #if ENABLE(INTL) | 
|  |  | 
|  | #include "Error.h" | 
|  | #include "FunctionPrototype.h" | 
|  | #include "IntlCollator.h" | 
|  | #include "IntlCollatorConstructor.h" | 
|  | #include "IntlCollatorPrototype.h" | 
|  | #include "IntlDateTimeFormat.h" | 
|  | #include "IntlDateTimeFormatConstructor.h" | 
|  | #include "IntlDateTimeFormatPrototype.h" | 
|  | #include "IntlNumberFormat.h" | 
|  | #include "IntlNumberFormatConstructor.h" | 
|  | #include "IntlNumberFormatPrototype.h" | 
|  | #include "IntlPluralRules.h" | 
|  | #include "IntlPluralRulesConstructor.h" | 
|  | #include "IntlPluralRulesPrototype.h" | 
|  | #include "JSCInlines.h" | 
|  | #include "JSCJSValueInlines.h" | 
|  | #include "Lookup.h" | 
|  | #include "ObjectPrototype.h" | 
|  | #include "Options.h" | 
|  | #include <unicode/uloc.h> | 
|  | #include <unicode/unumsys.h> | 
|  | #include <wtf/Assertions.h> | 
|  | #include <wtf/Language.h> | 
|  | #include <wtf/NeverDestroyed.h> | 
|  | #include <wtf/text/StringBuilder.h> | 
|  |  | 
|  | namespace JSC { | 
|  |  | 
|  | STATIC_ASSERT_IS_TRIVIALLY_DESTRUCTIBLE(IntlObject); | 
|  |  | 
|  | static EncodedJSValue JSC_HOST_CALL intlObjectFuncGetCanonicalLocales(ExecState*); | 
|  |  | 
|  | } | 
|  |  | 
|  | namespace JSC { | 
|  |  | 
|  | struct MatcherResult { | 
|  | String locale; | 
|  | String extension; | 
|  | size_t extensionIndex; | 
|  | }; | 
|  |  | 
|  | const ClassInfo IntlObject::s_info = { "Object", &Base::s_info, nullptr, nullptr, CREATE_METHOD_TABLE(IntlObject) }; | 
|  |  | 
|  | IntlObject::IntlObject(VM& vm, Structure* structure) | 
|  | : JSNonFinalObject(vm, structure) | 
|  | { | 
|  | } | 
|  |  | 
|  | IntlObject* IntlObject::create(VM& vm, JSGlobalObject* globalObject, Structure* structure) | 
|  | { | 
|  | IntlObject* object = new (NotNull, allocateCell<IntlObject>(vm.heap)) IntlObject(vm, structure); | 
|  | object->finishCreation(vm, globalObject); | 
|  | return object; | 
|  | } | 
|  |  | 
|  | void IntlObject::finishCreation(VM& vm, JSGlobalObject* globalObject) | 
|  | { | 
|  | Base::finishCreation(vm); | 
|  | ASSERT(inherits(vm, info())); | 
|  |  | 
|  | // Set up Collator. | 
|  | IntlCollatorPrototype* collatorPrototype = IntlCollatorPrototype::create(vm, globalObject, IntlCollatorPrototype::createStructure(vm, globalObject, globalObject->objectPrototype())); | 
|  | Structure* collatorStructure = IntlCollator::createStructure(vm, globalObject, collatorPrototype); | 
|  | IntlCollatorConstructor* collatorConstructor = IntlCollatorConstructor::create(vm, IntlCollatorConstructor::createStructure(vm, globalObject, globalObject->functionPrototype()), collatorPrototype, collatorStructure); | 
|  |  | 
|  | // Set up NumberFormat. | 
|  | IntlNumberFormatPrototype* numberFormatPrototype = IntlNumberFormatPrototype::create(vm, globalObject, IntlNumberFormatPrototype::createStructure(vm, globalObject, globalObject->objectPrototype())); | 
|  | Structure* numberFormatStructure = IntlNumberFormat::createStructure(vm, globalObject, numberFormatPrototype); | 
|  | IntlNumberFormatConstructor* numberFormatConstructor = IntlNumberFormatConstructor::create(vm, IntlNumberFormatConstructor::createStructure(vm, globalObject, globalObject->functionPrototype()), numberFormatPrototype, numberFormatStructure); | 
|  |  | 
|  | // Set up DateTimeFormat. | 
|  | IntlDateTimeFormatPrototype* dateTimeFormatPrototype = IntlDateTimeFormatPrototype::create(vm, globalObject, IntlDateTimeFormatPrototype::createStructure(vm, globalObject, globalObject->objectPrototype())); | 
|  | Structure* dateTimeFormatStructure = IntlDateTimeFormat::createStructure(vm, globalObject, dateTimeFormatPrototype); | 
|  | IntlDateTimeFormatConstructor* dateTimeFormatConstructor = IntlDateTimeFormatConstructor::create(vm, IntlDateTimeFormatConstructor::createStructure(vm, globalObject, globalObject->functionPrototype()), dateTimeFormatPrototype, dateTimeFormatStructure); | 
|  |  | 
|  | // Set up PluralRules. | 
|  | IntlPluralRulesPrototype* pluralRulesPrototype = IntlPluralRulesPrototype::create(vm, globalObject, IntlPluralRulesPrototype::createStructure(vm, globalObject, globalObject->objectPrototype())); | 
|  | Structure* pluralRulesStructure = IntlPluralRules::createStructure(vm, globalObject, pluralRulesPrototype); | 
|  | IntlPluralRulesConstructor* pluralRulesConstructor = IntlPluralRulesConstructor::create(vm, IntlPluralRulesConstructor::createStructure(vm, globalObject, globalObject->functionPrototype()), pluralRulesPrototype, pluralRulesStructure); | 
|  |  | 
|  | // Constructor Properties of the Intl Object | 
|  | // https://tc39.github.io/ecma402/#sec-constructor-properties-of-the-intl-object | 
|  | putDirectWithoutTransition(vm, vm.propertyNames->Collator, collatorConstructor, static_cast<unsigned>(PropertyAttribute::DontEnum)); | 
|  | putDirectWithoutTransition(vm, vm.propertyNames->NumberFormat, numberFormatConstructor, static_cast<unsigned>(PropertyAttribute::DontEnum)); | 
|  | putDirectWithoutTransition(vm, vm.propertyNames->DateTimeFormat, dateTimeFormatConstructor, static_cast<unsigned>(PropertyAttribute::DontEnum)); | 
|  | if (Options::useIntlPluralRules()) | 
|  | putDirectWithoutTransition(vm, vm.propertyNames->PluralRules, pluralRulesConstructor, static_cast<unsigned>(PropertyAttribute::DontEnum)); | 
|  |  | 
|  | // Function Properties of the Intl Object | 
|  | // https://tc39.github.io/ecma402/#sec-function-properties-of-the-intl-object | 
|  | putDirectNativeFunction(vm, globalObject, Identifier::fromString(&vm, "getCanonicalLocales"), 1, intlObjectFuncGetCanonicalLocales, NoIntrinsic, static_cast<unsigned>(PropertyAttribute::DontEnum)); | 
|  | } | 
|  |  | 
|  | Structure* IntlObject::createStructure(VM& vm, JSGlobalObject* globalObject, JSValue prototype) | 
|  | { | 
|  | return Structure::create(vm, globalObject, prototype, TypeInfo(ObjectType, StructureFlags), info()); | 
|  | } | 
|  |  | 
|  | void convertICULocaleToBCP47LanguageTag(String& locale) | 
|  | { | 
|  | locale.replace('_', '-'); | 
|  | } | 
|  |  | 
|  | bool intlBooleanOption(ExecState& state, JSValue options, PropertyName property, bool& usesFallback) | 
|  | { | 
|  | // GetOption (options, property, type="boolean", values, fallback) | 
|  | // https://tc39.github.io/ecma402/#sec-getoption | 
|  |  | 
|  | VM& vm = state.vm(); | 
|  | auto scope = DECLARE_THROW_SCOPE(vm); | 
|  |  | 
|  | JSObject* opts = options.toObject(&state); | 
|  | RETURN_IF_EXCEPTION(scope, false); | 
|  |  | 
|  | JSValue value = opts->get(&state, property); | 
|  | RETURN_IF_EXCEPTION(scope, false); | 
|  |  | 
|  | if (!value.isUndefined()) { | 
|  | bool booleanValue = value.toBoolean(&state); | 
|  | usesFallback = false; | 
|  | return booleanValue; | 
|  | } | 
|  |  | 
|  | // Because fallback can be undefined, we let the caller handle it instead. | 
|  | usesFallback = true; | 
|  | return false; | 
|  | } | 
|  |  | 
|  | String intlStringOption(ExecState& state, JSValue options, PropertyName property, std::initializer_list<const char*> values, const char* notFound, const char* fallback) | 
|  | { | 
|  | // GetOption (options, property, type="string", values, fallback) | 
|  | // https://tc39.github.io/ecma402/#sec-getoption | 
|  |  | 
|  | VM& vm = state.vm(); | 
|  | auto scope = DECLARE_THROW_SCOPE(vm); | 
|  |  | 
|  | JSObject* opts = options.toObject(&state); | 
|  | RETURN_IF_EXCEPTION(scope, String()); | 
|  |  | 
|  | JSValue value = opts->get(&state, property); | 
|  | RETURN_IF_EXCEPTION(scope, String()); | 
|  |  | 
|  | if (!value.isUndefined()) { | 
|  | String stringValue = value.toWTFString(&state); | 
|  | RETURN_IF_EXCEPTION(scope, String()); | 
|  |  | 
|  | if (values.size() && std::find(values.begin(), values.end(), stringValue) == values.end()) { | 
|  | throwException(&state, scope, createRangeError(&state, notFound)); | 
|  | return { }; | 
|  | } | 
|  | return stringValue; | 
|  | } | 
|  |  | 
|  | return fallback; | 
|  | } | 
|  |  | 
|  | unsigned intlNumberOption(ExecState& state, JSValue options, PropertyName property, unsigned minimum, unsigned maximum, unsigned fallback) | 
|  | { | 
|  | // GetNumberOption (options, property, minimum, maximum, fallback) | 
|  | // https://tc39.github.io/ecma402/#sec-getnumberoption | 
|  |  | 
|  | VM& vm = state.vm(); | 
|  | auto scope = DECLARE_THROW_SCOPE(vm); | 
|  |  | 
|  | JSObject* opts = options.toObject(&state); | 
|  | RETURN_IF_EXCEPTION(scope, 0); | 
|  |  | 
|  | JSValue value = opts->get(&state, property); | 
|  | RETURN_IF_EXCEPTION(scope, 0); | 
|  |  | 
|  | if (!value.isUndefined()) { | 
|  | double doubleValue = value.toNumber(&state); | 
|  | RETURN_IF_EXCEPTION(scope, 0); | 
|  |  | 
|  | if (!(doubleValue >= minimum && doubleValue <= maximum)) { | 
|  | throwException(&state, scope, createRangeError(&state, *property.publicName() + " is out of range")); | 
|  | return 0; | 
|  | } | 
|  | return static_cast<unsigned>(doubleValue); | 
|  | } | 
|  | return fallback; | 
|  | } | 
|  |  | 
|  | static String privateUseLangTag(const Vector<String>& parts, size_t startIndex) | 
|  | { | 
|  | size_t numParts = parts.size(); | 
|  | size_t currentIndex = startIndex; | 
|  |  | 
|  | // Check for privateuse. | 
|  | // privateuse = "x" 1*("-" (1*8alphanum)) | 
|  | StringBuilder privateuse; | 
|  | while (currentIndex < numParts) { | 
|  | const String& singleton = parts[currentIndex]; | 
|  | unsigned singletonLength = singleton.length(); | 
|  | bool isValid = (singletonLength == 1 && (singleton == "x" || singleton == "X")); | 
|  | if (!isValid) | 
|  | break; | 
|  |  | 
|  | if (currentIndex != startIndex) | 
|  | privateuse.append('-'); | 
|  |  | 
|  | ++currentIndex; | 
|  | unsigned numExtParts = 0; | 
|  | privateuse.append('x'); | 
|  | while (currentIndex < numParts) { | 
|  | const String& extPart = parts[currentIndex]; | 
|  | unsigned extPartLength = extPart.length(); | 
|  |  | 
|  | bool isValid = (extPartLength >= 1 && extPartLength <= 8 && extPart.isAllSpecialCharacters<isASCIIAlphanumeric>()); | 
|  | if (!isValid) | 
|  | break; | 
|  |  | 
|  | ++currentIndex; | 
|  | ++numExtParts; | 
|  | privateuse.append('-'); | 
|  | privateuse.append(extPart.convertToASCIILowercase()); | 
|  | } | 
|  |  | 
|  | // Requires at least one production. | 
|  | if (!numExtParts) | 
|  | return String(); | 
|  | } | 
|  |  | 
|  | // Leftovers makes it invalid. | 
|  | if (currentIndex < numParts) | 
|  | return String(); | 
|  |  | 
|  | return privateuse.toString(); | 
|  | } | 
|  |  | 
|  | static String canonicalLangTag(const Vector<String>& parts) | 
|  | { | 
|  | ASSERT(!parts.isEmpty()); | 
|  |  | 
|  | // Follows the grammar at https://www.rfc-editor.org/rfc/bcp/bcp47.txt | 
|  | // langtag = language ["-" script] ["-" region] *("-" variant) *("-" extension) ["-" privateuse] | 
|  |  | 
|  | size_t numParts = parts.size(); | 
|  | // Check for language. | 
|  | // language = 2*3ALPHA ["-" extlang] / 4ALPHA / 5*8ALPHA | 
|  | size_t currentIndex = 0; | 
|  | const String& language = parts[currentIndex]; | 
|  | unsigned languageLength = language.length(); | 
|  | bool canHaveExtlang = languageLength >= 2 && languageLength <= 3; | 
|  | bool isValidLanguage = languageLength >= 2 && languageLength <= 8 && language.isAllSpecialCharacters<isASCIIAlpha>(); | 
|  | if (!isValidLanguage) | 
|  | return String(); | 
|  |  | 
|  | ++currentIndex; | 
|  | StringBuilder canonical; | 
|  | canonical.append(language.convertToASCIILowercase()); | 
|  |  | 
|  | // Check for extlang. | 
|  | // extlang = 3ALPHA *2("-" 3ALPHA) | 
|  | if (canHaveExtlang) { | 
|  | for (unsigned times = 0; times < 3 && currentIndex < numParts; ++times) { | 
|  | const String& extlang = parts[currentIndex]; | 
|  | unsigned extlangLength = extlang.length(); | 
|  | if (extlangLength == 3 && extlang.isAllSpecialCharacters<isASCIIAlpha>()) { | 
|  | ++currentIndex; | 
|  | canonical.append('-'); | 
|  | canonical.append(extlang.convertToASCIILowercase()); | 
|  | } else | 
|  | break; | 
|  | } | 
|  | } | 
|  |  | 
|  | // Check for script. | 
|  | // script = 4ALPHA | 
|  | if (currentIndex < numParts) { | 
|  | const String& script = parts[currentIndex]; | 
|  | unsigned scriptLength = script.length(); | 
|  | if (scriptLength == 4 && script.isAllSpecialCharacters<isASCIIAlpha>()) { | 
|  | ++currentIndex; | 
|  | canonical.append('-'); | 
|  | canonical.append(toASCIIUpper(script[0])); | 
|  | canonical.append(script.substring(1, 3).convertToASCIILowercase()); | 
|  | } | 
|  | } | 
|  |  | 
|  | // Check for region. | 
|  | // region = 2ALPHA / 3DIGIT | 
|  | if (currentIndex < numParts) { | 
|  | const String& region = parts[currentIndex]; | 
|  | unsigned regionLength = region.length(); | 
|  | bool isValidRegion = ( | 
|  | (regionLength == 2 && region.isAllSpecialCharacters<isASCIIAlpha>()) | 
|  | || (regionLength == 3 && region.isAllSpecialCharacters<isASCIIDigit>()) | 
|  | ); | 
|  | if (isValidRegion) { | 
|  | ++currentIndex; | 
|  | canonical.append('-'); | 
|  | canonical.append(region.convertToASCIIUppercase()); | 
|  | } | 
|  | } | 
|  |  | 
|  | // Check for variant. | 
|  | // variant = 5*8alphanum / (DIGIT 3alphanum) | 
|  | HashSet<String> subtags; | 
|  | while (currentIndex < numParts) { | 
|  | const String& variant = parts[currentIndex]; | 
|  | unsigned variantLength = variant.length(); | 
|  | bool isValidVariant = ( | 
|  | (variantLength >= 5 && variantLength <= 8 && variant.isAllSpecialCharacters<isASCIIAlphanumeric>()) | 
|  | || (variantLength == 4 && isASCIIDigit(variant[0]) && variant.substring(1, 3).isAllSpecialCharacters<isASCIIAlphanumeric>()) | 
|  | ); | 
|  | if (!isValidVariant) | 
|  | break; | 
|  |  | 
|  | // Cannot include duplicate subtags (case insensitive). | 
|  | String lowerVariant = variant.convertToASCIILowercase(); | 
|  | if (!subtags.add(lowerVariant).isNewEntry) | 
|  | return String(); | 
|  |  | 
|  | ++currentIndex; | 
|  |  | 
|  | // Reordering variant subtags is not required in the spec. | 
|  | canonical.append('-'); | 
|  | canonical.append(lowerVariant); | 
|  | } | 
|  |  | 
|  | // Check for extension. | 
|  | // extension = singleton 1*("-" (2*8alphanum)) | 
|  | // singleton = alphanum except x or X | 
|  | subtags.clear(); | 
|  | Vector<String> extensions; | 
|  | while (currentIndex < numParts) { | 
|  | const String& possibleSingleton = parts[currentIndex]; | 
|  | unsigned singletonLength = possibleSingleton.length(); | 
|  | bool isValidSingleton = (singletonLength == 1 && possibleSingleton != "x" && possibleSingleton != "X" && isASCIIAlphanumeric(possibleSingleton[0])); | 
|  | if (!isValidSingleton) | 
|  | break; | 
|  |  | 
|  | // Cannot include duplicate singleton (case insensitive). | 
|  | String singleton = possibleSingleton.convertToASCIILowercase(); | 
|  | if (!subtags.add(singleton).isNewEntry) | 
|  | return String(); | 
|  |  | 
|  | ++currentIndex; | 
|  | int numExtParts = 0; | 
|  | StringBuilder extension; | 
|  | extension.append(singleton); | 
|  | while (currentIndex < numParts) { | 
|  | const String& extPart = parts[currentIndex]; | 
|  | unsigned extPartLength = extPart.length(); | 
|  |  | 
|  | bool isValid = (extPartLength >= 2 && extPartLength <= 8 && extPart.isAllSpecialCharacters<isASCIIAlphanumeric>()); | 
|  | if (!isValid) | 
|  | break; | 
|  |  | 
|  | ++currentIndex; | 
|  | ++numExtParts; | 
|  | extension.append('-'); | 
|  | extension.append(extPart.convertToASCIILowercase()); | 
|  | } | 
|  |  | 
|  | // Requires at least one production. | 
|  | if (!numExtParts) | 
|  | return String(); | 
|  |  | 
|  | extensions.append(extension.toString()); | 
|  | } | 
|  |  | 
|  | // Add extensions to canonical sorted by singleton. | 
|  | std::sort( | 
|  | extensions.begin(), | 
|  | extensions.end(), | 
|  | [] (const String& a, const String& b) -> bool { | 
|  | return a[0] < b[0]; | 
|  | } | 
|  | ); | 
|  | size_t numExtenstions = extensions.size(); | 
|  | for (size_t i = 0; i < numExtenstions; ++i) { | 
|  | canonical.append('-'); | 
|  | canonical.append(extensions[i]); | 
|  | } | 
|  |  | 
|  | // Check for privateuse. | 
|  | if (currentIndex < numParts) { | 
|  | String privateuse = privateUseLangTag(parts, currentIndex); | 
|  | if (privateuse.isNull()) | 
|  | return String(); | 
|  | canonical.append('-'); | 
|  | canonical.append(privateuse); | 
|  | } | 
|  |  | 
|  | // FIXME: Replace subtags with their preferred values. | 
|  |  | 
|  | return canonical.toString(); | 
|  | } | 
|  |  | 
|  | static String grandfatheredLangTag(const String& locale) | 
|  | { | 
|  | // grandfathered = irregular / regular | 
|  | // FIXME: convert to a compile time hash table if this is causing performance issues. | 
|  | HashMap<String, String> tagMap = { | 
|  | // Irregular. | 
|  | { ASCIILiteral("en-gb-oed"), ASCIILiteral("en-GB-oed") }, | 
|  | { ASCIILiteral("i-ami"), ASCIILiteral("ami") }, | 
|  | { ASCIILiteral("i-bnn"), ASCIILiteral("bnn") }, | 
|  | { ASCIILiteral("i-default"), ASCIILiteral("i-default") }, | 
|  | { ASCIILiteral("i-enochian"), ASCIILiteral("i-enochian") }, | 
|  | { ASCIILiteral("i-hak"), ASCIILiteral("hak") }, | 
|  | { ASCIILiteral("i-klingon"), ASCIILiteral("tlh") }, | 
|  | { ASCIILiteral("i-lux"), ASCIILiteral("lb") }, | 
|  | { ASCIILiteral("i-mingo"), ASCIILiteral("i-mingo") }, | 
|  | { ASCIILiteral("i-navajo"), ASCIILiteral("nv") }, | 
|  | { ASCIILiteral("i-pwn"), ASCIILiteral("pwn") }, | 
|  | { ASCIILiteral("i-tao"), ASCIILiteral("tao") }, | 
|  | { ASCIILiteral("i-tay"), ASCIILiteral("tay") }, | 
|  | { ASCIILiteral("i-tsu"), ASCIILiteral("tsu") }, | 
|  | { ASCIILiteral("sgn-be-fr"), ASCIILiteral("sfb") }, | 
|  | { ASCIILiteral("sgn-be-nl"), ASCIILiteral("vgt") }, | 
|  | { ASCIILiteral("sgn-ch-de"), ASCIILiteral("sgg") }, | 
|  | // Regular. | 
|  | { ASCIILiteral("art-lojban"), ASCIILiteral("jbo") }, | 
|  | { ASCIILiteral("cel-gaulish"), ASCIILiteral("cel-gaulish") }, | 
|  | { ASCIILiteral("no-bok"), ASCIILiteral("nb") }, | 
|  | { ASCIILiteral("no-nyn"), ASCIILiteral("nn") }, | 
|  | { ASCIILiteral("zh-guoyu"), ASCIILiteral("cmn") }, | 
|  | { ASCIILiteral("zh-hakka"), ASCIILiteral("hak") }, | 
|  | { ASCIILiteral("zh-min"), ASCIILiteral("zh-min") }, | 
|  | { ASCIILiteral("zh-min-nan"), ASCIILiteral("nan") }, | 
|  | { ASCIILiteral("zh-xiang"), ASCIILiteral("hsn") } | 
|  | }; | 
|  |  | 
|  | return tagMap.get(locale.convertToASCIILowercase()); | 
|  | } | 
|  |  | 
|  | static String canonicalizeLanguageTag(const String& locale) | 
|  | { | 
|  | // IsStructurallyValidLanguageTag (locale) | 
|  | // CanonicalizeLanguageTag (locale) | 
|  | // These are done one after another in CanonicalizeLocaleList, so they are combined here to reduce duplication. | 
|  | // https://www.rfc-editor.org/rfc/bcp/bcp47.txt | 
|  |  | 
|  | // Language-Tag = langtag / privateuse / grandfathered | 
|  | String grandfather = grandfatheredLangTag(locale); | 
|  | if (!grandfather.isNull()) | 
|  | return grandfather; | 
|  |  | 
|  | // FIXME: Replace redundant tags [RFC4647]. | 
|  |  | 
|  | Vector<String> parts; | 
|  | locale.split('-', true, parts); | 
|  | if (!parts.isEmpty()) { | 
|  | String langtag = canonicalLangTag(parts); | 
|  | if (!langtag.isNull()) | 
|  | return langtag; | 
|  |  | 
|  | String privateuse = privateUseLangTag(parts, 0); | 
|  | if (!privateuse.isNull()) | 
|  | return privateuse; | 
|  | } | 
|  |  | 
|  | return String(); | 
|  | } | 
|  |  | 
|  | Vector<String> canonicalizeLocaleList(ExecState& state, JSValue locales) | 
|  | { | 
|  | // CanonicalizeLocaleList (locales) | 
|  | // https://tc39.github.io/ecma402/#sec-canonicalizelocalelist | 
|  |  | 
|  | VM& vm = state.vm(); | 
|  | auto scope = DECLARE_THROW_SCOPE(vm); | 
|  |  | 
|  | JSGlobalObject* globalObject = state.jsCallee()->globalObject(); | 
|  | Vector<String> seen; | 
|  |  | 
|  | if (locales.isUndefined()) | 
|  | return seen; | 
|  |  | 
|  | JSObject* localesObject; | 
|  | if (locales.isString()) { | 
|  | JSArray* localesArray = JSArray::tryCreate(vm, globalObject->arrayStructureForIndexingTypeDuringAllocation(ArrayWithContiguous)); | 
|  | if (!localesArray) { | 
|  | throwOutOfMemoryError(&state, scope); | 
|  | RETURN_IF_EXCEPTION(scope, Vector<String>()); | 
|  | } | 
|  | localesArray->push(&state, locales); | 
|  | RETURN_IF_EXCEPTION(scope, Vector<String>()); | 
|  |  | 
|  | localesObject = localesArray; | 
|  | } else { | 
|  | localesObject = locales.toObject(&state); | 
|  | RETURN_IF_EXCEPTION(scope, Vector<String>()); | 
|  | } | 
|  |  | 
|  | // 6. Let len be ToLength(Get(O, "length")). | 
|  | JSValue lengthProperty = localesObject->get(&state, vm.propertyNames->length); | 
|  | RETURN_IF_EXCEPTION(scope, Vector<String>()); | 
|  |  | 
|  | double length = lengthProperty.toLength(&state); | 
|  | RETURN_IF_EXCEPTION(scope, Vector<String>()); | 
|  |  | 
|  | HashSet<String> seenSet; | 
|  | for (double k = 0; k < length; ++k) { | 
|  | bool kPresent = localesObject->hasProperty(&state, k); | 
|  | RETURN_IF_EXCEPTION(scope, Vector<String>()); | 
|  |  | 
|  | if (kPresent) { | 
|  | JSValue kValue = localesObject->get(&state, k); | 
|  | RETURN_IF_EXCEPTION(scope, Vector<String>()); | 
|  |  | 
|  | if (!kValue.isString() && !kValue.isObject()) { | 
|  | throwTypeError(&state, scope, ASCIILiteral("locale value must be a string or object")); | 
|  | return Vector<String>(); | 
|  | } | 
|  |  | 
|  | JSString* tag = kValue.toString(&state); | 
|  | RETURN_IF_EXCEPTION(scope, Vector<String>()); | 
|  |  | 
|  | String canonicalizedTag = canonicalizeLanguageTag(tag->value(&state)); | 
|  | if (canonicalizedTag.isNull()) { | 
|  | throwException(&state, scope, createRangeError(&state, String::format("invalid language tag: %s", tag->value(&state).utf8().data()))); | 
|  | return Vector<String>(); | 
|  | } | 
|  |  | 
|  | if (seenSet.add(canonicalizedTag).isNewEntry) | 
|  | seen.append(canonicalizedTag); | 
|  | } | 
|  | } | 
|  |  | 
|  | return seen; | 
|  | } | 
|  |  | 
|  | String bestAvailableLocale(const HashSet<String>& availableLocales, const String& locale) | 
|  | { | 
|  | // BestAvailableLocale (availableLocales, locale) | 
|  | // https://tc39.github.io/ecma402/#sec-bestavailablelocale | 
|  |  | 
|  | String candidate = locale; | 
|  | while (!candidate.isEmpty()) { | 
|  | if (availableLocales.contains(candidate)) | 
|  | return candidate; | 
|  |  | 
|  | size_t pos = candidate.reverseFind('-'); | 
|  | if (pos == notFound) | 
|  | return String(); | 
|  |  | 
|  | if (pos >= 2 && candidate[pos - 2] == '-') | 
|  | pos -= 2; | 
|  |  | 
|  | candidate = candidate.substring(0, pos); | 
|  | } | 
|  |  | 
|  | return String(); | 
|  | } | 
|  |  | 
|  | String defaultLocale(ExecState& state) | 
|  | { | 
|  | // DefaultLocale () | 
|  | // https://tc39.github.io/ecma402/#sec-defaultlocale | 
|  |  | 
|  | // WebCore's global objects will have their own ideas of how to determine the language. It may | 
|  | // be determined by WebCore-specific logic like some WK settings. Usually this will return the | 
|  | // same thing as userPreferredLanguages()[0]. | 
|  | if (auto defaultLanguage = state.jsCallee()->globalObject()->globalObjectMethodTable()->defaultLanguage) { | 
|  | String locale = defaultLanguage(); | 
|  | if (!locale.isEmpty()) | 
|  | return canonicalizeLanguageTag(locale); | 
|  | } | 
|  |  | 
|  | Vector<String> languages = userPreferredLanguages(); | 
|  | if (!languages.isEmpty() && !languages[0].isEmpty()) | 
|  | return canonicalizeLanguageTag(languages[0]); | 
|  |  | 
|  | // If all else fails, ask ICU. It will probably say something bogus like en_us even if the user | 
|  | // has configured some other language, but being wrong is better than crashing. | 
|  | String locale = uloc_getDefault(); | 
|  | convertICULocaleToBCP47LanguageTag(locale); | 
|  | return locale; | 
|  | } | 
|  |  | 
|  | String removeUnicodeLocaleExtension(const String& locale) | 
|  | { | 
|  | Vector<String> parts; | 
|  | locale.split('-', parts); | 
|  | StringBuilder builder; | 
|  | size_t partsSize = parts.size(); | 
|  | if (partsSize > 0) | 
|  | builder.append(parts[0]); | 
|  | for (size_t p = 1; p < partsSize; ++p) { | 
|  | if (parts[p] == "u" && p + 1 < partsSize) { | 
|  | // Skip the u- and anything that follows until another singleton. | 
|  | // While the next part is part of the unicode extension, skip it. | 
|  | while (p + 1 < partsSize && parts[p + 1].length() > 1) | 
|  | ++p; | 
|  | } else { | 
|  | builder.append('-'); | 
|  | builder.append(parts[p]); | 
|  | } | 
|  | } | 
|  | return builder.toString(); | 
|  | } | 
|  |  | 
|  | static MatcherResult lookupMatcher(ExecState& state, const HashSet<String>& availableLocales, const Vector<String>& requestedLocales) | 
|  | { | 
|  | // LookupMatcher (availableLocales, requestedLocales) | 
|  | // https://tc39.github.io/ecma402/#sec-lookupmatcher | 
|  |  | 
|  | String locale; | 
|  | String noExtensionsLocale; | 
|  | String availableLocale; | 
|  | for (size_t i = 0; i < requestedLocales.size() && availableLocale.isNull(); ++i) { | 
|  | locale = requestedLocales[i]; | 
|  | noExtensionsLocale = removeUnicodeLocaleExtension(locale); | 
|  | availableLocale = bestAvailableLocale(availableLocales, noExtensionsLocale); | 
|  | } | 
|  |  | 
|  | MatcherResult result; | 
|  | if (!availableLocale.isNull()) { | 
|  | result.locale = availableLocale; | 
|  | if (locale != noExtensionsLocale) { | 
|  | size_t extensionIndex = locale.find("-u-"); | 
|  | RELEASE_ASSERT(extensionIndex != notFound); | 
|  |  | 
|  | size_t extensionLength = locale.length() - extensionIndex; | 
|  | size_t end = extensionIndex + 3; | 
|  | while (end < locale.length()) { | 
|  | end = locale.find('-', end); | 
|  | if (end == notFound) | 
|  | break; | 
|  | if (end + 2 < locale.length() && locale[end + 2] == '-') { | 
|  | extensionLength = end - extensionIndex; | 
|  | break; | 
|  | } | 
|  | end++; | 
|  | } | 
|  | result.extension = locale.substring(extensionIndex, extensionLength); | 
|  | result.extensionIndex = extensionIndex; | 
|  | } | 
|  | } else | 
|  | result.locale = defaultLocale(state); | 
|  | return result; | 
|  | } | 
|  |  | 
|  | static MatcherResult bestFitMatcher(ExecState& state, const HashSet<String>& availableLocales, const Vector<String>& requestedLocales) | 
|  | { | 
|  | // BestFitMatcher (availableLocales, requestedLocales) | 
|  | // https://tc39.github.io/ecma402/#sec-bestfitmatcher | 
|  |  | 
|  | // FIXME: Implement something better than lookup. | 
|  | return lookupMatcher(state, availableLocales, requestedLocales); | 
|  | } | 
|  |  | 
|  | static void unicodeExtensionSubTags(const String& extension, Vector<String>& subtags) | 
|  | { | 
|  | // UnicodeExtensionSubtags (extension) | 
|  | // https://tc39.github.io/ecma402/#sec-unicodeextensionsubtags | 
|  |  | 
|  | auto extensionLength = extension.length(); | 
|  | if (extensionLength < 3) | 
|  | return; | 
|  |  | 
|  | size_t subtagStart = 3; // Skip initial -u-. | 
|  | size_t valueStart = 3; | 
|  | bool isLeading = true; | 
|  | for (size_t index = subtagStart; index < extensionLength; ++index) { | 
|  | if (extension[index] == '-') { | 
|  | if (index - subtagStart == 2) { | 
|  | // Tag is a key, first append prior key's value if there is one. | 
|  | if (subtagStart - valueStart > 1) | 
|  | subtags.append(extension.substring(valueStart, subtagStart - valueStart - 1)); | 
|  | subtags.append(extension.substring(subtagStart, index - subtagStart)); | 
|  | valueStart = index + 1; | 
|  | isLeading = false; | 
|  | } else if (isLeading) { | 
|  | // Leading subtags before first key. | 
|  | subtags.append(extension.substring(subtagStart, index - subtagStart)); | 
|  | valueStart = index + 1; | 
|  | } | 
|  | subtagStart = index + 1; | 
|  | } | 
|  | } | 
|  | if (extensionLength - subtagStart == 2) { | 
|  | // Trailing an extension key, first append prior key's value if there is one. | 
|  | if (subtagStart - valueStart > 1) | 
|  | subtags.append(extension.substring(valueStart, subtagStart - valueStart - 1)); | 
|  | valueStart = subtagStart; | 
|  | } | 
|  | // Append final key's value. | 
|  | subtags.append(extension.substring(valueStart, extensionLength - valueStart)); | 
|  | } | 
|  |  | 
|  | HashMap<String, String> resolveLocale(ExecState& state, const HashSet<String>& availableLocales, const Vector<String>& requestedLocales, const HashMap<String, String>& options, const char* const relevantExtensionKeys[], size_t relevantExtensionKeyCount, Vector<String> (*localeData)(const String&, size_t)) | 
|  | { | 
|  | // ResolveLocale (availableLocales, requestedLocales, options, relevantExtensionKeys, localeData) | 
|  | // https://tc39.github.io/ecma402/#sec-resolvelocale | 
|  |  | 
|  | const String& matcher = options.get(ASCIILiteral("localeMatcher")); | 
|  | MatcherResult matcherResult = (matcher == "lookup") | 
|  | ? lookupMatcher(state, availableLocales, requestedLocales) | 
|  | : bestFitMatcher(state, availableLocales, requestedLocales); | 
|  |  | 
|  | String foundLocale = matcherResult.locale; | 
|  |  | 
|  | Vector<String> extensionSubtags; | 
|  | if (!matcherResult.extension.isNull()) | 
|  | unicodeExtensionSubTags(matcherResult.extension, extensionSubtags); | 
|  |  | 
|  | HashMap<String, String> result; | 
|  | result.add(ASCIILiteral("dataLocale"), foundLocale); | 
|  |  | 
|  | String supportedExtension = ASCIILiteral("-u"); | 
|  | for (size_t keyIndex = 0; keyIndex < relevantExtensionKeyCount; ++keyIndex) { | 
|  | const char* key = relevantExtensionKeys[keyIndex]; | 
|  | Vector<String> keyLocaleData = localeData(foundLocale, keyIndex); | 
|  | ASSERT(!keyLocaleData.isEmpty()); | 
|  |  | 
|  | String value = keyLocaleData[0]; | 
|  | String supportedExtensionAddition; | 
|  |  | 
|  | if (!extensionSubtags.isEmpty()) { | 
|  | size_t keyPos = extensionSubtags.find(key); | 
|  | if (keyPos != notFound) { | 
|  | if (keyPos + 1 < extensionSubtags.size() && extensionSubtags[keyPos + 1].length() > 2) { | 
|  | const String& requestedValue = extensionSubtags[keyPos + 1]; | 
|  | if (keyLocaleData.contains(requestedValue)) { | 
|  | value = requestedValue; | 
|  | supportedExtensionAddition = makeString('-', key, '-', value); | 
|  | } | 
|  | } else if (keyLocaleData.contains(static_cast<String>(ASCIILiteral("true")))) { | 
|  | value = ASCIILiteral("true"); | 
|  | } | 
|  | } | 
|  | } | 
|  |  | 
|  | HashMap<String, String>::const_iterator iterator = options.find(key); | 
|  | if (iterator != options.end()) { | 
|  | const String& optionsValue = iterator->value; | 
|  | if (!optionsValue.isNull() && keyLocaleData.contains(optionsValue)) { | 
|  | if (optionsValue != value) { | 
|  | value = optionsValue; | 
|  | supportedExtensionAddition = String(); | 
|  | } | 
|  | } | 
|  | } | 
|  | result.add(key, value); | 
|  | supportedExtension.append(supportedExtensionAddition); | 
|  | } | 
|  |  | 
|  | if (supportedExtension.length() > 2) { | 
|  | String preExtension = foundLocale.substring(0, matcherResult.extensionIndex); | 
|  | String postExtension = foundLocale.substring(matcherResult.extensionIndex); | 
|  | foundLocale = preExtension + supportedExtension + postExtension; | 
|  | } | 
|  |  | 
|  | result.add(ASCIILiteral("locale"), foundLocale); | 
|  | return result; | 
|  | } | 
|  |  | 
|  | static JSArray* lookupSupportedLocales(ExecState& state, const HashSet<String>& availableLocales, const Vector<String>& requestedLocales) | 
|  | { | 
|  | // LookupSupportedLocales (availableLocales, requestedLocales) | 
|  | // https://tc39.github.io/ecma402/#sec-lookupsupportedlocales | 
|  |  | 
|  | VM& vm = state.vm(); | 
|  | auto scope = DECLARE_THROW_SCOPE(vm); | 
|  |  | 
|  | size_t len = requestedLocales.size(); | 
|  | JSGlobalObject* globalObject = state.jsCallee()->globalObject(); | 
|  | JSArray* subset = JSArray::tryCreate(vm, globalObject->arrayStructureForIndexingTypeDuringAllocation(ArrayWithUndecided), 0); | 
|  | if (!subset) { | 
|  | throwOutOfMemoryError(&state, scope); | 
|  | return nullptr; | 
|  | } | 
|  |  | 
|  | for (size_t k = 0; k < len; ++k) { | 
|  | const String& locale = requestedLocales[k]; | 
|  | String noExtensionsLocale = removeUnicodeLocaleExtension(locale); | 
|  | String availableLocale = bestAvailableLocale(availableLocales, noExtensionsLocale); | 
|  | if (!availableLocale.isNull()) { | 
|  | subset->push(&state, jsString(&state, locale)); | 
|  | RETURN_IF_EXCEPTION(scope, nullptr); | 
|  | } | 
|  | } | 
|  |  | 
|  | return subset; | 
|  | } | 
|  |  | 
|  | static JSArray* bestFitSupportedLocales(ExecState& state, const HashSet<String>& availableLocales, const Vector<String>& requestedLocales) | 
|  | { | 
|  | // BestFitSupportedLocales (availableLocales, requestedLocales) | 
|  | // https://tc39.github.io/ecma402/#sec-bestfitsupportedlocales | 
|  |  | 
|  | // FIXME: Implement something better than lookup. | 
|  | return lookupSupportedLocales(state, availableLocales, requestedLocales); | 
|  | } | 
|  |  | 
|  | JSValue supportedLocales(ExecState& state, const HashSet<String>& availableLocales, const Vector<String>& requestedLocales, JSValue options) | 
|  | { | 
|  | // SupportedLocales (availableLocales, requestedLocales, options) | 
|  | // https://tc39.github.io/ecma402/#sec-supportedlocales | 
|  |  | 
|  | VM& vm = state.vm(); | 
|  | auto scope = DECLARE_THROW_SCOPE(vm); | 
|  | String matcher; | 
|  |  | 
|  | if (!options.isUndefined()) { | 
|  | matcher = intlStringOption(state, options, vm.propertyNames->localeMatcher, { "lookup", "best fit" }, "localeMatcher must be either \"lookup\" or \"best fit\"", "best fit"); | 
|  | RETURN_IF_EXCEPTION(scope, JSValue()); | 
|  | } else | 
|  | matcher = ASCIILiteral("best fit"); | 
|  |  | 
|  | JSArray* supportedLocales = (matcher == "best fit") | 
|  | ? bestFitSupportedLocales(state, availableLocales, requestedLocales) | 
|  | : lookupSupportedLocales(state, availableLocales, requestedLocales); | 
|  | RETURN_IF_EXCEPTION(scope, JSValue()); | 
|  |  | 
|  | PropertyNameArray keys(&vm, PropertyNameMode::Strings, PrivateSymbolMode::Exclude); | 
|  | supportedLocales->getOwnPropertyNames(supportedLocales, &state, keys, EnumerationMode()); | 
|  | RETURN_IF_EXCEPTION(scope, JSValue()); | 
|  |  | 
|  | PropertyDescriptor desc; | 
|  | desc.setConfigurable(false); | 
|  | desc.setWritable(false); | 
|  |  | 
|  | size_t len = keys.size(); | 
|  | for (size_t i = 0; i < len; ++i) { | 
|  | supportedLocales->defineOwnProperty(supportedLocales, &state, keys[i], desc, true); | 
|  | RETURN_IF_EXCEPTION(scope, JSValue()); | 
|  | } | 
|  |  | 
|  | return supportedLocales; | 
|  | } | 
|  |  | 
|  | Vector<String> numberingSystemsForLocale(const String& locale) | 
|  | { | 
|  | static NeverDestroyed<Vector<String>> cachedNumberingSystems; | 
|  | Vector<String>& availableNumberingSystems = cachedNumberingSystems.get(); | 
|  |  | 
|  | if (UNLIKELY(availableNumberingSystems.isEmpty())) { | 
|  | static Lock cachedNumberingSystemsMutex; | 
|  | std::lock_guard<Lock> lock(cachedNumberingSystemsMutex); | 
|  | if (availableNumberingSystems.isEmpty()) { | 
|  | UErrorCode status = U_ZERO_ERROR; | 
|  | UEnumeration* numberingSystemNames = unumsys_openAvailableNames(&status); | 
|  | ASSERT(U_SUCCESS(status)); | 
|  |  | 
|  | int32_t resultLength; | 
|  | // Numbering system names are always ASCII, so use char[]. | 
|  | while (const char* result = uenum_next(numberingSystemNames, &resultLength, &status)) { | 
|  | ASSERT(U_SUCCESS(status)); | 
|  | availableNumberingSystems.append(String(result, resultLength)); | 
|  | } | 
|  | uenum_close(numberingSystemNames); | 
|  | } | 
|  | } | 
|  |  | 
|  | UErrorCode status = U_ZERO_ERROR; | 
|  | UNumberingSystem* defaultSystem = unumsys_open(locale.utf8().data(), &status); | 
|  | ASSERT(U_SUCCESS(status)); | 
|  | String defaultSystemName(unumsys_getName(defaultSystem)); | 
|  | unumsys_close(defaultSystem); | 
|  |  | 
|  | Vector<String> numberingSystems({ defaultSystemName }); | 
|  | numberingSystems.appendVector(availableNumberingSystems); | 
|  | return numberingSystems; | 
|  | } | 
|  |  | 
|  | EncodedJSValue JSC_HOST_CALL intlObjectFuncGetCanonicalLocales(ExecState* state) | 
|  | { | 
|  | // Intl.getCanonicalLocales(locales) | 
|  | // https://tc39.github.io/ecma402/#sec-intl.getcanonicallocales | 
|  |  | 
|  | VM& vm = state->vm(); | 
|  | auto scope = DECLARE_THROW_SCOPE(vm); | 
|  |  | 
|  | Vector<String> localeList = canonicalizeLocaleList(*state, state->argument(0)); | 
|  | RETURN_IF_EXCEPTION(scope, encodedJSValue()); | 
|  |  | 
|  | JSGlobalObject* globalObject = state->jsCallee()->globalObject(); | 
|  | JSArray* localeArray = JSArray::tryCreate(vm, globalObject->arrayStructureForIndexingTypeDuringAllocation(ArrayWithContiguous)); | 
|  | if (!localeArray) { | 
|  | throwOutOfMemoryError(state, scope); | 
|  | return encodedJSValue(); | 
|  | } | 
|  |  | 
|  | auto length = localeList.size(); | 
|  | for (size_t i = 0; i < length; ++i) { | 
|  | localeArray->push(state, jsString(state, localeList[i])); | 
|  | RETURN_IF_EXCEPTION(scope, encodedJSValue()); | 
|  | } | 
|  | return JSValue::encode(localeArray); | 
|  | } | 
|  |  | 
|  | } // namespace JSC | 
|  |  | 
|  | #endif // ENABLE(INTL) |