| // Copyright 2017 the V8 project authors. All rights reserved. |
| // Use of this source code is governed by a BSD-style license that can be |
| // found in the LICENSE file. |
| |
| #ifndef V8_INTL_SUPPORT |
| #error Internationalization is expected to be enabled. |
| #endif // V8_INTL_SUPPORT |
| |
| #include "src/builtins/builtins-iterator-gen.h" |
| #include "src/builtins/builtins-utils-gen.h" |
| #include "src/codegen/code-stub-assembler-inl.h" |
| #include "src/objects/js-list-format-inl.h" |
| #include "src/objects/js-list-format.h" |
| #include "src/objects/objects-inl.h" |
| #include "src/objects/objects.h" |
| |
| namespace v8 { |
| namespace internal { |
| |
| #include "src/codegen/define-code-stub-assembler-macros.inc" |
| |
| class IntlBuiltinsAssembler : public CodeStubAssembler { |
| public: |
| explicit IntlBuiltinsAssembler(compiler::CodeAssemblerState* state) |
| : CodeStubAssembler(state) {} |
| |
| void ListFormatCommon(TNode<Context> context, TNode<Int32T> argc, |
| Runtime::FunctionId format_func_id, |
| const char* method_name); |
| |
| TNode<JSArray> AllocateEmptyJSArray(TNode<Context> context); |
| |
| TNode<IntPtrT> PointerToSeqStringData(TNode<String> seq_string) { |
| CSA_DCHECK(this, |
| IsSequentialStringInstanceType(LoadInstanceType(seq_string))); |
| static_assert(OFFSET_OF_DATA_START(SeqOneByteString) == |
| OFFSET_OF_DATA_START(SeqTwoByteString)); |
| return IntPtrAdd(BitcastTaggedToWord(seq_string), |
| IntPtrConstant(OFFSET_OF_DATA_START(SeqOneByteString) - |
| kHeapObjectTag)); |
| } |
| |
| TNode<Uint8T> GetChar(TNode<SeqOneByteString> seq_string, int index) { |
| size_t effective_offset = OFFSET_OF_DATA_START(SeqOneByteString) + |
| sizeof(SeqOneByteString::Char) * index - |
| kHeapObjectTag; |
| return Load<Uint8T>(seq_string, IntPtrConstant(effective_offset)); |
| } |
| |
| // Jumps to {target} if the first two characters of {seq_string} equal |
| // {pattern} ignoring case. |
| void JumpIfStartsWithIgnoreCase(TNode<SeqOneByteString> seq_string, |
| const char* pattern, Label* target) { |
| size_t effective_offset = |
| OFFSET_OF_DATA_START(SeqOneByteString) - kHeapObjectTag; |
| TNode<Uint16T> raw = |
| Load<Uint16T>(seq_string, IntPtrConstant(effective_offset)); |
| DCHECK_EQ(strlen(pattern), 2); |
| #if V8_TARGET_BIG_ENDIAN |
| int raw_pattern = (pattern[0] << 8) + pattern[1]; |
| #else |
| int raw_pattern = pattern[0] + (pattern[1] << 8); |
| #endif |
| GotoIf(Word32Equal(Word32Or(raw, Int32Constant(0x2020)), |
| Int32Constant(raw_pattern)), |
| target); |
| } |
| |
| TNode<BoolT> IsNonAlpha(TNode<Uint8T> character) { |
| return Uint32GreaterThan( |
| Int32Sub(Word32Or(character, Int32Constant(0x20)), Int32Constant('a')), |
| Int32Constant('z' - 'a')); |
| } |
| |
| enum class ToLowerCaseKind { |
| kToLowerCase, |
| kToLocaleLowerCase, |
| }; |
| void ToLowerCaseImpl(TNode<String> string, TNode<Object> maybe_locales, |
| TNode<Context> context, ToLowerCaseKind kind, |
| std::function<void(TNode<Object>)> ReturnFct); |
| }; |
| |
| TF_BUILTIN(StringToLowerCaseIntl, IntlBuiltinsAssembler) { |
| const auto string = Parameter<String>(Descriptor::kString); |
| ToLowerCaseImpl(string, TNode<Object>() /*maybe_locales*/, TNode<Context>(), |
| ToLowerCaseKind::kToLowerCase, |
| [this](TNode<Object> ret) { Return(ret); }); |
| } |
| |
| TF_BUILTIN(StringPrototypeToLowerCaseIntl, IntlBuiltinsAssembler) { |
| auto maybe_string = Parameter<Object>(Descriptor::kReceiver); |
| auto context = Parameter<Context>(Descriptor::kContext); |
| |
| TNode<String> string = |
| ToThisString(context, maybe_string, "String.prototype.toLowerCase"); |
| |
| Return(CallBuiltin(Builtin::kStringToLowerCaseIntl, context, string)); |
| } |
| |
| TF_BUILTIN(StringPrototypeToLocaleLowerCase, IntlBuiltinsAssembler) { |
| TNode<Int32T> argc = |
| UncheckedParameter<Int32T>(Descriptor::kJSActualArgumentsCount); |
| CodeStubArguments args(this, argc); |
| TNode<Object> maybe_string = args.GetReceiver(); |
| TNode<Context> context = Parameter<Context>(Descriptor::kContext); |
| TNode<Object> maybe_locales = args.GetOptionalArgumentValue(0); |
| TNode<String> string = |
| ToThisString(context, maybe_string, "String.prototype.toLocaleLowerCase"); |
| ToLowerCaseImpl(string, maybe_locales, context, |
| ToLowerCaseKind::kToLocaleLowerCase, |
| [&args](TNode<Object> ret) { args.PopAndReturn(ret); }); |
| } |
| |
| void IntlBuiltinsAssembler::ToLowerCaseImpl( |
| TNode<String> string, TNode<Object> maybe_locales, TNode<Context> context, |
| ToLowerCaseKind kind, std::function<void(TNode<Object>)> ReturnFct) { |
| Label call_c(this), return_string(this), runtime(this, Label::kDeferred); |
| |
| // Unpack strings if possible, and bail to runtime unless we get a one-byte |
| // flat string. |
| ToDirectStringAssembler to_direct( |
| state(), string, ToDirectStringAssembler::kDontUnpackSlicedStrings); |
| to_direct.TryToDirect(&runtime); |
| |
| if (kind == ToLowerCaseKind::kToLocaleLowerCase) { |
| Label fast(this), check_locale(this); |
| // Check for fast locales. |
| GotoIf(IsUndefined(maybe_locales), &fast); |
| // Passing a Smi as locales requires performing a ToObject conversion |
| // followed by reading the length property and the "indexed" properties of |
| // it until a valid locale is found. |
| GotoIf(TaggedIsSmi(maybe_locales), &runtime); |
| GotoIfNot(IsString(CAST(maybe_locales)), &runtime); |
| GotoIfNot(IsSeqOneByteString(CAST(maybe_locales)), &runtime); |
| TNode<SeqOneByteString> locale = CAST(maybe_locales); |
| TNode<Uint32T> locale_length = LoadStringLengthAsWord32(locale); |
| GotoIf(Int32LessThan(locale_length, Int32Constant(2)), &runtime); |
| GotoIf(IsNonAlpha(GetChar(locale, 0)), &runtime); |
| GotoIf(IsNonAlpha(GetChar(locale, 1)), &runtime); |
| GotoIf(Word32Equal(locale_length, Int32Constant(2)), &check_locale); |
| GotoIf(Word32NotEqual(locale_length, Int32Constant(5)), &runtime); |
| GotoIf(Word32NotEqual(GetChar(locale, 2), Int32Constant('-')), &runtime); |
| GotoIf(IsNonAlpha(GetChar(locale, 3)), &runtime); |
| GotoIf(IsNonAlpha(GetChar(locale, 4)), &runtime); |
| Goto(&check_locale); |
| |
| Bind(&check_locale); |
| JumpIfStartsWithIgnoreCase(locale, "az", &runtime); |
| JumpIfStartsWithIgnoreCase(locale, "el", &runtime); |
| JumpIfStartsWithIgnoreCase(locale, "lt", &runtime); |
| JumpIfStartsWithIgnoreCase(locale, "tr", &runtime); |
| Goto(&fast); |
| |
| Bind(&fast); |
| } |
| |
| // Early exit on empty string. |
| const TNode<Uint32T> length = LoadStringLengthAsWord32(string); |
| GotoIf(Word32Equal(length, Uint32Constant(0)), &return_string); |
| |
| const TNode<BoolT> is_one_byte = to_direct.IsOneByte(); |
| GotoIfNot(is_one_byte, &runtime); |
| |
| // For short strings, do the conversion in CSA through the lookup table. |
| |
| const TNode<String> dst = AllocateSeqOneByteString(length); |
| |
| const int kMaxShortStringLength = 24; // Determined empirically. |
| GotoIf(Uint32GreaterThan(length, Uint32Constant(kMaxShortStringLength)), |
| &call_c); |
| |
| { |
| const TNode<IntPtrT> dst_ptr = PointerToSeqStringData(dst); |
| TVARIABLE(IntPtrT, var_cursor, IntPtrConstant(0)); |
| |
| const TNode<IntPtrT> start_address = |
| ReinterpretCast<IntPtrT>(to_direct.PointerToData(&call_c)); |
| const TNode<IntPtrT> end_address = |
| Signed(IntPtrAdd(start_address, ChangeUint32ToWord(length))); |
| |
| const TNode<ExternalReference> to_lower_table_addr = |
| ExternalConstant(ExternalReference::intl_to_latin1_lower_table()); |
| |
| TVARIABLE(Word32T, var_did_change, Int32Constant(0)); |
| |
| VariableList push_vars({&var_cursor, &var_did_change}, zone()); |
| BuildFastLoop<IntPtrT>( |
| push_vars, start_address, end_address, |
| [&](TNode<IntPtrT> current) { |
| TNode<Uint8T> c = Load<Uint8T>(current); |
| TNode<Uint8T> lower = |
| Load<Uint8T>(to_lower_table_addr, ChangeInt32ToIntPtr(c)); |
| StoreNoWriteBarrier(MachineRepresentation::kWord8, dst_ptr, |
| var_cursor.value(), lower); |
| |
| var_did_change = |
| Word32Or(Word32NotEqual(c, lower), var_did_change.value()); |
| |
| Increment(&var_cursor); |
| }, |
| kCharSize, LoopUnrollingMode::kNo, IndexAdvanceMode::kPost); |
| |
| // Return the original string if it remained unchanged in order to preserve |
| // e.g. internalization and private symbols (such as the preserved object |
| // hash) on the source string. |
| GotoIfNot(var_did_change.value(), &return_string); |
| |
| ReturnFct(dst); |
| } |
| |
| // Call into C for case conversion. The signature is: |
| // String ConvertOneByteToLower(String src, String dst); |
| BIND(&call_c); |
| { |
| const TNode<String> src = to_direct.string(); |
| |
| const TNode<ExternalReference> function_addr = |
| ExternalConstant(ExternalReference::intl_convert_one_byte_to_lower()); |
| |
| MachineType type_tagged = MachineType::AnyTagged(); |
| |
| const TNode<String> result = CAST(CallCFunction( |
| function_addr, type_tagged, std::make_pair(type_tagged, src), |
| std::make_pair(type_tagged, dst))); |
| |
| ReturnFct(result); |
| } |
| |
| BIND(&return_string); |
| ReturnFct(string); |
| |
| BIND(&runtime); |
| if (kind == ToLowerCaseKind::kToLocaleLowerCase) { |
| ReturnFct(CallRuntime(Runtime::kStringToLocaleLowerCase, context, string, |
| maybe_locales)); |
| } else { |
| DCHECK_EQ(kind, ToLowerCaseKind::kToLowerCase); |
| ReturnFct(CallRuntime(Runtime::kStringToLowerCaseIntl, NoContextConstant(), |
| string)); |
| } |
| } |
| |
| void IntlBuiltinsAssembler::ListFormatCommon(TNode<Context> context, |
| TNode<Int32T> argc, |
| Runtime::FunctionId format_func_id, |
| const char* method_name) { |
| CodeStubArguments args(this, argc); |
| |
| // Label has_list(this); |
| // 1. Let lf be this value. |
| // 2. If Type(lf) is not Object, throw a TypeError exception. |
| TNode<Object> receiver = args.GetReceiver(); |
| |
| // 3. If lf does not have an [[InitializedListFormat]] internal slot, throw a |
| // TypeError exception. |
| ThrowIfNotInstanceType(context, receiver, JS_LIST_FORMAT_TYPE, method_name); |
| TNode<JSListFormat> list_format = CAST(receiver); |
| |
| TNode<Object> list = args.GetOptionalArgumentValue(0); |
| { |
| // 4. Let stringList be ? StringListFromIterable(list). |
| TNode<Object> string_list = |
| CallBuiltin(Builtin::kStringListFromIterable, context, list); |
| |
| // 6. Return ? FormatList(lf, stringList). |
| args.PopAndReturn( |
| CallRuntime(format_func_id, context, list_format, string_list)); |
| } |
| } |
| |
| TNode<JSArray> IntlBuiltinsAssembler::AllocateEmptyJSArray( |
| TNode<Context> context) { |
| return CodeStubAssembler::AllocateJSArray( |
| PACKED_ELEMENTS, |
| LoadJSArrayElementsMap(PACKED_ELEMENTS, LoadNativeContext(context)), |
| IntPtrConstant(0), SmiConstant(0)); |
| } |
| |
| TF_BUILTIN(ListFormatPrototypeFormat, IntlBuiltinsAssembler) { |
| ListFormatCommon( |
| Parameter<Context>(Descriptor::kContext), |
| UncheckedParameter<Int32T>(Descriptor::kJSActualArgumentsCount), |
| Runtime::kFormatList, "Intl.ListFormat.prototype.format"); |
| } |
| |
| TF_BUILTIN(ListFormatPrototypeFormatToParts, IntlBuiltinsAssembler) { |
| ListFormatCommon( |
| Parameter<Context>(Descriptor::kContext), |
| UncheckedParameter<Int32T>(Descriptor::kJSActualArgumentsCount), |
| Runtime::kFormatListToParts, "Intl.ListFormat.prototype.formatToParts"); |
| } |
| |
| #include "src/codegen/undef-code-stub-assembler-macros.inc" |
| |
| } // namespace internal |
| } // namespace v8 |