ui/accessibility/ax_computed_node_data.cc - chromium/src - Git at Google

 // Copyright 2021 The Chromium Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style license that can be
 // found in the LICENSE file.

 #include "ui/accessibility/ax_computed_node_data.h"

 #include "base/check_op.h"
 #include "base/i18n/break_iterator.h"
 #include "base/logging.h"
 #include "base/numerics/safe_conversions.h"
 #include "base/strings/string_util.h"
 #include "base/strings/utf_string_conversions.h"
 #include "ui/accessibility/ax_enums.mojom.h"
 #include "ui/accessibility/ax_node.h"
 #include "ui/accessibility/ax_node_position.h"
 #include "ui/accessibility/ax_position.h"
 #include "ui/accessibility/ax_range.h"
 #include "ui/accessibility/ax_tree_manager.h"
 #include "ui/accessibility/ax_tree_manager_map.h"

 namespace ui {

 AXComputedNodeData::AXComputedNodeData(const AXNode& node) : owner_(&node) {}

 AXComputedNodeData::~AXComputedNodeData() = default;

 int AXComputedNodeData::GetOrComputeUnignoredIndexInParent() const {
   DCHECK(!owner_->IsIgnored());
   if (unignored_index_in_parent_)
     return *unignored_index_in_parent_;

   if (const AXNode* unignored_parent = owner_->GetUnignoredParent()) {
     unignored_parent->GetComputedNodeData().ComputeUnignoredValues();
   } else {
     // This should be the root node and, by convention, we assign it an
     // index-in-parent of 0.
     unignored_index_in_parent_ = 0;
   }
   return *unignored_index_in_parent_;
 }

 int AXComputedNodeData::GetOrComputeUnignoredChildCount() const {
   DCHECK(!owner_->IsIgnored());
   if (!unignored_child_count_)
     ComputeUnignoredValues();
   return *unignored_child_count_;
 }

 const std::vector<AXNodeID>& AXComputedNodeData::GetOrComputeUnignoredChildIDs()
     const {
   DCHECK(!owner_->IsIgnored());
   if (!unignored_child_ids_)
     ComputeUnignoredValues();
   return *unignored_child_ids_;
 }

 bool AXComputedNodeData::HasOrCanComputeAttribute(
     const ax::mojom::StringAttribute attribute) const {
   if (owner_->data().HasStringAttribute(attribute))
     return true;

   switch (attribute) {
     case ax::mojom::StringAttribute::kValue:
       // The value attribute could be computed on the browser for content
       // editables and ARIA text/search boxes.
       return owner_->data().IsNonAtomicTextField();
     default:
       return false;
   }
 }

 bool AXComputedNodeData::HasOrCanComputeAttribute(
     const ax::mojom::IntListAttribute attribute) const {
   if (owner_->data().HasIntListAttribute(attribute))
     return true;

   switch (attribute) {
     case ax::mojom::IntListAttribute::kLineStarts:
     case ax::mojom::IntListAttribute::kLineEnds:
     case ax::mojom::IntListAttribute::kSentenceStarts:
     case ax::mojom::IntListAttribute::kSentenceEnds:
     case ax::mojom::IntListAttribute::kWordStarts:
     case ax::mojom::IntListAttribute::kWordEnds:
       return true;
     default:
       return false;
   }
 }

 const std::string& AXComputedNodeData::GetOrComputeAttributeUTF8(
     const ax::mojom::StringAttribute attribute) const {
   if (owner_->data().HasStringAttribute(attribute))
     return owner_->data().GetStringAttribute(attribute);

   switch (attribute) {
     case ax::mojom::StringAttribute::kValue:
       if (owner_->data().IsNonAtomicTextField()) {
         DCHECK(HasOrCanComputeAttribute(attribute))
             << "Code in `HasOrCanComputeAttribute` should be in sync with "
                "'GetOrComputeAttributeUTF8`";
         return GetOrComputeTextContentWithParagraphBreaksUTF8();
       }
       // If an atomic text field has no value attribute sent from the renderer,
       // then it means that it is empty, since we do not compute the values of
       // such controls on the browser. The same for all other controls, other
       // than non-atomic text fields.
       return base::EmptyString();
     default:
       // This is a special case: for performance reasons do not use
       // `base::EmptyString()` in other places throughout the codebase.
       return base::EmptyString();
   }
 }

 std::u16string AXComputedNodeData::GetOrComputeAttributeUTF16(
     const ax::mojom::StringAttribute attribute) const {
   if (owner_->data().HasStringAttribute(attribute))
     return owner_->data().GetString16Attribute(attribute);

   switch (attribute) {
     case ax::mojom::StringAttribute::kValue:
       if (owner_->data().IsNonAtomicTextField()) {
         DCHECK(HasOrCanComputeAttribute(attribute))
             << "Code in `HasOrCanComputeAttribute` should be in sync with "
                "'GetOrComputeAttributeUTF16`";
         return GetOrComputeTextContentWithParagraphBreaksUTF16();
       }
       // If an atomic text field has no value attribute sent from the renderer,
       // then it means that it is empty, since we do not compute the values of
       // such controls on the browser. The same for all other controls, other
       // than non-atomic text fields.
       return std::u16string();
     default:
       return std::u16string();
   }
 }

 const std::vector<int32_t>& AXComputedNodeData::GetOrComputeAttribute(
     const ax::mojom::IntListAttribute attribute) const {
   if (owner_->data().HasIntListAttribute(attribute))
     return owner_->data().GetIntListAttribute(attribute);

   const std::vector<int32_t>* result = nullptr;
   switch (attribute) {
     case ax::mojom::IntListAttribute::kLineStarts:
       ComputeLineOffsetsIfNeeded();
       result = &(*line_starts_);
       break;
     case ax::mojom::IntListAttribute::kLineEnds:
       ComputeLineOffsetsIfNeeded();
       result = &(*line_ends_);
       break;
     case ax::mojom::IntListAttribute::kSentenceStarts:
       ComputeSentenceOffsetsIfNeeded();
       result = &(*sentence_starts_);
       break;
     case ax::mojom::IntListAttribute::kSentenceEnds:
       ComputeSentenceOffsetsIfNeeded();
       result = &(*sentence_ends_);
       break;
     case ax::mojom::IntListAttribute::kWordStarts:
       ComputeWordOffsetsIfNeeded();
       result = &(*word_starts_);
       break;
     case ax::mojom::IntListAttribute::kWordEnds:
       ComputeWordOffsetsIfNeeded();
       result = &(*word_ends_);
       break;
     default:
       return owner_->data().GetIntListAttribute(
           ax::mojom::IntListAttribute::kNone);
   }

   DCHECK(HasOrCanComputeAttribute(attribute))
       << "Code in `HasOrCanComputeAttribute` should be in sync with "
          "'GetOrComputeAttribute`";
   DCHECK(result);
   return *result;
 }

 const std::string&
 AXComputedNodeData::GetOrComputeTextContentWithParagraphBreaksUTF8() const {
   if (!text_content_with_paragraph_breaks_utf8_) {
     VLOG_IF(1, text_content_with_paragraph_breaks_utf16_)
         << "Only a single encoding of text content with paragraph breaks "
            "should be cached.";
     auto range =
         AXRange<AXPosition<AXNodePosition, AXNode>>::RangeOfContents(*owner_);
     text_content_with_paragraph_breaks_utf8_ = base::UTF16ToUTF8(
         range.GetText(AXTextConcatenationBehavior::kWithParagraphBreaks,
                       AXEmbeddedObjectBehavior::kSuppressCharacter));
   }
   return *text_content_with_paragraph_breaks_utf8_;
 }

 const std::u16string&
 AXComputedNodeData::GetOrComputeTextContentWithParagraphBreaksUTF16() const {
   if (!text_content_with_paragraph_breaks_utf16_) {
     VLOG_IF(1, text_content_with_paragraph_breaks_utf8_)
         << "Only a single encoding of text content with paragraph breaks "
            "should be cached.";
     auto range =
         AXRange<AXPosition<AXNodePosition, AXNode>>::RangeOfContents(*owner_);
     text_content_with_paragraph_breaks_utf16_ =
         range.GetText(AXTextConcatenationBehavior::kWithParagraphBreaks,
                       AXEmbeddedObjectBehavior::kSuppressCharacter);
   }
   return *text_content_with_paragraph_breaks_utf16_;
 }

 const std::string& AXComputedNodeData::GetOrComputeTextContentUTF8() const {
   if (!text_content_utf8_) {
     VLOG_IF(1, text_content_utf16_)
         << "Only a single encoding of text content should be cached.";
     text_content_utf8_ = ComputeTextContentUTF8();
   }
   return *text_content_utf8_;
 }

 const std::u16string& AXComputedNodeData::GetOrComputeTextContentUTF16() const {
   if (!text_content_utf16_) {
     VLOG_IF(1, text_content_utf8_)
         << "Only a single encoding of text content should be cached.";
     text_content_utf16_ = ComputeTextContentUTF16();
   }
   return *text_content_utf16_;
 }

 int AXComputedNodeData::GetOrComputeTextContentLengthUTF8() const {
   return static_cast<int>(GetOrComputeTextContentUTF8().length());
 }

 int AXComputedNodeData::GetOrComputeTextContentLengthUTF16() const {
   return static_cast<int>(GetOrComputeTextContentUTF16().length());
 }

 void AXComputedNodeData::ComputeUnignoredValues(
     int starting_index_in_parent) const {
   // Reset any previously computed values.
   unignored_index_in_parent_ = absl::nullopt;
   unignored_child_count_ = absl::nullopt;
   unignored_child_ids_ = absl::nullopt;

   int unignored_child_count = 0;
   std::vector<AXNodeID> unignored_child_ids;
   for (auto iter = owner_->AllChildrenBegin(); iter != owner_->AllChildrenEnd();
        ++iter) {
     const AXComputedNodeData& computed_data = iter->GetComputedNodeData();
     int new_index_in_parent = starting_index_in_parent + unignored_child_count;

     if (iter->IsIgnored()) {
       // Skip the ignored node and recursively look at its children.
       computed_data.ComputeUnignoredValues(new_index_in_parent);
       DCHECK(computed_data.unignored_child_count_);
       unignored_child_count += *computed_data.unignored_child_count_;
       DCHECK(computed_data.unignored_child_ids_);
       unignored_child_ids.insert(unignored_child_ids.end(),
                                  computed_data.unignored_child_ids_->begin(),
                                  computed_data.unignored_child_ids_->end());
     } else {
       ++unignored_child_count;
       unignored_child_ids.push_back(iter->id());
       computed_data.unignored_index_in_parent_ = new_index_in_parent;
     }
   }

   // Ignored nodes store unignored child information in order to propagate it to
   // their parents, but do not expose it directly.
   unignored_child_count_ = unignored_child_count;
   unignored_child_ids_ = unignored_child_ids;
 }

 void AXComputedNodeData::ComputeLineOffsetsIfNeeded() const {
   if (line_starts_ || line_ends_) {
     DCHECK_EQ(line_starts_->size(), line_ends_->size());
     return;  // Already cached.
   }

   line_starts_ = std::vector<int32_t>();
   line_ends_ = std::vector<int32_t>();
   const std::u16string& text_content = GetOrComputeTextContentUTF16();
   if (text_content.empty())
     return;

   // TODO(nektar): Using the `base::i18n::BreakIterator` class is not enough. We
   // also need to pass information from Blink as to which inline text boxes
   // start a new line and deprecate next/previous_on_line.
   base::i18n::BreakIterator iter(text_content,
                                  base::i18n::BreakIterator::BREAK_NEWLINE);
   if (!iter.Init())
     return;

   while (iter.Advance()) {
     line_starts_->push_back(base::checked_cast<int32_t>(iter.prev()));
     line_ends_->push_back(base::checked_cast<int32_t>(iter.pos()));
   }
 }

 void AXComputedNodeData::ComputeSentenceOffsetsIfNeeded() const {
   if (sentence_starts_ || sentence_ends_) {
     DCHECK_EQ(sentence_starts_->size(), sentence_ends_->size());
     return;  // Already cached.
   }

   sentence_starts_ = std::vector<int32_t>();
   sentence_ends_ = std::vector<int32_t>();
   if (owner_->IsLineBreak())
     return;
   const std::u16string& text_content = GetOrComputeTextContentUTF16();
   if (text_content.empty() ||
       base::ContainsOnlyChars(text_content, base::kWhitespaceUTF16)) {
     return;
   }

   // Unlike in ICU, a sentence boundary is not valid in Blink if it falls within
   // some whitespace that is used to separate sentences. We therefore need to
   // filter the boundaries returned by ICU and return a subset of them. For
   // example we should exclude a sentence boundary that is between two space
   // characters, "Hello. | there.".
   // TODO(nektar): The above is not accomplished simply by using the
   // `base::i18n::BreakIterator` class.
   base::i18n::BreakIterator iter(text_content,
                                  base::i18n::BreakIterator::BREAK_SENTENCE);
   if (!iter.Init())
     return;

   while (iter.Advance()) {
     sentence_starts_->push_back(base::checked_cast<int32_t>(iter.prev()));
     sentence_ends_->push_back(base::checked_cast<int32_t>(iter.pos()));
   }
 }

 void AXComputedNodeData::ComputeWordOffsetsIfNeeded() const {
   if (word_starts_ || word_ends_) {
     DCHECK_EQ(word_starts_->size(), word_ends_->size());
     return;  // Already cached.
   }

   word_starts_ = std::vector<int32_t>();
   word_ends_ = std::vector<int32_t>();
   const std::u16string& text_content = GetOrComputeTextContentUTF16();
   if (text_content.empty())
     return;

   // Unlike in ICU, a word boundary is valid in Blink only if it is before, or
   // immediately preceded by, an alphanumeric character, a series of punctuation
   // marks, an underscore or a line break. We therefore need to filter the
   // boundaries returned by ICU and return a subset of them. For example we
   // should exclude a word boundary that is between two space characters, "Hello
   // | there".
   // TODO(nektar): Fix the fact that the `base::i18n::BreakIterator` class does
   // not take into account underscores as word separators.
   base::i18n::BreakIterator iter(text_content,
                                  base::i18n::BreakIterator::BREAK_WORD);
   if (!iter.Init())
     return;

   while (iter.Advance()) {
     if (iter.IsWord()) {
       word_starts_->push_back(base::checked_cast<int>(iter.prev()));
       word_ends_->push_back(base::checked_cast<int>(iter.pos()));
     }
   }
 }

 std::string AXComputedNodeData::ComputeTextContentUTF8() const {
   // If a text field has no descendants, then we compute its text content from
   // its value or its placeholder. Otherwise we prefer to look at its descendant
   // text nodes because Blink doesn't always add all trailing white space to the
   // value attribute.
   const bool is_atomic_text_field_without_descendants =
       (owner_->data().IsTextField() && !owner_->GetUnignoredChildCount());
   if (is_atomic_text_field_without_descendants) {
     std::string value =
         owner_->data().GetStringAttribute(ax::mojom::StringAttribute::kValue);
     // If the value is empty, then there might be some placeholder text in the
     // text field, or any other name that is derived from visible contents, even
     // if the text field has no children, so we treat this as any other leaf
     // node.
     if (!value.empty())
       return value;
   }

   // Ordinarily, atomic text fields are leaves, and for all leaves we directly
   // retrieve their text content using the information provided by the tree
   // source, such as Blink. However, for atomic text fields we need to exclude
   // them from the set of leaf nodes when they expose any descendants. This is
   // because we want to compute their text content from their descendant text
   // nodes as we don't always trust the "value" attribute provided by Blink.
   const bool is_atomic_text_field_with_descendants =
       (owner_->data().IsTextField() && owner_->GetUnignoredChildCount());
   if (owner_->IsLeaf() && !is_atomic_text_field_with_descendants) {
     switch (owner_->data().GetNameFrom()) {
       case ax::mojom::NameFrom::kNone:
       case ax::mojom::NameFrom::kUninitialized:
       // The accessible name is not displayed on screen, e.g. aria-label, or is
       // not displayed directly inside the node, e.g. an associated label
       // element.
       case ax::mojom::NameFrom::kAttribute:
       // The node's accessible name is explicitly empty.
       case ax::mojom::NameFrom::kAttributeExplicitlyEmpty:
       // The accessible name does not represent the entirety of the node's text
       // content, e.g. a table's caption or a figure's figcaption.
       case ax::mojom::NameFrom::kCaption:
       case ax::mojom::NameFrom::kRelatedElement:
       // The accessible name is not displayed directly inside the node but is
       // visible via e.g. a tooltip.
       case ax::mojom::NameFrom::kTitle:
         return std::string();

       case ax::mojom::NameFrom::kContents:
       // The placeholder text is initially displayed inside the text field and
       // takes the place of its value.
       case ax::mojom::NameFrom::kPlaceholder:
       // The value attribute takes the place of the node's text content, e.g.
       // the value of a submit button is displayed inside the button itself.
       case ax::mojom::NameFrom::kValue:
         return owner_->data().GetStringAttribute(
             ax::mojom::StringAttribute::kName);
     }
   }

   std::string text_content;
   for (auto it = owner_->UnignoredChildrenCrossingTreeBoundaryBegin();
        it != owner_->UnignoredChildrenCrossingTreeBoundaryEnd(); ++it) {
     text_content += it->GetTextContentUTF8();
   }
   return text_content;
 }

 std::u16string AXComputedNodeData::ComputeTextContentUTF16() const {
   return base::UTF8ToUTF16(ComputeTextContentUTF8());
 }

 }  // namespace ui
	// Copyright 2021 The Chromium Authors. All rights reserved.
	// Use of this source code is governed by a BSD-style license that can be
	// found in the LICENSE file.

	#include "ui/accessibility/ax_computed_node_data.h"

	#include "base/check_op.h"
	#include "base/i18n/break_iterator.h"
	#include "base/logging.h"
	#include "base/numerics/safe_conversions.h"
	#include "base/strings/string_util.h"
	#include "base/strings/utf_string_conversions.h"
	#include "ui/accessibility/ax_enums.mojom.h"
	#include "ui/accessibility/ax_node.h"
	#include "ui/accessibility/ax_node_position.h"
	#include "ui/accessibility/ax_position.h"
	#include "ui/accessibility/ax_range.h"
	#include "ui/accessibility/ax_tree_manager.h"
	#include "ui/accessibility/ax_tree_manager_map.h"

	namespace ui {

	AXComputedNodeData::AXComputedNodeData(const AXNode& node) : owner_(&node) {}

	AXComputedNodeData::~AXComputedNodeData() = default;

	int AXComputedNodeData::GetOrComputeUnignoredIndexInParent() const {
	DCHECK(!owner_->IsIgnored());
	if (unignored_index_in_parent_)
	return *unignored_index_in_parent_;

	if (const AXNode* unignored_parent = owner_->GetUnignoredParent()) {
	unignored_parent->GetComputedNodeData().ComputeUnignoredValues();
	} else {
	// This should be the root node and, by convention, we assign it an
	// index-in-parent of 0.
	unignored_index_in_parent_ = 0;
	}
	return *unignored_index_in_parent_;
	}

	int AXComputedNodeData::GetOrComputeUnignoredChildCount() const {
	DCHECK(!owner_->IsIgnored());
	if (!unignored_child_count_)
	ComputeUnignoredValues();
	return *unignored_child_count_;
	}

	const std::vector<AXNodeID>& AXComputedNodeData::GetOrComputeUnignoredChildIDs()
	const {
	DCHECK(!owner_->IsIgnored());
	if (!unignored_child_ids_)
	ComputeUnignoredValues();
	return *unignored_child_ids_;
	}

	bool AXComputedNodeData::HasOrCanComputeAttribute(
	const ax::mojom::StringAttribute attribute) const {
	if (owner_->data().HasStringAttribute(attribute))
	return true;

	switch (attribute) {
	case ax::mojom::StringAttribute::kValue:
	// The value attribute could be computed on the browser for content
	// editables and ARIA text/search boxes.
	return owner_->data().IsNonAtomicTextField();
	default:
	return false;
	}
	}

	bool AXComputedNodeData::HasOrCanComputeAttribute(
	const ax::mojom::IntListAttribute attribute) const {
	if (owner_->data().HasIntListAttribute(attribute))
	return true;

	switch (attribute) {
	case ax::mojom::IntListAttribute::kLineStarts:
	case ax::mojom::IntListAttribute::kLineEnds:
	case ax::mojom::IntListAttribute::kSentenceStarts:
	case ax::mojom::IntListAttribute::kSentenceEnds:
	case ax::mojom::IntListAttribute::kWordStarts:
	case ax::mojom::IntListAttribute::kWordEnds:
	return true;
	default:
	return false;
	}
	}

	const std::string& AXComputedNodeData::GetOrComputeAttributeUTF8(
	const ax::mojom::StringAttribute attribute) const {
	if (owner_->data().HasStringAttribute(attribute))
	return owner_->data().GetStringAttribute(attribute);

	switch (attribute) {
	case ax::mojom::StringAttribute::kValue:
	if (owner_->data().IsNonAtomicTextField()) {
	DCHECK(HasOrCanComputeAttribute(attribute))
	<< "Code in `HasOrCanComputeAttribute` should be in sync with "
	"'GetOrComputeAttributeUTF8`";
	return GetOrComputeTextContentWithParagraphBreaksUTF8();
	}
	// If an atomic text field has no value attribute sent from the renderer,
	// then it means that it is empty, since we do not compute the values of
	// such controls on the browser. The same for all other controls, other
	// than non-atomic text fields.
	return base::EmptyString();
	default:
	// This is a special case: for performance reasons do not use
	// `base::EmptyString()` in other places throughout the codebase.
	return base::EmptyString();
	}
	}

	std::u16string AXComputedNodeData::GetOrComputeAttributeUTF16(
	const ax::mojom::StringAttribute attribute) const {
	if (owner_->data().HasStringAttribute(attribute))
	return owner_->data().GetString16Attribute(attribute);

	switch (attribute) {
	case ax::mojom::StringAttribute::kValue:
	if (owner_->data().IsNonAtomicTextField()) {
	DCHECK(HasOrCanComputeAttribute(attribute))
	<< "Code in `HasOrCanComputeAttribute` should be in sync with "
	"'GetOrComputeAttributeUTF16`";
	return GetOrComputeTextContentWithParagraphBreaksUTF16();
	}
	// If an atomic text field has no value attribute sent from the renderer,
	// then it means that it is empty, since we do not compute the values of
	// such controls on the browser. The same for all other controls, other
	// than non-atomic text fields.
	return std::u16string();
	default:
	return std::u16string();
	}
	}

	const std::vector<int32_t>& AXComputedNodeData::GetOrComputeAttribute(
	const ax::mojom::IntListAttribute attribute) const {
	if (owner_->data().HasIntListAttribute(attribute))
	return owner_->data().GetIntListAttribute(attribute);

	const std::vector<int32_t>* result = nullptr;
	switch (attribute) {
	case ax::mojom::IntListAttribute::kLineStarts:
	ComputeLineOffsetsIfNeeded();
	result = &(*line_starts_);
	break;
	case ax::mojom::IntListAttribute::kLineEnds:
	ComputeLineOffsetsIfNeeded();
	result = &(*line_ends_);
	break;
	case ax::mojom::IntListAttribute::kSentenceStarts:
	ComputeSentenceOffsetsIfNeeded();
	result = &(*sentence_starts_);
	break;
	case ax::mojom::IntListAttribute::kSentenceEnds:
	ComputeSentenceOffsetsIfNeeded();
	result = &(*sentence_ends_);
	break;
	case ax::mojom::IntListAttribute::kWordStarts:
	ComputeWordOffsetsIfNeeded();
	result = &(*word_starts_);
	break;
	case ax::mojom::IntListAttribute::kWordEnds:
	ComputeWordOffsetsIfNeeded();
	result = &(*word_ends_);
	break;
	default:
	return owner_->data().GetIntListAttribute(
	ax::mojom::IntListAttribute::kNone);
	}

	DCHECK(HasOrCanComputeAttribute(attribute))
	<< "Code in `HasOrCanComputeAttribute` should be in sync with "
	"'GetOrComputeAttribute`";
	DCHECK(result);
	return *result;
	}

	const std::string&
	AXComputedNodeData::GetOrComputeTextContentWithParagraphBreaksUTF8() const {
	if (!text_content_with_paragraph_breaks_utf8_) {
	VLOG_IF(1, text_content_with_paragraph_breaks_utf16_)
	<< "Only a single encoding of text content with paragraph breaks "
	"should be cached.";
	auto range =
	AXRange<AXPosition<AXNodePosition, AXNode>>::RangeOfContents(*owner_);
	text_content_with_paragraph_breaks_utf8_ = base::UTF16ToUTF8(
	range.GetText(AXTextConcatenationBehavior::kWithParagraphBreaks,
	AXEmbeddedObjectBehavior::kSuppressCharacter));
	}
	return *text_content_with_paragraph_breaks_utf8_;
	}

	const std::u16string&
	AXComputedNodeData::GetOrComputeTextContentWithParagraphBreaksUTF16() const {
	if (!text_content_with_paragraph_breaks_utf16_) {
	VLOG_IF(1, text_content_with_paragraph_breaks_utf8_)
	<< "Only a single encoding of text content with paragraph breaks "
	"should be cached.";
	auto range =
	AXRange<AXPosition<AXNodePosition, AXNode>>::RangeOfContents(*owner_);
	text_content_with_paragraph_breaks_utf16_ =
	range.GetText(AXTextConcatenationBehavior::kWithParagraphBreaks,
	AXEmbeddedObjectBehavior::kSuppressCharacter);
	}
	return *text_content_with_paragraph_breaks_utf16_;
	}

	const std::string& AXComputedNodeData::GetOrComputeTextContentUTF8() const {
	if (!text_content_utf8_) {
	VLOG_IF(1, text_content_utf16_)
	<< "Only a single encoding of text content should be cached.";
	text_content_utf8_ = ComputeTextContentUTF8();
	}
	return *text_content_utf8_;
	}

	const std::u16string& AXComputedNodeData::GetOrComputeTextContentUTF16() const {
	if (!text_content_utf16_) {
	VLOG_IF(1, text_content_utf8_)
	<< "Only a single encoding of text content should be cached.";
	text_content_utf16_ = ComputeTextContentUTF16();
	}
	return *text_content_utf16_;
	}

	int AXComputedNodeData::GetOrComputeTextContentLengthUTF8() const {
	return static_cast<int>(GetOrComputeTextContentUTF8().length());
	}

	int AXComputedNodeData::GetOrComputeTextContentLengthUTF16() const {
	return static_cast<int>(GetOrComputeTextContentUTF16().length());
	}

	void AXComputedNodeData::ComputeUnignoredValues(
	int starting_index_in_parent) const {
	// Reset any previously computed values.
	unignored_index_in_parent_ = absl::nullopt;
	unignored_child_count_ = absl::nullopt;
	unignored_child_ids_ = absl::nullopt;

	int unignored_child_count = 0;
	std::vector<AXNodeID> unignored_child_ids;
	for (auto iter = owner_->AllChildrenBegin(); iter != owner_->AllChildrenEnd();
	++iter) {
	const AXComputedNodeData& computed_data = iter->GetComputedNodeData();
	int new_index_in_parent = starting_index_in_parent + unignored_child_count;

	if (iter->IsIgnored()) {
	// Skip the ignored node and recursively look at its children.
	computed_data.ComputeUnignoredValues(new_index_in_parent);
	DCHECK(computed_data.unignored_child_count_);
	unignored_child_count += *computed_data.unignored_child_count_;
	DCHECK(computed_data.unignored_child_ids_);
	unignored_child_ids.insert(unignored_child_ids.end(),
	computed_data.unignored_child_ids_->begin(),
	computed_data.unignored_child_ids_->end());
	} else {
	++unignored_child_count;
	unignored_child_ids.push_back(iter->id());
	computed_data.unignored_index_in_parent_ = new_index_in_parent;
	}
	}

	// Ignored nodes store unignored child information in order to propagate it to
	// their parents, but do not expose it directly.
	unignored_child_count_ = unignored_child_count;
	unignored_child_ids_ = unignored_child_ids;
	}

	void AXComputedNodeData::ComputeLineOffsetsIfNeeded() const {
	if (line_starts_ \|\| line_ends_) {
	DCHECK_EQ(line_starts_->size(), line_ends_->size());
	return; // Already cached.
	}

	line_starts_ = std::vector<int32_t>();
	line_ends_ = std::vector<int32_t>();
	const std::u16string& text_content = GetOrComputeTextContentUTF16();
	if (text_content.empty())
	return;

	// TODO(nektar): Using the `base::i18n::BreakIterator` class is not enough. We
	// also need to pass information from Blink as to which inline text boxes
	// start a new line and deprecate next/previous_on_line.
	base::i18n::BreakIterator iter(text_content,
	base::i18n::BreakIterator::BREAK_NEWLINE);
	if (!iter.Init())
	return;

	while (iter.Advance()) {
	line_starts_->push_back(base::checked_cast<int32_t>(iter.prev()));
	line_ends_->push_back(base::checked_cast<int32_t>(iter.pos()));
	}
	}

	void AXComputedNodeData::ComputeSentenceOffsetsIfNeeded() const {
	if (sentence_starts_ \|\| sentence_ends_) {
	DCHECK_EQ(sentence_starts_->size(), sentence_ends_->size());
	return; // Already cached.
	}

	sentence_starts_ = std::vector<int32_t>();
	sentence_ends_ = std::vector<int32_t>();
	if (owner_->IsLineBreak())
	return;
	const std::u16string& text_content = GetOrComputeTextContentUTF16();
	if (text_content.empty() \|\|
	base::ContainsOnlyChars(text_content, base::kWhitespaceUTF16)) {
	return;
	}

	// Unlike in ICU, a sentence boundary is not valid in Blink if it falls within
	// some whitespace that is used to separate sentences. We therefore need to
	// filter the boundaries returned by ICU and return a subset of them. For
	// example we should exclude a sentence boundary that is between two space
	// characters, "Hello. \| there.".
	// TODO(nektar): The above is not accomplished simply by using the
	// `base::i18n::BreakIterator` class.
	base::i18n::BreakIterator iter(text_content,
	base::i18n::BreakIterator::BREAK_SENTENCE);
	if (!iter.Init())
	return;

	while (iter.Advance()) {
	sentence_starts_->push_back(base::checked_cast<int32_t>(iter.prev()));
	sentence_ends_->push_back(base::checked_cast<int32_t>(iter.pos()));
	}
	}

	void AXComputedNodeData::ComputeWordOffsetsIfNeeded() const {
	if (word_starts_ \|\| word_ends_) {
	DCHECK_EQ(word_starts_->size(), word_ends_->size());
	return; // Already cached.
	}

	word_starts_ = std::vector<int32_t>();
	word_ends_ = std::vector<int32_t>();
	const std::u16string& text_content = GetOrComputeTextContentUTF16();
	if (text_content.empty())
	return;

	// Unlike in ICU, a word boundary is valid in Blink only if it is before, or
	// immediately preceded by, an alphanumeric character, a series of punctuation
	// marks, an underscore or a line break. We therefore need to filter the
	// boundaries returned by ICU and return a subset of them. For example we
	// should exclude a word boundary that is between two space characters, "Hello
	// \| there".
	// TODO(nektar): Fix the fact that the `base::i18n::BreakIterator` class does
	// not take into account underscores as word separators.
	base::i18n::BreakIterator iter(text_content,
	base::i18n::BreakIterator::BREAK_WORD);
	if (!iter.Init())
	return;

	while (iter.Advance()) {
	if (iter.IsWord()) {
	word_starts_->push_back(base::checked_cast<int>(iter.prev()));
	word_ends_->push_back(base::checked_cast<int>(iter.pos()));
	}
	}
	}

	std::string AXComputedNodeData::ComputeTextContentUTF8() const {
	// If a text field has no descendants, then we compute its text content from
	// its value or its placeholder. Otherwise we prefer to look at its descendant
	// text nodes because Blink doesn't always add all trailing white space to the
	// value attribute.
	const bool is_atomic_text_field_without_descendants =
	(owner_->data().IsTextField() && !owner_->GetUnignoredChildCount());
	if (is_atomic_text_field_without_descendants) {
	std::string value =
	owner_->data().GetStringAttribute(ax::mojom::StringAttribute::kValue);
	// If the value is empty, then there might be some placeholder text in the
	// text field, or any other name that is derived from visible contents, even
	// if the text field has no children, so we treat this as any other leaf
	// node.
	if (!value.empty())
	return value;
	}

	// Ordinarily, atomic text fields are leaves, and for all leaves we directly
	// retrieve their text content using the information provided by the tree
	// source, such as Blink. However, for atomic text fields we need to exclude
	// them from the set of leaf nodes when they expose any descendants. This is
	// because we want to compute their text content from their descendant text
	// nodes as we don't always trust the "value" attribute provided by Blink.
	const bool is_atomic_text_field_with_descendants =
	(owner_->data().IsTextField() && owner_->GetUnignoredChildCount());
	if (owner_->IsLeaf() && !is_atomic_text_field_with_descendants) {
	switch (owner_->data().GetNameFrom()) {
	case ax::mojom::NameFrom::kNone:
	case ax::mojom::NameFrom::kUninitialized:
	// The accessible name is not displayed on screen, e.g. aria-label, or is
	// not displayed directly inside the node, e.g. an associated label
	// element.
	case ax::mojom::NameFrom::kAttribute:
	// The node's accessible name is explicitly empty.
	case ax::mojom::NameFrom::kAttributeExplicitlyEmpty:
	// The accessible name does not represent the entirety of the node's text
	// content, e.g. a table's caption or a figure's figcaption.
	case ax::mojom::NameFrom::kCaption:
	case ax::mojom::NameFrom::kRelatedElement:
	// The accessible name is not displayed directly inside the node but is
	// visible via e.g. a tooltip.
	case ax::mojom::NameFrom::kTitle:
	return std::string();

	case ax::mojom::NameFrom::kContents:
	// The placeholder text is initially displayed inside the text field and
	// takes the place of its value.
	case ax::mojom::NameFrom::kPlaceholder:
	// The value attribute takes the place of the node's text content, e.g.
	// the value of a submit button is displayed inside the button itself.
	case ax::mojom::NameFrom::kValue:
	return owner_->data().GetStringAttribute(
	ax::mojom::StringAttribute::kName);
	}
	}

	std::string text_content;
	for (auto it = owner_->UnignoredChildrenCrossingTreeBoundaryBegin();
	it != owner_->UnignoredChildrenCrossingTreeBoundaryEnd(); ++it) {
	text_content += it->GetTextContentUTF8();
	}
	return text_content;
	}

	std::u16string AXComputedNodeData::ComputeTextContentUTF16() const {
	return base::UTF8ToUTF16(ComputeTextContentUTF8());
	}

	} // namespace ui