Avi Drissman | 4e1b7bc | 2022-09-15 14:03:50 | [diff] [blame] | 1 | // Copyright 2022 The Chromium Authors |
Abigail Klein | a303f27 | 2022-03-31 22:32:57 | [diff] [blame] | 2 | // Use of this source code is governed by a BSD-style license that can be |
| 3 | // found in the LICENSE file. |
| 4 | |
Abigail Klein | 1ed2224 | 2022-12-16 16:48:43 | [diff] [blame] | 5 | #include "chrome/renderer/accessibility/ax_tree_distiller.h" |
Abigail Klein | a303f27 | 2022-03-31 22:32:57 | [diff] [blame] | 6 | |
Abigail Klein | e8c97f2 | 2022-04-04 21:39:11 | [diff] [blame] | 7 | #include <memory> |
Abigail Klein | a303f27 | 2022-03-31 22:32:57 | [diff] [blame] | 8 | #include <queue> |
Abigail Klein | e9c8e3c | 2022-07-22 15:47:25 | [diff] [blame] | 9 | #include <utility> |
Abigail Klein | a303f27 | 2022-03-31 22:32:57 | [diff] [blame] | 10 | #include <vector> |
| 11 | |
Abigail Klein | 277fe7c2 | 2022-04-11 21:38:45 | [diff] [blame] | 12 | #include "base/containers/contains.h" |
Abigail Klein | a303f27 | 2022-03-31 22:32:57 | [diff] [blame] | 13 | #include "base/strings/utf_string_conversions.h" |
Abigail Klein | 1ed2224 | 2022-12-16 16:48:43 | [diff] [blame] | 14 | #include "content/public/renderer/render_frame.h" |
Jocelyn Tran | dab4ca60 | 2023-06-05 18:32:30 | [diff] [blame] | 15 | #include "content/public/renderer/render_thread.h" |
| 16 | #include "services/metrics/public/cpp/mojo_ukm_recorder.h" |
| 17 | #include "services/metrics/public/cpp/ukm_builders.h" |
Abigail Klein | 1ed2224 | 2022-12-16 16:48:43 | [diff] [blame] | 18 | #include "third_party/blink/public/common/browser_interface_broker_proxy.h" |
Ramin Halavati | eddadb6 | 2022-05-04 17:29:49 | [diff] [blame] | 19 | #include "ui/accessibility/accessibility_features.h" |
Abigail Klein | a303f27 | 2022-03-31 22:32:57 | [diff] [blame] | 20 | #include "ui/accessibility/ax_node.h" |
| 21 | #include "ui/accessibility/ax_tree.h" |
| 22 | |
| 23 | namespace { |
| 24 | |
Abigail Klein | 277fe7c2 | 2022-04-11 21:38:45 | [diff] [blame] | 25 | // TODO: Consider moving this to AXNodeProperties. |
| 26 | static const ax::mojom::Role kContentRoles[]{ |
| 27 | ax::mojom::Role::kHeading, |
| 28 | ax::mojom::Role::kParagraph, |
Kristi Saney | a99fff3 | 2023-05-17 17:32:15 | [diff] [blame] | 29 | ax::mojom::Role::kNote, |
Abigail Klein | 277fe7c2 | 2022-04-11 21:38:45 | [diff] [blame] | 30 | }; |
| 31 | |
| 32 | // TODO: Consider moving this to AXNodeProperties. |
Abigail Klein | a303f27 | 2022-03-31 22:32:57 | [diff] [blame] | 33 | static const ax::mojom::Role kRolesToSkip[]{ |
| 34 | ax::mojom::Role::kAudio, |
| 35 | ax::mojom::Role::kBanner, |
| 36 | ax::mojom::Role::kButton, |
| 37 | ax::mojom::Role::kComplementary, |
| 38 | ax::mojom::Role::kContentInfo, |
| 39 | ax::mojom::Role::kFooter, |
| 40 | ax::mojom::Role::kFooterAsNonLandmark, |
Abigail Klein | a303f27 | 2022-03-31 22:32:57 | [diff] [blame] | 41 | ax::mojom::Role::kImage, |
| 42 | ax::mojom::Role::kLabelText, |
| 43 | ax::mojom::Role::kNavigation, |
| 44 | }; |
Abigail Klein | a303f27 | 2022-03-31 22:32:57 | [diff] [blame] | 45 | |
Abigail Klein | 41d20e5 | 2022-11-28 19:24:06 | [diff] [blame] | 46 | // Find all of the main and article nodes. |
Abigail Klein | a303f27 | 2022-03-31 22:32:57 | [diff] [blame] | 47 | // TODO(crbug.com/1266555): Replace this with a call to |
| 48 | // OneShotAccessibilityTreeSearch. |
Abigail Klein | 41d20e5 | 2022-11-28 19:24:06 | [diff] [blame] | 49 | void GetContentRootNodes(const ui::AXNode* root, |
| 50 | std::vector<const ui::AXNode*>* content_root_nodes) { |
Kristi Saney | 414dd79b | 2023-04-20 20:45:44 | [diff] [blame] | 51 | if (!root) { |
| 52 | return; |
| 53 | } |
Abigail Klein | a303f27 | 2022-03-31 22:32:57 | [diff] [blame] | 54 | std::queue<const ui::AXNode*> queue; |
Abigail Klein | 930f02c | 2022-11-07 15:03:50 | [diff] [blame] | 55 | queue.push(root); |
Abigail Klein | a303f27 | 2022-03-31 22:32:57 | [diff] [blame] | 56 | while (!queue.empty()) { |
Abigail Klein | 930f02c | 2022-11-07 15:03:50 | [diff] [blame] | 57 | const ui::AXNode* node = queue.front(); |
Abigail Klein | a303f27 | 2022-03-31 22:32:57 | [diff] [blame] | 58 | queue.pop(); |
Abigail Klein | 41d20e5 | 2022-11-28 19:24:06 | [diff] [blame] | 59 | // If a main or article node is found, add it to the list of content root |
| 60 | // nodes and continue. Do not explore children for nested article nodes. |
| 61 | if (node->GetRole() == ax::mojom::Role::kMain || |
| 62 | node->GetRole() == ax::mojom::Role::kArticle) { |
| 63 | content_root_nodes->push_back(node); |
| 64 | continue; |
| 65 | } |
Abigail Klein | 930f02c | 2022-11-07 15:03:50 | [diff] [blame] | 66 | for (auto iter = node->UnignoredChildrenBegin(); |
| 67 | iter != node->UnignoredChildrenEnd(); ++iter) { |
| 68 | queue.push(iter.get()); |
Abigail Klein | a303f27 | 2022-03-31 22:32:57 | [diff] [blame] | 69 | } |
| 70 | } |
Abigail Klein | a303f27 | 2022-03-31 22:32:57 | [diff] [blame] | 71 | } |
| 72 | |
Abigail Klein | 277fe7c2 | 2022-04-11 21:38:45 | [diff] [blame] | 73 | // Recurse through the root node, searching for content nodes (any node whose |
| 74 | // role is in kContentRoles). Skip branches which begin with a node with role |
| 75 | // in kRolesToSkip. Once a content node is identified, add it to the vector |
| 76 | // |content_node_ids|, whose pointer is passed through the recursion. |
| 77 | void AddContentNodesToVector(const ui::AXNode* node, |
| 78 | std::vector<ui::AXNodeID>* content_node_ids) { |
| 79 | if (base::Contains(kContentRoles, node->GetRole())) { |
| 80 | content_node_ids->emplace_back(node->id()); |
Abigail Klein | a303f27 | 2022-03-31 22:32:57 | [diff] [blame] | 81 | return; |
| 82 | } |
Abigail Klein | 277fe7c2 | 2022-04-11 21:38:45 | [diff] [blame] | 83 | if (base::Contains(kRolesToSkip, node->GetRole())) |
| 84 | return; |
Abigail Klein | a303f27 | 2022-03-31 22:32:57 | [diff] [blame] | 85 | for (auto iter = node->UnignoredChildrenBegin(); |
| 86 | iter != node->UnignoredChildrenEnd(); ++iter) { |
Abigail Klein | 277fe7c2 | 2022-04-11 21:38:45 | [diff] [blame] | 87 | AddContentNodesToVector(iter.get(), content_node_ids); |
Abigail Klein | a303f27 | 2022-03-31 22:32:57 | [diff] [blame] | 88 | } |
| 89 | } |
| 90 | |
| 91 | } // namespace |
| 92 | |
Abigail Klein | 1ed2224 | 2022-12-16 16:48:43 | [diff] [blame] | 93 | AXTreeDistiller::AXTreeDistiller( |
| 94 | content::RenderFrame* render_frame, |
| 95 | OnAXTreeDistilledCallback on_ax_tree_distilled_callback) |
| 96 | : render_frame_(render_frame), |
Jocelyn Tran | dab4ca60 | 2023-06-05 18:32:30 | [diff] [blame] | 97 | on_ax_tree_distilled_callback_(on_ax_tree_distilled_callback) { |
| 98 | // TODO(crbug.com/1450930): Use a global ukm recorder instance instead. |
| 99 | mojo::Remote<ukm::mojom::UkmRecorderFactory> factory; |
| 100 | content::RenderThread::Get()->BindHostReceiver( |
| 101 | factory.BindNewPipeAndPassReceiver()); |
| 102 | ukm_recorder_ = ukm::MojoUkmRecorder::Create(*factory); |
| 103 | } |
Abigail Klein | a303f27 | 2022-03-31 22:32:57 | [diff] [blame] | 104 | |
| 105 | AXTreeDistiller::~AXTreeDistiller() = default; |
| 106 | |
Abigail Klein | fdeb3d7 | 2023-01-19 15:20:19 | [diff] [blame] | 107 | void AXTreeDistiller::Distill(const ui::AXTree& tree, |
Abigail Klein | dfdde35 | 2023-01-27 21:03:10 | [diff] [blame] | 108 | const ui::AXTreeUpdate& snapshot, |
Jocelyn Tran | dab4ca60 | 2023-06-05 18:32:30 | [diff] [blame] | 109 | const ukm::SourceId ukm_source_id) { |
| 110 | #if BUILDFLAG(ENABLE_SCREEN_AI_SERVICE) |
| 111 | base::TimeTicks start_time = base::TimeTicks::Now(); |
| 112 | #endif |
Jacob Francis | 1ba3a62 | 2023-11-21 22:18:21 | [diff] [blame^] | 113 | |
Kristi Saney | 4e5438b | 2023-05-16 21:00:58 | [diff] [blame] | 114 | std::vector<ui::AXNodeID> content_node_ids; |
Jacob Francis | 1ba3a62 | 2023-11-21 22:18:21 | [diff] [blame^] | 115 | if (features::IsReadAnythingWithAlgorithmEnabled()) { |
| 116 | // Try with the algorithm first. |
| 117 | DistillViaAlgorithm(tree, ukm_source_id, &content_node_ids); |
| 118 | } |
Kristi Saney | 4e5438b | 2023-05-16 21:00:58 | [diff] [blame] | 119 | |
Abigail Klein | 59872624 | 2023-02-22 18:44:14 | [diff] [blame] | 120 | // If Read Anything with Screen 2x is enabled and the main content extractor |
Kristi Saney | 4e5438b | 2023-05-16 21:00:58 | [diff] [blame] | 121 | // is bound, kick off Screen 2x run, which distills the AXTree in the |
| 122 | // utility process using ML. |
Abigail Klein | af1b516 | 2022-12-01 01:40:40 | [diff] [blame] | 123 | #if BUILDFLAG(ENABLE_SCREEN_AI_SERVICE) |
Abigail Klein | 59872624 | 2023-02-22 18:44:14 | [diff] [blame] | 124 | if (features::IsReadAnythingWithScreen2xEnabled() && |
| 125 | main_content_extractor_.is_bound()) { |
Jocelyn Tran | dab4ca60 | 2023-06-05 18:32:30 | [diff] [blame] | 126 | DistillViaScreen2x(tree, snapshot, ukm_source_id, start_time, |
| 127 | &content_node_ids); |
Abigail Klein | af1b516 | 2022-12-01 01:40:40 | [diff] [blame] | 128 | return; |
| 129 | } |
| 130 | #endif |
| 131 | |
Kristi Saney | 4e5438b | 2023-05-16 21:00:58 | [diff] [blame] | 132 | // Ensure we still callback if Screen2x is not available. |
| 133 | on_ax_tree_distilled_callback_.Run(tree.GetAXTreeID(), content_node_ids); |
Abigail Klein | a303f27 | 2022-03-31 22:32:57 | [diff] [blame] | 134 | } |
| 135 | |
Kristi Saney | 4e5438b | 2023-05-16 21:00:58 | [diff] [blame] | 136 | void AXTreeDistiller::DistillViaAlgorithm( |
| 137 | const ui::AXTree& tree, |
Jocelyn Tran | dab4ca60 | 2023-06-05 18:32:30 | [diff] [blame] | 138 | const ukm::SourceId ukm_source_id, |
Kristi Saney | 4e5438b | 2023-05-16 21:00:58 | [diff] [blame] | 139 | std::vector<ui::AXNodeID>* content_node_ids) { |
Jocelyn Tran | dab4ca60 | 2023-06-05 18:32:30 | [diff] [blame] | 140 | base::TimeTicks start_time = base::TimeTicks::Now(); |
Abigail Klein | 41d20e5 | 2022-11-28 19:24:06 | [diff] [blame] | 141 | std::vector<const ui::AXNode*> content_root_nodes; |
Abigail Klein | fdeb3d7 | 2023-01-19 15:20:19 | [diff] [blame] | 142 | GetContentRootNodes(tree.root(), &content_root_nodes); |
Abigail Klein | 41d20e5 | 2022-11-28 19:24:06 | [diff] [blame] | 143 | for (const ui::AXNode* content_root_node : content_root_nodes) { |
Kristi Saney | 4e5438b | 2023-05-16 21:00:58 | [diff] [blame] | 144 | AddContentNodesToVector(content_root_node, content_node_ids); |
Abigail Klein | 41d20e5 | 2022-11-28 19:24:06 | [diff] [blame] | 145 | } |
Jocelyn Tran | dab4ca60 | 2023-06-05 18:32:30 | [diff] [blame] | 146 | RecordRulesMetrics(ukm_source_id, base::TimeTicks::Now() - start_time, |
| 147 | !content_node_ids->empty()); |
| 148 | } |
| 149 | |
| 150 | void AXTreeDistiller::RecordRulesMetrics(ukm::SourceId ukm_source_id, |
| 151 | base::TimeDelta elapsed_time, |
| 152 | bool success) { |
| 153 | if (success) { |
| 154 | base::UmaHistogramTimes( |
| 155 | "Accessibility.ReadAnything.RulesDistillationTime.Success", |
| 156 | elapsed_time); |
| 157 | ukm::builders::Accessibility_ReadAnything(ukm_source_id) |
| 158 | .SetRulesDistillationTime_Success(elapsed_time.InMilliseconds()) |
| 159 | .Record(ukm_recorder_.get()); |
| 160 | } else { |
| 161 | base::UmaHistogramTimes( |
| 162 | "Accessibility.ReadAnything.RulesDistillationTime.Failure", |
| 163 | elapsed_time); |
| 164 | ukm::builders::Accessibility_ReadAnything(ukm_source_id) |
| 165 | .SetRulesDistillationTime_Failure(elapsed_time.InMilliseconds()) |
| 166 | .Record(ukm_recorder_.get()); |
| 167 | } |
Abigail Klein | a303f27 | 2022-03-31 22:32:57 | [diff] [blame] | 168 | } |
| 169 | |
Ramin Halavati | eddadb6 | 2022-05-04 17:29:49 | [diff] [blame] | 170 | #if BUILDFLAG(ENABLE_SCREEN_AI_SERVICE) |
Abigail Klein | ad097706 | 2023-05-19 18:21:08 | [diff] [blame] | 171 | void AXTreeDistiller::DistillViaScreen2x( |
| 172 | const ui::AXTree& tree, |
| 173 | const ui::AXTreeUpdate& snapshot, |
Jocelyn Tran | dab4ca60 | 2023-06-05 18:32:30 | [diff] [blame] | 174 | const ukm::SourceId ukm_source_id, |
| 175 | base::TimeTicks start_time, |
Abigail Klein | ad097706 | 2023-05-19 18:21:08 | [diff] [blame] | 176 | std::vector<ui::AXNodeID>* content_node_ids_algorithm) { |
Ramin Halavati | eddadb6 | 2022-05-04 17:29:49 | [diff] [blame] | 177 | DCHECK(main_content_extractor_.is_bound()); |
Abigail Klein | ad097706 | 2023-05-19 18:21:08 | [diff] [blame] | 178 | // Make a copy of |content_node_ids_algorithm| rather than sending a pointer. |
Ramin Halavati | eddadb6 | 2022-05-04 17:29:49 | [diff] [blame] | 179 | main_content_extractor_->ExtractMainContent( |
Abigail Klein | dfdde35 | 2023-01-27 21:03:10 | [diff] [blame] | 180 | snapshot, ukm_source_id, |
Abigail Klein | 34db57e | 2023-05-01 22:37:37 | [diff] [blame] | 181 | base::BindOnce(&AXTreeDistiller::ProcessScreen2xResult, |
Abigail Klein | ad097706 | 2023-05-19 18:21:08 | [diff] [blame] | 182 | weak_ptr_factory_.GetWeakPtr(), tree.GetAXTreeID(), |
Jocelyn Tran | dab4ca60 | 2023-06-05 18:32:30 | [diff] [blame] | 183 | ukm_source_id, start_time, *content_node_ids_algorithm)); |
Ramin Halavati | eddadb6 | 2022-05-04 17:29:49 | [diff] [blame] | 184 | } |
| 185 | |
| 186 | void AXTreeDistiller::ProcessScreen2xResult( |
Abigail Klein | 34db57e | 2023-05-01 22:37:37 | [diff] [blame] | 187 | const ui::AXTreeID& tree_id, |
Jocelyn Tran | dab4ca60 | 2023-06-05 18:32:30 | [diff] [blame] | 188 | const ukm::SourceId ukm_source_id, |
| 189 | base::TimeTicks start_time, |
Abigail Klein | ad097706 | 2023-05-19 18:21:08 | [diff] [blame] | 190 | std::vector<ui::AXNodeID> content_node_ids_algorithm, |
| 191 | const std::vector<ui::AXNodeID>& content_node_ids_screen2x) { |
| 192 | // Merge the results from the algorithm and from screen2x. |
| 193 | for (ui::AXNodeID content_node_id_screen2x : content_node_ids_screen2x) { |
| 194 | if (!base::Contains(content_node_ids_algorithm, content_node_id_screen2x)) { |
| 195 | content_node_ids_algorithm.push_back(content_node_id_screen2x); |
| 196 | } |
| 197 | } |
Jocelyn Tran | dab4ca60 | 2023-06-05 18:32:30 | [diff] [blame] | 198 | RecordMergedMetrics(ukm_source_id, base::TimeTicks::Now() - start_time, |
| 199 | !content_node_ids_algorithm.empty()); |
Abigail Klein | ad097706 | 2023-05-19 18:21:08 | [diff] [blame] | 200 | on_ax_tree_distilled_callback_.Run(tree_id, content_node_ids_algorithm); |
Abigail Klein | af1b516 | 2022-12-01 01:40:40 | [diff] [blame] | 201 | |
Kristi Saney | 84a7864 | 2023-05-10 18:41:54 | [diff] [blame] | 202 | // TODO(crbug.com/1266555): If no content nodes were identified, and |
Abigail Klein | d5fef9a | 2022-11-07 15:03:50 | [diff] [blame] | 203 | // there is a selection, try sending Screen2x a partial tree just containing |
| 204 | // the selected nodes. |
Ramin Halavati | eddadb6 | 2022-05-04 17:29:49 | [diff] [blame] | 205 | } |
Abigail Klein | 7849d1a | 2023-01-19 15:20:19 | [diff] [blame] | 206 | |
Abigail Klein | 59872624 | 2023-02-22 18:44:14 | [diff] [blame] | 207 | void AXTreeDistiller::ScreenAIServiceReady() { |
| 208 | if (main_content_extractor_.is_bound()) { |
| 209 | return; |
| 210 | } |
| 211 | render_frame_->GetBrowserInterfaceBroker()->GetInterface( |
| 212 | main_content_extractor_.BindNewPipeAndPassReceiver()); |
| 213 | main_content_extractor_.set_disconnect_handler( |
| 214 | base::BindOnce(&AXTreeDistiller::OnMainContentExtractorDisconnected, |
| 215 | weak_ptr_factory_.GetWeakPtr())); |
| 216 | } |
| 217 | |
Abigail Klein | 7849d1a | 2023-01-19 15:20:19 | [diff] [blame] | 218 | void AXTreeDistiller::OnMainContentExtractorDisconnected() { |
Abigail Klein | 3bd99e0 | 2023-01-24 00:29:18 | [diff] [blame] | 219 | on_ax_tree_distilled_callback_.Run(ui::AXTreeIDUnknown(), |
| 220 | std::vector<ui::AXNodeID>()); |
Abigail Klein | 7849d1a | 2023-01-19 15:20:19 | [diff] [blame] | 221 | } |
Jocelyn Tran | dab4ca60 | 2023-06-05 18:32:30 | [diff] [blame] | 222 | |
| 223 | void AXTreeDistiller::RecordMergedMetrics(ukm::SourceId ukm_source_id, |
| 224 | base::TimeDelta elapsed_time, |
| 225 | bool success) { |
| 226 | if (success) { |
| 227 | base::UmaHistogramTimes( |
| 228 | "Accessibility.ReadAnything.MergedDistillationTime.Success", |
| 229 | elapsed_time); |
| 230 | ukm::builders::Accessibility_ReadAnything(ukm_source_id) |
| 231 | .SetMergedDistillationTime_Success(elapsed_time.InMilliseconds()) |
| 232 | .Record(ukm_recorder_.get()); |
| 233 | } else { |
| 234 | base::UmaHistogramTimes( |
| 235 | "Accessibility.ReadAnything.MergedDistillationTime.Failure", |
| 236 | elapsed_time); |
| 237 | ukm::builders::Accessibility_ReadAnything(ukm_source_id) |
| 238 | .SetMergedDistillationTime_Failure(elapsed_time.InMilliseconds()) |
| 239 | .Record(ukm_recorder_.get()); |
| 240 | } |
| 241 | } |
Ramin Halavati | eddadb6 | 2022-05-04 17:29:49 | [diff] [blame] | 242 | #endif |