1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219
|
// Copyright 2023 The Chromium Authors
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
#ifndef CHROME_BROWSER_ACCESSIBILITY_MEDIA_APP_AX_MEDIA_APP_UNTRUSTED_SERVICE_H_
#define CHROME_BROWSER_ACCESSIBILITY_MEDIA_APP_AX_MEDIA_APP_UNTRUSTED_SERVICE_H_
#include <stdint.h>
#include <map>
#include <memory>
#include <optional>
#include <vector>
#include "ash/webui/media_app_ui/media_app_ui_untrusted.mojom.h"
#include "base/callback_list.h"
#include "base/containers/circular_deque.h"
#include "base/memory/raw_ptr.h"
#include "base/memory/raw_ref.h"
#include "base/memory/weak_ptr.h"
#include "base/sequence_checker.h"
#include "base/time/time.h"
#include "build/build_config.h"
#include "chrome/browser/accessibility/media_app/ax_media_app.h"
#include "chrome/browser/ash/accessibility/accessibility_manager.h"
#include "content/public/browser/browser_accessibility_state.h"
#include "content/public/browser/browser_context.h"
#include "content/public/browser/web_contents_observer.h"
#include "mojo/public/cpp/bindings/message.h"
#include "mojo/public/cpp/bindings/pending_remote.h"
#include "mojo/public/cpp/bindings/remote.h"
#include "ui/accessibility/ax_action_handler_base.h"
#include "ui/accessibility/ax_action_handler_registry.h"
#include "ui/accessibility/ax_enums.mojom.h"
#include "ui/accessibility/ax_event.h"
#include "ui/accessibility/ax_mode.h"
#include "ui/accessibility/ax_node_data.h"
#include "ui/accessibility/ax_node_id_forward.h"
#include "ui/accessibility/ax_serializable_tree.h"
#include "ui/accessibility/ax_tree_data.h"
#include "ui/accessibility/ax_tree_id.h"
#include "ui/accessibility/ax_tree_manager.h"
#include "ui/accessibility/ax_tree_serializer.h"
#include "ui/accessibility/ax_tree_source.h"
#include "ui/accessibility/ax_tree_update.h"
#include "ui/gfx/native_widget_types.h"
class SkBitmap;
namespace content {
class RenderFrameHost;
class WebContents;
} // namespace content
namespace screen_ai {
class OpticalCharacterRecognizer;
} // namespace screen_ai
namespace ui {
struct AXActionData;
class AXNode;
struct AXUpdatesAndEvents;
class RectF;
} // namespace ui
namespace ash {
struct AXMediaAppPageMetadata : ash::media_app_ui::mojom::PageMetadata {
// The page number of the page that this metadata describes. 1-indexed. Pages
// with a page number of 0 are 'deleted'.
uint32_t page_num;
};
class AXMediaAppUntrustedService
: public media_app_ui::mojom::OcrUntrustedService,
public ui::AXActionHandlerBase,
public content::WebContentsObserver {
public:
using TreeSource =
ui::AXTreeSource<const ui::AXNode*, ui::AXTreeData*, ui::AXNodeData>;
using TreeSerializer = ui::AXTreeSerializer<const ui::AXNode*,
std::vector<const ui::AXNode*>,
ui::AXTreeUpdate*,
ui::AXTreeData*,
ui::AXNodeData>;
enum class OcrStatus {
kUninitialized,
kInitializationFailed,
kInProgressWithNoTextExtractedYet,
kInProgressWithTextExtracted,
kCompletedWithNoTextExtracted,
kCompletedWithTextExtracted,
};
AXMediaAppUntrustedService(
content::BrowserContext& context,
gfx::NativeWindow native_window,
mojo::PendingRemote<media_app_ui::mojom::OcrUntrustedPage> page);
AXMediaAppUntrustedService(const AXMediaAppUntrustedService&) = delete;
AXMediaAppUntrustedService& operator=(const AXMediaAppUntrustedService&) =
delete;
~AXMediaAppUntrustedService() override;
bool IsAccessibilityEnabled() const;
void OnOCRServiceInitialized(bool is_successful);
void OnAshAccessibilityModeChanged(
const ash::AccessibilityStatusEventDetails& details);
// ui::AXActionHandlerBase:
void PerformAction(const ui::AXActionData& action_data) override;
// content::WebContentsObserver:
void AccessibilityEventReceived(
const ui::AXUpdatesAndEvents& details) override;
// ash::media_app_ui::mojom::OcrUntrustedService:
void PageMetadataUpdated(
const std::vector<ash::media_app_ui::mojom::PageMetadataPtr>
page_metadata) override;
void PageContentsUpdated(const std::string& dirty_page_id) override;
void ViewportUpdated(const ::gfx::RectF& viewport_box,
float scale_factor) override;
protected:
virtual bool IsOcrServiceEnabled() const;
void PushDirtyPage(const std::string& dirty_page_id);
std::string PopDirtyPage();
virtual void OcrNextDirtyPageIfAny();
size_t min_pages_per_batch_ = 2u;
size_t pages_ocred_on_initial_load_ = 0u;
// `AXMediaApp` should outlive this handler.
raw_ptr<AXMediaApp> media_app_;
bool has_landmark_node_ = true;
bool has_postamble_page_ = true;
std::unique_ptr<ui::AXTreeManager> document_;
std::unique_ptr<TreeSource> document_source_;
std::unique_ptr<TreeSerializer> document_serializer_;
std::map<const std::string, AXMediaAppPageMetadata> page_metadata_;
std::map<const std::string, std::unique_ptr<ui::AXTreeManager>> pages_;
std::map<const std::string, std::unique_ptr<TreeSource>> page_sources_;
std::map<const std::string, std::unique_ptr<TreeSerializer>>
page_serializers_;
std::unique_ptr<std::vector<ui::AXTreeUpdate>>
pending_serialized_updates_for_testing_;
raw_ptr<ui::AXNode> last_hit_test_node_for_testing_;
ui::AXEvent last_hit_test_event_for_testing_;
scoped_refptr<screen_ai::OpticalCharacterRecognizer> ocr_;
private:
size_t ComputePagesPerBatch() const;
std::vector<ui::AXNodeData> CreateStatusNodesWithLandmark() const;
std::vector<ui::AXNodeData> CreatePostamblePage() const;
void ToggleAccessibilityState();
void SendAllAXTreesToAccessibilityService();
void RemoveAllAXTreesFromAccessibilityService();
void RemoveDocumentTree();
void SendAXTreeToAccessibilityService(const ui::AXTreeManager& manager,
TreeSerializer& serializer);
void InitializeOcrService();
void DisconnectFromOcrService();
void StartWatchingForAccessibilityEvents();
void StopWatchingForAccessibilityEvents();
void ShowOcrServiceFailedToInitializeMessage();
void ShowDocumentTree();
void UpdateDocumentTree(ui::AXTreeUpdate& document_update);
void UpdatePageLocation(const std::string& page_id,
const gfx::RectF& page_location);
// A callback which is run after the Media App sends the bitmap of the page
// that should be OCRed.
void OnBitmapReceived(const std::string& dirty_page_id,
const SkBitmap& bitmap);
void OnPageOcred(const std::string& dirty_page_id,
const ui::AXTreeUpdate& tree_update);
content::WebContents* GetMediaAppWebContents() const;
content::RenderFrameHost* GetMediaAppRenderFrameHost() const;
void StitchDocumentTree();
bool HasRendererTerminatedDueToBadPageId(const std::string& method_name,
const std::string& page_id);
ui::AXNode* HitTest(const gfx::Point& document_point,
ui::AXNode& starting_node) const;
std::unique_ptr<gfx::Transform> MakeTransformFromOffsetAndScale() const;
// Observes whether spoken feedback is enabled in Ash.
base::CallbackListSubscription accessibility_status_subscription_;
// This `BrowserContext` will always outlive the WebUI, so this is safe.
raw_ref<content::BrowserContext> browser_context_;
gfx::NativeWindow native_window_;
mojo::Remote<media_app_ui::mojom::OcrUntrustedPage> media_app_page_;
gfx::RectF viewport_box_;
float scale_factor_ = 0.0f;
base::circular_deque<std::string> dirty_page_ids_;
OcrStatus ocr_status_ = OcrStatus::kUninitialized;
ui::AXTreeID document_tree_id_ = ui::AXTreeID::CreateNewAXTreeID();
SEQUENCE_CHECKER(sequence_checker_);
std::optional<mojo::ReportBadMessageCallback> bad_message_callback_ =
std::nullopt;
// Records when the user starts reading content in MediaApp.
base::TimeTicks start_reading_time_;
// Records of most recent time when the user reads content in MediaApp.
base::TimeTicks latest_reading_time_;
// Records the greatest page number to which the user has navigated.
size_t greatest_visited_page_number_ = 0;
base::WeakPtrFactory<AXMediaAppUntrustedService> weak_ptr_factory_{this};
};
} // namespace ash
#endif // CHROME_BROWSER_ACCESSIBILITY_MEDIA_APP_AX_MEDIA_APP_UNTRUSTED_SERVICE_H_
|