view dep/animone/src/a11y/win32.cc @ 342:adb79bdde329

dep/animone: fix tons of issues for example, the window ID stuff was just... completely wrong. since we're supporting multiple different window systems, it *has* to be a union rather than just a single integer type. HWND is also not a DWORD, it's a pointer(!), so now it's stored as a std::uintptr_t. (this probably breaks things)
author Paper <paper@paper.us.eu.org>
date Thu, 20 Jun 2024 03:03:05 -0400
parents 052ec053ee37
children 1faa72660932
line wrap: on
line source

#include <functional>
#include <string>
#include <vector>
#include <memory>

#include <windows.h>
#include <uiautomation.h>

#include "animone/a11y.h"
#include "animone/a11y/win32.h"
#include "animone/util/win32.h"

namespace animone::internal::win32 {

// Windows Accessibility API reference:
// https://msdn.microsoft.com/en-us/library/windows/desktop/ff486375.aspx

// Commonly used interfaces
using Element = IUIAutomationElement;
using TreeWalker = IUIAutomationTreeWalker;
using ValuePattern = IUIAutomationValuePattern;

using element_proc_t = std::function<TreeScope(Element&)>;
using properties_t = std::vector<std::pair<long, bool>>;

/* ------------------------------------------------------------------- */

template <typename T>
struct ComInterfaceDeleter {
	static_assert(std::is_base_of<IUnknown, T>::value, "Invalid COM interface");
	using pointer = T*;
	void operator()(pointer p) const { if (p) p->Release(); }
};

template <typename T>
using ComInterface = std::unique_ptr<T, ComInterfaceDeleter<T>>;

/* ------------------------------------------------------------------- */

// The main interface that is used throughout this file. Must be initialized
// before it can be used for the first time.
static ComInterface<IUIAutomation> ui_automation;

/* ------------------------------------------------------------------- */

static bool InitializeUIAutomation() {
	if (ui_automation)
		return true;

	// COM library must be initialized on the current thread before calling
	// CoCreateInstance.
	::CoInitialize(nullptr);

	IUIAutomation* ui_automation_interface = nullptr;
	const auto result = ::CoCreateInstance(
			CLSID_CUIAutomation, nullptr, CLSCTX_INPROC_SERVER, IID_IUIAutomation,
			reinterpret_cast<void**>(&ui_automation_interface));
	ui_automation.reset(ui_automation_interface);

	return SUCCEEDED(result);
}

/* ------------------------------------------------------------------- */

static Element* GetElementFromHandle(HWND hwnd) {
	Element* element = nullptr;
	ui_automation->ElementFromHandle(static_cast<UIA_HWND>(hwnd), &element);
	return element;
}

static std::wstring GetElementName(Element& element) {
	std::wstring element_name;

	BSTR bstr = nullptr;
	if (SUCCEEDED(element.get_CurrentName(&bstr)) && bstr) {
		element_name = bstr;
		::SysFreeString(bstr);
	}

	return element_name;
}

static std::wstring GetElementValue(Element& element) {
	std::wstring element_value;

	ValuePattern* value_pattern_interface = nullptr;
	element.GetCurrentPatternAs(
			UIA_ValuePatternId, IID_PPV_ARGS(&value_pattern_interface));
	ComInterface<ValuePattern> value_pattern(value_pattern_interface);

	if (value_pattern) {
		BSTR bstr = nullptr;
		if (SUCCEEDED(value_pattern->get_CurrentValue(&bstr)) && bstr) {
			element_value = bstr;
			::SysFreeString(bstr);
		}
	}

	return element_value;
}

/* ------------------------------------------------------------------- */

static bool VerifyElementProperties(Element& element, const properties_t& properties) {
	VARIANT v = {};
	for (const auto& pair : properties) {
		if (FAILED(element.GetCurrentPropertyValue(pair.first, &v)))
			return false;
		if (v.boolVal != (pair.second ? VARIANT_TRUE : VARIANT_FALSE))
			return false;
	}

	return true;
}

static bool IsAddressBarElement(Element& element) {
	static const properties_t properties = {
		{UIA_IsEnabledPropertyId, true},
		{UIA_IsKeyboardFocusablePropertyId, true},
		{UIA_IsValuePatternAvailablePropertyId, true},
		{UIA_ValueIsReadOnlyPropertyId, false},
	};

	return VerifyElementProperties(element, properties);
}

static bool IsTabsElement(Element& element) {
	static const properties_t properties = {
		{UIA_ValueIsReadOnlyPropertyId, true},
	};

	return VerifyElementProperties(element, properties);
}

/* ------------------------------------------------------------------- */

static void WalkElements(TreeWalker& tree_walker, Element& parent, TreeScope scope,
                         size_t depth, element_proc_t element_proc) {
	constexpr size_t kMaxTreeDepth = 16;  // arbitrary value
	if (depth > kMaxTreeDepth)
		return;

	if (scope & TreeScope_Element)
		scope = element_proc(parent);

	auto descend = [](TreeScope scope) {
		return (scope & TreeScope_Children) || (scope & TreeScope_Descendants);
	};

	if (descend(scope)) {
		Element* first_element = nullptr;
		tree_walker.GetFirstChildElement(&parent, &first_element);
		ComInterface<Element> element(first_element);

		while (element) {
			scope = element_proc(*element);

			if (descend(scope))
				WalkElements(tree_walker, *element, scope, depth + 1, element_proc);

			Element* next_element = nullptr;
			tree_walker.GetNextSiblingElement(element.get(), &next_element);
			element.reset(next_element);
		}
	}
}

static bool FindWebBrowserElements(Element& parent, std::wstring& address,
                                   std::vector<std::wstring>& tabs) {
	TreeWalker* tree_walker_interface = nullptr;
	ui_automation->get_ControlViewWalker(&tree_walker_interface);
	ComInterface<TreeWalker> tree_walker(tree_walker_interface);

	if (!tree_walker)
		return false;

	auto element_proc = [&](Element& element) -> TreeScope {
		CONTROLTYPEID control_type_id = 0;
		element.get_CurrentControlType(&control_type_id);

		switch (control_type_id) {
			default:
				// Are we done?
				if (!address.empty() && !tabs.empty())
					return TreeScope_Element;
				// Otherwise continue descending the tree.
				return TreeScope_Descendants;

			case UIA_DocumentControlTypeId:
			case UIA_MenuBarControlTypeId:
			case UIA_TitleBarControlTypeId:
				// We do not need to walk through these nodes. In fact, skipping
				// documents dramatically improves our performance on worst case
				// scenarios. This is the whole reason we are walking the tree rather
				// than using FindFirst and FindAll methods.
				return TreeScope_Element;

			case UIA_EditControlTypeId:
				// Here we assume that the first edit control that fits our properties
				// is the address bar (e.g. "Omnibox" on Chrome, "Awesome Bar" on
				// Firefox). This element is named differently on each web browser
				// (e.g. "Address and search bar" on Chrome, "Search or enter address"
				// on Firefox). This name can change depending on the browser
				// language. However, we are only interested in the element value,
				// which usually gives us the URL of the current page.
				if (address.empty() && IsAddressBarElement(element)) {
					address = GetElementValue(element);
					return TreeScope_Element;
				} else {
					// Opera has an edit control ("Address field") within another edit
					// control ("Address bar").
					return TreeScope_Descendants;
				}

			case UIA_TabControlTypeId:
				if (tabs.empty() && IsTabsElement(element))
					return TreeScope_Children;
				return TreeScope_Element;

			case UIA_TabItemControlTypeId:
				tabs.push_back(GetElementName(element));
				return TreeScope_Element;
		}
	};

	WalkElements(*tree_walker, parent, TreeScope_Subtree, 0, element_proc);
	return true;
}

/* ------------------------------------------------------------------------------------ */

bool GetWebBrowserInformation(const Window& window, web_browser_proc_t web_browser_proc) {
	if (!web_browser_proc)
		return false;

	if (!InitializeUIAutomation())
		return false;

	ComInterface<Element> parent(GetElementFromHandle(reinterpret_cast<HWND>(window.id.win32)));
	if (!parent)
		return false;

	const std::string title = ToUtf8String(GetElementName(*parent));
	web_browser_proc({WebBrowserInformationType::Title, title});

	std::wstring address;
	std::vector<std::wstring> tabs;

	if (!FindWebBrowserElements(*parent, address, tabs))
		return false;

	web_browser_proc({WebBrowserInformationType::Address, ToUtf8String(address)});
	for (const auto& tab : tabs)
		web_browser_proc({WebBrowserInformationType::Tab, ToUtf8String(tab)});

	return true;
}

}  // namespace animone::internal::win32