diff --git a/CHANGELOG.md b/CHANGELOG.md
index 4587d59c4b..1efded7a31 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -8,6 +8,10 @@ app.
 
 ## [Unreleased]
 
+- Rewrote text lookup to better handle cases of hidden content (including
+  `user-select: all` content), avoid lingering popups, and improve performance
+  (Fixes [#990](https://github.com/birchill/10ten-ja-reader/issues/990) and
+  [#1033](https://github.com/birchill/10ten-ja-reader/issues/1033)).
 - (Chrome, Edge, Safari) Fixed a bug where overlays would be broken on
   [MangaDex](https://mangadex.org/)
   ([#1110](https://github.com/birchill/10ten-ja-reader/issues/1110)).
diff --git a/src/content/gdocs-canvas.ts b/src/content/gdocs-canvas.ts
index 3a160e2dda..7cbd73df69 100644
--- a/src/content/gdocs-canvas.ts
+++ b/src/content/gdocs-canvas.ts
@@ -2,7 +2,7 @@ import { HighlightStyle } from '../common/content-config-params';
 import { empty, SVG_NS } from '../utils/dom-utils';
 import { Point, Rect } from '../utils/geometry';
 
-import { CursorPosition } from './get-text';
+import { CursorPosition } from './get-cursor-position';
 
 export function injectGdocsStyles() {
   removeGdocsStyles();
diff --git a/src/content/get-cursor-position.ts b/src/content/get-cursor-position.ts
new file mode 100644
index 0000000000..1dfcc1baa4
--- /dev/null
+++ b/src/content/get-cursor-position.ts
@@ -0,0 +1,672 @@
+import { html } from '../utils/builder';
+import { isTextInputNode, isTextNode, SVG_NS } from '../utils/dom-utils';
+import { bboxIncludesPoint, Point } from '../utils/geometry';
+import { getRangeForSingleCodepoint } from '../utils/range';
+import { isChromium } from '../utils/ua-utils';
+
+import { isGdocsOverlayElem } from './gdocs-canvas';
+
+declare global {
+  // The following definitions were dropped from lib.dom.d.ts in TypeScript 4.4
+  // since only Firefox supports them.
+  interface CaretPosition {
+    readonly offsetNode: Node;
+    readonly offset: number;
+    getClientRect(): DOMRect | null;
+  }
+
+  interface Document {
+    caretPositionFromPoint?: (x: number, y: number) => CaretPosition | null;
+  }
+}
+
+export type CursorPosition<T extends Node = Node> = {
+  offset: number;
+  offsetNode: T;
+};
+
+/**
+ * Wrapper around document.caretPositionFromPoint / document.caretRangeFromPoint
+ * that works around browser inconsistencies and bugs and digs into elements
+ * that otherwise would be hidden or unselectable.
+ */
+export function getCursorPosition({
+  point,
+  elements: initialElements,
+}: {
+  point: Point;
+  elements: readonly Element[];
+}): CursorPosition | null {
+  if (!initialElements.length) {
+    return null;
+  }
+
+  // Do an initial lookup
+  const initialResult = getCursorPositionForElement({
+    point,
+    element: initialElements[0],
+  });
+
+  // Check if our initial result is good enough
+  if (
+    isTextNodePosition(initialResult) ||
+    isTextInputPosition(initialResult) ||
+    isGdocsOverlayPosition(initialResult)
+  ) {
+    return initialResult;
+  }
+
+  // Otherwise see if we can get a better result by disabling pointer-events on
+  // any transparent elements from the hit list and checking again.
+  const stylesToRestore = new Map<Element, string | null>();
+
+  try {
+    const elements = [...initialElements];
+    let firstElement = true;
+
+    for (
+      let element = elements.shift();
+      element;
+      element = elements.shift(), firstElement = false
+    ) {
+      // Skip elements without a style attribute (since we have no easy way to
+      // toggle their pointer-events state).
+      if (
+        !(element instanceof HTMLElement) &&
+        !(element instanceof SVGElement)
+      ) {
+        continue;
+      }
+
+      // Skip elements that are already visible
+      //
+      // We need special handling here to account for "covering links".
+      //
+      // Normally we can just check if the current element is invisible or not
+      // but for asahi.com we have a special case where it effectively makes the
+      // covering content invisible by setting the dimensions of a _child_
+      // element to 1x1.
+      //
+      // To detect that case we check for a non-auto z-index since that has
+      // proven to be the most reliable indicator of this pattern. If we simply
+      // decide to treat the element as invisible whenever its bounding box
+      // doesn't line up, we'll run this too often and cause a performance
+      // regression when the the cursor is moving around empty space on the Web
+      // page.
+      //
+      // We only do this for the initial lookup for now because so far that's
+      // proved sufficient (and is probably cheaper than trying to perform this
+      // check on every element in the hit list).
+      const treatElementAsInvisible =
+        firstElement && getComputedStyle(element).zIndex !== 'auto';
+      if (!treatElementAsInvisible && isVisible(element)) {
+        continue;
+      }
+
+      // Temporarily turn off pointer-events on the (invisible) element
+      stylesToRestore.set(element, element.getAttribute('style'));
+      element.style.setProperty('pointer-events', 'none', 'important');
+
+      // See if we get a better result now
+      const result = getCursorPositionForElement({ point, element });
+      if (isTextNodePosition(result) || isTextInputPosition(result)) {
+        return result;
+      }
+    }
+  } finally {
+    restoreStyles(stylesToRestore);
+  }
+
+  // We didn't find anything better by toggling pointer-events, so use the
+  // original result.
+  return initialResult;
+}
+
+export function isTextNodePosition(
+  position: CursorPosition | null | undefined
+): position is CursorPosition<Text> {
+  return !!position && isTextNode(position.offsetNode);
+}
+
+export function isTextInputPosition(
+  position: CursorPosition | null | undefined
+): position is CursorPosition<HTMLInputElement | HTMLTextAreaElement> {
+  return !!position && isTextInputNode(position.offsetNode);
+}
+
+export function isGdocsOverlayPosition(
+  position: CursorPosition | null | undefined
+): position is CursorPosition<SVGElement> {
+  return (
+    !!position &&
+    document.location.host === 'docs.google.com' &&
+    isGdocsOverlayElem(position.offsetNode)
+  );
+}
+
+function getElementForPosition(
+  position: CursorPosition | null | undefined
+): Element | null {
+  return position?.offsetNode?.nodeType === Node.ELEMENT_NODE
+    ? (position.offsetNode as Element)
+    : position?.offsetNode?.parentElement || null;
+}
+
+function getCursorPositionForElement({
+  point,
+  element,
+}: {
+  point: Point;
+  element: Element;
+}): CursorPosition | null {
+  // Lookup point
+  let position = lookupPoint({ point, element });
+
+  // If the position is in a text input element or Google Docs element return it
+  // immediately.
+  if (isTextInputPosition(position) || isGdocsOverlayPosition(position)) {
+    return position;
+  }
+
+  // If we have any other kind of node, see if we need to override the
+  // user-select style to get a better result.
+  //
+  // This addresses two issues:
+  //
+  // 1. In Firefox, content with `user-select: all` will cause
+  //    caretPositionFromPoint to return the parent element.
+  //
+  // 2. In Safari, content with `-webkit-user-select: none` will not be found by
+  //    caretRangeFromPoint.
+  //
+  if (!isTextNodePosition(position)) {
+    const userSelectResult = lookupPointWithNormalizedUserSelect({
+      point,
+      element,
+    });
+
+    // If we got back a text node, prefer it to our previous result
+    if (isTextNodePosition(userSelectResult)) {
+      position = userSelectResult;
+    }
+  }
+
+  // Check that the element intersects the point
+  //
+  // This can happen when the Web page sets the geometry of the element we
+  // picked up in a way that hides it (see the extended comment before
+  // `positionIntersectsPoint` for details).
+  if (position && !positionIntersectsPoint(position, point)) {
+    return null;
+  }
+
+  // Check that the position is close to the lookup point since sometimes
+  // due to line-wrapping etc. caretPositionFromPoint can return a point far
+  // away from the cursor.
+  if (isTextNodePosition(position) && !isResultCloseToPoint(position, point)) {
+    return null;
+  }
+
+  // Check that the element is visible
+  const positionElement = getElementForPosition(position);
+  if (positionElement && !isVisible(positionElement)) {
+    return null;
+  }
+
+  return position;
+}
+
+function isVisible(element: Element) {
+  // Use the checkVisibility API when available
+  if ('checkVisibility' in element) {
+    return element.checkVisibility({
+      checkOpacity: true,
+      checkVisibilityCSS: true,
+    });
+  }
+
+  const { opacity, visibility } = getComputedStyle(element);
+  return opacity !== '0' && visibility !== 'hidden';
+}
+
+function lookupPoint({
+  point,
+  element,
+}: {
+  point: Point;
+  element: Element;
+}): CursorPosition | null {
+  const position = getCaretPosition({ point, element });
+  if (!position) {
+    return null;
+  }
+
+  if (isTextNodePosition(position) && position.offset) {
+    position.offset = getVisualOffset({ position, point });
+  }
+
+  return position;
+}
+
+function getCaretPosition({
+  point,
+  element,
+}: {
+  point: Point;
+  element: Element;
+}): CursorPosition | null {
+  if (document.caretPositionFromPoint) {
+    const position = document.caretPositionFromPoint(point.x, point.y);
+    return position?.offsetNode
+      ? { offset: position.offset, offsetNode: position.offsetNode }
+      : null;
+  }
+
+  return caretRangeFromPoint({ point, element });
+}
+
+// If the cursor is more than half way across a character,
+// caretPositionFromPoint will choose the _next_ character since that's where
+// the cursor would be placed if you clicked there and started editing the
+// text.
+//
+// (Or something like that, it looks like when editing it's more like if the
+// character is 70% or so of the way across the character it inserts before
+// the next character. In any case, caretPositionFromPoint et. al appear to
+// consistently choose the next character after about the 50% mark in at least
+// Firefox and Chromium.)
+//
+// For _looking up_ text, however, it's more intuitive if we look up starting
+// from the character you're pointing at.
+//
+// Here we see if the point is within the bounding box of the _previous_
+// character in the inline direction and, if it is, start from there instead.
+function getVisualOffset({
+  position,
+  point,
+}: {
+  position: CursorPosition<Text>;
+  point: Point;
+}): number {
+  const range = getRangeForSingleCodepoint({
+    source: position.offsetNode,
+    offset: position.offset,
+    direction: 'backwards',
+  });
+
+  const previousCharacterBbox = range.getBoundingClientRect();
+  return bboxIncludesPoint({ bbox: previousCharacterBbox, point })
+    ? range.startOffset
+    : position.offset;
+}
+
+function lookupPointWithNormalizedUserSelect({
+  point,
+  element,
+}: {
+  point: Point;
+  element: Element;
+}): CursorPosition | null {
+  const stylesToRestore = new Map<Element, string | null>();
+  let currentElem: Element | null = element;
+  while (currentElem) {
+    // If the element doesn't have a style attribute we can't override it
+    if (
+      !(currentElem instanceof HTMLElement) &&
+      !(currentElem instanceof SVGElement)
+    ) {
+      currentElem = currentElem.parentElement;
+      continue;
+    }
+
+    const { userSelect, webkitUserSelect } = getComputedStyle(currentElem);
+    const ok = ['auto', 'text', ''];
+    if (!ok.includes(userSelect) || !ok.includes(webkitUserSelect)) {
+      stylesToRestore.set(currentElem, currentElem.getAttribute('style'));
+      // We set the styles directly on the element (as opposed to temporarily
+      // installing a stylesheet) since this should work better on shadow DOM
+      // elements.
+      currentElem.style.setProperty('user-select', 'text', 'important');
+      currentElem.style.setProperty('-webkit-user-select', 'text', 'important');
+    }
+
+    currentElem = currentElem.parentElement;
+  }
+
+  if (!stylesToRestore.size) {
+    return null;
+  }
+
+  // Look up again
+  const result = lookupPoint({ point, element });
+
+  restoreStyles(stylesToRestore);
+
+  return result;
+}
+
+function restoreStyles(styles: Map<Element, string | null>) {
+  for (const [elem, style] of styles) {
+    if (style) {
+      elem.setAttribute('style', style);
+    } else {
+      elem.removeAttribute('style');
+    }
+  }
+}
+
+// --------------------------------------------------------------------------
+//
+// Intersection checking
+//
+// --------------------------------------------------------------------------
+
+// Check that the element's bounding box encapsulates the point, roughly.
+//
+// This is needed for at least two cases:
+//
+// 1) When the cursor is between two paragraphs. In that case the distance
+//    check below is not sufficient since we'll still be fairly close to the
+//    text we picked up (perhaps we should make the distance check based on
+//    the writing mode?).
+//
+// 2) For the "covering link" case found on sites like asahi.com which have
+//    a structure like the following:
+//
+//    <div>
+//      <a href="/articles/" style="position: absolute; top: 0; bottom: 0; left: 0; right: 0; z-index: 1">
+//        <span aria-hidden="true" style="display: block; width: 1px; height: 1px; overflow: hidden">
+//          あいうえお
+//        </span>
+//      </a>
+//    </div>
+//    <div>
+//      <div style="position: relative; width: 100%">
+//        <h2 style="z-index: auto">
+//          <a href="/articles/" id="innerLink">
+//            あいうえお
+//          </a>
+//        </h2>
+//      </div>
+//    </div>
+//
+//    In this case caretPositionFromPoint will return a position inside the
+//    first <span> (inside the "covering link") but that span is effectively
+//    made invisible by giving it a width and height of 1px.
+//
+//    We need to reject that result so we have a chance to look for the text
+//    in the covered <div> (the second <a> element).
+function positionIntersectsPoint(
+  position: CursorPosition,
+  point: Point
+): boolean {
+  const positionElement = getElementForPosition(position);
+
+  return (
+    !!positionElement &&
+    (getComputedStyle(positionElement).display === 'contents' ||
+      bboxIncludesPoint({
+        bbox: positionElement.getBoundingClientRect(),
+        margin: 5,
+        point,
+      }))
+  );
+}
+
+// --------------------------------------------------------------------------
+//
+// Distance checking
+//
+// --------------------------------------------------------------------------
+
+function isResultCloseToPoint(
+  position: { offsetNode: Text; offset: number },
+  point: Point
+): boolean {
+  const distanceResult = getDistanceFromTextNode(position, point);
+
+  // We should be within the space of about three characters
+  return (
+    !distanceResult || distanceResult.distance <= distanceResult.glyphExtent * 3
+  );
+}
+
+function getDistanceFromTextNode(
+  position: { offsetNode: Text; offset: number },
+  point: Point
+): { distance: number; glyphExtent: number } | null {
+  const { offsetNode: node, offset } = position;
+
+  if (!node.parentElement) {
+    return null;
+  }
+
+  // Ignore SVG content (it doesn't normally need distance checking).
+  if (node.parentElement.namespaceURI === SVG_NS) {
+    return null;
+  }
+
+  // Get bbox of first character in range (since that's where we select from).
+  const range = getRangeForSingleCodepoint({ source: node, offset });
+  const bbox = range.getBoundingClientRect();
+
+  // Find the distance from the cursor to the closest edge of that character
+  // since if we have a large font size the two distances could be quite
+  // different.
+  const xDist = Math.min(
+    Math.abs(point.x - bbox.left),
+    Math.abs(point.x - bbox.right)
+  );
+  const yDist = Math.min(
+    Math.abs(point.y - bbox.top),
+    Math.abs(point.y - bbox.bottom)
+  );
+
+  const distance = Math.sqrt(xDist * xDist + yDist * yDist);
+  const glyphExtent = Math.sqrt(
+    bbox.width * bbox.width + bbox.height * bbox.height
+  );
+
+  return { distance, glyphExtent };
+}
+
+// --------------------------------------------------------------------------
+//
+// caretRangeFromPoint helpers
+//
+// --------------------------------------------------------------------------
+
+/**
+ * Wrapper for document.caretRangeFromPoint that fixes some deficiencies when
+ * compared with caretPositionFromPoint (at least with regards to the Firefox
+ * implementation of caretPositionFromPoint).
+ */
+function caretRangeFromPoint({
+  point,
+  element,
+}: {
+  point: Point;
+  element: Element;
+}): CursorPosition | null {
+  // Special handling for text boxes.
+  //
+  // 1. In Chromium, caretRangeFromPoint doesn't return text input elements.
+  //    Instead it returns one of their ancestors.
+  //
+  // 2. In WebKit, caretRangeFromPoint returns text input elements, but always
+  //    sets the offset to 0.
+  if (isTextInputNode(element)) {
+    return getCursorPositionFromTextInput({ input: element, point });
+  }
+
+  let range = document.caretRangeFromPoint(point.x, point.y);
+
+  // TODO: Shadow DOM handling
+
+  // Range adjustment for Safari
+  range = adjustForRangeBoundary({ range, point });
+
+  return range
+    ? {
+        offsetNode: range.startContainer,
+        offset: range.startOffset,
+      }
+    : null;
+}
+
+/**
+ * Helper for caretRangeFromPoint to look up text input elements.
+ */
+function getCursorPositionFromTextInput({
+  input,
+  point,
+}: {
+  input: HTMLInputElement | HTMLTextAreaElement;
+  point: Point;
+}): CursorPosition | null {
+  // This is only called when the platform APIs failed to give us the correct
+  // result so we need to synthesize an element with the same layout as the
+  // text area, read the text position, then drop it.
+  //
+  // We currently only expect to use it together with caretRangeFromPoint since
+  // caretPositionFromPoint should look up text inputs correctly.
+  if (!('caretRangeFromPoint' in document)) {
+    throw new Error('caretRangeFromPoint not available');
+  }
+
+  // Create the element
+  const mirrorElement = html('div', {}, input.value);
+
+  // Set its styles to be the same
+  const cs = document.defaultView!.getComputedStyle(input);
+  for (let i = 0; i < cs.length; i++) {
+    const prop = cs.item(i);
+    mirrorElement.style.setProperty(prop, cs.getPropertyValue(prop));
+  }
+
+  // Special handling for Chromium which does _not_ include the scrollbars in
+  // the width/height when box-sizing is 'content-box'.
+  if (isChromium() && cs.boxSizing === 'content-box') {
+    const { paddingLeft, paddingRight, paddingTop, paddingBottom } = cs;
+    const {
+      borderLeftWidth,
+      borderRightWidth,
+      borderTopWidth,
+      borderBottomWidth,
+    } = cs;
+
+    const width =
+      input.offsetWidth -
+      parseFloat(paddingLeft) -
+      parseFloat(paddingRight) -
+      parseFloat(borderLeftWidth) -
+      parseFloat(borderRightWidth);
+    if (Number.isFinite(width)) {
+      mirrorElement.style.width = `${width}px`;
+    }
+
+    const height =
+      input.offsetHeight -
+      parseFloat(paddingTop) -
+      parseFloat(paddingBottom) -
+      parseFloat(borderTopWidth) -
+      parseFloat(borderBottomWidth);
+    if (Number.isFinite(height)) {
+      mirrorElement.style.height = `${height}px`;
+    }
+  }
+
+  // Set its position in the document to be to be the same
+  mirrorElement.style.position = 'absolute';
+  const bbox = input.getBoundingClientRect();
+
+  // We need to factor in the document scroll position too
+  const top = bbox.top + document.documentElement.scrollTop;
+  const left = bbox.left + document.documentElement.scrollLeft;
+
+  mirrorElement.style.top = top + 'px';
+  mirrorElement.style.left = left + 'px';
+
+  // Finally, make sure it is on top
+  mirrorElement.style.zIndex = '10000';
+
+  // Append the element to the document. We need to do this before adjusting
+  // the scroll offset or else it won't update.
+  document.documentElement.appendChild(mirrorElement);
+
+  // Match the scroll position
+  const { scrollLeft, scrollTop } = input;
+  mirrorElement.scrollTo(scrollLeft, scrollTop);
+
+  // Read the offset
+  const result = caretRangeFromPoint({ point, element: mirrorElement });
+  if (result) {
+    // Adjust the offset before we drop the mirror element
+    if (isTextNodePosition(result)) {
+      result.offset = getVisualOffset({ position: result, point });
+    }
+
+    result.offsetNode = input;
+  }
+
+  // Drop the element
+  mirrorElement.remove();
+
+  return result;
+}
+
+// On Safari, if you pass a point into caretRangeFromPoint that is less than
+// about 60~70% of the way across the first character in a text node it will
+// return the previous text node instead.
+//
+// Here we try to detect that situation and return the "next" text node instead.
+function adjustForRangeBoundary({
+  range,
+  point,
+}: {
+  range: Range | null;
+  point: Point;
+}): Range | null {
+  // Check we got a range with the offset set to the end of a text node
+  if (
+    !range ||
+    !range.startOffset ||
+    range.startContainer.nodeType !== Node.TEXT_NODE ||
+    range.startOffset !== range.startContainer.textContent?.length
+  ) {
+    return range;
+  }
+
+  // Check there is a _different_ text node under the cursor
+  const elemFromPoint = document.elementFromPoint(point.x, point.y);
+  if (
+    !(elemFromPoint instanceof HTMLElement) ||
+    elemFromPoint === range.startContainer ||
+    !elemFromPoint.innerText.length
+  ) {
+    return range;
+  }
+
+  // Check the first character in the new element is actually the one under the
+  // cursor.
+  const firstNonEmptyTextNode = Array.from(elemFromPoint.childNodes).find(
+    (elem): elem is Text =>
+      elem.nodeType === Node.TEXT_NODE && !!(elem as Text).length
+  );
+  if (!firstNonEmptyTextNode) {
+    return range;
+  }
+
+  const firstCharRange = getRangeForSingleCodepoint({
+    source: firstNonEmptyTextNode,
+    offset: 0,
+  });
+
+  const firstCharBbox = firstCharRange.getBoundingClientRect();
+  if (!bboxIncludesPoint({ bbox: firstCharBbox, point })) {
+    return range;
+  }
+
+  firstCharRange.setEnd(firstNonEmptyTextNode, 0);
+  return firstCharRange;
+}
diff --git a/src/content/get-text.ts b/src/content/get-text.ts
index 324674bb21..8b26371948 100644
--- a/src/content/get-text.ts
+++ b/src/content/get-text.ts
@@ -1,19 +1,20 @@
-import { html } from '../utils/builder';
-import {
-  nonJapaneseChar,
-  nonJapaneseCharOrNumber,
-  startsWithNumber,
-} from '../utils/char-range';
-import { isTextInputNode, isTextNode, SVG_NS } from '../utils/dom-utils';
 import { bboxIncludesPoint, Point } from '../utils/geometry';
-import { isChromium } from '../utils/ua-utils';
-import { getContentType } from './content-type';
+import { getRangeForSingleCodepoint } from '../utils/range';
 
-import { getTextFromAnnotatedCanvas, isGdocsOverlayElem } from './gdocs-canvas';
-import { extractGetTextMetadata, lookForMetadata, SelectionMeta } from './meta';
+import { getContentType } from './content-type';
+import { getTextFromAnnotatedCanvas } from './gdocs-canvas';
+import {
+  CursorPosition,
+  getCursorPosition,
+  isGdocsOverlayPosition,
+  isTextInputPosition,
+  isTextNodePosition,
+} from './get-cursor-position';
+import { SelectionMeta } from './meta';
+import { scanText } from './scan-text';
 import { TextRange } from './text-range';
 
-export interface GetTextAtPointResult {
+export type GetTextAtPointResult = {
   text: string;
   // Contains the set of nodes and their ranges where text was found.
   // This will be null if, for example, the result is the text from an element's
@@ -21,13 +22,7 @@ export interface GetTextAtPointResult {
   textRange: TextRange | null;
   // Extra metadata we parsed in the process
   meta?: SelectionMeta;
-}
-
-// Basically CaretPosition but without getClientRect()
-export interface CursorPosition {
-  readonly offset: number;
-  readonly offsetNode: Node;
-}
+};
 
 // Cache of previous result (since often the mouse position will change but
 // the cursor position will not).
@@ -36,6 +31,7 @@ let previousResult:
       point: Point;
       position: CursorPosition | undefined;
       result: GetTextAtPointResult;
+      firstCharBbox?: DOMRect;
     }
   | undefined;
 
@@ -52,54 +48,29 @@ export function getTextAtPoint({
   point: Point;
   maxLength?: number;
 }): GetTextAtPointResult | null {
-  let position = matchText ? caretPositionFromPoint(point) : null;
-
-  // Chrome not only doesn't support caretPositionFromPoint, but also
-  // caretRangeFromPoint doesn't return text input elements. Instead it returns
-  // one of their ancestors.
+  // First check for a cache hit on the glyph bounding box
   //
-  // Chrome may one day support caretPositionFromPoint with the same buggy
-  // behavior so check if we DIDN'T get a text input element but _should_ have.
-  if (position && !isTextInputNode(position.offsetNode)) {
-    const elemUnderCursor = document.elementFromPoint(point.x, point.y);
-    if (isTextInputNode(elemUnderCursor)) {
-      const offset = getOffsetFromTextInputNode({
-        node: elemUnderCursor,
-        point,
-      });
-      position =
-        offset !== null ? { offset, offsetNode: elemUnderCursor } : null;
-    }
-  }
-  // By contrast, Safari simply always returns an offset of 0 for text boxes
-  else if (
-    position &&
-    position.usedCaretRangeFromPoint &&
-    position.offset === 0 &&
-    isTextInputNode(position.offsetNode)
-  ) {
-    const offset = getOffsetFromTextInputNode({
-      node: position.offsetNode,
-      point,
-    });
-    position =
-      offset !== null ? { offset, offsetNode: position.offsetNode } : position;
-  }
-
-  // Check if we are dealing with Google docs annotated canvas
-  let textToSynthesize = '';
+  // This will often be the case when scanning along a line of text
   if (
-    matchText &&
-    document.location.host === 'docs.google.com' &&
-    position &&
-    isGdocsOverlayElem(position.offsetNode)
+    previousResult?.firstCharBbox &&
+    bboxIncludesPoint({ bbox: previousResult.firstCharBbox, point })
   ) {
-    ({ position, text: textToSynthesize } = getTextFromAnnotatedCanvas({
-      maxLength,
-      point,
-    }));
+    return previousResult.result;
   }
 
+  // First fetch the hit elements (dropping duplicates)
+  const elements = [...new Set(document.elementsFromPoint(point.x, point.y))];
+
+  // Look for text matches
+  const [position, scanNode] = matchText
+    ? getTextNodeStart({ elements, maxLength, point })
+    : [null, null];
+
+  // Check if we have a cache hit on the position
+  //
+  // This will mostly happen when we are working with non-text nodes (e.g. input
+  // boxes) or when the cursor is moving just outside the glyph bounds (e.g.
+  // along the top of a line).
   if (
     position &&
     position.offsetNode === previousResult?.position?.offsetNode &&
@@ -108,108 +79,57 @@ export function getTextAtPoint({
     return previousResult.result;
   }
 
-  // If we have a textual <input> node or a <textarea> we synthesize a
-  // text node and use that for finding text since it allows us to re-use
-  // the same handling for text nodes and 'value' attributes.
-
-  let startNode: Node | null = position ? position.offsetNode : null;
-  if (isTextInputNode(startNode)) {
-    // If we selected the end of the text, skip it.
-    if (position!.offset === startNode.value.length) {
-      previousResult = undefined;
-      return null;
-    }
-    startNode = document.createTextNode(startNode.value);
-  } else if (textToSynthesize) {
-    // Similarly, we synthesize a text node if we are dealing with Google docs
-    // text.
-    startNode = document.createTextNode(textToSynthesize);
-  }
-
-  // Try handling as a text node
-
-  if (isTextNode(startNode)) {
-    // Due to line wrapping etc. sometimes caretPositionFromPoint can return
-    // a point far away from the cursor.
-    //
-    // We don't need to do this for synthesized text nodes, however, since we
-    // assume we'll be within their bounds.
-    const distanceResult = getDistanceFromTextNode(
-      startNode,
-      position!.offset,
-      point
-    );
-
-    let closeEnough = true;
-    if (distanceResult) {
-      // If we're more than about three characters away, don't show the
-      // pop-up.
-      const { distance, glyphExtent } = distanceResult;
-      if (distance > glyphExtent * 3) {
-        closeEnough = false;
+  const synthesizedPosition = position
+    ? {
+        offsetNode: scanNode || position.offsetNode,
+        offset: position.offset,
       }
-    }
+    : undefined;
 
-    if (closeEnough) {
-      const result = getTextFromTextNode({
-        startNode,
-        startOffset: position!.offset,
-        point,
-        matchCurrency,
-        maxLength,
-      });
-
-      if (result) {
-        console.assert(
-          !!result.textRange,
-          'There should be a text range when getting text from a text node'
-        );
-
-        // If we synthesized a text node, substitute the original node back in.
-        if (startNode !== position!.offsetNode) {
-          console.assert(
-            result.textRange!.length === 1,
-            'When using a synthesized text node there should be a single range'
-          );
-          console.assert(
-            result.textRange![0].node === startNode,
-            'When using a synthesized text node the range should start' +
-              ' from that node'
-          );
-          result.textRange![0].node = position!.offsetNode;
-        }
-
-        previousResult = { point, position: position!, result };
-        return result;
-      }
-    }
-  }
-
-  // See if we are dealing with a covering link
-  const parentLink = getParentLink(startNode);
-  if (parentLink) {
-    const result = getTextFromCoveringLink({
-      linkElem: parentLink,
-      originalElem: startNode,
-      point,
+  if (position && isTextNodePosition(synthesizedPosition)) {
+    const result = scanText({
+      startPosition: synthesizedPosition,
       matchCurrency,
       maxLength,
     });
 
     if (result) {
-      // Don't cache `position` since it's not the position we actually used.
-      previousResult = { point, position: undefined, result };
+      console.assert(
+        !!result.textRange,
+        'There should be a text range when getting text from a text node'
+      );
+
+      // If we synthesized a text node, substitute the original node into the
+      // result.
+      if (position.offsetNode !== synthesizedPosition.offsetNode) {
+        console.assert(
+          result.textRange?.length === 1,
+          'When using a synthesized text node there should be a single range'
+        );
+        console.assert(
+          result.textRange![0].node === scanNode,
+          'When using a synthesized text node the range should start' +
+            ' from that node'
+        );
+        result.textRange![0].node = position.offsetNode;
+      }
+
+      previousResult = {
+        point,
+        position,
+        result,
+        firstCharBbox: getFirstCharBbox(position),
+      };
       return result;
     }
   }
 
   // Otherwise just pull whatever text we can off the element
-
-  const elem = document.elementFromPoint(point.x, point.y);
+  const elem = elements[0];
   if (elem) {
     const text = getTextFromRandomElement({ elem, matchImages, matchText });
     if (text) {
-      const result: GetTextAtPointResult = { text, textRange: null };
+      const result = { text, textRange: null };
       previousResult = { point, position: undefined, result };
       return result;
     }
@@ -237,685 +157,56 @@ export function clearPreviousResult() {
   previousResult = undefined;
 }
 
-function caretPositionFromPoint(
-  point: Point
-): (CursorPosition & { usedCaretRangeFromPoint?: boolean }) | null {
-  let result = rawCaretPositionFromPoint(point);
-  if (!result) {
-    return result;
+function getFirstCharBbox(position: CursorPosition): DOMRect | undefined {
+  if (!isTextNodePosition(position)) {
+    return undefined;
   }
 
-  // If the cursor is more than half way across a character,
-  // caretPositionFromPoint will choose the _next_ character since that's where
-  // the cursor would be placed if you clicked there and started editing the
-  // text.
-  //
-  // (Or something like that, it looks like when editing it's more like if the
-  // character is 70% or so of the way across the character it inserts before
-  // the next character. In any case, caretPositionFromPoint et. al appear to
-  // consistently choose the next character after about the 50% mark in at least
-  // Firefox and Chromium.)
-  //
-  // For _looking up_ text, however, it's more intuitive if we look up starting
-  // from the character you're pointing at.
-  //
-  // Below we see if the point is within the bounding box of the _previous_
-  // character in the inline direction and, if it is, start from there instead.
-  //
-  // (We do this adjustment here, rather than in, say, getTextFromTextNode,
-  // since it allows us to continue caching the position returned from this
-  // method and returning early if it doesn't change. The disadvantage is that
-  // because it only applies to text nodes, we don't do this adjustment for text
-  // boxes.
-  //
-  // If we did the adjustment inside getTextFromTextNode, however, it _would_
-  // work for text boxes since we synthesize a text node for them before calling
-  // getTextFromTextNode. As it is, we'll end up calling caretPositionFromPoint
-  // on the mirrored element we create for text boxes in Chrome/Edge/Safari so
-  // text boxes there will benefit from this adjustment already, it's just
-  // Firefox that won't. One might say that when we're in text boxes it's better
-  // to follow caretPositionFromPoint's behavior anyway.
-  //
-  // In any case, for now, we do the adjustment here so we keep the early return
-  // optimization and if it becomes important to apply this to text boxes too,
-  // we'll work out a way to address them at that time.)
-  const { offsetNode, offset } = result;
-  if (isTextNode(offsetNode) && offset) {
-    const range = new Range();
-    range.setStart(offsetNode, offset - 1);
-    range.setEnd(offsetNode, offset);
-    const previousCharacterBbox = range.getBoundingClientRect();
-    if (bboxIncludesPoint({ bbox: previousCharacterBbox, point })) {
-      result = {
-        offsetNode,
-        offset: offset - 1,
-        usedCaretRangeFromPoint: result.usedCaretRangeFromPoint,
-      };
-    }
-  }
-
-  return result;
-}
-
-declare global {
-  // The following definitions were dropped from lib.dom.d.ts in TypeScript 4.4
-  // since only Firefox supports them.
-  interface CaretPosition {
-    readonly offsetNode: Node;
-    readonly offset: number;
-    getClientRect(): DOMRect | null;
-  }
-
-  interface Document {
-    caretPositionFromPoint(x: number, y: number): CaretPosition | null;
-  }
-}
-
-function rawCaretPositionFromPoint(
-  point: Point
-): (CursorPosition & { usedCaretRangeFromPoint?: boolean }) | null {
-  if (document.caretPositionFromPoint) {
-    return document.caretPositionFromPoint(point.x, point.y);
-  }
-
-  let range = document.caretRangeFromPoint(point.x, point.y);
-
-  // Special handling for Safari which doesn't dig into nodes with
-  // -webkit-user-select: none.
-  //
-  // If we got an element (not a text node), try using elementFromPoint to see
-  // if we get a better match.
-  if (range && range.startContainer.nodeType === Node.ELEMENT_NODE) {
-    range =
-      getRangeWithoutUserSelectNone({ existingRange: range, point }) || range;
-  }
-
-  // Another Safari-specific workaround
-  range = adjustForRangeBoundary({ range, point });
-
-  return range
-    ? {
-        offsetNode: range.startContainer,
-        offset: range.startOffset,
-        usedCaretRangeFromPoint: true,
-      }
-    : null;
-}
-
-// For Safari, try harder to get the caret position for nodes with
-// -webkit-user-select: none.
-//
-// See notes in rawCaretPositionFromPoint for why we do this.
-function getRangeWithoutUserSelectNone({
-  existingRange,
-  point,
-}: {
-  existingRange: Range;
-  point: Point;
-}): Range | null {
-  const elemFromPoint = document.elementFromPoint(point.x, point.y);
-
-  if (
-    elemFromPoint === existingRange.startContainer ||
-    !(elemFromPoint instanceof HTMLElement) ||
-    !elemFromPoint.innerText.length
-  ) {
-    return null;
-  }
-
-  // Check if (-webkit-)user-select: none is set on the element
-  const cs = window.getComputedStyle(elemFromPoint);
-  if (cs.webkitUserSelect !== 'none' && cs.userSelect !== 'none') {
-    return null;
-  }
-
-  // Try to temporarily disable the (-webkit-)user-select style.
-  const styleElem = html(
-    'style',
-    {},
-    '* { -webkit-user-select: all !important; user-select: all !important; }'
-  );
-  document.head.append(styleElem);
-
-  // Retry looking up
-  const range = document.caretRangeFromPoint(point.x, point.y);
-  styleElem.remove();
-
-  // If we got a text node, prefer that to our previous result.
-  return range && range.startContainer.nodeType === Node.TEXT_NODE
-    ? range
-    : null;
-}
-
-// On Safari, if you pass a point into caretRangeFromPoint that is less than
-// about 60~70% of the way across the first character in a text node it will
-// return the previous text node instead.
-//
-// Here we try to detect that situation and return the "next" text node instead.
-function adjustForRangeBoundary({
-  range,
-  point,
-}: {
-  range: Range | null;
-  point: Point;
-}): Range | null {
-  // Check we got a range with the offset set to the end of a text node
-  if (
-    !range ||
-    !range.startOffset ||
-    range.startContainer.nodeType !== Node.TEXT_NODE ||
-    range.startOffset !== range.startContainer.textContent?.length
-  ) {
-    return range;
-  }
-
-  // Check there is a _different_ text node under the cursor
-  const elemFromPoint = document.elementFromPoint(point.x, point.y);
-  if (
-    !(elemFromPoint instanceof HTMLElement) ||
-    elemFromPoint === range.startContainer ||
-    !elemFromPoint.innerText.length
-  ) {
-    return range;
-  }
-
-  // Check the first character in the new element is actually the one under the
-  // cursor.
-  const firstNonEmptyTextNode = Array.from(elemFromPoint.childNodes).find(
-    (elem): elem is Text =>
-      elem.nodeType === Node.TEXT_NODE && !!(elem as Text).length
-  );
-  if (!firstNonEmptyTextNode) {
-    return range;
-  }
-
-  const firstCharRange = new Range();
-  firstCharRange.setStart(firstNonEmptyTextNode, 0);
-  firstCharRange.setEnd(firstNonEmptyTextNode, 1);
-
-  const firstCharBbox = firstCharRange.getBoundingClientRect();
-  if (!bboxIncludesPoint({ bbox: firstCharBbox, point })) {
-    return range;
-  }
-
-  firstCharRange.setEnd(firstNonEmptyTextNode, 0);
-  return firstCharRange;
-}
-
-function getOffsetFromTextInputNode({
-  node,
-  point,
-}: {
-  node: HTMLInputElement | HTMLTextAreaElement;
-  point: Point;
-}): number | null {
-  // This is only called when the platform APIs failed to give us the correct
-  // result so we need to synthesize an element with the same layout as the
-  // text area, read the text position, then drop it.
-
-  // Create the element
-  const mirrorElement = html('div', {}, node.value);
-
-  // Set its styles to be the same
-  const cs = document.defaultView!.getComputedStyle(node);
-  for (let i = 0; i < cs.length; i++) {
-    const prop = cs.item(i);
-    mirrorElement.style.setProperty(prop, cs.getPropertyValue(prop));
-  }
-
-  // Special handling for Chromium which does _not_ include the scrollbars in
-  // the width/height when box-sizing is 'content-box'.
-  if (isChromium() && cs.boxSizing === 'content-box') {
-    const { paddingLeft, paddingRight, paddingTop, paddingBottom } = cs;
-    const {
-      borderLeftWidth,
-      borderRightWidth,
-      borderTopWidth,
-      borderBottomWidth,
-    } = cs;
-
-    const width =
-      node.offsetWidth -
-      parseFloat(paddingLeft) -
-      parseFloat(paddingRight) -
-      parseFloat(borderLeftWidth) -
-      parseFloat(borderRightWidth);
-    if (Number.isFinite(width)) {
-      mirrorElement.style.width = `${width}px`;
-    }
-
-    const height =
-      node.offsetHeight -
-      parseFloat(paddingTop) -
-      parseFloat(paddingBottom) -
-      parseFloat(borderTopWidth) -
-      parseFloat(borderBottomWidth);
-    if (Number.isFinite(height)) {
-      mirrorElement.style.height = `${height}px`;
-    }
-  }
-
-  // Set its position in the document to be to be the same
-  mirrorElement.style.position = 'absolute';
-  const bbox = node.getBoundingClientRect();
-
-  // We need to factor in the document scroll position too
-  const top = bbox.top + document.documentElement.scrollTop;
-  const left = bbox.left + document.documentElement.scrollLeft;
-
-  mirrorElement.style.top = top + 'px';
-  mirrorElement.style.left = left + 'px';
-
-  // Finally, make sure it is on top
-  mirrorElement.style.zIndex = '10000';
-
-  // Append the element to the document. We need to do this before adjusting
-  // the scroll offset or else it won't update.
-  document.documentElement.appendChild(mirrorElement);
-
-  // Match the scroll position
-  const { scrollLeft, scrollTop } = node;
-  mirrorElement.scrollTo(scrollLeft, scrollTop);
-
-  // Read the offset
-  const position = caretPositionFromPoint(point);
-  const result = position?.offset ?? null;
-
-  // Drop the element
-  mirrorElement.remove();
-
-  return result;
-}
-
-function getDistanceFromTextNode(
-  startNode: CharacterData,
-  startOffset: number,
-  point: Point
-): { distance: number; glyphExtent: number } | null {
-  // Ignore synthesized text nodes.
-  if (!startNode.parentElement) {
-    return null;
-  }
-
-  // Ignore SVG content (it doesn't normally need distance checking).
-  if (startNode.parentElement.namespaceURI === SVG_NS) {
-    return null;
-  }
+  const firstCharRange = getRangeForSingleCodepoint({
+    source: position.offsetNode,
+    offset: position.offset,
+  });
 
-  // Get bbox of first character in range (since that's where we select from).
-  const range = new Range();
-  range.setStart(startNode, startOffset);
-  range.setEnd(startNode, Math.min(startOffset + 1, startNode.length));
-  const bbox = range.getBoundingClientRect();
-
-  // Find the distance from the cursor to the closest edge of that character
-  // since if we have a large font size the two distances could be quite
-  // different.
-  const xDist = Math.min(
-    Math.abs(point.x - bbox.left),
-    Math.abs(point.x - bbox.right)
-  );
-  const yDist = Math.min(
-    Math.abs(point.y - bbox.top),
-    Math.abs(point.y - bbox.bottom)
-  );
-
-  const distance = Math.sqrt(xDist * xDist + yDist * yDist);
-  const glyphExtent = Math.sqrt(
-    bbox.width * bbox.width + bbox.height * bbox.height
-  );
-
-  return { distance, glyphExtent };
+  // Skip empty ranges
+  return firstCharRange.startOffset !== firstCharRange.endOffset
+    ? firstCharRange.getBoundingClientRect()
+    : undefined;
 }
 
-function getTextFromTextNode({
-  startNode,
-  startOffset,
-  point,
-  matchCurrency,
+function getTextNodeStart({
+  elements,
   maxLength,
+  point,
 }: {
-  startNode: CharacterData;
-  startOffset: number;
-  point: Point;
-  matchCurrency: boolean;
+  elements: readonly Element[];
   maxLength?: number;
-}): GetTextAtPointResult | null {
-  const isRubyAnnotationElement = (element: Element | null) => {
-    if (!element) {
-      return false;
-    }
-
-    const tag = element.tagName.toLowerCase();
-    return tag === 'rp' || tag === 'rt';
-  };
-
-  const isInline = (element: Element | null) =>
-    element &&
-    // We always treat <rb> and <ruby> tags as inline regardless of the
-    // styling since sites like renshuu.org do faux-ruby styling where they
-    // give these elements styles like 'display: table-row-group'.
-    //
-    // We also make an exception for <span> because pdf.js uses
-    // absolutely-positioned (and hence `display: block`) spans to lay out
-    // characters in vertical text.
-    //
-    // Furthermore, we treat inline-block as inline because YouTube puts
-    // okurigana in a separate inline-block span when using ruby.
-    //
-    // Finally, if an element's parent is inline-block, then the element will
-    // still be laid out "inline" so we allow that too (and that appears to be
-    // used by Kanshudo at least).
-    //
-    // Given all these exceptions, I wonder if we should even both checking
-    // the display property.
-    (['RB', 'RUBY', 'SPAN'].includes(element.tagName) ||
-      ['inline', 'inline-block', 'ruby', 'ruby-base', 'ruby-text'].includes(
-        getComputedStyle(element).display!
-      ) ||
-      (element.parentElement &&
-        getComputedStyle(element.parentElement)?.display === 'inline-block'));
-
-  // Set up a check that each ancestor is visible and actually contains the
-  // point we're looking up.
-  //
-  // We need to do this for a few reasons:
-  //
-  // Firstly, sometimes caretPositionFromPoint can be too helpful and can choose
-  // an element far away.
-  //
-  // (For this we used to simply check that `inlineAncestor` is an inclusive
-  // ancestor of the result of document.elementFromPoint but using the bounding
-  // box seems like it should be a bit more robust, especially if
-  // caretPositionFromPoint is more clever than elementFromPoint in locating
-  // covered-up text.)
-  //
-  //
-  // Secondly, sites like asahi.com use "covering links" with the following
-  // structure:
-  //
-  // <div>
-  //   <a href="/articles/" style="position: absolute; top: 0; bottom: 0; left: 0; right: 0; z-index: 1">
-  //     <span aria-hidden="true" style="display: block; width: 1px; height: 1px; overflow: hidden">
-  //       あいうえお
-  //     </span>
-  //   </a>
-  // </div>
-  // <div>
-  //   <div style="position: relative; width: 100%">
-  //     <h2 style="z-index: auto">
-  //       <a href="/articles/" id="innerLink">
-  //         あいうえお
-  //       </a>
-  //     </h2>
-  //   </div>
-  // </div>
-  //
-  // We will initially pick up the あういえお text from the <a> element, but
-  // we want to ignore that it since it is "hidden" by giving it a width/height
-  // of 1px.
-  //
-  // Note that we can't just check for aria-hidden !== "true" because asahi.com
-  // also has links marked as aria-hidden="true" that are definitely NOT hidden.
-  //
-  // nikkei.com has a somewhat similar structure but without using or setting
-  // width/height to 1px. Instead it uses an opacity of 0 to hide the covering
-  // link so we need to check for that too.
-  const isVisible = (element: Element) => {
-    return (
-      getComputedStyle(element).opacity !== '0' &&
-      // If the element is display: contents the bounding box will be empty
-      (getComputedStyle(element).display === 'contents' ||
-        bboxIncludesPoint({
-          bbox: element.getBoundingClientRect(),
-          margin: 5,
-          point,
-        }))
-    );
-  };
-
-  // Get the ancestor node for all inline nodes
-  let inlineAncestor = startNode.parentElement;
-
-  // Check the direct parent, if available, is visible.
-  //
-  // If it is not, return null. This is particularly important for the "covering
-  // link" case described above since it will give us a chance to search for the
-  // real link text.
-  //
-  // (Note that here, and below if there is no inline ancestor we do NOT want to
-  // return null because we commonly encounter that case when using synthesized
-  // text nodes.)
-  if (inlineAncestor && !isVisible(inlineAncestor)) {
-    return null;
-  }
-
-  while (isInline(inlineAncestor) && !isRubyAnnotationElement(inlineAncestor)) {
-    inlineAncestor = inlineAncestor!.parentElement;
-    if (inlineAncestor && !isVisible(inlineAncestor)) {
-      return null;
-    }
-  }
-
-  // Skip ruby annotation elements when traversing. However, don't do that
-  // if the inline ancestor is itself a ruby annotation element or else
-  // we'll never be able to find the starting point within the tree walker.
-  let filter: NodeFilter | undefined;
-  if (!isRubyAnnotationElement(inlineAncestor)) {
-    filter = {
-      acceptNode: (node) =>
-        isRubyAnnotationElement(node.parentElement)
-          ? NodeFilter.FILTER_REJECT
-          : NodeFilter.FILTER_ACCEPT,
-    };
-  }
-
-  // Setup a treewalker starting at the current node
-  const treeWalker = document.createNodeIterator(
-    inlineAncestor || startNode,
-    NodeFilter.SHOW_TEXT,
-    filter
-  );
-  while (treeWalker.referenceNode !== startNode && treeWalker.nextNode());
-
-  if (treeWalker.referenceNode !== startNode) {
-    console.error('Could not find node in tree', startNode);
-    return null;
-  }
-
-  // Look for start, skipping any initial whitespace
-  let node: CharacterData = startNode;
-  let offset: number = startOffset;
-  do {
-    const nodeText = node.data.substring(offset);
-    const textStart = nodeText.search(/\S/);
-    if (textStart !== -1) {
-      offset += textStart;
-      break;
-    }
-    // Curiously with our synthesized text nodes, the next node can sometimes
-    // be the same node. We only tend to reach that case, however, when our
-    // offset corresponds to the end of the text so we just detect that case
-    // earlier on and don't bother checking it here.
-    node = <CharacterData>treeWalker.nextNode();
-    offset = 0;
-  } while (node);
-  // (This should probably not traverse block siblings but oh well)
-
-  if (!node) {
-    return null;
-  }
-
-  const result: GetTextAtPointResult = {
-    text: '',
-    textRange: [],
-  };
-
-  let textDelimiter = nonJapaneseChar;
-
-  // Look for range ends
-  do {
-    const nodeText = node.data.substring(offset);
-    let textEnd = nodeText.search(textDelimiter);
-
-    // Check if we are looking at a special string that accepts a different
-    // range of characters.
-    if (textDelimiter === nonJapaneseChar) {
-      const currentText =
-        result.text +
-        nodeText.substring(0, textEnd === -1 ? undefined : textEnd);
-
-      // If the source starts with a number, expand our text delimeter to allow
-      // reading the rest of the number since it might be something like 5つ.
-      if (!currentText.length && startsWithNumber(nodeText)) {
-        textDelimiter = nonJapaneseCharOrNumber;
-      }
-
-      // Check if we should further expand the set of allowed characters in
-      // order to recognize certains types of metadata-type strings (e.g. years
-      // or floor space measurements).
-      ({ textDelimiter, textEnd } = lookForMetadata({
-        currentText,
-        matchCurrency,
-        nodeText,
-        textDelimiter,
-        textEnd,
-      }));
-    }
-
-    if (typeof maxLength === 'number' && maxLength >= 0) {
-      const maxEnd = maxLength - result.text.length;
-      if (textEnd === -1) {
-        // The >= here is important since it means that if the node has
-        // exactly enough characters to reach the maxLength then we will
-        // stop walking the tree at this point.
-        textEnd = node.data.length - offset >= maxEnd ? maxEnd : -1;
-      } else {
-        textEnd = Math.min(textEnd, maxEnd);
-      }
-    }
+  point: Point;
+}): [position: CursorPosition, scanNode: Text | null] | [null, null] {
+  let position = getCursorPosition({ point, elements });
 
-    if (textEnd === 0) {
-      // There are no characters here for us.
-      break;
-    } else if (textEnd !== -1) {
-      // The text node has disallowed characters mid-way through so
-      // return up to that point.
-      result.text += nodeText.substring(0, textEnd);
-      result.textRange!.push({
-        node,
-        start: offset,
-        end: offset + textEnd,
-      });
-      break;
+  // If we have a textual <input> node or a <textarea> we synthesize a
+  // text node and use that for finding text since it allows us to re-use
+  // the same handling for text nodes and 'value' attributes.
+  if (isTextInputPosition(position)) {
+    if (position.offset === position.offsetNode.value.length) {
+      return [null, null];
     }
 
-    // The whole text node is allowed characters, keep going.
-    result.text += nodeText;
-    result.textRange!.push({
-      node,
-      start: offset,
-      end: node.data.length,
-    });
-    node = <CharacterData>treeWalker.nextNode();
-    offset = 0;
-  } while (
-    node &&
-    inlineAncestor &&
-    (node.parentElement === inlineAncestor || isInline(node.parentElement))
-  );
-
-  // Check if we didn't find any suitable characters
-  if (!result.textRange!.length) {
-    return null;
+    return [position, document.createTextNode(position.offsetNode.value)];
   }
 
-  result.meta = extractGetTextMetadata({ text: result.text, matchCurrency });
-
-  return result;
-}
-
-function getParentLink(node: Node | null): HTMLAnchorElement | null {
-  if (node && node.nodeType === Node.ELEMENT_NODE) {
-    return (node as Element).closest('a');
-  }
-
-  if (isTextNode(node)) {
-    return node.parentElement ? node.parentElement.closest('a') : null;
-  }
-
-  return null;
-}
-
-// Take care of "covering links". "Convering links" is the name we give to the
-// approach used by at least asahi.com and nikkei.com on their homepages where
-// they create a big <a> element and a tiny (1px x 1px) span with the link text
-// and then render the actual link content in a separate layer.
-//
-// Roughly it looks something like the following:
-//
-// <div>
-//   <a> <-- Link to article with abs-pos left/right/top/bottom: 0
-//     <span/> <-- Link text as a 1x1 div
-//   </a>
-//   <div> <!-- Actual link content
-//     <figure/>
-//     <h2><a>Link text again</a></h2>
-//     etc.
-//   </div>
-// </div>
-//
-// If we fail to find any text but are pointing at a link, we should try digging
-// for content underneath the link
-function getTextFromCoveringLink({
-  linkElem,
-  originalElem,
-  point,
-  matchCurrency,
-  maxLength,
-}: {
-  linkElem: HTMLAnchorElement;
-  originalElem: Node | null;
-  point: Point;
-  matchCurrency: boolean;
-  maxLength?: number;
-}): GetTextAtPointResult | null {
-  // We'd like to just turn off pointer-events and see what we find but that
-  // will introduce flickering when links have transitions defined on them.
-  //
-  // Instead we first probe to see if there is likely to be some other text
-  // underneath and only toggle pointer-events when that's the case.
-  const hasCoveredElements = document
-    .elementsFromPoint(point.x, point.y)
-    .some((elem) => !elem.contains(linkElem));
-  if (!hasCoveredElements) {
-    return null;
-  }
-
-  // Turn off pointer-events for the covering link
-  const previousPointEvents = linkElem.style.pointerEvents;
-  linkElem.style.pointerEvents = 'none';
-
-  const position = caretPositionFromPoint(point);
-
-  linkElem.style.pointerEvents = previousPointEvents;
+  // Similarly, if we have a Google Docs node, synthesize a node to scan.
+  if (isGdocsOverlayPosition(position)) {
+    let text = '';
+    ({ position, text } = getTextFromAnnotatedCanvas({
+      maxLength,
+      point,
+    }));
 
-  // See if we successfully found a different text node
-  if (
-    !position ||
-    position.offsetNode === originalElem ||
-    !isTextNode(position.offsetNode)
-  ) {
-    return null;
+    return position ? [position, document.createTextNode(text)] : [null, null];
   }
 
-  return getTextFromTextNode({
-    startNode: position.offsetNode,
-    startOffset: position.offset,
-    point,
-    matchCurrency,
-    maxLength,
-  });
+  return [position, null];
 }
 
 function getTextFromRandomElement({
@@ -936,9 +227,7 @@ function getTextFromRandomElement({
   // We divide the world into two types of elements: image-like elements and the
   // rest which we presume to be "text" elements.
   const isImage = getContentType(elem) === 'image';
-  if (isImage && !matchImages) {
-    return null;
-  } else if (!isImage && !matchText) {
+  if ((isImage && !matchImages) || (!isImage && !matchText)) {
     return null;
   }
 
diff --git a/src/content/scan-text.ts b/src/content/scan-text.ts
new file mode 100644
index 0000000000..0f248f0a58
--- /dev/null
+++ b/src/content/scan-text.ts
@@ -0,0 +1,196 @@
+import {
+  nonJapaneseChar,
+  nonJapaneseCharOrNumber,
+  startsWithNumber,
+} from '../utils/char-range';
+import { CursorPosition } from './get-cursor-position';
+import { GetTextAtPointResult } from './get-text';
+import { extractGetTextMetadata, lookForMetadata } from './meta';
+
+export function scanText({
+  startPosition,
+  matchCurrency,
+  maxLength,
+}: {
+  startPosition: CursorPosition<Text>;
+  matchCurrency: boolean;
+  maxLength?: number;
+}): GetTextAtPointResult | null {
+  const { offsetNode: startNode, offset: startOffset } = startPosition;
+
+  // Get the ancestor node for all inline nodes
+  let inlineAncestor = startNode.parentElement;
+  while (isInline(inlineAncestor) && !isRubyAnnotationElement(inlineAncestor)) {
+    inlineAncestor = inlineAncestor!.parentElement;
+  }
+
+  // Skip ruby annotation elements when traversing. However, don't do that
+  // if the inline ancestor is itself a ruby annotation element or else
+  // we'll never be able to find the starting point within the tree walker.
+  let filter: NodeFilter | undefined;
+  if (!isRubyAnnotationElement(inlineAncestor)) {
+    filter = {
+      acceptNode: (node) =>
+        isRubyAnnotationElement(node.parentElement)
+          ? NodeFilter.FILTER_REJECT
+          : NodeFilter.FILTER_ACCEPT,
+    };
+  }
+
+  // Setup a treewalker starting at the current node
+  const treeWalker = document.createNodeIterator(
+    inlineAncestor || startNode,
+    NodeFilter.SHOW_TEXT,
+    filter
+  );
+  while (treeWalker.referenceNode !== startNode && treeWalker.nextNode());
+
+  if (treeWalker.referenceNode !== startNode) {
+    console.error('Could not find node in tree', startNode);
+    return null;
+  }
+
+  // Look for start, skipping any initial whitespace
+  let node = startNode;
+  let offset = startOffset;
+  do {
+    const nodeText = node.data.substring(offset);
+    const textStart = nodeText.search(/\S/);
+    if (textStart !== -1) {
+      offset += textStart;
+      break;
+    }
+    // Curiously with our synthesized text nodes, the next node can sometimes
+    // be the same node. We only tend to reach that case, however, when our
+    // offset corresponds to the end of the text so we just detect that case
+    // earlier on and don't bother checking it here.
+    node = <Text>treeWalker.nextNode();
+    offset = 0;
+  } while (node);
+  // (This should probably not traverse block siblings but oh well)
+
+  if (!node) {
+    return null;
+  }
+
+  const result: GetTextAtPointResult = {
+    text: '',
+    textRange: [],
+  };
+
+  let textDelimiter = nonJapaneseChar;
+
+  // Look for range ends
+  do {
+    const nodeText = node.data.substring(offset);
+    let textEnd = nodeText.search(textDelimiter);
+
+    // Check if we are looking at a special string that accepts a different
+    // range of characters.
+    if (textDelimiter === nonJapaneseChar) {
+      const currentText =
+        result.text +
+        nodeText.substring(0, textEnd === -1 ? undefined : textEnd);
+
+      // If the source starts with a number, expand our text delimeter to allow
+      // reading the rest of the number since it might be something like 5つ.
+      if (!currentText.length && startsWithNumber(nodeText)) {
+        textDelimiter = nonJapaneseCharOrNumber;
+      }
+
+      // Check if we should further expand the set of allowed characters in
+      // order to recognize certains types of metadata-type strings (e.g. years
+      // or floor space measurements).
+      ({ textDelimiter, textEnd } = lookForMetadata({
+        currentText,
+        matchCurrency,
+        nodeText,
+        textDelimiter,
+        textEnd,
+      }));
+    }
+
+    if (typeof maxLength === 'number' && maxLength >= 0) {
+      const maxEnd = maxLength - result.text.length;
+      if (textEnd === -1) {
+        // The >= here is important since it means that if the node has
+        // exactly enough characters to reach the maxLength then we will
+        // stop walking the tree at this point.
+        textEnd = node.data.length - offset >= maxEnd ? maxEnd : -1;
+      } else {
+        textEnd = Math.min(textEnd, maxEnd);
+      }
+    }
+
+    if (textEnd === 0) {
+      // There are no characters here for us.
+      break;
+    } else if (textEnd !== -1) {
+      // The text node has disallowed characters mid-way through so
+      // return up to that point.
+      result.text += nodeText.substring(0, textEnd);
+      result.textRange!.push({
+        node,
+        start: offset,
+        end: offset + textEnd,
+      });
+      break;
+    }
+
+    // The whole text node is allowed characters, keep going.
+    result.text += nodeText;
+    result.textRange!.push({
+      node,
+      start: offset,
+      end: node.data.length,
+    });
+    node = <Text>treeWalker.nextNode();
+    offset = 0;
+  } while (
+    node &&
+    inlineAncestor &&
+    (node.parentElement === inlineAncestor || isInline(node.parentElement))
+  );
+
+  // Check if we didn't find any suitable characters
+  if (!result.textRange!.length) {
+    return null;
+  }
+
+  result.meta = extractGetTextMetadata({ text: result.text, matchCurrency });
+
+  return result;
+}
+
+function isRubyAnnotationElement(element: Element | null) {
+  return element && ['RP', 'RT'].includes(element.tagName);
+}
+
+function isInline(element: Element | null) {
+  return (
+    element &&
+    // We always treat <rb> and <ruby> tags as inline regardless of the styling
+    // since sites like renshuu.org do faux-ruby styling where they give these
+    // elements styles like 'display: table-row-group'.
+    //
+    // We also make an exception for <span> because pdf.js uses
+    // absolutely-positioned (and hence `display: block`) spans to lay out
+    // characters in vertical text.
+    //
+    // Furthermore, we treat inline-block as inline because YouTube puts
+    // okurigana in a separate inline-block span when using ruby.
+    //
+    // Finally, if an element's parent is inline-block, then the element will
+    // still be laid out "inline" so we allow that too (and that appears to be
+    // used by Kanshudo at least).
+    //
+    // Given all these exceptions, I wonder if we should even both checking
+    // the display property.
+    (['RB', 'RUBY', 'SPAN'].includes(element.tagName) ||
+      ['inline', 'inline-block', 'ruby', 'ruby-base', 'ruby-text'].includes(
+        getComputedStyle(element).display!
+      ) ||
+      (element.parentElement &&
+        getComputedStyle(element.parentElement)?.display === 'inline-block'))
+  );
+}
diff --git a/src/utils/dom-utils.ts b/src/utils/dom-utils.ts
index 21ddfcecba..e44af3f240 100644
--- a/src/utils/dom-utils.ts
+++ b/src/utils/dom-utils.ts
@@ -72,7 +72,7 @@ export function isTextInputNode(
   );
 }
 
-export const isTextNode = (node: Node | null): node is CharacterData =>
+export const isTextNode = (node: Node | null): node is Text =>
   !!node && node.nodeType === Node.TEXT_NODE;
 
 export function isSvg(node: Node): boolean {
diff --git a/src/utils/range.ts b/src/utils/range.ts
new file mode 100644
index 0000000000..60e8183948
--- /dev/null
+++ b/src/utils/range.ts
@@ -0,0 +1,36 @@
+/**
+ * Gets a Range for a single codepoint given a character offset and optional
+ * direction.
+ */
+export function getRangeForSingleCodepoint({
+  source,
+  offset,
+  direction = 'forwards',
+}: {
+  source: Text;
+  offset: number;
+  direction?: 'forwards' | 'backwards';
+}): Range {
+  const codepoints = [...source.data];
+  let codepointStart = 0;
+  let lastCodepointLength = 0;
+  while (codepointStart < offset && codepoints.length) {
+    lastCodepointLength = codepoints.shift()!.length;
+    codepointStart += lastCodepointLength;
+  }
+
+  const rangeStart =
+    direction === 'forwards'
+      ? codepointStart
+      : codepointStart - lastCodepointLength;
+  const rangeEnd =
+    direction === 'forwards'
+      ? rangeStart + (codepoints[0]?.length ?? 0)
+      : codepointStart;
+
+  const range = new Range();
+  range.setStart(source, rangeStart);
+  range.setEnd(source, rangeEnd);
+
+  return range;
+}
diff --git a/tests/get-text.test.ts b/tests/get-text.test.ts
index d3b7aa0785..bab1ebf68c 100644
--- a/tests/get-text.test.ts
+++ b/tests/get-text.test.ts
@@ -178,7 +178,7 @@ describe('getTextAtPoint', () => {
     );
   });
 
-  it('should find text in a block cousin if there the grandparent is inline-block', () => {
+  it('should find text in a block cousin if the grandparent is inline-block', () => {
     // Based on https://www.kanshudo.com/grammar/%E3%81%AA%E3%81%84%E3%81%A7%E3%83%BB%E3%81%AA%E3%81%8F%E3%81%A6%E3%83%BB%E3%81%9A%E3%81%AB
     testDiv.innerHTML =
       '<a><span style="display: inline-block"><div>あら</div><div>洗</div></span>わないで</a>';
@@ -238,9 +238,9 @@ describe('getTextAtPoint', () => {
     assertTextResultEqual(result, 'うえお', [lastTextNode, 0, 3]);
   });
 
-  it('should dig into the content behind covering links', () => {
+  it('should dig into the content behind covering links hidden with geometry', () => {
     // The following is based very heavily on the structure of article previews
-    // in asahi.com as of 2021-05-22 although nikkei.com is similar
+    // in asahi.com as of 2021-05-22.
     testDiv.innerHTML =
       '<div><a href="/articles/" style="position: absolute; top: 0; bottom: 0; left: 0; right: 0; z-index: 1"><span aria-hidden="true" style="display: block; width: 1px; height: 1px; overflow: hidden">あいうえお</span></a><div><div style="position: relative; width: 100%"><h2 style="z-index: auto"><a href="/articles/" id="innerLink">あいうえお</a></h2></div></div>';
 
@@ -257,6 +257,55 @@ describe('getTextAtPoint', () => {
     assertTextResultEqual(result, 'いうえお', [textNode, 1, 5]);
   });
 
+  it('should dig into the content behind covering links hidden with opacity', () => {
+    // The following is based on the structure of article previews from
+    // nikkei.com
+    testDiv.innerHTML =
+      '<a href="/articles/" style="position: absolute; top: 0; bottom: 0; left: 0; right: 0; overflow: hidden; opacity: 0">オーバーレイ</a><div style="padding-left: 20px"><h2 style="width: 100%"><a href="/articles/"><span id="innerSpan">あいうえお</span></a></h2></div>';
+
+    const textNode = testDiv.querySelector('#innerSpan')!.firstChild as Text;
+    const bbox = getBboxForOffset(textNode, 1);
+
+    const result = getTextAtPoint({
+      point: {
+        x: bbox.left + bbox.width / 2,
+        y: bbox.top + bbox.height / 2,
+      },
+    });
+
+    assertTextResultEqual(result, 'いうえお', [textNode, 1, 5]);
+  });
+
+  it('should find text in user-select: all content', () => {
+    testDiv.innerHTML = '<span style="user-select: all">あいうえお</span>';
+    const textNode = testDiv.firstChild!.firstChild as Text;
+    const bbox = getBboxForOffset(textNode, 1);
+
+    const result = getTextAtPoint({
+      point: {
+        x: bbox.left + bbox.width / 2,
+        y: bbox.top + bbox.height / 2,
+      },
+    });
+
+    assertTextResultEqual(result, 'いうえお', [textNode, 1, 5]);
+  });
+
+  it('should find text in user-select: none content', () => {
+    testDiv.innerHTML = '<span style="user-select: none">あいうえお</span>';
+    const textNode = testDiv.firstChild!.firstChild as Text;
+    const bbox = getBboxForOffset(textNode, 1);
+
+    const result = getTextAtPoint({
+      point: {
+        x: bbox.left + bbox.width / 2,
+        y: bbox.top + bbox.height / 2,
+      },
+    });
+
+    assertTextResultEqual(result, 'いうえお', [textNode, 1, 5]);
+  });
+
   it('should ignore non-Japanese characters', () => {
     testDiv.append('あいabc');
     const textNode = testDiv.firstChild as Text;
@@ -775,6 +824,7 @@ describe('getTextAtPoint', () => {
 
     for (const move of moves) {
       empty(testDiv);
+      clearPreviousResult();
       testDiv.append(`${move}です`);
       const textNode = testDiv.firstChild as Text;
       const bbox = getBboxForOffset(textNode, 0);
@@ -817,6 +867,7 @@ describe('getTextAtPoint', () => {
 
     // Try again with an all kanji match that should be treated as a number
     empty(testDiv);
+    clearPreviousResult();
     testDiv.append('八三銀です');
     result = getTextAtPoint({
       point: {
@@ -1268,11 +1319,11 @@ describe('getTextAtPoint', () => {
     // _should_ have returned the previous character to what it did).
     //
     // As a result, this may need tweaking from time to time. For now,
-    // hopefully 15px does the trick on all browsers and platforms we test on.
+    // hopefully these values do the trick on all browsers and platforms we test
+    // on.
     const offset = isChromium() ? 13 : 15;
 
     const result = getTextAtPoint({
-      // Just guess here...
       point: { x: bbox.left + offset, y: bbox.top + bbox.height / 2 },
     });
 
diff --git a/tests/range.test.ts b/tests/range.test.ts
new file mode 100644
index 0000000000..6ff01a6203
--- /dev/null
+++ b/tests/range.test.ts
@@ -0,0 +1,51 @@
+import { assert } from 'chai';
+
+import { getRangeForSingleCodepoint } from '../src/utils/range';
+
+mocha.setup('bdd');
+
+describe('getTextAtPoint', () => {
+  it('should handle non-BMP characters', () => {
+    const source = new Text('𠏹沢');
+
+    let range = getRangeForSingleCodepoint({ source, offset: 0 });
+    assert.strictEqual(range.startOffset, 0);
+    assert.strictEqual(range.endOffset, 2);
+
+    range = getRangeForSingleCodepoint({ source, offset: 2 });
+    assert.strictEqual(range.startOffset, 2);
+    assert.strictEqual(range.endOffset, 3);
+
+    range = getRangeForSingleCodepoint({
+      source,
+      offset: 2,
+      direction: 'backwards',
+    });
+    assert.strictEqual(range.startOffset, 0);
+    assert.strictEqual(range.endOffset, 2);
+
+    // Mid-character skips to the next character... just because that's simpler
+    // for now
+    range = getRangeForSingleCodepoint({ source, offset: 1 });
+    assert.strictEqual(range.startOffset, 2);
+    assert.strictEqual(range.endOffset, 3);
+  });
+
+  it('should handle out of range offsets', () => {
+    let range = getRangeForSingleCodepoint({ source: new Text(''), offset: 0 });
+    assert.strictEqual(range.startOffset, 0);
+    assert.strictEqual(range.endOffset, 0);
+
+    range = getRangeForSingleCodepoint({ source: new Text(''), offset: -1 });
+    assert.strictEqual(range.startOffset, 0);
+    assert.strictEqual(range.endOffset, 0);
+
+    range = getRangeForSingleCodepoint({ source: new Text(''), offset: 5 });
+    assert.strictEqual(range.startOffset, 0);
+    assert.strictEqual(range.endOffset, 0);
+
+    range = getRangeForSingleCodepoint({ source: new Text('abc'), offset: 5 });
+    assert.strictEqual(range.startOffset, 3);
+    assert.strictEqual(range.endOffset, 3);
+  });
+});