XFA - Support text search in XFA documents.

Moves the logic out of TextLayerBuilder to handle highlighting matches into a new separate class `TextHighlighter` that can be used with regular PDFs and XFA PDFs. To mimic the current find functionality in XFA, two arrays from the XFA rendering are created to get the text content and map those to DOM nodes. Fixes #13878
2025-07-09 17:55:37 +02:00 · 2021-08-18 17:02:29 -07:00 · 2021-08-18 17:02:29 -07:00 · bb47128864
commit bb47128864
parent 3c8ee25e05
11 changed files with 531 additions and 238 deletions
--- a/src/display/api.js
+++ b/src/display/api.js
@ -62,6 +62,7 @@ import { MessageHandler } from "../shared/message_handler.js";
 import { Metadata } from "./metadata.js";
 import { OptionalContentConfig } from "./optional_content_config.js";
 import { PDFDataTransportStream } from "./transport_stream.js";
+import { XfaText } from "./xfa_text.js";

 const DEFAULT_RANGE_CHUNK_SIZE = 65536; // 2^16 = 65536
 const RENDERING_CANCELLED_TIMEOUT = 100; // ms
@ -1561,6 +1562,13 @@ class PDFPageProxy {
   *   {@link TextContent} object that represents the page's text content.
   */
  getTextContent(params = {}) {
+    if (this._transport._htmlForXfa) {
+      // TODO: We need to revisit this once the XFA foreground patch lands and
+      // only do this for non-foreground XFA.
+      return this.getXfa().then(xfa => {
+        return XfaText.textContent(xfa);
+      });
+    }
    const readableStream = this.streamTextContent(params);

    return new Promise(function (resolve, reject) {