From d916c71d222ce1126b19cccedf571c60214485dc Mon Sep 17 00:00:00 2001
From: Michal Martyniak <michal.martyniak@deepsense.ai>
Date: Tue, 27 Jan 2026 14:21:14 +0100
Subject: [PATCH 1/2] fix: remove device_map to prevent meta tensor errors in
 table detection

The device_map parameter with HuggingFace Transformers can cause
NotImplementedError "Cannot copy out of meta tensor" in multi-threaded
contexts when loading TableTransformerForObjectDetection models.

This fix:
- Removes device_map from DetrImageProcessor.from_pretrained()
- Removes device_map from TableTransformerForObjectDetection.from_pretrained()
- Uses explicit .to(device) after model loading instead

This pattern matches the fix applied to SentenceTransformer models in
core-product (commits c8b175f7 and db636932).

Error observed in in-vpc customer deployment when using strategy=fast with table detection.
---
 CHANGELOG.md                            | 4 ++++
 unstructured_inference/models/tables.py | 8 +++-----
 2 files changed, 7 insertions(+), 5 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index c71091ce..64947f21 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,3 +1,7 @@
+## 1.1.8
+
+- Fix: Remove `device_map` parameter from TableTransformerForObjectDetection to prevent meta tensor errors during multi-threaded table detection
+
 ## 1.1.7
 
 - Update OpenCV-Python to 4.13.0.90 to squash ffmpeg vulnerability CVE-2023-6605
diff --git a/unstructured_inference/models/tables.py b/unstructured_inference/models/tables.py
index 3dc3ec1d..57716ef5 100644
--- a/unstructured_inference/models/tables.py
+++ b/unstructured_inference/models/tables.py
@@ -72,7 +72,7 @@ def initialize(
     ):
         """Loads the donut model using the specified parameters"""
         self.device = device
-        self.feature_extractor = DetrImageProcessor.from_pretrained(model, device_map=self.device)
+        self.feature_extractor = DetrImageProcessor.from_pretrained(model)
         # value not set in the configuration and needed for newer models
         # https://huggingface.co/microsoft/table-transformer-structure-recognition-v1.1-all/discussions/1
         self.feature_extractor.size["shortest_edge"] = inference_config.IMG_PROCESSOR_SHORTEST_EDGE
@@ -82,10 +82,8 @@ def initialize(
             logger.info("Loading the table structure model ...")
             cached_current_verbosity = logging.get_verbosity()
             logging.set_verbosity_error()
-            self.model = TableTransformerForObjectDetection.from_pretrained(
-                model,
-                device_map=self.device,
-            )
+            self.model = TableTransformerForObjectDetection.from_pretrained(model)
+            self.model.to(self.device)
             logging.set_verbosity(cached_current_verbosity)
             self.model.eval()
 

From ae4d40a776ef8d47683beffad0a7aff28d45d690 Mon Sep 17 00:00:00 2001
From: Michal Martyniak <michal.martyniak@deepsense.ai>
Date: Wed, 28 Jan 2026 12:25:35 +0100
Subject: [PATCH 2/2] fix: remove manual pypdfium2 close() calls to prevent
 finalization errors

Removed manual bitmap.close() and page.close() calls in convert_pdf_to_image()
to prevent pypdfium2 AssertionError during concurrent PDF processing.

Issue: When manually closing child objects (bitmap, page) followed by parent
PDF close, pypdfium2's weakref finalizers can run after parent closes,
triggering assertion failures in cleanup logic.

Solution: Let pypdfium2 finalizers handle resource cleanup automatically.
This prevents double-cleanup race conditions and simplifies code.

Version: Bumped to 1.1.9
---
 CHANGELOG.md                               |  6 +++-
 unstructured_inference/inference/layout.py | 33 ++++++++++------------
 2 files changed, 20 insertions(+), 19 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 64947f21..67d638cc 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,6 +1,10 @@
+## 1.1.9
+
+- Fix: Remove manual pypdfium2 close() calls to prevent finalization AssertionError during concurrent PDF processing. Let pypdfium2 finalizers handle resource cleanup.
+
 ## 1.1.8
 
-- Fix: Remove `device_map` parameter from TableTransformerForObjectDetection to prevent meta tensor errors during multi-threaded table detection
+- Fix: Remove `device_map` parameter from TableTransformerForObjectDetection to prevent meta tensor errors during multi-threaded table detection. Added device normalization and explicit dtype specification for robustness.
 
 ## 1.1.7
 
diff --git a/unstructured_inference/inference/layout.py b/unstructured_inference/inference/layout.py
index efc8b021..b11bd438 100644
--- a/unstructured_inference/inference/layout.py
+++ b/unstructured_inference/inference/layout.py
@@ -426,24 +426,21 @@ def convert_pdf_to_image(
             dpi = inference_config.PDF_RENDER_DPI
         scale = dpi / 72.0
         for i, page in enumerate(pdf, start=1):
-            try:
-                if first_page is not None and i < first_page:
-                    continue
-                if last_page is not None and i > last_page:
-                    break
-                bitmap = page.render(
-                    scale=scale,
-                    no_smoothtext=False,
-                    no_smoothimage=False,
-                    no_smoothpath=False,
-                    optimize_mode="print",
-                )
-                try:
-                    images[i] = bitmap.to_pil()
-                finally:
-                    bitmap.close()
-            finally:
-                page.close()
+            if first_page is not None and i < first_page:
+                continue
+            if last_page is not None and i > last_page:
+                break
+            bitmap = page.render(
+                scale=scale,
+                no_smoothtext=False,
+                no_smoothimage=False,
+                no_smoothpath=False,
+                optimize_mode="print",
+            )
+            # Convert to PIL immediately, then let pypdfium2 finalizers handle cleanup
+            images[i] = bitmap.to_pil()
+            # No manual close - prevents finalization race with parent PDF close
+
         if not output_folder:
             return list(images.values())
         else: