diff --git a/CHANGELOG.md b/CHANGELOG.md index 3cb7044e40..1d7e9988fc 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -1,3 +1,7 @@ +## 0.22.2 + +- Store routing in ElementMetadata + ## 0.22.1 ### Fixes diff --git a/unstructured/__version__.py b/unstructured/__version__.py index 55823cfd96..31dba6e8f3 100644 --- a/unstructured/__version__.py +++ b/unstructured/__version__.py @@ -1 +1 @@ -__version__ = "0.22.1" # pragma: no cover +__version__ = "0.22.2" # pragma: no cover diff --git a/unstructured/documents/elements.py b/unstructured/documents/elements.py index 4ead6617f4..af52e8cd5f 100644 --- a/unstructured/documents/elements.py +++ b/unstructured/documents/elements.py @@ -195,6 +195,10 @@ class ElementMetadata: page_number: Optional[int] parent_id: Optional[str] + # -- routing decision (page-level) -- + routing: Optional[str] + routing_score: Optional[float] + # -- e-mail specific metadata fields -- bcc_recipient: Optional[list[str]] cc_recipient: Optional[list[str]] @@ -250,6 +254,8 @@ def __init__( page_name: Optional[str] = None, page_number: Optional[int] = None, parent_id: Optional[str] = None, + routing: Optional[str] = None, + routing_score: Optional[float] = None, sent_from: Optional[list[str]] = None, sent_to: Optional[list[str]] = None, signature: Optional[str] = None, @@ -297,6 +303,8 @@ def __init__( self.page_name = page_name self.page_number = page_number self.parent_id = parent_id + self.routing = routing + self.routing_score = routing_score self.sent_from = sent_from self.sent_to = sent_to self.signature = signature @@ -520,6 +528,8 @@ def field_consolidation_strategies(cls) -> dict[str, ConsolidationStrategy]: "page_name": cls.FIRST, "page_number": cls.FIRST, "parent_id": cls.DROP, + "routing": cls.DROP, + "routing_score": cls.DROP, "sent_from": cls.FIRST, "sent_to": cls.FIRST, "signature": cls.FIRST,