Skip to content

Commit 54ed8ae

Browse files
authored
parametrize edge config (#431)
This PR parametrizes the edge config for `DetrImageProcessor` model used for table transformer.
1 parent 8407827 commit 54ed8ae

File tree

4 files changed

+17
-3
lines changed

4 files changed

+17
-3
lines changed

CHANGELOG.md

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,7 @@
1+
## 1.0.5-dev0
2+
3+
* feat: parametrize edge config for `DetrImageProcessor` with env variables
4+
15
## 1.0.4
26

37
* feat: use singleton instead of `global` to store shared variables

unstructured_inference/__version__.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1 +1 @@
1-
__version__ = "1.0.4" # pragma: no cover
1+
__version__ = "1.0.5-dev0" # pragma: no cover

unstructured_inference/config.py

Lines changed: 10 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -106,5 +106,15 @@ def ELEMENTS_V_PADDING_COEF(self) -> float:
106106
"""Same as ELEMENTS_H_PADDING_COEF but the vertical extension."""
107107
return self._get_float("ELEMENTS_V_PADDING_COEF", 0.3)
108108

109+
@property
110+
def IMG_PROCESSOR_LONGEST_EDGE(self) -> int:
111+
"""configuration for DetrImageProcessor to scale images"""
112+
return self._get_int("IMG_PROCESSOR_LONGEST_EDGE", 1333)
113+
114+
@property
115+
def IMG_PROCESSOR_SHORTEST_EDGE(self) -> int:
116+
"""configuration for DetrImageProcessor to scale images"""
117+
return self._get_int("IMG_PROCESSOR_SHORTEST_EDGE", 800)
118+
109119

110120
inference_config = InferenceConfig()

unstructured_inference/models/tables.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -73,8 +73,8 @@ def initialize(
7373
self.feature_extractor = DetrImageProcessor.from_pretrained(model)
7474
# value not set in the configuration and needed for newer models
7575
# https://huggingface.co/microsoft/table-transformer-structure-recognition-v1.1-all/discussions/1
76-
self.feature_extractor.size["shortest_edge"] = 800
77-
self.feature_extractor.size["longest_edge"] = 1333
76+
self.feature_extractor.size["shortest_edge"] = inference_config.IMG_PROCESSOR_SHORTEST_EDGE
77+
self.feature_extractor.size["longest_edge"] = inference_config.IMG_PROCESSOR_LONGEST_EDGE
7878

7979
try:
8080
logger.info("Loading the table structure model ...")

0 commit comments

Comments
 (0)