MCPcopy
hub / github.com/impira/docquery / ImageDocument

Class ImageDocument

src/docquery/document.py:167–181  ·  view source on GitHub ↗

Source from the content-addressed store, hash-verified

165
166
167class ImageDocument(Document):
168 def __init__(self, b, ocr_reader, **kwargs):
169 self.b = b
170 self.ocr_reader = ocr_reader
171
172 super().__init__(**kwargs)
173
174 @cached_property
175 def preview(self) -> "Image":
176 return [self.b.convert("RGB")]
177
178 @cached_property
179 def context(self) -> Dict[str, List[Tuple["Image.Image", List[Any]]]]:
180 words, boxes = self.ocr_reader.apply_ocr(self.b)
181 return self._generate_document_output([self.b], [words], [boxes], [(self.b.width, self.b.height)])
182
183
184class WebDocument(Document):

Callers 1

load_documentFunction · 0.85

Calls

no outgoing calls

Tested by

no test coverage detected