| 165 | |
| 166 | |
| 167 | class ImageDocument(Document): |
| 168 | def __init__(self, b, ocr_reader, **kwargs): |
| 169 | self.b = b |
| 170 | self.ocr_reader = ocr_reader |
| 171 | |
| 172 | super().__init__(**kwargs) |
| 173 | |
| 174 | @cached_property |
| 175 | def preview(self) -> "Image": |
| 176 | return [self.b.convert("RGB")] |
| 177 | |
| 178 | @cached_property |
| 179 | def context(self) -> Dict[str, List[Tuple["Image.Image", List[Any]]]]: |
| 180 | words, boxes = self.ocr_reader.apply_ocr(self.b) |
| 181 | return self._generate_document_output([self.b], [words], [boxes], [(self.b.width, self.b.height)]) |
| 182 | |
| 183 | |
| 184 | class WebDocument(Document): |