| self._file_cache_key = file_cache_key | self._file_cache_key = file_cache_key | ||||
| def extract(self) -> list[Document]: | def extract(self) -> list[Document]: | ||||
| plaintext_file_key = "" | |||||
| plaintext_file_exists = False | plaintext_file_exists = False | ||||
| if self._file_cache_key: | if self._file_cache_key: | ||||
| try: | try: | ||||
| text = "\n\n".join(text_list) | text = "\n\n".join(text_list) | ||||
| # save plaintext file for caching | # save plaintext file for caching | ||||
| if not plaintext_file_exists and plaintext_file_key: | |||||
| storage.save(plaintext_file_key, text.encode("utf-8")) | |||||
| if not plaintext_file_exists and self._file_cache_key: | |||||
| storage.save(self._file_cache_key, text.encode("utf-8")) | |||||
| return documents | return documents | ||||