| import datetime | import datetime | ||||
| import hashlib | import hashlib | ||||
| import tempfile | import tempfile | ||||
| import chardet | |||||
| import time | import time | ||||
| import uuid | import uuid | ||||
| from pathlib import Path | from pathlib import Path | ||||
| # ['txt', 'markdown', 'md'] | # ['txt', 'markdown', 'md'] | ||||
| with open(filepath, "rb") as fp: | with open(filepath, "rb") as fp: | ||||
| data = fp.read() | data = fp.read() | ||||
| text = data.decode(encoding='utf-8').strip() if data else '' | |||||
| encoding = chardet.detect(data)['encoding'] | |||||
| text = data.decode(encoding=encoding).strip() if data else '' | |||||
| text = text[0:PREVIEW_WORDS_LIMIT] if text else '' | text = text[0:PREVIEW_WORDS_LIMIT] if text else '' | ||||
| return {'content': text} | return {'content': text} |