| def _extract_text_by_file_extension(*, file_content: bytes, file_extension: str) -> str: | def _extract_text_by_file_extension(*, file_content: bytes, file_extension: str) -> str: | ||||
| """Extract text from a file based on its file extension.""" | """Extract text from a file based on its file extension.""" | ||||
| match file_extension: | match file_extension: | ||||
| case ".txt" | ".markdown" | ".md" | ".html" | ".htm" | ".xml": | |||||
| case ".txt" | ".markdown" | ".md" | ".html" | ".htm" | ".xml" | ".vtt": | |||||
| return _extract_text_from_plain_text(file_content) | return _extract_text_from_plain_text(file_content) | ||||
| case ".json": | case ".json": | ||||
| return _extract_text_from_json(file_content) | return _extract_text_from_json(file_content) |