|
@@ -113,7 +113,7 @@ def _extract_text_by_mime_type(*, file_content: bytes, mime_type: str) -> str:
|
|
|
def _extract_text_by_file_extension(*, file_content: bytes, file_extension: str) -> str:
|
|
|
"""Extract text from a file based on its file extension."""
|
|
|
match file_extension:
|
|
|
- case ".txt" | ".markdown" | ".md" | ".html" | ".htm" | ".xml":
|
|
|
+ case ".txt" | ".markdown" | ".md" | ".html" | ".htm" | ".xml" | ".vtt":
|
|
|
return _extract_text_from_plain_text(file_content)
|
|
|
case ".json":
|
|
|
return _extract_text_from_json(file_content)
|