del doc support (#2494)

Co-authored-by: jyong <jyong@dify.ai>

del doc support (#2494)
Co-authored-by: jyong <jyong@dify.ai>
20b932da · Jyong · GitHub · 207080ba · 20b932da · 20b932da
Unverified Commit 20b932da authored Feb 20, 2024 by Jyong Committed by GitHub Feb 20, 2024
Hide whitespace changes
Inline Side-by-side

Showing with 5 additions and 5 deletions

file_extractor.py api/core/data_loader/file_extractor.py +2 -2

file_service.py api/services/file_service.py +3 -3

No files found.
--- a/api/core/data_loader/file_extractor.py
+++ b/api/core/data_loader/file_extractor.py
@@ -69,7 +69,7 @@ class FileExtractor:
                    else MarkdownLoader(file_path, autodetect_encoding=True)
            elif file_extension in ['.htm', '.html']:
                loader = HTMLLoader(file_path)
-            elif file_extension in ['.docx', '.doc']:
+            elif file_extension in ['.docx']:
                loader = Docx2txtLoader(file_path)
            elif file_extension == '.csv':
                loader = CSVLoader(file_path, autodetect_encoding=True)
@@ -96,7 +96,7 @@ class FileExtractor:
                loader = MarkdownLoader(file_path, autodetect_encoding=True)
            elif file_extension in ['.htm', '.html']:
                loader = HTMLLoader(file_path)
-            elif file_extension in ['.docx', '.doc']:
+            elif file_extension in ['.docx']:
                loader = Docx2txtLoader(file_path)
            elif file_extension == '.csv':
                loader = CSVLoader(file_path, autodetect_encoding=True)

--- a/api/services/file_service.py
+++ b/api/services/file_service.py
@@ -20,9 +20,9 @@ from services.errors.file import FileTooLargeError, UnsupportedFileTypeError
 IMAGE_EXTENSIONS = ['jpg', 'jpeg', 'png', 'webp', 'gif', 'svg']
 IMAGE_EXTENSIONS.extend([ext.upper() for ext in IMAGE_EXTENSIONS])
-ALLOWED_EXTENSIONS = ['txt', 'markdown', 'md', 'pdf', 'html', 'htm', 'xlsx', 'docx', 'doc', 'csv'] + IMAGE_EXTENSIONS
+ALLOWED_EXTENSIONS = ['txt', 'markdown', 'md', 'pdf', 'html', 'htm', 'xlsx', 'docx', 'csv'] + IMAGE_EXTENSIONS
 UNSTRUSTURED_ALLOWED_EXTENSIONS = ['txt', 'markdown', 'md', 'pdf', 'html', 'htm', 'xlsx',
-                                      'docx', 'doc', 'csv', 'eml', 'msg', 'pptx', 'ppt', 'xml'] + IMAGE_EXTENSIONS
+                                   'docx', 'csv', 'eml', 'msg', 'pptx', 'ppt', 'xml'] + IMAGE_EXTENSIONS
 PREVIEW_WORDS_LIMIT = 3000
@@ -162,7 +162,7 @@ class FileService:
        generator = storage.load(upload_file.key, stream=True)
        return generator, upload_file.mime_type
    @staticmethod
    def get_public_image_preview(file_id: str) -> str:
        upload_file = db.session.query(UploadFile) \