Unverified Commit fa7ba30b authored by Charlie.Wei's avatar Charlie.Wei Committed by GitHub

Fix rebuild index&csv parsing (#2705)

Co-authored-by: luowei <glpat-EjySCyNjWiLqAED-YmwM>
Co-authored-by: 's avatarcrazywoola <427733928@qq.com>
Co-authored-by: 's avatarcrazywoola <100913391+crazywoola@users.noreply.github.com>
parent 1cf5f510
...@@ -186,7 +186,7 @@ class IndexingRunner: ...@@ -186,7 +186,7 @@ class IndexingRunner:
first() first()
index_type = dataset_document.doc_form index_type = dataset_document.doc_form
index_processor = IndexProcessorFactory(index_type, processing_rule.to_dict()).init_index_processor() index_processor = IndexProcessorFactory(index_type).init_index_processor()
self._load( self._load(
index_processor=index_processor, index_processor=index_processor,
dataset=dataset, dataset=dataset,
......
...@@ -3,6 +3,7 @@ import csv ...@@ -3,6 +3,7 @@ import csv
from typing import Optional from typing import Optional
from core.rag.extractor.extractor_base import BaseExtractor from core.rag.extractor.extractor_base import BaseExtractor
from core.rag.extractor.helpers import detect_file_encodings
from core.rag.models.document import Document from core.rag.models.document import Document
...@@ -36,7 +37,7 @@ class CSVExtractor(BaseExtractor): ...@@ -36,7 +37,7 @@ class CSVExtractor(BaseExtractor):
docs = self._read_from_file(csvfile) docs = self._read_from_file(csvfile)
except UnicodeDecodeError as e: except UnicodeDecodeError as e:
if self._autodetect_encoding: if self._autodetect_encoding:
detected_encodings = detect_filze_encodings(self._file_path) detected_encodings = detect_file_encodings(self._file_path)
for encoding in detected_encodings: for encoding in detected_encodings:
try: try:
with open(self._file_path, newline="", encoding=encoding.encoding) as csvfile: with open(self._file_path, newline="", encoding=encoding.encoding) as csvfile:
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment