瀏覽代碼

Fix rebuild index&csv parsing (#2705)

Co-authored-by: luowei <glpat-EjySCyNjWiLqAED-YmwM>
Co-authored-by: crazywoola <427733928@qq.com>
Co-authored-by: crazywoola <100913391+crazywoola@users.noreply.github.com>
tags/0.5.9
Charlie.Wei 1 年之前
父節點
當前提交
fa7ba30ba3
沒有連結到貢獻者的電子郵件帳戶。
共有 2 個檔案被更改,包括 3 行新增2 行删除
  1. 1
    1
      api/core/indexing_runner.py
  2. 2
    1
      api/core/rag/extractor/csv_extractor.py

+ 1
- 1
api/core/indexing_runner.py 查看文件

first() first()


index_type = dataset_document.doc_form index_type = dataset_document.doc_form
index_processor = IndexProcessorFactory(index_type, processing_rule.to_dict()).init_index_processor()
index_processor = IndexProcessorFactory(index_type).init_index_processor()
self._load( self._load(
index_processor=index_processor, index_processor=index_processor,
dataset=dataset, dataset=dataset,

+ 2
- 1
api/core/rag/extractor/csv_extractor.py 查看文件

from typing import Optional from typing import Optional


from core.rag.extractor.extractor_base import BaseExtractor from core.rag.extractor.extractor_base import BaseExtractor
from core.rag.extractor.helpers import detect_file_encodings
from core.rag.models.document import Document from core.rag.models.document import Document




docs = self._read_from_file(csvfile) docs = self._read_from_file(csvfile)
except UnicodeDecodeError as e: except UnicodeDecodeError as e:
if self._autodetect_encoding: if self._autodetect_encoding:
detected_encodings = detect_filze_encodings(self._file_path)
detected_encodings = detect_file_encodings(self._file_path)
for encoding in detected_encodings: for encoding in detected_encodings:
try: try:
with open(self._file_path, newline="", encoding=encoding.encoding) as csvfile: with open(self._file_path, newline="", encoding=encoding.encoding) as csvfile:

Loading…
取消
儲存