Browse Source

fix nltk averaged_perceptron_tagger download and fix score limit is none (#7582)

Co-authored-by: crazywoola <100913391+crazywoola@users.noreply.github.com>
tags/0.7.2
Jyong 1 year ago
parent
commit
7ae728a9a3
No account linked to committer's email address
3 changed files with 3 additions and 1 deletions
  1. 1
    0
      api/.idea/vcs.xml
  2. 1
    1
      api/Dockerfile
  3. 1
    0
      api/core/rag/retrieval/dataset_retrieval.py

+ 1
- 0
api/.idea/vcs.xml View File

</component> </component>
<component name="VcsDirectoryMappings"> <component name="VcsDirectoryMappings">
<mapping directory="" vcs="Git" /> <mapping directory="" vcs="Git" />
<mapping directory="$PROJECT_DIR$/.." vcs="Git" />
</component> </component>
</project> </project>

+ 1
- 1
api/Dockerfile View File

ENV PATH="${VIRTUAL_ENV}/bin:${PATH}" ENV PATH="${VIRTUAL_ENV}/bin:${PATH}"


# Download nltk data # Download nltk data
RUN python -c "import nltk; nltk.download('punkt')"
RUN python -c "import nltk; nltk.download('punkt'); nltk.download('averaged_perceptron_tagger')"


# Copy source code # Copy source code
COPY . /app/api/ COPY . /app/api/

+ 1
- 0
api/core/rag/retrieval/dataset_retrieval.py View File

for document in all_documents: for document in all_documents:
if score_threshold is None or document.metadata['score'] >= score_threshold: if score_threshold is None or document.metadata['score'] >= score_threshold:
filter_documents.append(document) filter_documents.append(document)

if not filter_documents: if not filter_documents:
return [] return []
filter_documents = sorted(filter_documents, key=lambda x: x.metadata['score'], reverse=True) filter_documents = sorted(filter_documents, key=lambda x: x.metadata['score'], reverse=True)

Loading…
Cancel
Save