|
|
|
@@ -138,7 +138,7 @@ export default { |
|
|
|
fromMessage: 'Missing start page number', |
|
|
|
toPlaceholder: 'to', |
|
|
|
toMessage: 'Missing end page number (excluded)', |
|
|
|
layoutRecognize: 'Document parser', |
|
|
|
layoutRecognize: 'PDF parser', |
|
|
|
layoutRecognizeTip: |
|
|
|
'Use a visual model for PDF layout analysis to effectively locate document titles, text blocks, images, and tables. If the naive option is chosen, only the plain text in the PDF will be retrieved. Please note that this option currently works ONLY for PDF documents.', |
|
|
|
taskPageSize: 'Task page size', |
|
|
|
@@ -161,7 +161,7 @@ export default { |
|
|
|
rerankTip: `If left empty, RAGFlow will use a combination of weighted keyword similarity and weighted vector cosine similarity; if a rerank model is selected, a weighted reranking score will replace the weighted vector cosine similarity. Please be aware that using a rerank model will significantly increase the system's response time.`, |
|
|
|
topK: 'Top-K', |
|
|
|
topKTip: `K chunks will be sent into the rerank model.`, |
|
|
|
delimiter: `Delimiters`, |
|
|
|
delimiter: `Delimiter for text`, |
|
|
|
delimiterTip: |
|
|
|
'A delimiter or separator can consist of one or multiple special characters. If it is multiple characters, ensure they are enclosed in backticks( ``). For example, if you configure your delimiters like this: \n`##`;, then your texts will be separated at line breaks, double hash symbols (##), or semicolons.', |
|
|
|
html4excel: 'Excel to HTML', |
|
|
|
@@ -209,8 +209,8 @@ export default { |
|
|
|
languagePlaceholder: 'Please input your language!', |
|
|
|
permissions: 'Permissions', |
|
|
|
embeddingModel: 'Embedding model', |
|
|
|
chunkTokenNumber: 'Chunk token number', |
|
|
|
chunkTokenNumberMessage: 'Chunk token number is required', |
|
|
|
chunkTokenNumber: 'Chunk token number for text', |
|
|
|
chunkTokenNumberMessage: 'Chunk token number for text is required', |
|
|
|
embeddingModelTip: |
|
|
|
'The model that converts chunks into embeddings. It cannot be changed once the knowledge base has chunks. To switch to a different embedding model, you must delete all existing chunks in the knowledge base.', |
|
|
|
permissionsTip: |
|
|
|
@@ -250,7 +250,7 @@ export default { |
|
|
|
<p>This method chunks files using a 'naive' method: </p> |
|
|
|
<p> |
|
|
|
<li>Use vision detection model to split the texts into smaller segments.</li> |
|
|
|
<li>Then, combine adjacent segments until the token count exceeds the threshold specified by 'Chunk token number', at which point a chunk is created.</li></p>`, |
|
|
|
<li>Then, combine adjacent segments until the token count exceeds the threshold specified by 'Chunk token number for text', at which point a chunk is created.</li></p>`, |
|
|
|
paper: `<p>Only <b>PDF</b> file is supported.</p><p> |
|
|
|
Papers will be split by section, such as <i>abstract, 1.1, 1.2</i>. </p><p> |
|
|
|
This approach enables the LLM to summarize the paper more effectively and to provide more comprehensive, understandable responses. |
|
|
|
@@ -312,7 +312,7 @@ export default { |
|
|
|
</p>`, |
|
|
|
knowledgeGraph: `<p>Supported file formats are <b>DOCX, EXCEL, PPT, IMAGE, PDF, TXT, MD, JSON, EML</b> |
|
|
|
|
|
|
|
<p>This approach chunks files using the 'naive'/'General' method. It splits a document into segments and then combines adjacent segments until the token count exceeds the threshold specified by 'Chunk token number', at which point a chunk is created.</p> |
|
|
|
<p>This approach chunks files using the 'naive'/'General' method. It splits a document into segments and then combines adjacent segments until the token count exceeds the threshold specified by 'Chunk token number for text', at which point a chunk is created.</p> |
|
|
|
<p>The chunks are then fed to the LLM to extract entities and relationships for a knowledge graph and a mind map.</p> |
|
|
|
<p>Ensure that you set the <b>Entity types</b>.</p>`, |
|
|
|
tag: `<p>Knowledge base using 'Tag' as a chunking method is supposed to be used by other knowledge bases to add tags to their chunks, queries to which will also be with tags too.</p> |