Nevar pievienot vairāk kā 25 tēmas Tēmai ir jāsākas ar burtu vai ciparu, tā var saturēt domu zīmes ('-') un var būt līdz 35 simboliem gara.

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225
  1. import React, { useEffect, useMemo, useState } from 'react'
  2. import { useRouter } from 'next/navigation'
  3. import { useTranslation } from 'react-i18next'
  4. import { ArrowRightIcon } from '@heroicons/react/24/solid'
  5. import {
  6. RiCheckboxCircleFill,
  7. RiErrorWarningFill,
  8. RiLoader2Fill,
  9. RiTerminalBoxLine,
  10. } from '@remixicon/react'
  11. import cn from '@/utils/classnames'
  12. import Button from '@/app/components/base/button'
  13. import type { IndexingStatusResponse } from '@/models/datasets'
  14. import NotionIcon from '@/app/components/base/notion-icon'
  15. import PriorityLabel from '@/app/components/billing/priority-label'
  16. import { Plan } from '@/app/components/billing/type'
  17. import { ZapFast } from '@/app/components/base/icons/src/vender/solid/general'
  18. import UpgradeBtn from '@/app/components/billing/upgrade-btn'
  19. import { useProviderContext } from '@/context/provider-context'
  20. import Tooltip from '@/app/components/base/tooltip'
  21. import { useInvalidDocumentList } from '@/service/knowledge/use-document'
  22. import DocumentFileIcon from '@/app/components/datasets/common/document-file-icon'
  23. import RuleDetail from './rule-detail'
  24. import type { IndexingType } from '@/app/components/datasets/create/step-two'
  25. import type { RETRIEVE_METHOD } from '@/types/app'
  26. import { DatasourceType, type InitialDocumentDetail } from '@/models/pipeline'
  27. import { useIndexingStatusBatch, useProcessRule } from '@/service/knowledge/use-dataset'
  28. type EmbeddingProcessProps = {
  29. datasetId: string
  30. batchId: string
  31. documents?: InitialDocumentDetail[]
  32. indexingType?: IndexingType
  33. retrievalMethod?: RETRIEVE_METHOD
  34. }
  35. const EmbeddingProcess = ({
  36. datasetId,
  37. batchId,
  38. documents = [],
  39. indexingType,
  40. retrievalMethod,
  41. }: EmbeddingProcessProps) => {
  42. const { t } = useTranslation()
  43. const router = useRouter()
  44. const { enableBilling, plan } = useProviderContext()
  45. const [indexingStatusBatchDetail, setIndexingStatusDetail] = useState<IndexingStatusResponse[]>([])
  46. const [shouldPoll, setShouldPoll] = useState(true)
  47. const { mutateAsync: fetchIndexingStatus } = useIndexingStatusBatch({ datasetId, batchId })
  48. useEffect(() => {
  49. let timeoutId: ReturnType<typeof setTimeout>
  50. const fetchData = async () => {
  51. await fetchIndexingStatus(undefined, {
  52. onSuccess: (res) => {
  53. const indexingStatusDetailList = res.data
  54. setIndexingStatusDetail(indexingStatusDetailList)
  55. const isCompleted = indexingStatusDetailList.every(indexingStatusDetail => ['completed', 'error', 'paused'].includes(indexingStatusDetail.indexing_status))
  56. if (isCompleted)
  57. setShouldPoll(false)
  58. },
  59. onSettled: () => {
  60. if (shouldPoll)
  61. timeoutId = setTimeout(fetchData, 2500)
  62. },
  63. })
  64. }
  65. fetchData()
  66. return () => {
  67. clearTimeout(timeoutId)
  68. }
  69. // eslint-disable-next-line react-hooks/exhaustive-deps
  70. }, [shouldPoll])
  71. // get rule
  72. const firstDocument = documents[0]
  73. const { data: ruleDetail } = useProcessRule(firstDocument.id)
  74. const invalidDocumentList = useInvalidDocumentList()
  75. const navToDocumentList = () => {
  76. invalidDocumentList()
  77. router.push(`/datasets/${datasetId}/documents`)
  78. }
  79. const navToApiDocs = () => {
  80. router.push('/datasets?category=api')
  81. }
  82. const isEmbedding = useMemo(() => {
  83. return indexingStatusBatchDetail.some(indexingStatusDetail => ['indexing', 'splitting', 'parsing', 'cleaning'].includes(indexingStatusDetail?.indexing_status || ''))
  84. }, [indexingStatusBatchDetail])
  85. const isEmbeddingCompleted = useMemo(() => {
  86. return indexingStatusBatchDetail.every(indexingStatusDetail => ['completed', 'error', 'paused'].includes(indexingStatusDetail?.indexing_status || ''))
  87. }, [indexingStatusBatchDetail])
  88. const getSourceName = (id: string) => {
  89. const doc = documents.find(document => document.id === id)
  90. return doc?.name
  91. }
  92. const getFileType = (name?: string) => name?.split('.').pop() || 'txt'
  93. const getSourcePercent = (detail: IndexingStatusResponse) => {
  94. const completedCount = detail.completed_segments || 0
  95. const totalCount = detail.total_segments || 0
  96. if (totalCount === 0)
  97. return 0
  98. const percent = Math.round(completedCount * 100 / totalCount)
  99. return percent > 100 ? 100 : percent
  100. }
  101. const getSourceType = (id: string) => {
  102. const doc = documents.find(document => document.id === id)
  103. return doc?.data_source_type
  104. }
  105. const getIcon = (id: string) => {
  106. const doc = documents.find(document => document.id === id)
  107. return doc?.data_source_info.notion_page_icon
  108. }
  109. const isSourceEmbedding = (detail: IndexingStatusResponse) =>
  110. ['indexing', 'splitting', 'parsing', 'cleaning', 'waiting'].includes(detail.indexing_status || '')
  111. return (
  112. <>
  113. <div className='mb-3 flex h-5 items-center'>
  114. <div className='mr-2 flex items-center justify-between text-sm font-medium text-text-secondary'>
  115. {isEmbedding && <div className='flex items-center'>
  116. <RiLoader2Fill className='mr-1 size-4 animate-spin text-text-secondary' />
  117. {t('datasetDocuments.embedding.processing')}
  118. </div>}
  119. {isEmbeddingCompleted && t('datasetDocuments.embedding.completed')}
  120. </div>
  121. </div>
  122. {
  123. enableBilling && plan.type !== Plan.team && (
  124. <div className='mb-3 flex h-14 items-center rounded-xl border-[0.5px] border-black/5 bg-white p-3 shadow-md'>
  125. <div className='flex h-8 w-8 shrink-0 items-center justify-center rounded-lg bg-[#FFF6ED]'>
  126. <ZapFast className='h-4 w-4 text-[#FB6514]' />
  127. </div>
  128. <div className='mx-3 grow text-[13px] font-medium text-gray-700'>
  129. {t('billing.plansCommon.documentProcessingPriorityUpgrade')}
  130. </div>
  131. <UpgradeBtn loc='knowledge-speed-up' />
  132. </div>
  133. )
  134. }
  135. <div className='flex flex-col gap-0.5 pb-2'>
  136. {indexingStatusBatchDetail.map(indexingStatusDetail => (
  137. <div key={indexingStatusDetail.id} className={cn(
  138. 'relative h-[26px] overflow-hidden rounded-md bg-components-progress-bar-bg',
  139. indexingStatusDetail.indexing_status === 'error' && 'bg-state-destructive-hover-alt',
  140. )}>
  141. {isSourceEmbedding(indexingStatusDetail) && (
  142. <div
  143. className='absolute left-0 top-0 h-full min-w-0.5 border-r-[2px] border-r-components-progress-bar-progress-highlight bg-components-progress-bar-progress'
  144. style={{ width: `${getSourcePercent(indexingStatusDetail)}%` }}
  145. />
  146. )}
  147. <div className='z-[1] flex h-full items-center gap-1 pl-[6px] pr-2'>
  148. {getSourceType(indexingStatusDetail.id) === DatasourceType.localFile && (
  149. <DocumentFileIcon
  150. className='size-4 shrink-0'
  151. name={getSourceName(indexingStatusDetail.id)}
  152. extension={getFileType(getSourceName(indexingStatusDetail.id))}
  153. />
  154. )}
  155. {getSourceType(indexingStatusDetail.id) === DatasourceType.onlineDocument && (
  156. <NotionIcon
  157. className='shrink-0'
  158. type='page'
  159. src={getIcon(indexingStatusDetail.id)}
  160. />
  161. )}
  162. <div className='flex w-0 grow items-center gap-1' title={getSourceName(indexingStatusDetail.id)}>
  163. <div className='system-xs-medium truncate text-text-secondary'>
  164. {getSourceName(indexingStatusDetail.id)}
  165. </div>
  166. {
  167. enableBilling && (
  168. <PriorityLabel className='ml-0' />
  169. )
  170. }
  171. </div>
  172. {isSourceEmbedding(indexingStatusDetail) && (
  173. <div className='shrink-0 text-xs text-text-secondary'>{`${getSourcePercent(indexingStatusDetail)}%`}</div>
  174. )}
  175. {indexingStatusDetail.indexing_status === 'error' && (
  176. <Tooltip
  177. popupClassName='px-4 py-[14px] max-w-60 text-sm leading-4 text-text-secondary border-[0.5px] border-components-panel-border rounded-xl'
  178. offset={4}
  179. popupContent={indexingStatusDetail.error}
  180. >
  181. <span>
  182. <RiErrorWarningFill className='size-4 shrink-0 text-text-destructive' />
  183. </span>
  184. </Tooltip>
  185. )}
  186. {indexingStatusDetail.indexing_status === 'completed' && (
  187. <RiCheckboxCircleFill className='size-4 shrink-0 text-text-success' />
  188. )}
  189. </div>
  190. </div>
  191. ))}
  192. </div>
  193. <hr className='my-3 h-[1px] border-0 bg-divider-subtle' />
  194. <RuleDetail
  195. sourceData={ruleDetail}
  196. indexingType={indexingType}
  197. retrievalMethod={retrievalMethod}
  198. />
  199. <div className='my-10 flex items-center gap-2'>
  200. <Button className='w-fit' onClick={navToApiDocs}>
  201. <RiTerminalBoxLine className='mr-2 size-4' />
  202. <span>Access the API</span>
  203. </Button>
  204. <Button className='w-fit' variant='primary' onClick={navToDocumentList}>
  205. <span>{t('datasetCreation.stepThree.navTo')}</span>
  206. <ArrowRightIcon className='ml-2 size-4 stroke-current stroke-1' />
  207. </Button>
  208. </div>
  209. </>
  210. )
  211. }
  212. export default EmbeddingProcess