You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251
  1. import React, { useEffect, useMemo, useState } from 'react'
  2. import { useRouter } from 'next/navigation'
  3. import { useTranslation } from 'react-i18next'
  4. import {
  5. RiAedFill,
  6. RiArrowRightLine,
  7. RiCheckboxCircleFill,
  8. RiErrorWarningFill,
  9. RiLoader2Fill,
  10. RiTerminalBoxLine,
  11. } from '@remixicon/react'
  12. import cn from '@/utils/classnames'
  13. import Button from '@/app/components/base/button'
  14. import type { IndexingStatusResponse } from '@/models/datasets'
  15. import NotionIcon from '@/app/components/base/notion-icon'
  16. import PriorityLabel from '@/app/components/billing/priority-label'
  17. import { Plan } from '@/app/components/billing/type'
  18. import UpgradeBtn from '@/app/components/billing/upgrade-btn'
  19. import { useProviderContext } from '@/context/provider-context'
  20. import Tooltip from '@/app/components/base/tooltip'
  21. import { useInvalidDocumentList } from '@/service/knowledge/use-document'
  22. import DocumentFileIcon from '@/app/components/datasets/common/document-file-icon'
  23. import RuleDetail from './rule-detail'
  24. import type { IndexingType } from '@/app/components/datasets/create/step-two'
  25. import type { RETRIEVE_METHOD } from '@/types/app'
  26. import { DatasourceType, type InitialDocumentDetail } from '@/models/pipeline'
  27. import { useIndexingStatusBatch, useProcessRule } from '@/service/knowledge/use-dataset'
  28. import Divider from '@/app/components/base/divider'
  29. import { useDatasetApiAccessUrl } from '@/hooks/use-api-access-url'
  30. import Link from 'next/link'
  31. type EmbeddingProcessProps = {
  32. datasetId: string
  33. batchId: string
  34. documents?: InitialDocumentDetail[]
  35. indexingType?: IndexingType
  36. retrievalMethod?: RETRIEVE_METHOD
  37. }
  38. const EmbeddingProcess = ({
  39. datasetId,
  40. batchId,
  41. documents = [],
  42. indexingType,
  43. retrievalMethod,
  44. }: EmbeddingProcessProps) => {
  45. const { t } = useTranslation()
  46. const router = useRouter()
  47. const { enableBilling, plan } = useProviderContext()
  48. const [indexingStatusBatchDetail, setIndexingStatusDetail] = useState<IndexingStatusResponse[]>([])
  49. const [shouldPoll, setShouldPoll] = useState(true)
  50. const { mutateAsync: fetchIndexingStatus } = useIndexingStatusBatch({ datasetId, batchId })
  51. useEffect(() => {
  52. let timeoutId: ReturnType<typeof setTimeout>
  53. const fetchData = async () => {
  54. await fetchIndexingStatus(undefined, {
  55. onSuccess: (res) => {
  56. const indexingStatusDetailList = res.data
  57. setIndexingStatusDetail(indexingStatusDetailList)
  58. const isCompleted = indexingStatusDetailList.every(indexingStatusDetail => ['completed', 'error', 'paused'].includes(indexingStatusDetail.indexing_status))
  59. if (isCompleted)
  60. setShouldPoll(false)
  61. },
  62. onSettled: () => {
  63. if (shouldPoll)
  64. timeoutId = setTimeout(fetchData, 2500)
  65. },
  66. })
  67. }
  68. fetchData()
  69. return () => {
  70. clearTimeout(timeoutId)
  71. }
  72. }, [shouldPoll])
  73. // get rule
  74. const firstDocument = documents[0]
  75. const { data: ruleDetail } = useProcessRule(firstDocument.id)
  76. const invalidDocumentList = useInvalidDocumentList()
  77. const navToDocumentList = () => {
  78. invalidDocumentList()
  79. router.push(`/datasets/${datasetId}/documents`)
  80. }
  81. const apiReferenceUrl = useDatasetApiAccessUrl()
  82. const isEmbeddingWaiting = useMemo(() => {
  83. if (!indexingStatusBatchDetail.length) return false
  84. return indexingStatusBatchDetail.every(indexingStatusDetail => ['waiting'].includes(indexingStatusDetail?.indexing_status || ''))
  85. }, [indexingStatusBatchDetail])
  86. const isEmbedding = useMemo(() => {
  87. if (!indexingStatusBatchDetail.length) return false
  88. return indexingStatusBatchDetail.some(indexingStatusDetail => ['indexing', 'splitting', 'parsing', 'cleaning'].includes(indexingStatusDetail?.indexing_status || ''))
  89. }, [indexingStatusBatchDetail])
  90. const isEmbeddingCompleted = useMemo(() => {
  91. if (!indexingStatusBatchDetail.length) return false
  92. return indexingStatusBatchDetail.every(indexingStatusDetail => ['completed', 'error', 'paused'].includes(indexingStatusDetail?.indexing_status || ''))
  93. }, [indexingStatusBatchDetail])
  94. const getSourceName = (id: string) => {
  95. const doc = documents.find(document => document.id === id)
  96. return doc?.name
  97. }
  98. const getFileType = (name?: string) => name?.split('.').pop() || 'txt'
  99. const getSourcePercent = (detail: IndexingStatusResponse) => {
  100. const completedCount = detail.completed_segments || 0
  101. const totalCount = detail.total_segments || 0
  102. if (totalCount === 0)
  103. return 0
  104. const percent = Math.round(completedCount * 100 / totalCount)
  105. return percent > 100 ? 100 : percent
  106. }
  107. const getSourceType = (id: string) => {
  108. const doc = documents.find(document => document.id === id)
  109. return doc?.data_source_type
  110. }
  111. const getIcon = (id: string) => {
  112. const doc = documents.find(document => document.id === id)
  113. return doc?.data_source_info.notion_page_icon
  114. }
  115. const isSourceEmbedding = (detail: IndexingStatusResponse) =>
  116. ['indexing', 'splitting', 'parsing', 'cleaning', 'waiting'].includes(detail.indexing_status || '')
  117. return (
  118. <>
  119. <div className='flex flex-col gap-y-3'>
  120. <div className='system-md-semibold-uppercase flex items-center gap-x-1 text-text-secondary'>
  121. {(isEmbeddingWaiting || isEmbedding) && (
  122. <>
  123. <RiLoader2Fill className='size-4 animate-spin' />
  124. <span>
  125. {isEmbeddingWaiting ? t('datasetDocuments.embedding.waiting') : t('datasetDocuments.embedding.processing')}
  126. </span>
  127. </>
  128. )}
  129. {isEmbeddingCompleted && t('datasetDocuments.embedding.completed')}
  130. </div>
  131. {
  132. enableBilling && plan.type !== Plan.team && (
  133. <div className='flex h-[52px] items-center gap-x-2 rounded-xl border-[0.5px] border-components-panel-border-subtle bg-components-panel-on-panel-item-bg p-2.5 pl-3 shadow-xs shadow-shadow-shadow-3'>
  134. <div className='flex shrink-0 items-center justify-center rounded-lg border-[0.5px] border-divider-subtle bg-util-colors-blue-brand-blue-brand-500 shadow-md shadow-shadow-shadow-5'>
  135. <RiAedFill className='size-4 text-text-primary-on-surface' />
  136. </div>
  137. <div className='system-md-medium grow text-text-primary'>
  138. {t('billing.plansCommon.documentProcessingPriorityUpgrade')}
  139. </div>
  140. <UpgradeBtn loc='knowledge-speed-up' />
  141. </div>
  142. )
  143. }
  144. <div className='flex flex-col gap-0.5 pb-2'>
  145. {indexingStatusBatchDetail.map(indexingStatusDetail => (
  146. <div
  147. key={indexingStatusDetail.id}
  148. className={cn(
  149. 'relative h-[26px] overflow-hidden rounded-md bg-components-progress-bar-bg',
  150. indexingStatusDetail.indexing_status === 'error' && 'bg-state-destructive-hover-alt',
  151. )}
  152. >
  153. {isSourceEmbedding(indexingStatusDetail) && (
  154. <div
  155. className='absolute left-0 top-0 h-full min-w-0.5 border-r-[2px] border-r-components-progress-bar-progress-highlight bg-components-progress-bar-progress'
  156. style={{ width: `${getSourcePercent(indexingStatusDetail)}%` }}
  157. />
  158. )}
  159. <div className='z-[1] flex h-full items-center gap-1 pl-[6px] pr-2'>
  160. {getSourceType(indexingStatusDetail.id) === DatasourceType.localFile && (
  161. <DocumentFileIcon
  162. size='sm'
  163. className='shrink-0'
  164. name={getSourceName(indexingStatusDetail.id)}
  165. extension={getFileType(getSourceName(indexingStatusDetail.id))}
  166. />
  167. )}
  168. {getSourceType(indexingStatusDetail.id) === DatasourceType.onlineDocument && (
  169. <NotionIcon
  170. className='shrink-0'
  171. type='page'
  172. src={getIcon(indexingStatusDetail.id)}
  173. />
  174. )}
  175. <div className='flex w-0 grow items-center gap-1' title={getSourceName(indexingStatusDetail.id)}>
  176. <div className='system-xs-medium truncate text-text-secondary'>
  177. {getSourceName(indexingStatusDetail.id)}
  178. </div>
  179. {
  180. enableBilling && (
  181. <PriorityLabel className='ml-0' />
  182. )
  183. }
  184. </div>
  185. {isSourceEmbedding(indexingStatusDetail) && (
  186. <div className='shrink-0 text-xs text-text-secondary'>{`${getSourcePercent(indexingStatusDetail)}%`}</div>
  187. )}
  188. {indexingStatusDetail.indexing_status === 'error' && (
  189. <Tooltip
  190. popupClassName='px-4 py-[14px] max-w-60 body-xs-regular text-text-secondary border-[0.5px] border-components-panel-border rounded-xl'
  191. offset={4}
  192. popupContent={indexingStatusDetail.error}
  193. >
  194. <span>
  195. <RiErrorWarningFill className='size-4 shrink-0 text-text-destructive' />
  196. </span>
  197. </Tooltip>
  198. )}
  199. {indexingStatusDetail.indexing_status === 'completed' && (
  200. <RiCheckboxCircleFill className='size-4 shrink-0 text-text-success' />
  201. )}
  202. </div>
  203. </div>
  204. ))}
  205. </div>
  206. <Divider type='horizontal' className='my-0 bg-divider-subtle' />
  207. <RuleDetail
  208. sourceData={ruleDetail}
  209. indexingType={indexingType}
  210. retrievalMethod={retrievalMethod}
  211. />
  212. </div>
  213. <div className='mt-6 flex items-center gap-x-2 py-2'>
  214. <Link
  215. href={apiReferenceUrl}
  216. target='_blank'
  217. rel='noopener noreferrer'
  218. >
  219. <Button
  220. className='w-fit gap-x-0.5 px-3'
  221. >
  222. <RiTerminalBoxLine className='size-4' />
  223. <span className='px-0.5'>Access the API</span>
  224. </Button>
  225. </Link>
  226. <Button
  227. className='w-fit gap-x-0.5 px-3'
  228. variant='primary'
  229. onClick={navToDocumentList}
  230. >
  231. <span className='px-0.5'>{t('datasetCreation.stepThree.navTo')}</span>
  232. <RiArrowRightLine className='size-4 stroke-current stroke-1' />
  233. </Button>
  234. </div>
  235. </>
  236. )
  237. }
  238. export default EmbeddingProcess