index.tsx 6.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172
  1. 'use client'
  2. import React, { useCallback, useEffect, useState } from 'react'
  3. import { useTranslation } from 'react-i18next'
  4. import AppUnavailable from '../../base/app-unavailable'
  5. import { ModelTypeEnum } from '../../header/account-setting/model-provider-page/declarations'
  6. import StepsNavBar from './steps-nav-bar'
  7. import StepOne from './step-one'
  8. import StepTwo from './step-two'
  9. import StepThree from './step-three'
  10. import { DataSourceType } from '@/models/datasets'
  11. import type { CrawlOptions, CrawlResultItem, DataSet, FileItem, createDocumentResponse } from '@/models/datasets'
  12. import { fetchDataSource } from '@/service/common'
  13. import { fetchDatasetDetail } from '@/service/datasets'
  14. import type { NotionPage } from '@/models/common'
  15. import { useModalContext } from '@/context/modal-context'
  16. import { useDefaultModel } from '@/app/components/header/account-setting/model-provider-page/hooks'
  17. type DatasetUpdateFormProps = {
  18. datasetId?: string
  19. }
  20. const DEFAULT_CRAWL_OPTIONS: CrawlOptions = {
  21. crawl_sub_pages: true,
  22. only_main_content: true,
  23. includes: '',
  24. excludes: '',
  25. limit: 10,
  26. max_depth: '',
  27. }
  28. const DatasetUpdateForm = ({ datasetId }: DatasetUpdateFormProps) => {
  29. const { t } = useTranslation()
  30. const { setShowAccountSettingModal } = useModalContext()
  31. const [hasConnection, setHasConnection] = useState(true)
  32. const [dataSourceType, setDataSourceType] = useState<DataSourceType>(DataSourceType.FILE)
  33. const [step, setStep] = useState(1)
  34. const [indexingTypeCache, setIndexTypeCache] = useState('')
  35. const [fileList, setFiles] = useState<FileItem[]>([])
  36. const [result, setResult] = useState<createDocumentResponse | undefined>()
  37. const [hasError, setHasError] = useState(false)
  38. const { data: embeddingsDefaultModel } = useDefaultModel(ModelTypeEnum.textEmbedding)
  39. const [notionPages, setNotionPages] = useState<NotionPage[]>([])
  40. const updateNotionPages = (value: NotionPage[]) => {
  41. setNotionPages(value)
  42. }
  43. const [websitePages, setWebsitePages] = useState<CrawlResultItem[]>([])
  44. const [crawlOptions, setCrawlOptions] = useState<CrawlOptions>(DEFAULT_CRAWL_OPTIONS)
  45. const updateFileList = (preparedFiles: FileItem[]) => {
  46. setFiles(preparedFiles)
  47. }
  48. const [fireCrawlJobId, setFireCrawlJobId] = useState('')
  49. const updateFile = (fileItem: FileItem, progress: number, list: FileItem[]) => {
  50. const targetIndex = list.findIndex(file => file.fileID === fileItem.fileID)
  51. list[targetIndex] = {
  52. ...list[targetIndex],
  53. progress,
  54. }
  55. setFiles([...list])
  56. // use follow code would cause dirty list update problem
  57. // const newList = list.map((file) => {
  58. // if (file.fileID === fileItem.fileID) {
  59. // return {
  60. // ...fileItem,
  61. // progress,
  62. // }
  63. // }
  64. // return file
  65. // })
  66. // setFiles(newList)
  67. }
  68. const updateIndexingTypeCache = (type: string) => {
  69. setIndexTypeCache(type)
  70. }
  71. const updateResultCache = (res?: createDocumentResponse) => {
  72. setResult(res)
  73. }
  74. const nextStep = useCallback(() => {
  75. setStep(step + 1)
  76. }, [step, setStep])
  77. const changeStep = useCallback((delta: number) => {
  78. setStep(step + delta)
  79. }, [step, setStep])
  80. const checkNotionConnection = async () => {
  81. const { data } = await fetchDataSource({ url: '/data-source/integrates' })
  82. const hasConnection = data.filter(item => item.provider === 'notion') || []
  83. setHasConnection(hasConnection.length > 0)
  84. }
  85. useEffect(() => {
  86. checkNotionConnection()
  87. }, [])
  88. const [detail, setDetail] = useState<DataSet | null>(null)
  89. useEffect(() => {
  90. (async () => {
  91. if (datasetId) {
  92. try {
  93. const detail = await fetchDatasetDetail(datasetId)
  94. setDetail(detail)
  95. }
  96. catch (e) {
  97. setHasError(true)
  98. }
  99. }
  100. })()
  101. }, [datasetId])
  102. if (hasError)
  103. return <AppUnavailable code={500} unknownReason={t('datasetCreation.error.unavailable') as string} />
  104. return (
  105. <div className='flex' style={{ height: 'calc(100vh - 56px)' }}>
  106. <div className="flex flex-col w-11 sm:w-56 overflow-y-auto bg-white border-r border-gray-200 shrink-0">
  107. <StepsNavBar step={step} datasetId={datasetId} />
  108. </div>
  109. <div className="grow bg-white">
  110. <div className={step === 1 ? 'block h-full' : 'hidden'}>
  111. <StepOne
  112. hasConnection={hasConnection}
  113. onSetting={() => setShowAccountSettingModal({ payload: 'data-source' })}
  114. datasetId={datasetId}
  115. dataSourceType={dataSourceType}
  116. dataSourceTypeDisable={!!detail?.data_source_type}
  117. changeType={setDataSourceType}
  118. files={fileList}
  119. updateFile={updateFile}
  120. updateFileList={updateFileList}
  121. notionPages={notionPages}
  122. updateNotionPages={updateNotionPages}
  123. onStepChange={nextStep}
  124. websitePages={websitePages}
  125. updateWebsitePages={setWebsitePages}
  126. onFireCrawlJobIdChange={setFireCrawlJobId}
  127. crawlOptions={crawlOptions}
  128. onCrawlOptionsChange={setCrawlOptions}
  129. />
  130. </div>
  131. {(step === 2 && (!datasetId || (datasetId && !!detail))) && <StepTwo
  132. isAPIKeySet={!!embeddingsDefaultModel}
  133. onSetting={() => setShowAccountSettingModal({ payload: 'provider' })}
  134. indexingType={detail?.indexing_technique}
  135. datasetId={datasetId}
  136. dataSourceType={dataSourceType}
  137. files={fileList.map(file => file.file)}
  138. notionPages={notionPages}
  139. websitePages={websitePages}
  140. fireCrawlJobId={fireCrawlJobId}
  141. onStepChange={changeStep}
  142. updateIndexingTypeCache={updateIndexingTypeCache}
  143. updateResultCache={updateResultCache}
  144. crawlOptions={crawlOptions}
  145. />}
  146. {step === 3 && <StepThree
  147. datasetId={datasetId}
  148. datasetName={detail?.name}
  149. indexingType={detail?.indexing_technique || indexingTypeCache}
  150. creationCache={result}
  151. />}
  152. </div>
  153. </div>
  154. )
  155. }
  156. export default DatasetUpdateForm