datasets.ts 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344
  1. import type { Fetcher } from 'swr'
  2. import qs from 'qs'
  3. import { del, get, patch, post, put } from './base'
  4. import type {
  5. CreateDocumentReq,
  6. DataSet,
  7. DataSetListResponse,
  8. DocumentDetailResponse,
  9. DocumentListResponse,
  10. ErrorDocsResponse,
  11. ExternalAPIDeleteResponse,
  12. ExternalAPIItem,
  13. ExternalAPIListResponse,
  14. ExternalAPIUsage,
  15. ExternalKnowledgeBaseHitTestingResponse,
  16. ExternalKnowledgeItem,
  17. FileIndexingEstimateResponse,
  18. HitTestingRecordsResponse,
  19. HitTestingResponse,
  20. IndexingEstimateParams,
  21. IndexingEstimateResponse,
  22. IndexingStatusBatchResponse,
  23. IndexingStatusResponse,
  24. ProcessRuleResponse,
  25. RelatedAppResponse,
  26. SegmentDetailModel,
  27. SegmentUpdater,
  28. SegmentsQuery,
  29. SegmentsResponse,
  30. createDocumentResponse,
  31. } from '@/models/datasets'
  32. import type { CreateKnowledgeBaseReq } from '@/app/components/datasets/external-knowledge-base/create/declarations'
  33. import type { CreateExternalAPIReq } from '@/app/components/datasets/external-api/declarations.ts'
  34. import type { CommonResponse, DataSourceNotionWorkspace } from '@/models/common'
  35. import type {
  36. ApiKeysListResponse,
  37. CreateApiKeyResponse,
  38. } from '@/models/app'
  39. import type { RetrievalConfig } from '@/types/app'
  40. // apis for documents in a dataset
  41. type CommonDocReq = {
  42. datasetId: string
  43. documentId: string
  44. }
  45. type BatchReq = {
  46. datasetId: string
  47. batchId: string
  48. }
  49. export type SortType = 'created_at' | 'hit_count' | '-created_at' | '-hit_count'
  50. export type MetadataType = 'all' | 'only' | 'without'
  51. export const fetchDatasetDetail: Fetcher<DataSet, string> = (datasetId: string) => {
  52. return get<DataSet>(`/datasets/${datasetId}`)
  53. }
  54. export const updateDatasetSetting: Fetcher<DataSet, {
  55. datasetId: string
  56. body: Partial<Pick<DataSet,
  57. 'name' | 'description' | 'permission' | 'partial_member_list' | 'indexing_technique' | 'retrieval_model' | 'embedding_model' | 'embedding_model_provider'
  58. >>
  59. }> = ({ datasetId, body }) => {
  60. return patch<DataSet>(`/datasets/${datasetId}`, { body })
  61. }
  62. export const fetchDatasetRelatedApps: Fetcher<RelatedAppResponse, string> = (datasetId: string) => {
  63. return get<RelatedAppResponse>(`/datasets/${datasetId}/related-apps`)
  64. }
  65. export const fetchDatasets: Fetcher<DataSetListResponse, { url: string; params: { page: number; ids?: string[]; limit?: number } }> = ({ url, params }) => {
  66. const urlParams = qs.stringify(params, { indices: false })
  67. return get<DataSetListResponse>(`${url}?${urlParams}`)
  68. }
  69. export const createEmptyDataset: Fetcher<DataSet, { name: string }> = ({ name }) => {
  70. return post<DataSet>('/datasets', { body: { name } })
  71. }
  72. export const checkIsUsedInApp: Fetcher<{ is_using: boolean }, string> = (id) => {
  73. return get<{ is_using: boolean }>(`/datasets/${id}/use-check`, {}, {
  74. silent: true,
  75. })
  76. }
  77. export const deleteDataset: Fetcher<DataSet, string> = (datasetID) => {
  78. return del<DataSet>(`/datasets/${datasetID}`)
  79. }
  80. export const fetchExternalAPIList: Fetcher<ExternalAPIListResponse, { url: string }> = ({ url }) => {
  81. return get<ExternalAPIListResponse>(url)
  82. }
  83. export const fetchExternalAPI: Fetcher<ExternalAPIItem, { apiTemplateId: string }> = ({ apiTemplateId }) => {
  84. return get<ExternalAPIItem>(`/datasets/external-knowledge-api/${apiTemplateId}`)
  85. }
  86. export const updateExternalAPI: Fetcher<ExternalAPIItem, { apiTemplateId: string; body: ExternalAPIItem }> = ({ apiTemplateId, body }) => {
  87. return patch<ExternalAPIItem>(`/datasets/external-knowledge-api/${apiTemplateId}`, { body })
  88. }
  89. export const deleteExternalAPI: Fetcher<ExternalAPIDeleteResponse, { apiTemplateId: string }> = ({ apiTemplateId }) => {
  90. return del<ExternalAPIDeleteResponse>(`/datasets/external-knowledge-api/${apiTemplateId}`)
  91. }
  92. export const checkUsageExternalAPI: Fetcher<ExternalAPIUsage, { apiTemplateId: string }> = ({ apiTemplateId }) => {
  93. return get<ExternalAPIUsage>(`/datasets/external-knowledge-api/${apiTemplateId}/use-check`)
  94. }
  95. export const createExternalAPI: Fetcher<ExternalAPIItem, { body: CreateExternalAPIReq }> = ({ body }) => {
  96. return post<ExternalAPIItem>('/datasets/external-knowledge-api', { body })
  97. }
  98. export const createExternalKnowledgeBase: Fetcher<ExternalKnowledgeItem, { body: CreateKnowledgeBaseReq }> = ({ body }) => {
  99. return post<ExternalKnowledgeItem>('/datasets/external', { body })
  100. }
  101. export const fetchDefaultProcessRule: Fetcher<ProcessRuleResponse, { url: string }> = ({ url }) => {
  102. return get<ProcessRuleResponse>(url)
  103. }
  104. export const fetchProcessRule: Fetcher<ProcessRuleResponse, { params: { documentId: string } }> = ({ params: { documentId } }) => {
  105. return get<ProcessRuleResponse>('/datasets/process-rule', { params: { document_id: documentId } })
  106. }
  107. export const fetchDocuments: Fetcher<DocumentListResponse, { datasetId: string; params: { keyword: string; page: number; limit: number; sort?: SortType } }> = ({ datasetId, params }) => {
  108. return get<DocumentListResponse>(`/datasets/${datasetId}/documents`, { params })
  109. }
  110. export const createFirstDocument: Fetcher<createDocumentResponse, { body: CreateDocumentReq }> = ({ body }) => {
  111. return post<createDocumentResponse>('/datasets/init', { body })
  112. }
  113. export const createDocument: Fetcher<createDocumentResponse, { datasetId: string; body: CreateDocumentReq }> = ({ datasetId, body }) => {
  114. return post<createDocumentResponse>(`/datasets/${datasetId}/documents`, { body })
  115. }
  116. export const fetchIndexingEstimate: Fetcher<IndexingEstimateResponse, CommonDocReq> = ({ datasetId, documentId }) => {
  117. return get<IndexingEstimateResponse>(`/datasets/${datasetId}/documents/${documentId}/indexing-estimate`, {})
  118. }
  119. export const fetchIndexingEstimateBatch: Fetcher<IndexingEstimateResponse, BatchReq> = ({ datasetId, batchId }) => {
  120. return get<IndexingEstimateResponse>(`/datasets/${datasetId}/batch/${batchId}/indexing-estimate`, {})
  121. }
  122. export const fetchIndexingStatus: Fetcher<IndexingStatusResponse, CommonDocReq> = ({ datasetId, documentId }) => {
  123. return get<IndexingStatusResponse>(`/datasets/${datasetId}/documents/${documentId}/indexing-status`, {})
  124. }
  125. export const fetchIndexingStatusBatch: Fetcher<IndexingStatusBatchResponse, BatchReq> = ({ datasetId, batchId }) => {
  126. return get<IndexingStatusBatchResponse>(`/datasets/${datasetId}/batch/${batchId}/indexing-status`, {})
  127. }
  128. export const fetchDocumentDetail: Fetcher<DocumentDetailResponse, CommonDocReq & { params: { metadata?: MetadataType } }> = ({ datasetId, documentId, params }) => {
  129. return get<DocumentDetailResponse>(`/datasets/${datasetId}/documents/${documentId}`, { params })
  130. }
  131. export const renameDocumentName: Fetcher<CommonResponse, CommonDocReq & { name: string }> = ({ datasetId, documentId, name }) => {
  132. return post<CommonResponse>(`/datasets/${datasetId}/documents/${documentId}/rename`, {
  133. body: { name },
  134. })
  135. }
  136. export const pauseDocIndexing: Fetcher<CommonResponse, CommonDocReq> = ({ datasetId, documentId }) => {
  137. return patch<CommonResponse>(`/datasets/${datasetId}/documents/${documentId}/processing/pause`)
  138. }
  139. export const resumeDocIndexing: Fetcher<CommonResponse, CommonDocReq> = ({ datasetId, documentId }) => {
  140. return patch<CommonResponse>(`/datasets/${datasetId}/documents/${documentId}/processing/resume`)
  141. }
  142. export const deleteDocument: Fetcher<CommonResponse, CommonDocReq> = ({ datasetId, documentId }) => {
  143. return del<CommonResponse>(`/datasets/${datasetId}/documents/${documentId}`)
  144. }
  145. export const archiveDocument: Fetcher<CommonResponse, CommonDocReq> = ({ datasetId, documentId }) => {
  146. return patch<CommonResponse>(`/datasets/${datasetId}/documents/${documentId}/status/archive`)
  147. }
  148. export const unArchiveDocument: Fetcher<CommonResponse, CommonDocReq> = ({ datasetId, documentId }) => {
  149. return patch<CommonResponse>(`/datasets/${datasetId}/documents/${documentId}/status/un_archive`)
  150. }
  151. export const enableDocument: Fetcher<CommonResponse, CommonDocReq> = ({ datasetId, documentId }) => {
  152. return patch<CommonResponse>(`/datasets/${datasetId}/documents/${documentId}/status/enable`)
  153. }
  154. export const disableDocument: Fetcher<CommonResponse, CommonDocReq> = ({ datasetId, documentId }) => {
  155. return patch<CommonResponse>(`/datasets/${datasetId}/documents/${documentId}/status/disable`)
  156. }
  157. export const syncDocument: Fetcher<CommonResponse, CommonDocReq> = ({ datasetId, documentId }) => {
  158. return get<CommonResponse>(`/datasets/${datasetId}/documents/${documentId}/notion/sync`)
  159. }
  160. export const syncWebsite: Fetcher<CommonResponse, CommonDocReq> = ({ datasetId, documentId }) => {
  161. return get<CommonResponse>(`/datasets/${datasetId}/documents/${documentId}/website-sync`)
  162. }
  163. export const preImportNotionPages: Fetcher<{ notion_info: DataSourceNotionWorkspace[] }, { url: string; datasetId?: string }> = ({ url, datasetId }) => {
  164. return get<{ notion_info: DataSourceNotionWorkspace[] }>(url, { params: { dataset_id: datasetId } })
  165. }
  166. export const modifyDocMetadata: Fetcher<CommonResponse, CommonDocReq & { body: { doc_type: string; doc_metadata: Record<string, any> } }> = ({ datasetId, documentId, body }) => {
  167. return put<CommonResponse>(`/datasets/${datasetId}/documents/${documentId}/metadata`, { body })
  168. }
  169. // apis for segments in a document
  170. export const fetchSegments: Fetcher<SegmentsResponse, CommonDocReq & { params: SegmentsQuery }> = ({ datasetId, documentId, params }) => {
  171. return get<SegmentsResponse>(`/datasets/${datasetId}/documents/${documentId}/segments`, { params })
  172. }
  173. export const enableSegment: Fetcher<CommonResponse, { datasetId: string; segmentId: string }> = ({ datasetId, segmentId }) => {
  174. return patch<CommonResponse>(`/datasets/${datasetId}/segments/${segmentId}/enable`)
  175. }
  176. export const disableSegment: Fetcher<CommonResponse, { datasetId: string; segmentId: string }> = ({ datasetId, segmentId }) => {
  177. return patch<CommonResponse>(`/datasets/${datasetId}/segments/${segmentId}/disable`)
  178. }
  179. export const updateSegment: Fetcher<{ data: SegmentDetailModel; doc_form: string }, { datasetId: string; documentId: string; segmentId: string; body: SegmentUpdater }> = ({ datasetId, documentId, segmentId, body }) => {
  180. return patch<{ data: SegmentDetailModel; doc_form: string }>(`/datasets/${datasetId}/documents/${documentId}/segments/${segmentId}`, { body })
  181. }
  182. export const addSegment: Fetcher<{ data: SegmentDetailModel; doc_form: string }, { datasetId: string; documentId: string; body: SegmentUpdater }> = ({ datasetId, documentId, body }) => {
  183. return post<{ data: SegmentDetailModel; doc_form: string }>(`/datasets/${datasetId}/documents/${documentId}/segment`, { body })
  184. }
  185. export const deleteSegment: Fetcher<CommonResponse, { datasetId: string; documentId: string; segmentId: string }> = ({ datasetId, documentId, segmentId }) => {
  186. return del<CommonResponse>(`/datasets/${datasetId}/documents/${documentId}/segments/${segmentId}`)
  187. }
  188. export const segmentBatchImport: Fetcher<{ job_id: string; job_status: string }, { url: string; body: FormData }> = ({ url, body }) => {
  189. return post<{ job_id: string; job_status: string }>(url, { body }, { bodyStringify: false, deleteContentType: true })
  190. }
  191. export const checkSegmentBatchImportProgress: Fetcher<{ job_id: string; job_status: string }, { jobID: string }> = ({ jobID }) => {
  192. return get<{ job_id: string; job_status: string }>(`/datasets/batch_import_status/${jobID}`)
  193. }
  194. // hit testing
  195. export const hitTesting: Fetcher<HitTestingResponse, { datasetId: string; queryText: string; retrieval_model: RetrievalConfig }> = ({ datasetId, queryText, retrieval_model }) => {
  196. return post<HitTestingResponse>(`/datasets/${datasetId}/hit-testing`, { body: { query: queryText, retrieval_model } })
  197. }
  198. export const externalKnowledgeBaseHitTesting: Fetcher<ExternalKnowledgeBaseHitTestingResponse, { datasetId: string; query: string; external_retrieval_model: { top_k: number; score_threshold: number; score_threshold_enabled: boolean } }> = ({ datasetId, query, external_retrieval_model }) => {
  199. return post<ExternalKnowledgeBaseHitTestingResponse>(`/datasets/${datasetId}/external-hit-testing`, { body: { query, external_retrieval_model } })
  200. }
  201. export const fetchTestingRecords: Fetcher<HitTestingRecordsResponse, { datasetId: string; params: { page: number; limit: number } }> = ({ datasetId, params }) => {
  202. return get<HitTestingRecordsResponse>(`/datasets/${datasetId}/queries`, { params })
  203. }
  204. export const fetchFileIndexingEstimate: Fetcher<FileIndexingEstimateResponse, IndexingEstimateParams> = (body: IndexingEstimateParams) => {
  205. return post<FileIndexingEstimateResponse>('/datasets/indexing-estimate', { body })
  206. }
  207. export const fetchNotionPagePreview: Fetcher<{ content: string }, { workspaceID: string; pageID: string; pageType: string }> = ({ workspaceID, pageID, pageType }) => {
  208. return get<{ content: string }>(`notion/workspaces/${workspaceID}/pages/${pageID}/${pageType}/preview`)
  209. }
  210. export const fetchApiKeysList: Fetcher<ApiKeysListResponse, { url: string; params: Record<string, any> }> = ({ url, params }) => {
  211. return get<ApiKeysListResponse>(url, params)
  212. }
  213. export const delApikey: Fetcher<CommonResponse, { url: string; params: Record<string, any> }> = ({ url, params }) => {
  214. return del<CommonResponse>(url, params)
  215. }
  216. export const createApikey: Fetcher<CreateApiKeyResponse, { url: string; body: Record<string, any> }> = ({ url, body }) => {
  217. return post<CreateApiKeyResponse>(url, body)
  218. }
  219. export const fetchDatasetApiBaseUrl: Fetcher<{ api_base_url: string }, string> = (url) => {
  220. return get<{ api_base_url: string }>(url)
  221. }
  222. export const fetchDataSources = () => {
  223. return get<CommonResponse>('api-key-auth/data-source')
  224. }
  225. export const createDataSourceApiKeyBinding: Fetcher<CommonResponse, Record<string, any>> = (body) => {
  226. return post<CommonResponse>('api-key-auth/data-source/binding', { body })
  227. }
  228. export const removeDataSourceApiKeyBinding: Fetcher<CommonResponse, string> = (id: string) => {
  229. return del<CommonResponse>(`api-key-auth/data-source/${id}`)
  230. }
  231. export const createFirecrawlTask: Fetcher<CommonResponse, Record<string, any>> = (body) => {
  232. return post<CommonResponse>('website/crawl', {
  233. body: {
  234. ...body,
  235. provider: DataSourceProvider.fireCrawl,
  236. },
  237. })
  238. }
  239. export const checkFirecrawlTaskStatus: Fetcher<CommonResponse, string> = (jobId: string) => {
  240. return get<CommonResponse>(`website/crawl/status/${jobId}`, {
  241. params: {
  242. provider: DataSourceProvider.fireCrawl,
  243. },
  244. }, {
  245. silent: true,
  246. })
  247. }
  248. export const createJinaReaderTask: Fetcher<CommonResponse, Record<string, any>> = (body) => {
  249. return post<CommonResponse>('website/crawl', {
  250. body: {
  251. ...body,
  252. provider: DataSourceProvider.jinaReader,
  253. },
  254. })
  255. }
  256. export const checkJinaReaderTaskStatus: Fetcher<CommonResponse, string> = (jobId: string) => {
  257. return get<CommonResponse>(`website/crawl/status/${jobId}`, {
  258. params: {
  259. provider: 'jinareader',
  260. },
  261. }, {
  262. silent: true,
  263. })
  264. }
  265. type FileTypesRes = {
  266. allowed_extensions: string[]
  267. }
  268. export const fetchSupportFileTypes: Fetcher<FileTypesRes, { url: string }> = ({ url }) => {
  269. return get<FileTypesRes>(url)
  270. }
  271. export const getErrorDocs: Fetcher<ErrorDocsResponse, { datasetId: string }> = ({ datasetId }) => {
  272. return get<ErrorDocsResponse>(`/datasets/${datasetId}/error-docs`)
  273. }
  274. export const retryErrorDocs: Fetcher<CommonResponse, { datasetId: string; document_ids: string[] }> = ({ datasetId, document_ids }) => {
  275. return post<CommonResponse>(`/datasets/${datasetId}/retry`, { body: { document_ids } })
  276. }