Package com.bytedesk.kbase.llm_file
Class FileChunkService
java.lang.Object
com.bytedesk.kbase.llm_file.FileChunkService
-
Field Summary
Fields -
Constructor Summary
Constructors -
Method Summary
Modifier and TypeMethodDescriptionList<org.springframework.ai.document.Document>
parseFileContent
(UploadEntity upload) https://docs.spring.io/spring-ai/reference/api/etl-pipeline.htmlList<org.springframework.ai.document.Document>
readByTika
(org.springframework.core.io.Resource resource) List<org.springframework.ai.document.Document>
readJson
(org.springframework.core.io.Resource resource) List<org.springframework.ai.document.Document>
readMarkdown
(org.springframework.core.io.Resource resource) List<org.springframework.ai.document.Document>
readPdfPage
(org.springframework.core.io.Resource resource) List<org.springframework.ai.document.Document>
readPdfParagraph
(org.springframework.core.io.Resource resource) List<org.springframework.ai.document.Document>
readTxt
(org.springframework.core.io.Resource resource)
-
Field Details
-
uploadRestService
-
-
Constructor Details
-
FileChunkService
public FileChunkService()
-
-
Method Details
-
parseFileContent
https://docs.spring.io/spring-ai/reference/api/etl-pipeline.html -
readPdfPage
public List<org.springframework.ai.document.Document> readPdfPage(org.springframework.core.io.Resource resource) -
readPdfParagraph
public List<org.springframework.ai.document.Document> readPdfParagraph(org.springframework.core.io.Resource resource) -
readJson
public List<org.springframework.ai.document.Document> readJson(org.springframework.core.io.Resource resource) -
readMarkdown
public List<org.springframework.ai.document.Document> readMarkdown(org.springframework.core.io.Resource resource) -
readTxt
public List<org.springframework.ai.document.Document> readTxt(org.springframework.core.io.Resource resource) -
readByTika
public List<org.springframework.ai.document.Document> readByTika(org.springframework.core.io.Resource resource)
-