use pdf-parser

This commit is contained in:
Henry
2023-04-13 19:56:48 +01:00
parent 02d8284f58
commit 930449f956
2 changed files with 5 additions and 3 deletions
@@ -66,7 +66,8 @@ class Pdf_DocumentLoaders implements INode {
const blob = new Blob([bf])
if (usage === 'perFile') {
const loader = new PDFLoader(blob, { splitPages: false })
// @ts-ignore
const loader = new PDFLoader(blob, { splitPages: false, pdfjs: () => import('pdf-parse/lib/pdf.js/v1.10.100/build/pdf.js') })
if (textSplitter) {
const docs = await loader.loadAndSplit(textSplitter)
return docs
@@ -75,7 +76,8 @@ class Pdf_DocumentLoaders implements INode {
return docs
}
} else {
const loader = new PDFLoader(blob)
// @ts-ignore
const loader = new PDFLoader(blob, { pdfjs: () => import('pdf-parse/lib/pdf.js/v1.10.100/build/pdf.js') })
if (textSplitter) {
const docs = await loader.loadAndSplit(textSplitter)
return docs