diff --git a/packages/components/nodes/documentloaders/Pdf/Pdf.ts b/packages/components/nodes/documentloaders/Pdf/Pdf.ts index 10e12226..936259cb 100644 --- a/packages/components/nodes/documentloaders/Pdf/Pdf.ts +++ b/packages/components/nodes/documentloaders/Pdf/Pdf.ts @@ -66,7 +66,8 @@ class Pdf_DocumentLoaders implements INode { const blob = new Blob([bf]) if (usage === 'perFile') { - const loader = new PDFLoader(blob, { splitPages: false }) + // @ts-ignore + const loader = new PDFLoader(blob, { splitPages: false, pdfjs: () => import('pdf-parse/lib/pdf.js/v1.10.100/build/pdf.js') }) if (textSplitter) { const docs = await loader.loadAndSplit(textSplitter) return docs @@ -75,7 +76,8 @@ class Pdf_DocumentLoaders implements INode { return docs } } else { - const loader = new PDFLoader(blob) + // @ts-ignore + const loader = new PDFLoader(blob, { pdfjs: () => import('pdf-parse/lib/pdf.js/v1.10.100/build/pdf.js') }) if (textSplitter) { const docs = await loader.loadAndSplit(textSplitter) return docs diff --git a/packages/components/package.json b/packages/components/package.json index 0a211553..a80c434e 100644 --- a/packages/components/package.json +++ b/packages/components/package.json @@ -27,7 +27,7 @@ "langchain": "^0.0.44", "moment": "^2.29.3", "node-fetch": "2", - "pdfjs-dist": "^3.5.141", + "pdf-parse": "^1.1.1", "ws": "^8.9.0" }, "devDependencies": {