diff --git a/packages/components/nodes/documentloaders/Pdf/Pdf.ts b/packages/components/nodes/documentloaders/Pdf/Pdf.ts index 49b6e52fc..7933e6a04 100644 --- a/packages/components/nodes/documentloaders/Pdf/Pdf.ts +++ b/packages/components/nodes/documentloaders/Pdf/Pdf.ts @@ -63,7 +63,8 @@ class Pdf_DocumentLoaders implements INode { const blob = new Blob([bf]) if (usage === 'perFile') { - const loader = new PDFLoader(blob, { splitPages: false }) + // @ts-ignore + const loader = new PDFLoader(blob, { splitPages: false, pdfjs: () => import('pdf-parse/lib/pdf.js/v1.10.100/build/pdf.js') }) if (textSplitter) { const docs = await loader.loadAndSplit(textSplitter) return docs @@ -72,7 +73,8 @@ class Pdf_DocumentLoaders implements INode { return docs } } else { - const loader = new PDFLoader(blob) + // @ts-ignore + const loader = new PDFLoader(blob, { pdfjs: () => import('pdf-parse/lib/pdf.js/v1.10.100/build/pdf.js') }) if (textSplitter) { const docs = await loader.loadAndSplit(textSplitter) return docs diff --git a/packages/components/package.json b/packages/components/package.json index 84c2b9a2a..34da56a15 100644 --- a/packages/components/package.json +++ b/packages/components/package.json @@ -27,7 +27,7 @@ "langchain": "^0.0.53", "moment": "^2.29.3", "node-fetch": "2", - "pdfjs-dist": "^3.5.141", + "pdf-parse": "^1.1.1", "ws": "^8.9.0" }, "devDependencies": {