Skip to content

Commit 11a810c

Browse files
authored
Merge pull request #5 from FlowiseAI/bugfix/PDFLoader
Bugfix/Use pdf-parser
2 parents 9eb9964 + 930449f commit 11a810c

File tree

2 files changed

+5
-3
lines changed

2 files changed

+5
-3
lines changed

packages/components/nodes/documentloaders/Pdf/Pdf.ts

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -63,7 +63,8 @@ class Pdf_DocumentLoaders implements INode {
6363
const blob = new Blob([bf])
6464

6565
if (usage === 'perFile') {
66-
const loader = new PDFLoader(blob, { splitPages: false })
66+
// @ts-ignore
67+
const loader = new PDFLoader(blob, { splitPages: false, pdfjs: () => import('pdf-parse/lib/pdf.js/v1.10.100/build/pdf.js') })
6768
if (textSplitter) {
6869
const docs = await loader.loadAndSplit(textSplitter)
6970
return docs
@@ -72,7 +73,8 @@ class Pdf_DocumentLoaders implements INode {
7273
return docs
7374
}
7475
} else {
75-
const loader = new PDFLoader(blob)
76+
// @ts-ignore
77+
const loader = new PDFLoader(blob, { pdfjs: () => import('pdf-parse/lib/pdf.js/v1.10.100/build/pdf.js') })
7678
if (textSplitter) {
7779
const docs = await loader.loadAndSplit(textSplitter)
7880
return docs

packages/components/package.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -27,7 +27,7 @@
2727
"langchain": "^0.0.53",
2828
"moment": "^2.29.3",
2929
"node-fetch": "2",
30-
"pdfjs-dist": "^3.5.141",
30+
"pdf-parse": "^1.1.1",
3131
"ws": "^8.9.0"
3232
},
3333
"devDependencies": {

0 commit comments

Comments
 (0)