Skip to content

Commit

Permalink
fix(pdf): recognise .mjs deps, use UInt8Array
Browse files Browse the repository at this point in the history
  • Loading branch information
LoneRifle committed May 23, 2024
1 parent e697ec2 commit 767ffcc
Show file tree
Hide file tree
Showing 2 changed files with 7 additions and 3 deletions.
2 changes: 1 addition & 1 deletion lib/pdf2md-cli.js
Original file line number Diff line number Diff line change
Expand Up @@ -54,7 +54,7 @@ async function createMarkdownFiles (filePaths, allOutputPaths) {
const callbacks = allOutputPaths[i] && {}
const pdfBuffer = fs.readFileSync(filePath)
try {
const text = await pdf2md(pdfBuffer, callbacks)
const text = await pdf2md(new Uint8Array(pdfBuffer), callbacks)
const outputFile = allOutputPaths[i] + '.md'
console.log(`Writing to ${outputFile}...`)
fs.writeFileSync(path.resolve(outputFile), text)
Expand Down
8 changes: 6 additions & 2 deletions lib/util/pdf.js
Original file line number Diff line number Diff line change
@@ -1,6 +1,9 @@
const path = require('path')
const pdfjs = require('pdfjs-dist/legacy/build/pdf')
pdfjs.GlobalWorkerOptions.workerSrc = `pdfjs-dist/legacy/build/pdf.worker`
const pdfjsPromise = import('pdfjs-dist/build/pdf.mjs')

pdfjsPromise.then((pdfjs) => {
pdfjs.GlobalWorkerOptions.workerSrc = `pdfjs-dist/build/pdf.worker.mjs`
})

const { findPageNumbers, findFirstPage, removePageNumber } = require('../../lib/util/page-number-functions')
const TextItem = require('../models/TextItem')
Expand All @@ -22,6 +25,7 @@ exports.parse = async function parse (docOptions, callbacks) {
} else if (docOptions instanceof ArrayBuffer || ArrayBuffer.isView(docOptions)) {
docOptions = { data: docOptions };
}
const pdfjs = await pdfjsPromise
const pdfDocument = await pdfjs.getDocument(
{
...docOptions,
Expand Down

0 comments on commit 767ffcc

Please sign in to comment.