pdf2json

v3.1.3
PDF file parser that converts PDF binaries to text based JSON, powered by porting a fork of PDF.JS to Node.js
pdf pdf parser pdf2json convert pdf to json server side PDF parser port pdf.js to node.js PDF to text PDF text extractor PDF binary to text and 6 more...

test

jest --config ./jest.config.json && npm run parse-r && npm run parse-fd

build

npm run build:bundle-pdfjs-base && npm run build:rollup

parse

./bin/pdf2json.js -f ./test/pdf/fd/form/F1040.pdf -o ./test/target/fd/form

parse-c

./bin/pdf2json.js -f ./test/pdf/fd/form/F1040.pdf -o ./test/target/fd/form -s -t -c

parse-e

./bin/pdf2json.js -f ./test/pdf/misc/i43_encrypted.pdf -o ./test/target/misc

parse-m

./bin/pdf2json.js -f ./test/pdf/fd/form/F1040.pdf -o ./test/target/fd/form -s -t -c -m

parse-r

./bin/pdf2json.js -f ./test/pdf/fd/form/F1040.pdf -o ./test/target/fd/form -t -c -m -r

parse-s

./bin/pdf2json.js -f ./test/pdf/fd/form/F1040.pdf -o ./test/target/fd/form -s

parse-t

./bin/pdf2json.js -f ./test/pdf/fd/form/F1040.pdf -o ./test/target/fd/form -s -t

prepare

npm run build

pretest

npm run build

parse-fd

./bin/pdf2json.js -f ./test/pdf/fd/form/ -o ./test/target/fd/form -t -c -m -r

parse-tb

./bin/pdf2json.js -f ./test/pdf/misc/i242_testingWithTable.pdf -o ./test/target/misc

parse-tc

./bin/pdf2json.js -f ./test/pdf/misc/i293_pdfpac.pdf -o ./test/target/misc

test:jest

jest --config ./jest.config.json

test:misc

cd ./test && sh p2j.one.sh misc . "Expected: 12 success, 3 fail exception with stack trace"

test:forms

cd ./test && sh p2j.forms.sh

build:rollup

rollup -c ./rollup.config.js

parse-rectFix

./bin/pdf2json.js -f ./test/pdf/misc/pr298_rect_fix_from_upstream.pdf -o ./test/target/misc

build:bundle-pdfjs-base

node rollup/bundle-pdfjs-base.js

Metadata

Downloads

Maintainers