-
Notifications
You must be signed in to change notification settings - Fork 0
/
reader.js
57 lines (51 loc) · 1.54 KB
/
reader.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
const PFParser = require("pdf2json/pdfparser"); // doc: https://github.com/modesty/pdf2json
function forEachItem(pdf, handler, index) {
const arr = [];
pdf.formImage.Pages.forEach(page => {
const item = page.Texts[index];
const name = decodeURIComponent(item.R[0].T);
arr.push(name);
});
handler(null, arr);
}
function getIndex(pdf, keyword) {
const promise = new Promise(resolve => {
pdf.formImage.Pages.some(page => {
const index = page.Texts.findIndex(item => {
return decodeURIComponent(item.R[0].T) === keyword;
});
if (index !== -1) {
resolve(index);
return true;
}
return false;
});
});
return promise;
}
function Reader() {}
/**
* parseBuffer: calls itemHandler(error, item) on each item parsed from the pdf file received as a buffer
*/
Reader.prototype.parseBuffer = (pdfBuffer, itemHandler, index) => {
const pdfParser = new PFParser();
pdfParser.on("pdfParser_dataError", itemHandler);
pdfParser.on("pdfParser_dataReady", pdfData => {
forEachItem(pdfData, itemHandler, index);
});
pdfParser.parseBuffer(pdfBuffer);
};
Reader.prototype.getIndex = (pdfBuffer, keyword) => {
const promise = new Promise(resolve => {
const pdfParser = new PFParser();
pdfParser.on("pdfParser_dataError", () => {
throw new Error("pdfParser_dataError");
});
pdfParser.on("pdfParser_dataReady", async pdfData => {
resolve(getIndex(pdfData, keyword));
});
pdfParser.parseBuffer(pdfBuffer);
});
return promise;
};
module.exports = Reader;