Files
bentopdf/public/workers/pdf-to-json.worker.js

53 lines
1.4 KiB
JavaScript
Raw Normal View History

const baseUrl = self.location.href.substring(0, self.location.href.lastIndexOf('/workers/') + 1);
self.importScripts(baseUrl + 'coherentpdf.browser.min.js');
function convertPDFsToJSONInWorker(fileBuffers, fileNames) {
try {
const jsonFiles = [];
const transferBuffers = [];
for (let i = 0; i < fileBuffers.length; i++) {
const buffer = fileBuffers[i];
const fileName = fileNames[i];
const uint8Array = new Uint8Array(buffer);
const pdf = coherentpdf.fromMemory(uint8Array, '');
//TODO:@ALAM -> add options for users to select these settings
// parse_content: true, no_stream_data: false, decompress_streams: false
const jsonData = coherentpdf.outputJSONMemory(true, false, false, pdf);
const jsonBuffer = jsonData.buffer.slice(0);
jsonFiles.push({
name: fileName,
data: jsonBuffer,
});
transferBuffers.push(jsonBuffer);
coherentpdf.deletePdf(pdf);
}
self.postMessage(
{
status: 'success',
jsonFiles: jsonFiles,
},
transferBuffers
);
} catch (error) {
self.postMessage({
status: 'error',
message:
error instanceof Error
? error.message
: 'Unknown error during PDF to JSON conversion.',
});
}
}
self.onmessage = (e) => {
if (e.data.command === 'convert') {
convertPDFsToJSONInWorker(e.data.fileBuffers, e.data.fileNames);
}
};