From ef7b9d03653b259a12b36add1cae0a0682f537ed Mon Sep 17 00:00:00 2001 From: Shirshendu R Tripathi Date: Sun, 19 Oct 2025 22:12:51 +0530 Subject: [PATCH 1/2] Fix#20 OCR pdf text not selectable --- src/js/logic/ocr-pdf.ts | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/js/logic/ocr-pdf.ts b/src/js/logic/ocr-pdf.ts index 2cf5aec..d74b510 100644 --- a/src/js/logic/ocr-pdf.ts +++ b/src/js/logic/ocr-pdf.ts @@ -144,7 +144,7 @@ async function runOCR() { binarizeCanvas(context); } - const result = await worker.recognize(canvas); + const result = await worker.recognize(canvas, {}, { text: true, hocr: true }); const data = result.data; const newPage = newPdfDoc.addPage([viewport.width, viewport.height]); const pngImageBytes = await new Promise((resolve) => @@ -192,7 +192,7 @@ async function runOCR() { font, size: fontSize, color: rgb(0, 0, 0), - opacity: 0, + opacity: 0.1, }); } catch (error) { // If drawing fails despite sanitization, log and skip this word From 797d8f5b9d9411925915671aa31f40749bb4a670 Mon Sep 17 00:00:00 2001 From: Shirshendu R Tripathi Date: Sun, 19 Oct 2025 22:13:49 +0530 Subject: [PATCH 2/2] Fix#20 OCR pdf text not selectable --- src/js/logic/ocr-pdf.ts | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/js/logic/ocr-pdf.ts b/src/js/logic/ocr-pdf.ts index d74b510..8219dac 100644 --- a/src/js/logic/ocr-pdf.ts +++ b/src/js/logic/ocr-pdf.ts @@ -192,7 +192,7 @@ async function runOCR() { font, size: fontSize, color: rgb(0, 0, 0), - opacity: 0.1, + opacity: 0, }); } catch (error) { // If drawing fails despite sanitization, log and skip this word