From b82bff7236e64db6ecbe4268c7251c19d43cc36f Mon Sep 17 00:00:00 2001
From: sanj <67624670+iodrift@users.noreply.github.com>
Date: Mon, 24 Feb 2025 14:35:49 -0800
Subject: [PATCH] Auto-update: Mon Feb 24 14:35:49 PST 2025

---
 jpgpdfocr | 27 ++++++++++++++++++++++++++-
 1 file changed, 26 insertions(+), 1 deletion(-)

diff --git a/jpgpdfocr b/jpgpdfocr
index 4581e73..58ad319 100755
--- a/jpgpdfocr
+++ b/jpgpdfocr
@@ -1,7 +1,32 @@
 #!/usr/bin/env python3
-import io
+"""
+jpgpdfocr - Convert JPG images to a searchable PDF using OCR.
+
+This script processes a directory of JPG images, runs OCR (Optical Character Recognition) 
+on each image using Tesseract, and merges them into a single searchable PDF.
+
+Usage:
+    ./jpgpdfocr --input <directory> [--output <file>] [--lang <language>] 
+                [--threads <num>] [--quiet]
+
+Arguments:
+    --input, -i    Directory containing JPG files (required).
+    --output, -o   Output PDF filename (default: <input_folder>_searchable.pdf).
+    --lang, -l     OCR language (default: 'eng').
+    --threads, -t  Number of threads for OCR (default: auto-detect CPU cores).
+    --quiet, -q    Suppress output messages.
+
+Dependencies:
+    - Python 3
+    - PIL (Pillow)
+    - pytesseract (Tesseract OCR)
+    - PyPDF2
+    - concurrent.futures (built-in)
+"""
+
 import os
 import argparse
+import io
 from PIL import Image
 import pytesseract
 import concurrent.futures