Added OCR PDF, CAD to PDF/image, Animated WebP/GIF

2026-07-01 23:17:37 +08:00 · 2026-04-19 10:53:59 +07:00
parent b329efe6ad
commit a07b480a71
5 changed files with 336 additions and 2 deletions
@@ -1,6 +1,6 @@
 # Your Everyday Tools

-A lightweight, self-hosted web app that bundles 48 everyday utilities into a single interface. Built with Python + Flask, zero JavaScript frameworks, and minimal CSS — no bloat, just tools.
+A lightweight, self-hosted web app that bundles 51 everyday utilities into a single interface. Built with Python + Flask, zero JavaScript frameworks, and minimal CSS — no bloat, just tools.

 ![Python](https://img.shields.io/badge/Python-3.10+-blue)
 ![Flask](https://img.shields.io/badge/Flask-3.x-green)
@@ -27,6 +27,8 @@ A lightweight, self-hosted web app that bundles 48 everyday utilities into a sin
 | **PDF to Images** | Export each PDF page as PNG or JPG (configurable DPI) |
 | **PDF to Text** | Extract all text content from a PDF |
 | **HTML to PDF** | Convert HTML content to a PDF document |
+| **OCR PDF** | Make scanned PDFs searchable (image + hidden text layer) or extract text — 14 languages supported |
+| **CAD to PDF/Image** | Convert DXF drawings to PDF or PNG (DWG via optional ODA File Converter) |

 ### PDF Tools
 | Tool | Description |
@@ -54,6 +56,7 @@ A lightweight, self-hosted web app that bundles 48 everyday utilities into a sin
 | **EXIF Viewer** | View or strip image metadata (EXIF data) for privacy |
 | **Favicon Generator** | Create .ico favicons from any image with multiple size options |
 | **Image to Text (OCR)** | Extract text from images using optical character recognition |
+| **Animated WebP/GIF** | Convert between animated GIF and animated WebP (preserves per-frame timing) |

 ### Text & Data (client-side, no upload needed)
 | Tool | Description |
@@ -138,7 +141,8 @@ The core app works out of the box with the main dependencies. Some features requ
 | `rembg` | Remove Background | Installs ONNX Runtime (~500 MB). The app works without it and shows a helpful message if missing. |
 | `pyzbar` | Read QR Code | Requires the [ZBar](https://github.com/NaturalHistoryMuseum/pyzbar#installation) shared library on your system. |
 | `pdf2docx` | PDF to Word | Pure Python, but conversion quality depends on PDF complexity. |
-| `pytesseract` | Image to Text (OCR) | Requires the [Tesseract](https://github.com/tesseract-ocr/tesseract) binary installed on your system. |
+| `pytesseract` | Image to Text (OCR), OCR PDF | Requires the [Tesseract](https://github.com/tesseract-ocr/tesseract) binary installed on your system. For non-English OCR, download the matching `*.traineddata` language pack into your Tesseract `tessdata` folder. |
+| `ezdxf` + `matplotlib` | CAD to PDF/Image | Renders DXF drawings. For DWG support, also install the free [ODA File Converter](https://www.opendesign.com/guestfiles/oda_file_converter) and make sure it's on your `PATH`. |

 If you only need the core tools, install the minimal set:

@@ -15,6 +15,8 @@ TOOL_CATEGORIES = [
            {"id": "pdf-to-images", "name": "PDF to Images", "desc": "Convert PDF pages to images", "icon": "bi-file-image-fill"},
            {"id": "pdf-to-text", "name": "PDF to Text", "desc": "Extract text content from PDF", "icon": "bi-file-text-fill"},
            {"id": "html-to-pdf", "name": "HTML to PDF", "desc": "Convert HTML content to PDF", "icon": "bi-filetype-html"},
+            {"id": "ocr-pdf", "name": "OCR PDF", "desc": "Make scanned PDFs searchable or extract text", "icon": "bi-file-earmark-text-fill"},
+            {"id": "cad-to-pdf", "name": "CAD to PDF/Image", "desc": "Convert DXF/DWG drawings to PDF or PNG", "icon": "bi-rulers"},
        ],
    },
    {
@@ -48,6 +50,7 @@ TOOL_CATEGORIES = [
            {"id": "exif", "name": "EXIF Viewer", "desc": "View and strip image metadata", "icon": "bi-info-circle-fill"},
            {"id": "favicon", "name": "Favicon Generator", "desc": "Create .ico favicons from images", "icon": "bi-app-indicator"},
            {"id": "ocr", "name": "Image to Text", "desc": "Extract text from images (OCR)", "icon": "bi-card-text"},
+            {"id": "animated", "name": "Animated WebP/GIF", "desc": "Convert between animated WebP and GIF", "icon": "bi-film"},
        ],
    },
    {
@@ -13,3 +13,5 @@ rembg
 pyzbar
 pdf2docx
 pytesseract
+ezdxf
+matplotlib
@@ -17,6 +17,26 @@ try:
 except ImportError:
    HAS_PDF2DOCX = False

+try:
+    import pytesseract
+    HAS_TESSERACT = True
+except ImportError:
+    HAS_TESSERACT = False
+
+try:
+    import ezdxf
+    from ezdxf.addons.drawing import RenderContext, Frontend
+    from ezdxf.addons.drawing.matplotlib import MatplotlibBackend
+    import matplotlib
+    matplotlib.use("Agg")
+    import matplotlib.pyplot as plt
+    HAS_EZDXF = True
+except ImportError:
+    HAS_EZDXF = False
+
+import shutil
+ODA_CONVERTER = shutil.which("ODAFileConverter") or shutil.which("oda_file_converter")
+
 bp = Blueprint("convert", __name__)


@@ -73,6 +93,68 @@ def pdf_to_text_page():
        options=[])


+OCR_LANGS = [
+    {"value": "eng", "label": "English"},
+    {"value": "ind", "label": "Indonesian"},
+    {"value": "fra", "label": "French"},
+    {"value": "deu", "label": "German"},
+    {"value": "spa", "label": "Spanish"},
+    {"value": "ita", "label": "Italian"},
+    {"value": "por", "label": "Portuguese"},
+    {"value": "rus", "label": "Russian"},
+    {"value": "chi_sim", "label": "Chinese (Simplified)"},
+    {"value": "chi_tra", "label": "Chinese (Traditional)"},
+    {"value": "jpn", "label": "Japanese"},
+    {"value": "kor", "label": "Korean"},
+    {"value": "ara", "label": "Arabic"},
+    {"value": "hin", "label": "Hindi"},
+]
+
+
+@bp.route("/ocr-pdf")
+def ocr_pdf_page():
+    return render_template("upload_tool.html",
+        title="OCR PDF",
+        description="Extract text from scanned PDFs or create a searchable PDF with a hidden text layer",
+        endpoint="/convert/ocr-pdf",
+        accept=".pdf",
+        multiple=False,
+        options=[
+            {"type": "select", "name": "mode", "label": "Output",
+             "choices": [
+                 {"value": "searchable", "label": "Searchable PDF (image + text layer)"},
+                 {"value": "text", "label": "Extracted text only"},
+             ]},
+            {"type": "select", "name": "lang", "label": "Language",
+             "choices": OCR_LANGS},
+            {"type": "number", "name": "dpi", "label": "OCR Resolution (DPI)",
+             "default": 200, "min": 100, "max": 400},
+        ])
+
+
+@bp.route("/cad-to-pdf")
+def cad_to_pdf_page():
+    desc = "Convert DXF (or DWG with ODA File Converter) drawings to PDF or PNG"
+    if not ODA_CONVERTER:
+        desc += " — DWG requires ODA File Converter on PATH"
+    return render_template("upload_tool.html",
+        title="CAD to PDF/Image",
+        description=desc,
+        endpoint="/convert/cad-to-pdf",
+        accept=".dxf,.dwg",
+        multiple=False,
+        options=[
+            {"type": "select", "name": "format", "label": "Output Format",
+             "choices": [
+                 {"value": "pdf", "label": "PDF"},
+                 {"value": "png", "label": "PNG"},
+             ]},
+            {"type": "number", "name": "dpi", "label": "PNG Resolution (DPI)",
+             "default": 150, "min": 72, "max": 600,
+             "depends_on": {"format": "png"}},
+        ])
+
+
@bp.route("/html-to-pdf")
 def html_to_pdf_page():
    return render_template("upload_tool.html",
@@ -357,3 +439,144 @@ def html_to_pdf():

    return send_file(output, mimetype="application/pdf",
                     as_attachment=True, download_name="converted.pdf")
+
+
+@bp.route("/ocr-pdf", methods=["POST"])
+def ocr_pdf():
+    if not HAS_TESSERACT:
+        return jsonify(error="OCR requires 'pytesseract' and the Tesseract binary. Install: pip install pytesseract, plus Tesseract from https://github.com/tesseract-ocr/tesseract"), 400
+
+    files = request.files.getlist("files")
+    if not files or not files[0].filename:
+        return jsonify(error="No file uploaded."), 400
+
+    mode = request.form.get("mode", "searchable")
+    lang = request.form.get("lang", "eng")
+    dpi = int(request.form.get("dpi", 200))
+
+    pdf_data = files[0].read()
+    src = fitz.open(stream=pdf_data, filetype="pdf")
+    zoom = dpi / 72
+
+    try:
+        if mode == "text":
+            text_parts = []
+            for i, page in enumerate(src):
+                pix = page.get_pixmap(matrix=fitz.Matrix(zoom, zoom))
+                img = Image.open(io.BytesIO(pix.tobytes("png")))
+                text = pytesseract.image_to_string(img, lang=lang)
+                text_parts.append(f"--- Page {i + 1} ---\n{text.strip()}")
+            src.close()
+            combined = "\n\n".join(text_parts).strip()
+            return jsonify(text=combined or "(No text detected)")
+
+        output = fitz.open()
+        for page in src:
+            pix = page.get_pixmap(matrix=fitz.Matrix(zoom, zoom))
+            img = Image.open(io.BytesIO(pix.tobytes("png")))
+            page_pdf_bytes = pytesseract.image_to_pdf_or_hocr(img, extension="pdf", lang=lang)
+            sub = fitz.open(stream=page_pdf_bytes, filetype="pdf")
+            output.insert_pdf(sub)
+            sub.close()
+        src.close()
+
+        buf = io.BytesIO()
+        output.save(buf)
+        output.close()
+        buf.seek(0)
+
+        name = files[0].filename.rsplit(".", 1)[0] + "_ocr.pdf"
+        return send_file(buf, mimetype="application/pdf",
+                         as_attachment=True, download_name=name)
+    except pytesseract.TesseractNotFoundError:
+        return jsonify(error="Tesseract binary not found. Install from https://github.com/tesseract-ocr/tesseract and ensure it is on PATH."), 400
+    except Exception as e:
+        msg = str(e)
+        if "language" in msg.lower() or "traineddata" in msg.lower():
+            return jsonify(error=f"Language pack '{lang}' not installed. Download its .traineddata file into your Tesseract tessdata directory."), 400
+        return jsonify(error=f"OCR failed: {msg}"), 400
+
+
+@bp.route("/cad-to-pdf", methods=["POST"])
+def cad_to_pdf():
+    if not HAS_EZDXF:
+        return jsonify(error="CAD conversion requires 'ezdxf' and 'matplotlib'. Install: pip install ezdxf matplotlib"), 400
+
+    files = request.files.getlist("files")
+    if not files or not files[0].filename:
+        return jsonify(error="No file uploaded."), 400
+
+    target = request.form.get("format", "pdf")
+    dpi = int(request.form.get("dpi", 150))
+
+    filename = files[0].filename
+    ext = filename.rsplit(".", 1)[-1].lower() if "." in filename else ""
+    file_data = files[0].read()
+
+    import tempfile, os, subprocess
+    with tempfile.TemporaryDirectory() as tmpdir:
+        if ext == "dwg":
+            if not ODA_CONVERTER:
+                return jsonify(error="DWG support requires ODA File Converter. Download it free from https://www.opendesign.com/guestfiles/oda_file_converter and ensure it is on your PATH. Or convert your DWG to DXF first."), 400
+
+            in_dir = os.path.join(tmpdir, "in")
+            out_dir = os.path.join(tmpdir, "out")
+            os.makedirs(in_dir)
+            os.makedirs(out_dir)
+            dwg_path = os.path.join(in_dir, "input.dwg")
+            with open(dwg_path, "wb") as f:
+                f.write(file_data)
+
+            try:
+                subprocess.run(
+                    [ODA_CONVERTER, in_dir, out_dir, "ACAD2018", "DXF", "0", "1", "*.DWG"],
+                    check=True, capture_output=True, timeout=60,
+                )
+            except subprocess.CalledProcessError as e:
+                return jsonify(error=f"DWG to DXF conversion failed: {e.stderr.decode(errors='replace')[:200]}"), 400
+            except subprocess.TimeoutExpired:
+                return jsonify(error="DWG conversion timed out."), 400
+
+            dxf_path = os.path.join(out_dir, "input.dxf")
+            if not os.path.exists(dxf_path):
+                return jsonify(error="DWG to DXF conversion produced no output."), 400
+            doc = ezdxf.readfile(dxf_path)
+        elif ext == "dxf":
+            dxf_path = os.path.join(tmpdir, "input.dxf")
+            with open(dxf_path, "wb") as f:
+                f.write(file_data)
+            try:
+                doc = ezdxf.readfile(dxf_path)
+            except Exception as e:
+                return jsonify(error=f"Invalid DXF file: {str(e)[:200]}"), 400
+        else:
+            return jsonify(error="Upload a .dxf or .dwg file."), 400
+
+        msp = doc.modelspace()
+        fig = plt.figure()
+        ax = fig.add_axes([0, 0, 1, 1])
+        ax.set_aspect("equal")
+        ax.set_axis_off()
+
+        try:
+            ctx = RenderContext(doc)
+            backend = MatplotlibBackend(ax)
+            Frontend(ctx, backend).draw_layout(msp, finalize=True)
+        except Exception as e:
+            plt.close(fig)
+            return jsonify(error=f"Rendering failed: {str(e)[:200]}"), 400
+
+        buf = io.BytesIO()
+        base_name = filename.rsplit(".", 1)[0]
+        if target == "pdf":
+            fig.savefig(buf, format="pdf", bbox_inches="tight", pad_inches=0.2)
+            plt.close(fig)
+            buf.seek(0)
+            return send_file(buf, mimetype="application/pdf",
+                             as_attachment=True, download_name=base_name + ".pdf")
+        else:
+            fig.savefig(buf, format="png", dpi=dpi, bbox_inches="tight", pad_inches=0.2)
+            plt.close(fig)
+            buf.seek(0)
+            return send_file(buf, mimetype="image/png",
+                             as_attachment=True, download_name=base_name + ".png")
@@ -217,6 +217,31 @@ def favicon_page():
        button_text="Generate Favicon")


+@bp.route("/animated")
+def animated_page():
+    return render_template("upload_tool.html",
+        title="Animated WebP / GIF",
+        description="Convert animated GIF to WebP, or animated WebP to GIF (preserves timing)",
+        endpoint="/image/animated",
+        accept=".gif,.webp",
+        multiple=False,
+        options=[
+            {"type": "select", "name": "target", "label": "Output Format",
+             "choices": [
+                 {"value": "webp", "label": "Animated WebP"},
+                 {"value": "gif", "label": "GIF"},
+             ]},
+            {"type": "range", "name": "quality", "label": "WebP Quality",
+             "default": 80, "min": 10, "max": 100, "step": 5, "suffix": "%",
+             "depends_on": {"target": "webp"}},
+            {"type": "number", "name": "fps", "label": "Override FPS (0 = keep original)",
+             "default": 0, "min": 0, "max": 60},
+            {"type": "checkbox", "name": "lossless", "label": "Lossless",
+             "check_label": "Lossless WebP (larger file)", "default": False,
+             "depends_on": {"target": "webp"}},
+        ])
+
+
@bp.route("/ocr")
 def ocr_page():
    return render_template("upload_tool.html",
@@ -545,6 +570,83 @@ def favicon():
                     as_attachment=True, download_name="favicon.ico")


+@bp.route("/animated", methods=["POST"])
+def animated():
+    files = request.files.getlist("files")
+    if not files or not files[0].filename:
+        return jsonify(error="No file uploaded."), 400
+
+    target = request.form.get("target", "webp").lower()
+    quality = int(request.form.get("quality", 80))
+    fps_override = int(request.form.get("fps", 0))
+    lossless = request.form.get("lossless") == "on"
+
+    try:
+        src = Image.open(io.BytesIO(files[0].read()))
+    except Exception as e:
+        return jsonify(error=f"Could not read image: {e}"), 400
+
+    frames = []
+    durations = []
+    try:
+        while True:
+            frame = src.copy()
+            if frame.mode == "P":
+                frame = frame.convert("RGBA")
+            frames.append(frame)
+            durations.append(src.info.get("duration", 100))
+            src.seek(src.tell() + 1)
+    except EOFError:
+        pass
+
+    if not frames:
+        return jsonify(error="No frames found in image."), 400
+
+    if fps_override > 0:
+        per_frame_ms = int(1000 / fps_override)
+        durations = [per_frame_ms] * len(frames)
+
+    loop = src.info.get("loop", 0)
+    buf = io.BytesIO()
+    base = files[0].filename.rsplit(".", 1)[0]
+
+    if target == "webp":
+        save_kwargs = {
+            "format": "WEBP",
+            "save_all": True,
+            "append_images": frames[1:],
+            "duration": durations,
+            "loop": loop,
+            "lossless": lossless,
+        }
+        if not lossless:
+            save_kwargs["quality"] = quality
+        frames[0].save(buf, **save_kwargs)
+        buf.seek(0)
+        return send_file(buf, mimetype="image/webp",
+                         as_attachment=True, download_name=base + ".webp")
+
+    # GIF output — GIF palette is 256 colors
+    gif_frames = [f.convert("RGBA") for f in frames]
+    disposal_frames = []
+    for f in gif_frames:
+        if f.mode == "RGBA":
+            bg = Image.new("RGBA", f.size, (255, 255, 255, 255))
+            bg.paste(f, mask=f.split()[3])
+            disposal_frames.append(bg.convert("P", palette=Image.ADAPTIVE, colors=256))
+        else:
+            disposal_frames.append(f.convert("P", palette=Image.ADAPTIVE, colors=256))
+
+    disposal_frames[0].save(
+        buf, format="GIF", save_all=True,
+        append_images=disposal_frames[1:],
+        duration=durations, loop=loop, optimize=True, disposal=2,
+    )
+    buf.seek(0)
+    return send_file(buf, mimetype="image/gif",
+                     as_attachment=True, download_name=base + ".gif")
+
+
@bp.route("/ocr", methods=["POST"])
 def ocr():
    if not HAS_TESSERACT: