import tempfile
import subprocess

def capture_screen():
    try:
        with tempfile.NamedTemporaryFile(prefix="screenshot_", suffix=".png", delete=False) as tmp:
            screenshot_file_path = tmp.name
            subprocess.run(["screencapture", "-i", "-s", screenshot_file_path], check=True)
        return screenshot_file_path
    except subprocess.CalledProcessError as e:
        print(f"Error capturing screen: {e}")
        return None

from PIL import Image
from pytesseract import image_to_string
import os

def recognize_text(screenshot_file_path, lang="eng"):
    if not screenshot_file_path:
        return ""

    if os.path.isfile(screenshot_file_path):
        screenshot = Image.open(screenshot_file_path)
        recognized_text = image_to_string(screenshot, lang=lang, config='--psm 6')
        os.unlink(screenshot_file_path)
        return recognized_text.strip()

    return ""

from IPython.display import HTML
import warnings

warnings.simplefilter("ignore")

HTML("""<iframe width="786" height="491" src="https://www.youtube.com/embed/A7vLKHKeFYQ" title="tesseract ocr demonstration" frameborder="0" allow="accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture; web-share" allowfullscreen></iframe>""")

try:
    clipboard.copy(pred)
except:
    pass

from PIL import Image
from pix2tex.cli import LatexOCR
import os
import pyperclip

latex_ocr_model = LatexOCR()


def recognize_latex(screenshot_file_path):
    if not screenshot_file_path:
        return ""

    # Save the current clipboard content
    original_clipboard_content = pyperclip.paste()

    if os.path.isfile(screenshot_file_path):
        screenshot = Image.open(screenshot_file_path)
        recognized_latex = latex_ocr_model(screenshot, resize=True)

        # Restore the original clipboard content
        pyperclip.copy(original_clipboard_content)

        if recognized_latex:
            return recognized_latex

    return ""

HTML("""<iframe width="786" height="491" src="https://www.youtube.com/embed/2dQBsZzLu_k?si=pNJTGs_50YgQSwzy" title="tesseract ocr demonstration" frameborder="0" allow="accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture; web-share" allowfullscreen></iframe>""")

$$
\nabla\times\vec{\mathrm{B}}-\frac{1}{C}\frac{\delta\vec{\mathrm{E}}}{\delta t}=4\pi\rho
$$

#main_app.py

import tkinter as tk
from tkinter import ttk
import pyperclip

from ocr_engine import recognize_text
from latex_engine import recognize_latex
from capture_tools import capture_screen

class GUI:

    def __init__(self):
        self.root = tk.Tk()
        self.root.title("Screen Capture OCR")
        self.root.geometry("450x250")

        main_frame = ttk.Frame(self.root)
        main_frame.pack(pady=10)

        ttk.Label(main_frame, text="Choose recognition mode:").grid(row=0, column=0, sticky="W", padx=(20, 0), columnspan=2)

        ttk.Button(main_frame, text="Text OCR", command=self.capture_and_copy_text).grid(row=1, column=0, padx=(20, 0), pady=5)
        ttk.Button(main_frame, text="LaTeX OCR", command=self.capture_and_copy_latex).grid(row=1, column=1, padx=(10, 0), pady=5)


        ttk.Button(main_frame, text="Clear Clipboard", command=self.reset_clipboard).grid(row=3, column=0, padx=(20, 0), pady=5, columnspan=2)

        self.status_text = tk.StringVar()
        ttk.Label(main_frame, textvariable=self.status_text).grid(row=4, column=0, sticky="W", padx=(20, 0), pady=5, columnspan=2)

        self.root.bind("<Return>", lambda event: self.capture_and_copy_text())


    def copy_content(self, content, current_clipboard, is_latex=False):
        if is_latex:
            content = f"$$\n{content}\n$$"

        if current_clipboard:
            new_clipboard = current_clipboard + "\n\n" + content
        else:
            new_clipboard = content

        pyperclip.copy(new_clipboard)

    def capture_and_copy_text(self):
        screenshot_file_path = capture_screen()

        if screenshot_file_path:
            recognized_content = recognize_text(screenshot_file_path)

            if recognized_content:
                current_clipboard = pyperclip.paste()
                self.copy_content(recognized_content, current_clipboard, is_latex=False)
                self.status_text.set("Text recognized and appended to clipboard!")

    def capture_and_copy_latex(self):
        screenshot_file_path = capture_screen()

        if screenshot_file_path:
            recognized_content = recognize_latex(screenshot_file_path)

            if recognized_content:
                current_clipboard = pyperclip.paste()
                self.copy_content(recognized_content, current_clipboard, is_latex=True)
                self.status_text.set("LaTeX recognized and appended to clipboard!")

    def reset_clipboard(self):
        pyperclip.copy('')
        self.status_text.set("Clipboard has been reset.")

    def run(self):
        self.root.mainloop()

def main():
    app = GUI()
    app.run()

if __name__ == "__main__":
    main()

HTML("""<iframe width="786" height="491" src="https://www.youtube.com/embed/1dBCizYflqw?si=Xms4aATEKkA1lVcM" title="tesseract ocr demonstration" frameborder="0" allow="accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture; web-share" allowfullscreen></iframe>""")

MacOS Screenshot - OCR & LaTeX Model¶

Brief Overview of Features¶

Screenshot Capture¶

OCR Engine: Pytesseract¶

LaTeX Engine: Modified Pix2tex¶

Clipboard Management¶

User Interface¶

Motivation¶

Basic Copy-Paste Example¶

OCR Text Extraction Issues - Example #1¶

OCR Text Extraction Issues - Example #2¶

Capture Tools (capture_tools.py)¶

Dependencies and Function: capture_screen()¶

Tempfile Module¶

Subprocess Module¶

OCR Engine (ocr_engine.py)¶

Dependencies and Function: recognize_text(screenshot_file_path, lang="eng")¶

Tesseract OCR Demonstration¶

OCR Models and Challenges in Recognizing Scientific Symbols and Technical Expressions¶

Critical Causes of OCR Inaccuracy¶

LaTeX Engine (latex_engine.py)¶

Dependencies and Function: recognize_latex(screenshot_file_path)¶

LatexOCR and pix2tex¶

Other Dependencies and Functions¶

LaTeX OCR Model Demonstration¶

Main App (main_app.py)¶

Dependencies¶

Class: GUI¶

Function: main¶

Entry Point¶

Main App Demo¶