0% found this document useful (0 votes)

2 views4 pages

Image To Doc Working

This document is a Python script for a Batch Image-to-DOCX Converter using Tkinter for the GUI. It allows users to select multiple image files, enhances them, extracts text using OCR, optionally formats the text with GPT, and saves the results in DOCX format. The program checks for expiration and handles errors during the conversion process.

Uploaded by

koduwos2013

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

2 views4 pages

Image To Doc Working

Uploaded by

koduwos2013

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 4

import tkinter as tk

from tkinter import filedialog, messagebox

import os
import shutil
import easyocr
from docx import Document
from PIL import Image, ImageFilter
import openai
import datetime
import sys

# Set expiration date

EXPIRATION_DATE = datetime.datetime(2025, 12, 31) # YYYY, MM, DD
CURRENT_DATE = datetime.datetime.now()

# Check if the program has expired

if CURRENT_DATE >= EXPIRATION_DATE:
messagebox.showerror("Program Expired", "This program has expired and is no
longer operational.")
sys.exit() # Stop execution

def enhance_image(image_path):
""" Basic image enhancement using Pillow's SHARPEN filter. """
image = Image.open(image_path).convert("RGB")
sharpened = image.filter(ImageFilter.SHARPEN)
return sharpened

def extract_text(image_path):
""" Extract text from an image using EasyOCR. """
reader = easyocr.Reader(['en'], gpu=True, recog_network='latin_g2')
text_list = reader.readtext(image_path, detail=0)
return "\n".join(text_list)

def format_text_with_gpt(raw_text, api_key):

""" Use GPT (via OpenAI API) to format extracted text, if API key is provided.
"""
if not api_key:
return raw_text

try:
openai.api_key = api_key
system_prompt = (
"You are a helpful assistant that formats raw OCR text into a cleaner,
"
"more human-readable style. Preserve essential content, but fix
spacing, "
"punctuation, and line breaks as appropriate."
)
user_prompt = f"Please format the following text:\n\n{raw_text}\n\n"

response = openai.ChatCompletion.create(
model="gpt-3.5-turbo",
messages=[
{"role": "system", "content": system_prompt},
{"role": "user", "content": user_prompt}
],
temperature=0.2,
max_tokens=1000
)
formatted_text = response["choices"][0]["message"]["content"].strip()
return formatted_text
except Exception as e:
messagebox.showwarning("GPT Formatting Warning", f"GPT formatting failed:\
n{str(e)}")
return raw_text

def save_to_docx(text, output_path):

""" Save extracted text into a DOCX file using python-docx. """
doc = Document()
doc.add_paragraph(text)
doc.save(output_path)

def convert_single_image(image_path, api_key=None):

"""
Convert a single image file to .docx:
1) Enhance -> Save to "enhanced"
2) OCR
3) Optional GPT formatting
4) Save DOCX to "converted"
5) Move original image to "finished"
Returns a status string for reporting.
"""
try:
if not os.path.isfile(image_path):
return f"ERROR: File not found: {image_path}"

# Base directory of the image

directory = os.path.dirname(image_path)

# Create necessary folders

enhanced_folder = os.path.join(directory, "enhanced")
converted_folder = os.path.join(directory, "converted")
finished_folder = os.path.join(directory, "finished")

for folder in [enhanced_folder, converted_folder, finished_folder]:

if not os.path.exists(folder):
os.makedirs(folder)

# Extract base filename without extension

filename = os.path.basename(image_path)
name, ext = os.path.splitext(filename)

# 1) Enhance the image

enhanced = enhance_image(image_path)
enhanced_path = os.path.join(enhanced_folder, f"{name}_enhanced.jpg")
enhanced.save(enhanced_path)

# 2) Extract OCR text from the enhanced image

raw_text = extract_text(enhanced_path)

# 3) Format text using GPT if API key is provided

final_text = format_text_with_gpt(raw_text, api_key)
# 4) Save the formatted text to a DOCX file in the converted folder
output_path = os.path.join(converted_folder, f"{name}.docx")
save_to_docx(final_text, output_path)

# 5) Move the original image to the "finished" folder

finished_path = os.path.join(finished_folder, filename)
shutil.move(image_path, finished_path)

return f"✓ Success: {filename} -> Enhanced:

{os.path.basename(enhanced_path)}, DOCX: {os.path.basename(output_path)}, Moved to
'finished'."
except Exception as e:
return f"✗ Error with {os.path.basename(image_path)}: {str(e)}"

def convert_multiple_images(file_list, api_key=None):

""" Convert multiple selected images one by one and show results. """
results = []
for f in file_list:
status = convert_single_image(f, api_key)
results.append(status)

final_report = "\n".join(results)
messagebox.showinfo("Conversion Results", final_report)

# --------------------- GUI ----------------------

def browse_files():
""" Allow user to select multiple image files. """
filepaths = filedialog.askopenfilenames(
title="Select One or More Document Images",
filetypes=[("Image Files", "*.jpg *.jpeg *.png *.bmp *.tiff *.webp"), ("All
Files", "*.*")]
)
if filepaths:
text_files.delete("1.0", tk.END)
for fp in filepaths:
text_files.insert(tk.END, fp + "\n")

def convert_action():
""" Collect file paths and optional API key, then start conversion. """
content = text_files.get("1.0", tk.END).strip()
if not content:
messagebox.showerror("Error", "No files selected.")
return

# Split lines into a list of file paths

file_list = [line.strip() for line in content.splitlines() if line.strip()]
if not file_list:
messagebox.showerror("Error", "No valid file paths found.")
return

api_key = entry_api.get().strip()
convert_multiple_images(file_list, api_key)

# MAIN WINDOW
root = tk.Tk()
root.title("Batch Image-to-DOCX Converter")
root.geometry("700x400")
root.resizable(False, False)

# Label for instructions

lbl_info = tk.Label(root, text="Select your image files (multiple):",
font=("Arial", 12))
lbl_info.pack(pady=(10, 5))

# "Browse" button
btn_browse = tk.Button(root, text="Browse Files", command=browse_files,
font=("Arial", 10))
btn_browse.pack()

# A text widget to display chosen file paths

frame_files = tk.Frame(root)
frame_files.pack(padx=10, pady=10, fill="both", expand=True)

scroll_y = tk.Scrollbar(frame_files, orient=tk.VERTICAL)

text_files = tk.Text(frame_files, wrap="none", height=8, width=80,
yscrollcommand=scroll_y.set)
scroll_y.config(command=text_files.yview)
scroll_y.pack(side=tk.RIGHT, fill=tk.Y)
text_files.pack(side=tk.LEFT, fill=tk.BOTH, expand=True)

lbl_api = tk.Label(root, text="OpenAI API Key (optional):", font=("Arial", 12))

lbl_api.pack(pady=(10, 5))

entry_api = tk.Entry(root, width=60, font=("Arial", 10), show='*')

entry_api.pack()

btn_convert = tk.Button(root, text="Convert All to DOCX", command=convert_action,

font=("Arial", 12), bg="navy", fg="white")
btn_convert.pack(pady=20)

root.mainloop()

TSG - RS 40 How To Restore A Backup in RobotStudio 4.0 or QuickTeach 5.5
No ratings yet
TSG - RS 40 How To Restore A Backup in RobotStudio 4.0 or QuickTeach 5.5
8 pages
Practical No3
No ratings yet
Practical No3
8 pages
25 Awesome Python Scripts
No ratings yet
25 Awesome Python Scripts
26 pages
Flask Text-to-Image App
No ratings yet
Flask Text-to-Image App
5 pages
Department of Computer Science & Engineering ST Joseph Engineering College, Mangaluru-575028 2020-2021
No ratings yet
Department of Computer Science & Engineering ST Joseph Engineering College, Mangaluru-575028 2020-2021
11 pages
PDF Data Extraction and Summarization
No ratings yet
PDF Data Extraction and Summarization
9 pages
Findasskasjd
No ratings yet
Findasskasjd
5 pages
Custom AI Image Generator
No ratings yet
Custom AI Image Generator
10 pages
Untitled Document-4
No ratings yet
Untitled Document-4
7 pages
Create - Folder - If - Not - Exists: STR None
No ratings yet
Create - Folder - If - Not - Exists: STR None
5 pages
Democratizing AI
No ratings yet
Democratizing AI
6 pages
Python Code 3
No ratings yet
Python Code 3
17 pages
50 Python Projects Scripts
No ratings yet
50 Python Projects Scripts
65 pages
CV-Mini Project 2
No ratings yet
CV-Mini Project 2
15 pages
BBB
No ratings yet
BBB
8 pages
Math Solver
No ratings yet
Math Solver
2 pages
Notes - by Kishor
No ratings yet
Notes - by Kishor
11 pages
PH Bom-Ali
No ratings yet
PH Bom-Ali
5 pages
Lab4 Image Generation
No ratings yet
Lab4 Image Generation
4 pages
New 5
No ratings yet
New 5
1 page
Updated Code That Flags Faulty Jpgs
No ratings yet
Updated Code That Flags Faulty Jpgs
3 pages
Submission Automata Oussama
No ratings yet
Submission Automata Oussama
2 pages
Ut It Lites All 2 Continue
No ratings yet
Ut It Lites All 2 Continue
7 pages
Python Scripts for Developers
100% (2)
Python Scripts for Developers
65 pages
C) Le Script But Not Complet Partie 1
No ratings yet
C) Le Script But Not Complet Partie 1
13 pages
F) Maybe Is Full Script Complet
No ratings yet
F) Maybe Is Full Script Complet
35 pages
Finxter OpenAI Python API
No ratings yet
Finxter OpenAI Python API
1 page
Lab Manual
No ratings yet
Lab Manual
3 pages
Untitled Document
No ratings yet
Untitled Document
18 pages
D&D Second Brain Setup
No ratings yet
D&D Second Brain Setup
9 pages
How To Analyze A PDF With The Layout-Parser Package. - by Brendan Ferris - Towards Data Science
No ratings yet
How To Analyze A PDF With The Layout-Parser Package. - by Brendan Ferris - Towards Data Science
3 pages
Python Image Processing Pipeline
100% (1)
Python Image Processing Pipeline
31 pages
Open AI GPT 3
No ratings yet
Open AI GPT 3
45 pages
Deep Fake For Free - Ipynb
No ratings yet
Deep Fake For Free - Ipynb
5 pages
Quickstart Openai
No ratings yet
Quickstart Openai
8 pages
Web Scraping & Inverted Index Guide
No ratings yet
Web Scraping & Inverted Index Guide
10 pages
Build App With ChatGPT
100% (1)
Build App With ChatGPT
96 pages
Code Used 240208
No ratings yet
Code Used 240208
9 pages
OCR & Groq: Fast Data Extraction
No ratings yet
OCR & Groq: Fast Data Extraction
17 pages
DeepSeek AI Code Generator
No ratings yet
DeepSeek AI Code Generator
3 pages
45
No ratings yet
45
5 pages
PDF Word
No ratings yet
PDF Word
1 page
Document Classification With LayoutLMv3
No ratings yet
Document Classification With LayoutLMv3
25 pages
Bulk File Rename Python PBL
No ratings yet
Bulk File Rename Python PBL
15 pages
Long Docs
No ratings yet
Long Docs
8 pages
Bypass CAPTCHA with Python OCR
No ratings yet
Bypass CAPTCHA with Python OCR
3 pages
Byte Brawl
No ratings yet
Byte Brawl
11 pages
Extracting Text From Scanned PDF Using Pytesseract & Open CV
No ratings yet
Extracting Text From Scanned PDF Using Pytesseract & Open CV
9 pages
Reference API
No ratings yet
Reference API
2 pages
Python Code 12
No ratings yet
Python Code 12
13 pages
Feature Extraction
No ratings yet
Feature Extraction
9 pages
Agent 301
No ratings yet
Agent 301
5 pages
Trip Planner Example
No ratings yet
Trip Planner Example
7 pages
RAG With Reinforcement Learning
No ratings yet
RAG With Reinforcement Learning
40 pages
Math Agent
No ratings yet
Math Agent
11 pages
DeepSeek - Python Tutorial
No ratings yet
DeepSeek - Python Tutorial
8 pages
Upload
No ratings yet
Upload
6 pages
ML Report
No ratings yet
ML Report
5 pages
Bot Py
No ratings yet
Bot Py
35 pages
Utils
No ratings yet
Utils
4 pages
GeoProbe OW DataServer Guide
No ratings yet
GeoProbe OW DataServer Guide
20 pages
The Context-Switch Overhead Inflicted by Hardware Interrupts (And The Enigma of Do-Nothing Loops)
No ratings yet
The Context-Switch Overhead Inflicted by Hardware Interrupts (And The Enigma of Do-Nothing Loops)
14 pages
Adorage Protocol
No ratings yet
Adorage Protocol
138 pages
OS Unit-5 23-24
No ratings yet
OS Unit-5 23-24
78 pages
University of Mumbai MCQ QUESTION BANK (100 Questions) : Middleware Firmware Package System Software Middleware
No ratings yet
University of Mumbai MCQ QUESTION BANK (100 Questions) : Middleware Firmware Package System Software Middleware
16 pages
OS Practical File
No ratings yet
OS Practical File
47 pages
Kernel Basics for Tech Enthusiasts
100% (1)
Kernel Basics for Tech Enthusiasts
4 pages
IT Infrastructure Guide
No ratings yet
IT Infrastructure Guide
16 pages
Cat Sis
75% (4)
Cat Sis
1 page
The Map Reduce Programming
No ratings yet
The Map Reduce Programming
15 pages
Com - Magma.cheat Logcat
No ratings yet
Com - Magma.cheat Logcat
27 pages
Module 5
No ratings yet
Module 5
69 pages
1 Practical-1
No ratings yet
1 Practical-1
4 pages
Easy Quran Wa Hadees Software Notes
No ratings yet
Easy Quran Wa Hadees Software Notes
6 pages
Red Hat OpenStack-3-Deployment Guide Foreman Technical Preview-En-US
No ratings yet
Red Hat OpenStack-3-Deployment Guide Foreman Technical Preview-En-US
50 pages
USB Driver Upgrade Manual: Revision: 1.000 Date: 3 Aug, 2004
No ratings yet
USB Driver Upgrade Manual: Revision: 1.000 Date: 3 Aug, 2004
14 pages
Power Off Reset Reason Backup
No ratings yet
Power Off Reset Reason Backup
5 pages
The Definitive Guide To Windows Installer
No ratings yet
The Definitive Guide To Windows Installer
41 pages
Euro Truck Simulator 2 Crash Log
No ratings yet
Euro Truck Simulator 2 Crash Log
33 pages
OS MCQs: RAID, Middleware, Scheduling
No ratings yet
OS MCQs: RAID, Middleware, Scheduling
6 pages
Create UEFI Ubuntu USB on Windows
No ratings yet
Create UEFI Ubuntu USB on Windows
7 pages
Windows 2000 PDF
No ratings yet
Windows 2000 PDF
48 pages
Memory Allocation
No ratings yet
Memory Allocation
22 pages
Commnds JES2 MVS
No ratings yet
Commnds JES2 MVS
10 pages
Linux
100% (1)
Linux
76 pages
Object Oriented Programming - SCJ2153: Associate Prof. Dr. Norazah Yusof
No ratings yet
Object Oriented Programming - SCJ2153: Associate Prof. Dr. Norazah Yusof
15 pages
Dixit Abhishek
No ratings yet
Dixit Abhishek
54 pages
Bcom 1st Sem FIT Lab Record Single File Printing
No ratings yet
Bcom 1st Sem FIT Lab Record Single File Printing
35 pages
DRD (Dynamic Root Disk) Release Notes (Release March 2014, 766141-001a) (Edition 2, April 2015)
No ratings yet
DRD (Dynamic Root Disk) Release Notes (Release March 2014, 766141-001a) (Edition 2, April 2015)
25 pages

Image To Doc Working

Uploaded by

Image To Doc Working

Uploaded by

import tkinter as tk

from tkinter import filedialog, messagebox

# Set expiration date

# Check if the program has expired

def format_text_with_gpt(raw_text, api_key):

def save_to_docx(text, output_path):

def convert_single_image(image_path, api_key=None):

# Base directory of the image

# Create necessary folders

for folder in [enhanced_folder, converted_folder, finished_folder]:

# Extract base filename without extension

# 1) Enhance the image

# 2) Extract OCR text from the enhanced image

# 3) Format text using GPT if API key is provided

# 5) Move the original image to the "finished" folder

return f"✓ Success: {filename} -> Enhanced:

def convert_multiple_images(file_list, api_key=None):

# --------------------- GUI ----------------------

# Split lines into a list of file paths

# Label for instructions

# A text widget to display chosen file paths

scroll_y = tk.Scrollbar(frame_files, orient=tk.VERTICAL)

lbl_api = tk.Label(root, text="OpenAI API Key (optional):", font=("Arial", 12))

entry_api = tk.Entry(root, width=60, font=("Arial", 10), show='*')

btn_convert = tk.Button(root, text="Convert All to DOCX", command=convert_action,

You might also like