Spaces:

sitammeur
/

TextSnap

Running on Zero

App Files Files Community

TextSnap / src /app /task.py

sitammeur

Update src/app/task.py

53409f7 verified 4 months ago

raw

history blame

1.85 kB

	# Import necessary libraries
	import sys
	import copy
	from typing import Tuple
	from PIL import Image
	import gradio as gr
	import supervision as sv

	# Local imports
	from src.utils.processing import clean_text, draw_ocr_bboxes
	from src.app.model import run_example
	from src.logger import logging
	from src.exception import CustomExceptionHandling


	def ocr_task(image: Image.Image) -> Tuple[Image.Image, str]:
	"""
	Perform OCR (Optical Character Recognition) on the given image.

	Args:
	image (PIL.Image.Image): The input image to perform OCR on.

	Returns:
	tuple: A tuple containing the output image with OCR bounding boxes drawn and the cleaned OCR text.
	"""
	try:
	# Task prompts
	ocr_prompt = "<OCR>"
	ocr_with_region_prompt = "<OCR_WITH_REGION>"

	# Get OCR text
	ocr_results = run_example(ocr_prompt, image)
	cleaned_text = clean_text(ocr_results["<OCR>"])

	# Log the successful extraction and cleaning of OCR text
	logging.info("OCR text extracted and cleaned successfully.")

	# Get OCR with region
	ocr_with_region_results = run_example(ocr_with_region_prompt, image)
	output_image = copy.deepcopy(image)
	detections = sv.Detections.from_lmm(
	lmm=sv.LMM.FLORENCE_2,
	result=ocr_with_region_results,
	resolution_wh=image.size,
	)
	output_image = draw_ocr_bboxes(image, detections)

	# Log the successful drawing of OCR bounding boxes
	logging.info("OCR bounding boxes drawn successfully.")

	# Return the output image and cleaned OCR text
	return output_image, cleaned_text

	# Handle exceptions that may occur during the process
	except Exception as e:
	# Custom exception handling
	raise CustomExceptionHandling(e, sys) from e