Spaces:

rmayormartins
/

ocr-img2txt

Sleeping

ocr-img2txt / app.py

Adicionando app.py2a

30adacb 6 months ago

1.06 kB

	import gradio as gr
	import pytesseract
	from PIL import Image
	import easyocr

	##
	easyocr_reader = easyocr.Reader(['en', 'pt', 'es'], gpu=False) #

	#Tesseract
	def tesseract_ocr(image):
	return pytesseract.image_to_string(image)

	#EasyOCR
	def easyocr_ocr(image):
	return ' '.join(easyocr_reader.readtext(image, detail=0))

	#
	def extract_text_from_image(ocr_engine, image):
	if ocr_engine == "Tesseract":
	return tesseract_ocr(image)
	elif ocr_engine == "EasyOCR":
	return easyocr_ocr(image)
	else:
	return "Invalid OCR selection."


	#Gradio
	iface = gr.Interface(
	fn=extract_text_from_image,
	inputs=[gr.Dropdown(["Tesseract", "EasyOCR"], label="Select the OCR Engine"), "image"],
	outputs="text",
	title="OCR Img2txt",
	description="This application uses Optical Character Recognition (OCR) technology to extract text from images. Choose between Tesseract OCR and EasyOCR engine to process images containing printed text, converting it into editable and searchable text."
	)

	iface.launch(debug=True)