toshiba_2.O / app.py
neerajkalyank's picture
Update app.py
3469319 verified
raw
history blame
573 Bytes
import camelot
import pandas as pd
import gradio as gr
def extract_tables(pdf_file):
tables = camelot.read_pdf(pdf_file.name, pages="all")
df = pd.concat([table.df for table in tables], ignore_index=True)
df.to_excel("output.xlsx", index=False)
return "output.xlsx"
interface = gr.Interface(
fn=extract_tables,
inputs=gr.File(label="Upload PDF"),
outputs=gr.File(label="Download Excel"),
title="PDF Table Extractor",
description="Extract tables from PDF and output as Excel file.",
)
if __name__ == "__main__":
interface.launch()