Spaces:

neerajkalyank
/

toshiba_2.O

Sleeping

neerajkalyank commited on Nov 12

Commit

48f229e

•

1 Parent(s): ac741f6

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,14 +1,21 @@
 import pdfplumber
 import pandas as pd
 from io import BytesIO
 import re
 import gradio as gr
 def extract_data_from_pdf(pdf_file):
     data = []
     po_number = None
-    with pdfplumber.open(pdf_file) as pdf:
         for page in pdf.pages:
             text = page.extract_text()

 import pdfplumber
 import pandas as pd
 from io import BytesIO
+import tempfile
 import re
 import gradio as gr
 def extract_data_from_pdf(pdf_file):
     data = []
     po_number = None
+    # Save the uploaded file temporarily so pdfplumber can open it
+    with tempfile.NamedTemporaryFile(delete=False, suffix=".pdf") as temp_pdf:
+        temp_pdf.write(pdf_file.read())  # Write the uploaded file content to a temporary file
+        temp_pdf_path = temp_pdf.name  # Get the file path
+    # Now open the temporary file with pdfplumber
+    with pdfplumber.open(temp_pdf_path) as pdf:
         for page in pdf.pages:
             text = page.extract_text()