File size: 623 Bytes
0be1cdb
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
import pdfplumber
import pandas as pd

def parse_perfect_metaprint(pdf_path):
    columns = [
        "Purchase Order No", "Purchase Order Date", "S. No", "Material No",
        "Material Description", "Qty", "Price", "Delivery Date", "Total Value", 
        "Vat%", "Amount Incl. VAT"
    ]
    data = []

    with pdfplumber.open(pdf_path) as pdf:
        for page in pdf.pages:
            table = page.extract_table()
            if table:
                for row in table[1:]:  # Skip header row
                    data.append(row)

    # Create a DataFrame
    df = pd.DataFrame(data, columns=columns)
    return df