NotebookLlamaGroq

Running

yasserrmd commited on 23 days ago

Commit

65a0de7

•

1 Parent(s): cb49480

Update extract_text_from_pdf.py

Files changed (1) hide show

extract_text_from_pdf.py CHANGED Viewed

@@ -19,7 +19,7 @@ class PDFTextExtractor:
     A class to handle PDF text extraction and preprocessing for podcast preparation.
     """
     @spaces.GPU
-    def __init__(self, pdf_path, output_path, model_name="meta-llama/Llama-3.2-1B-Instruct"):
         """
         Initialize the PDFTextExtractor with paths and model details.
@@ -28,6 +28,8 @@ class PDFTextExtractor:
             output_path (str): Path to save the cleaned text file.
             model_name (str): Name of the model to use for text processing.
         """
         self.pdf_path = pdf_path
         self.output_path = output_path
         self.max_chars = 100000

     A class to handle PDF text extraction and preprocessing for podcast preparation.
     """
     @spaces.GPU
+    def __init__(self, pdf_path, output_path):
         """
         Initialize the PDFTextExtractor with paths and model details.
             output_path (str): Path to save the cleaned text file.
             model_name (str): Name of the model to use for text processing.
         """
+        model_name="meta-llama/Llama-3.2-1B-Instruct"
         self.pdf_path = pdf_path
         self.output_path = output_path
         self.max_chars = 100000