Spaces:

acecalisto3
/

CEEMEESEEK

Runtime error

acecalisto3 commited on Oct 4

Commit

b723646

•

1 Parent(s): 14db2f5

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -63,7 +63,6 @@ def monitor_urls(storage_location, urls, scrape_interval, content_type, stop_scr
     except Exception as e:
         logging.error(f"Error starting ChromeDriver: {e}")
-# Define a function to start scraping
 def start_scraping(storage_location, urls, scrape_interval, content_type, stop_scraping_flag):
     global CURRENT_TASK, HISTORY
@@ -80,7 +79,7 @@ def start_scraping(storage_location, urls, scrape_interval, content_type, stop_s
         try:
             with webdriver.Chrome(service=Service(webdriver.ChromeDriverManager().install()), options=Options()) as driver:
                 driver.get(url)
-                time.sleep(2 )  # Wait for the page to load
                 if content_type == "text":
                     initial_content = driver.page_source
                 elif content_type == "media":
@@ -94,8 +93,8 @@ def start_scraping(storage_location, urls, scrape_interval, content_type, stop_s
         except (NoSuchElementException, Exception) as e:
             HISTORY.append(f"Error accessing {url}: {e}")
-    # Start a new thread for monitoring URLs
-    threading.Thread(target=monitor_urls, args=(storage_location, urls, scrape_interval, content_type, stop_scraping_flag)).start()
     return f"Started scraping {', '.join(urls)} every {scrape_interval} minutes."

     except Exception as e:
         logging.error(f"Error starting ChromeDriver: {e}")
 def start_scraping(storage_location, urls, scrape_interval, content_type, stop_scraping_flag):
     global CURRENT_TASK, HISTORY
         try:
             with webdriver.Chrome(service=Service(webdriver.ChromeDriverManager().install()), options=Options()) as driver:
                 driver.get(url)
+                time.sleep(2)  # Wait for the page to load
                 if content_type == "text":
                     initial_content = driver.page_source
                 elif content_type == "media":
         except (NoSuchElementException, Exception) as e:
             HISTORY.append(f"Error accessing {url}: {e}")
+        # Start a new thread for monitoring URLs
+        threading.Thread(target=monitor_urls, args=(storage_location, urls, scrape_interval, content_type, stop_scraping_flag)).start()
     return f"Started scraping {', '.join(urls)} every {scrape_interval} minutes."