Spaces:

SR05
/

Delhi_Irish_visa_decisions

Running

SR05 commited on 9 days ago

Commit

82e2987

•

1 Parent(s): 40b182b

Update loading_file.py (#7)

Files changed (1) hide show

loading_file.py CHANGED Viewed

@@ -3,8 +3,10 @@ from bs4 import BeautifulSoup
 from io import BytesIO
 import streamlit as st
-# URL and headers for the file source
 url = "https://www.ireland.ie/en/india/newdelhi/services/visas/processing-times-and-decisions/"
 headers = {
     "User-Agent": (
         "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 "
@@ -19,11 +21,14 @@ def load_data_file():
         soup = BeautifulSoup(response.content, 'html.parser')
         links = soup.find_all('a')
         file_url = None
         for link in links:
             link_text = link.get_text(strip=True)
             if "Visa decisions made from 1 January 2024 to" in link_text:
                 file_url = link.get('href')
                 break
         if file_url:
@@ -32,11 +37,9 @@ def load_data_file():
             file_response = requests.get(file_url, headers=headers)
             if file_response.status_code == 200:
-                return BytesIO(file_response.content), link_text
             else:
                 st.error(f"Failed to download the file. Status code: {file_response.status_code}")
-        else:
-            st.error("The specified link was not found.")
     else:
         st.error(f"Failed to retrieve the webpage. Status code: {response.status_code}")
     return None, None

 from io import BytesIO
 import streamlit as st
+# URL of the website to scrape
 url = "https://www.ireland.ie/en/india/newdelhi/services/visas/processing-times-and-decisions/"
+# Headers for the HTTP request
 headers = {
     "User-Agent": (
         "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 "
         soup = BeautifulSoup(response.content, 'html.parser')
         links = soup.find_all('a')
+        # Look for the link to the .ods file
         file_url = None
+        file_name = None
         for link in links:
             link_text = link.get_text(strip=True)
             if "Visa decisions made from 1 January 2024 to" in link_text:
                 file_url = link.get('href')
+                file_name = link_text
                 break
         if file_url:
             file_response = requests.get(file_url, headers=headers)
             if file_response.status_code == 200:
+                return BytesIO(file_response.content), file_name
             else:
                 st.error(f"Failed to download the file. Status code: {file_response.status_code}")
     else:
         st.error(f"Failed to retrieve the webpage. Status code: {response.status_code}")
     return None, None