Spaces:

GIZ
/

Development-Project-Synergy-Finder

Running on CPU Upgrade

App Files Files Community

Jan Mühlnikel commited on Mar 24

Commit

c8e0175

•

1 Parent(s): 21b6daa

added single matching result table

Browse files

Files changed (7) hide show

__pycache__/similarity_page.cpython-310.pyc +0 -0
functions/__pycache__/calc_matches.cpython-310.pyc +0 -0
functions/__pycache__/single_similar.cpython-310.pyc +0 -0
functions/single_similar.py +15 -0
modules/{result_table.py → multimatch_result_table.py} +1 -2
modules/singlematch_result_table.py +83 -0
similarity_page.py +12 -2

__pycache__/similarity_page.cpython-310.pyc CHANGED Viewed

Binary files a/__pycache__/similarity_page.cpython-310.pyc and b/__pycache__/similarity_page.cpython-310.pyc differ

functions/__pycache__/calc_matches.cpython-310.pyc CHANGED Viewed

Binary files a/functions/__pycache__/calc_matches.cpython-310.pyc and b/functions/__pycache__/calc_matches.cpython-310.pyc differ

functions/__pycache__/single_similar.cpython-310.pyc ADDED Viewed

Binary file (675 Bytes). View file

functions/single_similar.py ADDED Viewed

	@@ -0,0 +1,15 @@

+import pandas as pd
+import numpy as np
+def find_similar(p_index, similarity_matrix, projects_df, top_x):
+    selected_row = similarity_matrix[p_index]
+    top_indexes = np.argsort(selected_row)[-10:][::-1]
+    top_values = selected_row[top_indexes]
+    top_projects_df = projects_df.iloc[top_indexes]
+    top_projects_df["similarity"] = top_values
+    return top_projects_df

modules/{result_table.py → multimatch_result_table.py} RENAMED Viewed

@@ -1,8 +1,7 @@
 import streamlit as st
-from st_aggrid import AgGrid, GridOptionsBuilder
 import pandas as pd
-def show_table(p1_df, p2_df):
         st.write("------------------")
         p1_df = p1_df.reset_index(drop=True)

 import streamlit as st
 import pandas as pd
+def show_multi_table(p1_df, p2_df):
         st.write("------------------")
         p1_df = p1_df.reset_index(drop=True)

modules/singlematch_result_table.py ADDED Viewed

	@@ -0,0 +1,83 @@

+import streamlit as st
+import pandas as pd
+def show_single_table(result_df):
+    result_df = result_df.reset_index(drop=True)
+    # Transformations
+    result_df["crs_3_code_list"] = result_df['crs_3_code'].str.split(";").apply(lambda x: x[:-1] if x else [])
+    result_df["crs_5_code_list"] = result_df['crs_5_code'].str.split(";").apply(lambda x: x[:-1] if x else [])
+    result_df["sdg_list"] = result_df['sgd_pred_code'].apply(lambda x: [x] if pd.notna(x) else [])
+    result_df["flag"] = result_df['country'].apply(lambda x: f"https://flagicons.lipis.dev/flags/4x3/{x[:2].lower()}.svg" if pd.notna(x) else "https://flagicons.lipis.dev/flags/4x3/xx.svg")
+    st.dataframe(
+        result_df[["similarity", "iati_id", "title_main", "orga_abbreviation", "client", "description_main", "country", "flag", "sdg_list", "crs_3_code_list", "crs_5_code_list"]],
+        use_container_width = True,
+        height = 35 + 35 * len(result_df),
+        column_config={
+            "similarity": st.column_config.TextColumn(
+                "Similarity",
+                help="similarity to selected project",
+                disabled=True,
+                width="small"
+            ),
+            "iati_id": st.column_config.TextColumn(
+                "IATI ID",
+                help="IATI Project ID",
+                disabled=True,
+                width="small"
+            ),
+            "orga_abbreviation": st.column_config.TextColumn(
+                "Organization",
+                help="If description not in English, description in other language provided",
+                disabled=True,
+                width="small"
+            ),
+            "client": st.column_config.TextColumn(
+                "Client",
+                help="Client organization of customer",
+                disabled=True,
+                width="small"
+            ),
+            "title_main": st.column_config.TextColumn(
+                "Title",
+                help="If title not in English, title in other language provided",
+                disabled=True,
+                width="large"
+            ),
+            "description_main": st.column_config.TextColumn(
+                "Description",
+                help="If description not in English, description in other language provided",
+                disabled=True,
+                width="large"
+            ),
+            "country": st.column_config.TextColumn(
+                "Country",
+                help="Country of project",
+                disabled=True,
+                width="small"
+            ),
+            "flag": st.column_config.ImageColumn(
+                "Flag",
+                help="country flag",
+                width="small"
+            ),
+            "sdg_list": st.column_config.ListColumn(
+                "SDG Prediction",
+                help="Prediction of SDG's",
+                width="small"
+            ),
+            "crs_3_code_list": st.column_config.ListColumn(
+                "CRS 3",
+                help="CRS 3 code given by organization",
+                width="small"
+            ),
+            "crs_5_code_list": st.column_config.ListColumn(
+                "CRS 5",
+                help="CRS 5 code given by organization",
+                width="small"
+            ),
+        },
+        hide_index=True,
+    )

similarity_page.py CHANGED Viewed

@@ -10,10 +10,12 @@ import pandas as pd
 from scipy.sparse import load_npz
 import pickle
 from sentence_transformers import SentenceTransformer
-from modules.result_table import show_table
 from functions.filter_projects import filter_projects
 from functions.calc_matches import calc_matches
 from functions.same_country_filter import same_country_filter
 import psutil
 import os
 import gc
@@ -235,7 +237,7 @@ def show_multi_matching_page():
             p1_df, p2_df = calc_matches(filtered_df, compare_df, sim_matrix, TOP_X_PROJECTS)
         # SHOW THE RESULT
-        show_table(p1_df, p2_df)
         del p1_df, p2_df
     else:
         st.write("Select at least on CRS 3, SDG or type in a query")
@@ -265,4 +267,12 @@ def show_single_matching_page():
                 placeholder = " ",
                 options = search_list,
                 )

 from scipy.sparse import load_npz
 import pickle
 from sentence_transformers import SentenceTransformer
+from modules.multimatch_result_table import show_multi_table
+from modules.singlematch_result_table import show_single_table
 from functions.filter_projects import filter_projects
 from functions.calc_matches import calc_matches
 from functions.same_country_filter import same_country_filter
+from functions.single_similar import find_similar
 import psutil
 import os
 import gc
             p1_df, p2_df = calc_matches(filtered_df, compare_df, sim_matrix, TOP_X_PROJECTS)
         # SHOW THE RESULT
+        show_multi_table(p1_df, p2_df)
         del p1_df, p2_df
     else:
         st.write("Select at least on CRS 3, SDG or type in a query")
                 placeholder = " ",
                 options = search_list,
                 )
+    if project_option:
+        selected_index = search_list.index(project_option)
+        top_projects_df = find_similar(selected_index, sim_matrix, projects_df, 10)
+        show_single_table(top_projects_df)