Spaces:

GIZ
/

Development-Project-Synergy-Finder

Sleeping

App Files Files Community

Jan Mühlnikel commited on Apr 12, 2024

Commit

39b49f4

2 Parent(s): 1de85ab 1db84e9

Merge branch 'main' of https://huggingface.co/spaces/GIZ/eb-synergy-app

Browse files

Files changed (4) hide show

functions/filter_projects.py +49 -0
modules/navbar.py +40 -0
requirements.txt +9 -0
similarity_page.py +3 -1

functions/filter_projects.py ADDED Viewed

	@@ -0,0 +1,49 @@

+import pandas as pd
+from functions.semantic_search import search
+def contains_code(crs_codes, code_list):
+    codes = str(crs_codes).split(';')
+    return any(code in code_list for code in codes)
+def filter_projects(df, crs3_list, crs5_list, sdg_str, country_code_list, orga_code_list, query, model, embeddings, TOP_X_PROJECTS=30):
+    # Check if filters where not all should be selected are empty
+    if crs3_list != [] or crs5_list != [] or sdg_str != "" or query != "":
+        # FILTER CRS
+        if crs3_list and not crs5_list:
+            df = df[df['crs_3_code'].apply(lambda x: contains_code(x, crs3_list))]
+        elif crs3_list and crs5_list:
+            df = df[df['crs_5_code'].apply(lambda x: contains_code(x, crs5_list))]
+        elif not crs3_list and crs5_list:
+            df = df[df['crs_5_code'].apply(lambda x: contains_code(x, crs5_list))]
+        # FILTER SDG
+        if sdg_str != "":
+            df = df[df["sgd_pred_code"] == int(sdg_str)]
+        # FILTER COUNTRY
+        if country_code_list != []:
+            country_filtered_df = pd.DataFrame()
+            for c in country_code_list:
+                c_df = df[df["country"].str.contains(c, na=False)]
+                country_filtered_df = pd.concat([country_filtered_df, c_df], ignore_index=False)
+            df = country_filtered_df
+        # FILTER ORGANIZATION
+        if orga_code_list != []:
+            df = df[df['orga_abbreviation'].isin(orga_code_list)]
+        # FILTER QUERY
+        if query != "" and len(df) > 0:
+            if len(df) < TOP_X_PROJECTS:
+                TOP_X_PROJECTS = len(df)
+            df = search(query, model, embeddings, df, TOP_X_PROJECTS)
+        return df

modules/navbar.py ADDED Viewed

	@@ -0,0 +1,40 @@

+import streamlit as st
+from streamlit_option_menu import option_menu # https://github.com/victoryhb/streamlit-option-menu
+import similarity_page
+# giz-dsc colors
+# orange: #e5b50d
+# green: #48d47b
+# blue: #0da2dc
+# grey: #dadada
+# giz colors https://www.giz.de/cdc/en/html/59638.html
+# red: #c80f0f
+# grey: #6f6f6f
+# light_grey: #b2b2b2
+# light_red: #eba1a3
+def show_navbar():
+    #st.markdown("<h1 style='color: red;'>THIS APP IS WORK IN PROGRESS ...</h1>", unsafe_allow_html=True)
+    #st.title("Development Bank Synergy Mapper")
+    # enlarge tab fontsizes
+    css = '''
+    <style>
+        .stTabs [data-baseweb="tab-list"] button [data-testid="stMarkdownContainer"] p {
+        font-size:1rem;
+        }
+    </style>
+    '''
+    st.markdown(css, unsafe_allow_html=True)
+    tab1, tab2 = st.tabs([
+        "🔍 Multi-Project Matching",
+        "🎯 Single-Project Matching"
+        ])
+    with tab1:
+        similarity_page.show_multi_matching_page()
+    with tab2:
+        similarity_page.show_single_matching_page()

requirements.txt ADDED Viewed

	@@ -0,0 +1,9 @@

+numpy==1.26.4
+pandas==2.1.4
+streamlit==1.32.2
+streamlit-option-menu==0.3.12
+scipy==1.12.0
+faiss-cpu==1.8.0
+faiss-gpu==1.7.2
+sentence-transformers==2.5.1
+streamlit-aggrid==0.3.4.

similarity_page.py CHANGED Viewed

@@ -17,13 +17,15 @@ from functions.filter_single import filter_single
 from functions.calc_matches import calc_matches
 from functions.same_country_filter import same_country_filter
 from functions.single_similar import find_similar
-import psutil
 import os
 import gc
 def get_process_memory():
     process = psutil.Process(os.getpid())
     return process.memory_info().rss / (1024 * 1024)
 # Catch DATA
 # Load Similarity matrix

 from functions.calc_matches import calc_matches
 from functions.same_country_filter import same_country_filter
 from functions.single_similar import find_similar
+#import psutil
 import os
 import gc
+"""
 def get_process_memory():
     process = psutil.Process(os.getpid())
     return process.memory_info().rss / (1024 * 1024)
+"""
 # Catch DATA
 # Load Similarity matrix