Spaces:
Build error
Build error
Ronio Jerico Roque
Update spinner messages to reflect file upload actions across multiple classes
c75d56b | import streamlit as st | |
| import requests | |
| from dotenv import load_dotenv | |
| import os | |
| import pandas as pd | |
| import pandas._libs.tslibs.parsing | |
| import time | |
| import chardet | |
| from helper.telemetry import collect_telemetry | |
| from helper.upload_File import uploadFile | |
| from helper.button_behaviour import hide_button | |
| from helper.initialize_analyze_session import initialize_analyze_session | |
| class Seo: | |
| def __init__(self, model_url): | |
| self.uploaded_files = [] | |
| self.file_dict = {} | |
| self.model_url = model_url | |
| #self.analyst_name = analyst_name | |
| #self.data_src = data_src | |
| #self.analyst_description = analyst_description | |
| self.initialize() | |
| self.row1() | |
| def initialize(self): | |
| # FOR ENV | |
| load_dotenv() | |
| # AGENT NAME | |
| #st.header(self.analyst_name) | |
| # EVALUATION FORM LINK | |
| '''url = os.getenv('Link') | |
| st.write('Evaluation Form: [Link](%s)' % url) | |
| # RETURN BUTTON | |
| try: | |
| if st.button("Return", type='primary'): | |
| st.switch_page("./pages/home.py") | |
| except Exception: | |
| pass''' | |
| if 'bounce_rate' not in st.session_state: | |
| st.session_state['bounce_rate'] = '' | |
| if 'page_index' not in st.session_state: | |
| st.session_state['page_index'] = '' | |
| if 'others' not in st.session_state: | |
| st.session_state['others'] = '' | |
| if 'df_traffic' not in st.session_state: | |
| st.session_state['df_traffic'] = '' | |
| if 'df_seo' not in st.session_state: | |
| st.session_state['df_seo'] = '' | |
| def detect_encoding(self, uploaded_file): | |
| result = chardet.detect(uploaded_file.read(100000)) | |
| uploaded_file.seek(0) # Reset file pointer to the beginning | |
| return result['encoding'] | |
| def keyword_ranking(self, df_seo): | |
| keyword_ranking = df_seo | |
| st.session_state['keyword_ranking'] = keyword_ranking | |
| keywords_ranking_sorted = keyword_ranking.sort_values("Position", ascending=True) | |
| keywords_ranking_top_10 = keywords_ranking_sorted[keywords_ranking_sorted["Position"] <= 10].shape[0] | |
| keywords_ranking_top_100 = keywords_ranking_sorted[keywords_ranking_sorted["Position"] <= 100].shape[0] | |
| keyword_ranking = { | |
| 'Keyword_top_10': keywords_ranking_top_10, | |
| 'Keyword_top_100': keywords_ranking_top_100 | |
| } | |
| st.session_state['keyword_ranking'] = keyword_ranking | |
| def traffic_files(self, df_traffic): | |
| traffic_channels = df_traffic | |
| try: | |
| traffic_channels.rename(columns={traffic_channels.columns[0]: 'date'}, inplace=True) | |
| traffic_channels['date'] = pd.to_datetime(traffic_channels['date'], format='mixed') | |
| except pandas._libs.tslibs.parsing.DateParseError: | |
| pass | |
| traffic_channels_sort = traffic_channels.sort_values("date", ascending=False) | |
| organic_traffic = traffic_channels_sort['Organic Search'].values[0] | |
| paid_traffic = traffic_channels_sort['Paid Search'].values[0] | |
| direct_traffic = traffic_channels_sort['Direct'].values[0] | |
| referral_traffic = traffic_channels_sort['Referral'].values[0] | |
| st.session_state['organic_traffic'] = organic_traffic | |
| st.session_state['paid_traffic'] = paid_traffic | |
| st.session_state['direct_traffic'] = direct_traffic | |
| st.session_state['referral_traffic'] = referral_traffic | |
| def ga4_traffic(self, others): | |
| st.session_state['others'] = others | |
| ga4_paid_social = others['Sessions'].values[0] | |
| ga4_organic_traffic = others['Sessions'].values[4] | |
| ga4_direct_traffic = others['Sessions'].values[2] | |
| ga4_referral_traffic = others['Sessions'].values[3] | |
| st.session_state['ga4_paid_social'] = ga4_paid_social | |
| st.session_state['ga4_organic_traffic'] = ga4_organic_traffic | |
| st.session_state['ga4_direct_traffic'] = ga4_direct_traffic | |
| st.session_state['ga4_referral_traffic'] = ga4_referral_traffic | |
| def delete_sessions(self): | |
| try: | |
| del st.session_state['df_traffic'] | |
| del st.session_state['others'] | |
| del st.session_state['df_seo'] | |
| del st.session_state['keyword_ranking'] | |
| del st.session_state['ga4_paid_social'] | |
| del st.session_state['ga4_organic_traffic'] | |
| del st.session_state['ga4_direct_traffic'] | |
| del st.session_state['ga4_referral_traffic'] | |
| del st.session_state['organic_traffic'] | |
| del st.session_state['paid_traffic'] | |
| del st.session_state['direct_traffic'] | |
| del st.session_state['referral_traffic'] | |
| except KeyError: | |
| pass | |
| def process (self): | |
| session = st.session_state.analyze | |
| if ((self.uploaded_file or self.others or self.uploaded_file_seo) or (self.page_index or self.bounce_rate)) and session == 'clicked': | |
| seo_keywords = "" | |
| traffic_channels = "" | |
| traffic_aqcuisition = "" | |
| pages_index = "" | |
| bounce_rate = "" | |
| with st.spinner('Uploading Seo Files...', show_time=True): | |
| st.write('') | |
| # INITIALIZING SESSIONS | |
| pages_index += f"Pages Indexed: {self.page_index}\n" | |
| bounce_rate += f"Bounce Rate: {self.bounce_rate}\n" | |
| ''' | |
| try: | |
| backlink_files = self.file_dict | |
| combined_text += f"Number of backlinks {backlink_files}\n\n" | |
| except KeyError: | |
| pass | |
| ''' | |
| try: | |
| df_traffic = st.session_state['df_traffic'] | |
| self.traffic_files(df_traffic) | |
| organic_traffic = st.session_state['organic_traffic'] | |
| paid_traffic = st.session_state['paid_traffic'] | |
| direct_traffic = st.session_state['direct_traffic'] | |
| referral_traffic = st.session_state['referral_traffic'] | |
| traffic_channels += f"\nOrganic Traffic: {organic_traffic}" | |
| traffic_channels += f"\nPaid Traffic: {paid_traffic}" | |
| traffic_channels += f"\nDirect Traffic: {direct_traffic}" | |
| traffic_channels += f"\nReferral Traffic: {referral_traffic}" | |
| traffic_channels += df_traffic.to_csv(index=True) | |
| except AttributeError: | |
| pass | |
| except KeyError as e: | |
| # Check if 'df_traffic' is the missing key (no file uploaded) | |
| if self.uploaded_file_seo: | |
| pass | |
| else: | |
| # This would be triggered if df_traffic exists but the other keys are missing | |
| st.info("Incorrect Traffic Channels SEMRush format. Please upload a valid SEMRush file.") | |
| try: | |
| df_seo = st.session_state['df_seo'] | |
| self.keyword_ranking(df_seo) | |
| keyword_ranking = st.session_state['keyword_ranking'] | |
| seo_keywords += f"\nKeyword Ranking Top 10: {keyword_ranking['Keyword_top_10']}" | |
| seo_keywords += f"\nKeyword Ranking Top 100: {keyword_ranking['Keyword_top_100']}\n\n" | |
| seo_keywords += df_seo.to_csv(index=True) | |
| except AttributeError: | |
| pass | |
| except KeyError: | |
| pass | |
| try: | |
| others = st.session_state['others'] | |
| self.ga4_traffic(others) | |
| ga4_paid_social = st.session_state['ga4_paid_social'] | |
| ga4_organic_traffic = st.session_state['ga4_organic_traffic'] | |
| ga4_direct_traffic = st.session_state['ga4_direct_traffic'] | |
| ga4_referral_traffic = st.session_state['ga4_referral_traffic'] | |
| traffics = ga4_direct_traffic + ga4_organic_traffic + ga4_paid_social + ga4_referral_traffic | |
| traffic_aqcuisition += f"Traffics: {traffics}" | |
| traffic_aqcuisition += f"\nPaid Traffic: {ga4_paid_social}\nOrganic Traffic: {ga4_organic_traffic}\nDirect Traffic: {ga4_direct_traffic}\nReferral Traffic: {ga4_referral_traffic}" | |
| except KeyError: | |
| if self.others: | |
| pass | |
| else: | |
| # This would be triggered if df_traffic exists but the other keys are missing | |
| #st.info("Incorrect Traffic Acquisition GA4 format. Please upload a valid GA4 file.") | |
| pass | |
| except TypeError: | |
| st.info("Incorrect Traffic Acquisition GA4 format. Please upload a valid GA4 file.") | |
| #result = self.request_model(payload_txt_seo_keywords) | |
| #end_time = time.time() | |
| #time_lapsed = end_time - start_time | |
| debug_info_seo_keywords = {'data_field' : 'SEO Keywords', 'result': seo_keywords} | |
| debug_info_traffic_channels = {'data_field' : 'Traffic Channels', 'result': traffic_channels} | |
| debug_info_traffic_aqcuisition = {'data_field' : 'Traffic Acquisition', 'result': traffic_aqcuisition} | |
| debug_info_pages_index = {'data_field' : 'Pages Indexed', 'result': pages_index} | |
| debug_info_bounce_rate = {'data_field' : 'Bounce Rate', 'result': bounce_rate} | |
| ''' | |
| debug_info = { | |
| #'analyst': self.analyst_name, | |
| 'url_uuid': self.model_url.split("-")[-1], | |
| 'time_lapsed': time_lapsed, | |
| #'backlink_files': [*st.session_state['uploaded_files']], | |
| #'seo_file': [self.uploaded_file_seo.name] if self.uploaded_file_seo else ['Not available'], | |
| 'payload': payload_txt, | |
| 'result': result, | |
| } | |
| ''' | |
| if self.bounce_rate: | |
| st.session_state['bounce_rate'] = 'uploaded' | |
| collect_telemetry(debug_info_bounce_rate) | |
| if self.page_index: | |
| st.session_state['pages_index'] = 'uploaded' | |
| collect_telemetry(debug_info_pages_index) | |
| if self.others: | |
| st.session_state['others'] = 'uploaded' | |
| collect_telemetry(debug_info_traffic_aqcuisition) | |
| if self.uploaded_file: | |
| st.session_state['df_traffic'] = 'uploaded' | |
| collect_telemetry(debug_info_traffic_channels) | |
| if self.uploaded_file_seo: | |
| st.session_state['df_seo'] = 'uploaded' | |
| collect_telemetry(debug_info_seo_keywords) | |
| #with st.expander("Debug information", icon="⚙"): | |
| # st.write(debug_info) | |
| #del st.session_state[df_traffic] | |
| #del st.session_state[df_seo] | |
| #del st.session_state[others] | |
| st.session_state['analyzing'] = False | |
| def row1(self): | |
| #st.write("") # FOR SPACINGs | |
| #st.write("") # FOR SPACINGs | |
| ''' | |
| self.uploaded_files = st.file_uploader("Backlinks (SEO)", type=['pdf', 'csv'], accept_multiple_files=True, key="seo1") | |
| if self.uploaded_files: | |
| self.delete_sessions() | |
| upload.upload_file_seo(self.uploaded_files) | |
| self.file_dict = upload.file_dict | |
| ''' | |
| #st.write("") # FOR THE HIDE BUTTON | |
| self.uploaded_file_seo = st.file_uploader("SEO Keywords - SEMRush", type='csv', key="seo2") | |
| if self.uploaded_file_seo: | |
| self.delete_sessions() | |
| try: | |
| encoding_seo = self.detect_encoding(self.uploaded_file_seo) | |
| st.session_state['df_seo'] = pd.read_csv(self.uploaded_file_seo, encoding=encoding_seo, low_memory=False) | |
| except Exception: | |
| pass | |
| self.uploaded_file = st.file_uploader("Traffic Channels - SEMRush", type='csv') | |
| if self.uploaded_file: | |
| self.delete_sessions() | |
| try: | |
| encoding = self.detect_encoding(self.uploaded_file) | |
| st.session_state['df_traffic'] = pd.read_csv(self.uploaded_file, encoding=encoding, low_memory=False) | |
| except Exception: | |
| pass | |
| st.write("") # FOR THE HIDE BUTTON | |
| self.others = st.file_uploader("Traffic Acquisition - GA4", type='csv', key="seo5") | |
| if self.others: | |
| try: | |
| st.session_state['others'] = pd.read_csv(self.others, skiprows=9) | |
| except Exception: | |
| pass | |
| self.page_index = st.text_input("Pages Indexed - Google Search Console:", placeholder='Enter Pages Indexed') | |
| self.bounce_rate = st.text_input("Bounce Rate - GA4:", placeholder='Enter Bounce Rate') | |
| followers = { | |
| 'Pages Indexed': self.page_index if self.page_index else 'N/A', | |
| 'Bounce Rate': self.bounce_rate if self.bounce_rate else 'N/A' | |
| } | |
| #st.write("") # FOR THE HIDE BUTTON | |
| #st.write("") # FOR THE HIDE BUTTON | |
| #st.write("AI Analyst Output: ") | |
| st.session_state['analyzing'] = False | |
| #st.write("") # FOR THE HIDE BUTTON | |
| #analyze_button = st.button("Analyze", disabled=initialize_analyze_session()) | |
| self.process() | |
| if __name__ == "__main__": | |
| st.set_page_config(layout="wide") | |
| upload = uploadFile() | |