Spaces:

egumasa
/

simple-text-analyzer

Building

App Files Files Community

egumasa commited on Jul 28, 2025

Commit

025fa56

1 Parent(s): e7279e4

tag set

Browse files

Files changed (7) hide show

test_column_matching.py → test/test_column_matching.py +0 -0
test_csv_comma_handling.py → test/test_csv_comma_handling.py +0 -0
test_plot_fix.py → test/test_plot_fix.py +0 -0
test_reference_loading_issue.py → test/test_reference_loading_issue.py +0 -0
web_app/app.py +1 -1
web_app/components/ui_components.py +7 -7
web_app/handlers/pos_handlers.py +26 -0

test_column_matching.py → test/test_column_matching.py RENAMED Viewed

File without changes

test_csv_comma_handling.py → test/test_csv_comma_handling.py RENAMED Viewed

File without changes

test_plot_fix.py → test/test_plot_fix.py RENAMED Viewed

File without changes

test_reference_loading_issue.py → test/test_reference_loading_issue.py RENAMED Viewed

File without changes

web_app/app.py CHANGED Viewed

@@ -48,7 +48,7 @@ def main():
     # Route to appropriate interface
     if tool_choice == 'Lexical Sophistication':
         render_lexical_sophistication_interface()
-    elif tool_choice == 'POS Parser':
         render_pos_parser_interface()
     elif tool_choice == 'Corpus Data Visualizer':
         render_corpus_visualization_interface()

     # Route to appropriate interface
     if tool_choice == 'Lexical Sophistication':
         render_lexical_sophistication_interface()
+    elif tool_choice == 'POS & Dependency Parser':
         render_pos_parser_interface()
     elif tool_choice == 'Corpus Data Visualizer':
         render_corpus_visualization_interface()

web_app/components/ui_components.py CHANGED Viewed

@@ -106,9 +106,9 @@ class UIComponents:
         st.subheader("SpaCy Model")
         new_model_size = st.selectbox(
             "Model Size",
-            options=['trf', 'md'],
             format_func=lambda x: 'Transformer (trf)' if x == 'trf' else 'Medium (md)',
-            index=0 if st.session_state.model_size == 'trf' else 1
         )
         # Only update if changed
@@ -122,7 +122,7 @@ class UIComponents:
         st.subheader("Analysis Tools")
         return st.radio(
             "Select Tool",
-            options=['Lexical Sophistication', 'POS Parser', 'Frequency Analysis', 'Corpus Data Visualizer'],
             key='tool_choice'
         )
@@ -195,9 +195,9 @@ class UIComponents:
         col1, col2 = st.columns(2)
         with col1:
-            token_analysis = st.checkbox("☑️ Token-based", value=True, key="token_analysis_enabled")
         with col2:
-            lemma_analysis = st.checkbox("☑️ Lemma-based", value=True, key="lemma_analysis_enabled")
         # Global Options
         st.write("### ⚙️ Global Options")
@@ -319,7 +319,7 @@ class UIComponents:
             # Group-level enable/disable checkbox
             group_key = f"group_enabled_{base_name}"
             group_enabled = st.checkbox(
-                f"☑️ **{base_name}**",
                 value=True,  # Default enabled
                 key=group_key,
                 help=f"Enable/disable all {base_name} analyses"
@@ -424,7 +424,7 @@ class UIComponents:
                 # Measure checkbox (pre-selected based on defaults)
                 measure_key = f"measure_{entry_name}_{measure}"
                 selected = st.checkbox(
-                    f"☑️ {measure.replace('_', ' ').title()}",
                     value=measure in st.session_state[f'custom_measures_{entry_name}'],
                     key=measure_key,
                     help=f"Include {measure} in analysis"

         st.subheader("SpaCy Model")
         new_model_size = st.selectbox(
             "Model Size",
+            options=['md', 'trf'],
             format_func=lambda x: 'Transformer (trf)' if x == 'trf' else 'Medium (md)',
+            index=0 if st.session_state.model_size == 'md' else 1
         )
         # Only update if changed
         st.subheader("Analysis Tools")
         return st.radio(
             "Select Tool",
+            options=['Lexical Sophistication', 'POS & Dependency Parser', 'Frequency Analysis', 'Corpus Data Visualizer'],
             key='tool_choice'
         )
         col1, col2 = st.columns(2)
         with col1:
+            token_analysis = st.checkbox("Token-based", value=True, key="token_analysis_enabled")
         with col2:
+            lemma_analysis = st.checkbox("Lemma-based", value=True, key="lemma_analysis_enabled")
         # Global Options
         st.write("### ⚙️ Global Options")
             # Group-level enable/disable checkbox
             group_key = f"group_enabled_{base_name}"
             group_enabled = st.checkbox(
+                f"**{base_name}**",
                 value=True,  # Default enabled
                 key=group_key,
                 help=f"Enable/disable all {base_name} analyses"
                 # Measure checkbox (pre-selected based on defaults)
                 measure_key = f"measure_{entry_name}_{measure}"
                 selected = st.checkbox(
+                    f"{measure.replace('_', ' ').title()}",
                     value=measure in st.session_state[f'custom_measures_{entry_name}'],
                     key=measure_key,
                     help=f"Include {measure} in analysis"

web_app/handlers/pos_handlers.py CHANGED Viewed

@@ -136,6 +136,32 @@ class POSHandlers:
             mime="text/tab-separated-values"
         )
         # Dependency visualization
         st.write("**Dependency Visualization**")
         try:

             mime="text/tab-separated-values"
         )
+        with st.expander("## **See Tagset**"):
+            # col1, col2, col3 = st.columns(3)
+            st.markdown("""
+The following table is based on [UD guideline](https://universaldependencies.org/u/dep/index.html).
+Note that spaCy English model is trained on  [ClearNLP tag set](https://github.com/clir/clearnlp-guidelines/blob/master/md/specifications/dependency_labels.md)
+#### Dependency relations
+|                           | **Nominals**        | **Clauses**        | **Modifier words** | **Function Words** |
+|---------------------------|--------------------|--------------------|--------------------|--------------------|
+| **Core arguments**        | `nsubj`, `obj`, `iobj` | `csubj`, `ccomp`, `xcomp` |                    |                    |
+| **Non-core dependents**   | `obl`, `vocative`, `expl`, `dislocated` | `advcl`            | `advmod`, `discourse` | `aux`, `cop`, `mark` |
+| **Nominal dependents**    | `nmod`, `appos`, `nummod` | `acl`              | `amod`            | `det`, `clf`, `case` |
+#### Additional Relations
+| **Coordination** | **Headless** | **Loose**      | **Special**        | **Other**        |
+|------------------|-------------|----------------|--------------------|------------------|
+| `conj`, `cc`   | `fixed`, `flat` | `list`, `parataxis` | `compound`, `orphan`, `goeswith`, `reparandum` | `punct`, `root`, `dep` |
+                    """)
         # Dependency visualization
         st.write("**Dependency Visualization**")
         try: