Harika22 commited on
Commit
1d0bfe1
Β·
verified Β·
1 Parent(s): 0d400f0

Update pages/5_Pre-procesing_of_text.py

Browse files
Files changed (1) hide show
  1. pages/5_Pre-procesing_of_text.py +21 -7
pages/5_Pre-procesing_of_text.py CHANGED
@@ -75,12 +75,6 @@ st.markdown("βœ… **Grammar Preservation** – If grammar is needed, avoid removi
75
 
76
  st.success("πŸš€ Well-structured and clean text significantly boosts ML model performance!")
77
 
78
- st.markdown(
79
- """
80
- <div class='caption'>Step into the world of NLP and discover the endless possibilities of language-driven innovation!</div>
81
- """,
82
- unsafe_allow_html=True,
83
- )
84
 
85
  st.markdown("<div class='section'>", unsafe_allow_html=True)
86
  st.markdown("<h2 class='title'>πŸ” NLP Data Preprocessing</h2>", unsafe_allow_html=True)
@@ -91,6 +85,16 @@ st.success("πŸ“Œ **Benefits of Preprocessing:**\n\nβœ… Reduces dimensionality\n\
91
 
92
  st.markdown("### ✨ **Essential Preprocessing Steps:**")
93
 
 
 
 
 
 
 
 
 
 
 
94
  st.markdown("βœ… **Converting Text Case** – Reduces dimensionality; case conversion depends on problem statement.")
95
  st.markdown("βœ… **Removing URLs, Tags, and Mentions** – Retain only if required by the problem statement.")
96
  st.markdown("βœ… **Handling Emojis** – Preserve or convert emoji data based on context.")
@@ -98,4 +102,14 @@ st.markdown("βœ… **Expanding Contractions & Acronyms** – Convert abbreviations
98
  st.markdown("βœ… **Stop Words Removal** – Optional, useful for text simplification.")
99
  st.markdown("βœ… **Stemming & Lemmatization** – Perform only if grammar is **not** crucial for analysis.")
100
 
101
- st.markdown("</div>", unsafe_allow_html=True)
 
 
 
 
 
 
 
 
 
 
 
75
 
76
  st.success("πŸš€ Well-structured and clean text significantly boosts ML model performance!")
77
 
 
 
 
 
 
 
78
 
79
  st.markdown("<div class='section'>", unsafe_allow_html=True)
80
  st.markdown("<h2 class='title'>πŸ” NLP Data Preprocessing</h2>", unsafe_allow_html=True)
 
85
 
86
  st.markdown("### ✨ **Essential Preprocessing Steps:**")
87
 
88
+ st.markdown(
89
+ """
90
+ <div class='image-container'>
91
+ <img src="https://cdn-uploads.huggingface.co/production/uploads/66bde9bf3c885d04498227a0/HtdtNm-UJdfN057BeKSgV.png",width=400>
92
+ </div>
93
+ """,
94
+ unsafe_allow_html=True,
95
+ )
96
+
97
+
98
  st.markdown("βœ… **Converting Text Case** – Reduces dimensionality; case conversion depends on problem statement.")
99
  st.markdown("βœ… **Removing URLs, Tags, and Mentions** – Retain only if required by the problem statement.")
100
  st.markdown("βœ… **Handling Emojis** – Preserve or convert emoji data based on context.")
 
102
  st.markdown("βœ… **Stop Words Removal** – Optional, useful for text simplification.")
103
  st.markdown("βœ… **Stemming & Lemmatization** – Perform only if grammar is **not** crucial for analysis.")
104
 
105
+ st.markdown("</div>", unsafe_allow_html=True)
106
+
107
+
108
+
109
+
110
+ st.markdown(
111
+ """
112
+ <div class='caption'>Step into the world of NLP and discover the endless possibilities of language-driven innovation!</div>
113
+ """,
114
+ unsafe_allow_html=True,
115
+ )