Update pages/Introduction.py
Browse files- pages/Introduction.py +11 -2
pages/Introduction.py
CHANGED
|
@@ -49,10 +49,10 @@ st.markdown('<p style="color:blue;"><b>f. Text Normalization</b></p>', unsafe_al
|
|
| 49 |
st.write("Converts text to a standard format (lowercasing, removing punctuation, etc.).")
|
| 50 |
|
| 51 |
|
| 52 |
-
st.markdown('<p style="color:
|
| 53 |
st.write("Text needs to be transformed into numerical representations for machine learning models.")
|
| 54 |
|
| 55 |
-
st.markdown('<p style="color:blue;"><b>Bag of Words (BoW)</b></p>', unsafe_allow_html=True)
|
| 56 |
st.write("Represents text as a vector of word frequencies or occurrences, ignoring grammar and order")
|
| 57 |
st.write("Examples:")
|
| 58 |
st.write("Text: “I love NLP” and “NLP is great”")
|
|
@@ -60,3 +60,12 @@ st.write("Vocabulary: [“I”, “love”, “NLP”, “is”, “great”]")
|
|
| 60 |
st.write("Vector for “I love NLP”: [1, 1, 1, 0, 0]")
|
| 61 |
|
| 62 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 49 |
st.write("Converts text to a standard format (lowercasing, removing punctuation, etc.).")
|
| 50 |
|
| 51 |
|
| 52 |
+
st.markdown('<p style="color:blue;"><b>2. Feature Extraction Techniques</b></p>', unsafe_allow_html=True)
|
| 53 |
st.write("Text needs to be transformed into numerical representations for machine learning models.")
|
| 54 |
|
| 55 |
+
st.markdown('<p style="color:blue;"><b>a. Bag of Words (BoW)</b></p>', unsafe_allow_html=True)
|
| 56 |
st.write("Represents text as a vector of word frequencies or occurrences, ignoring grammar and order")
|
| 57 |
st.write("Examples:")
|
| 58 |
st.write("Text: “I love NLP” and “NLP is great”")
|
|
|
|
| 60 |
st.write("Vector for “I love NLP”: [1, 1, 1, 0, 0]")
|
| 61 |
|
| 62 |
|
| 63 |
+
st.markdown('<p style="color:blue;"><b>b. Term Frequency-Inverse Document Frequency (TF-IDF)</b></p>', unsafe_allow_html=True)
|
| 64 |
+
st.write("Assigns weights to words based on their frequency in a document and their rarity across all documents.")
|
| 65 |
+
st.write("Examples:")
|
| 66 |
+
st.write("Text: “I love NLP” and “NLP is great”")
|
| 67 |
+
st.write("Vocabulary: [“I”, “love”, “NLP”, “is”, “great”]")
|
| 68 |
+
st.write("Vector for “I love NLP”: [1, 1, 1, 0, 0]")
|
| 69 |
+
|
| 70 |
+
|
| 71 |
+
|