Update pages/Introduction.py
Browse files- pages/Introduction.py +7 -2
pages/Introduction.py
CHANGED
|
@@ -17,6 +17,11 @@ st.write("Before performing any analysis or modeling, raw text data must be clea
|
|
| 17 |
st.write("**a. Tokenization**")
|
| 18 |
st.write("Splits text into smaller units like words or sentences.")
|
| 19 |
st.write("**Types:**")
|
| 20 |
-
|
| 21 |
-
st.write("(
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 22 |
|
|
|
|
| 17 |
st.write("**a. Tokenization**")
|
| 18 |
st.write("Splits text into smaller units like words or sentences.")
|
| 19 |
st.write("**Types:**")
|
| 20 |
+
|
| 21 |
+
st.write("**(i) Word Tokenization:** Breaking text into words.")
|
| 22 |
+
st.write("Example: _'I love NLP'_ → [‘I’, ‘love’, ‘NLP’]")
|
| 23 |
+
|
| 24 |
+
st.write("**(ii) Sentence Tokenization:** Breaking text into sentences.")
|
| 25 |
+
st.write("Example: _'I love NLP. It’s fascinating!'_ → [‘I love NLP.’, ‘It’s fascinating!’]")
|
| 26 |
+
|
| 27 |
|