Update pages/Introduction.py
Browse files- pages/Introduction.py +6 -0
pages/Introduction.py
CHANGED
|
@@ -13,4 +13,10 @@ st.subheader("NLP Techniques")
|
|
| 13 |
st.markdown("<p>NLP encompasses a wide array of techniques that aimed at enabling computers to process and understand human language. These tasks can be categorized into several broad areas, each addressing different aspects of language processing. Here are some of the key NLP techniques:</p>",unsafe_allow_html= True)
|
| 14 |
|
| 15 |
st.write("**1. Text Processing and Preprocessing In NLP**")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 16 |
|
|
|
|
| 13 |
st.markdown("<p>NLP encompasses a wide array of techniques that aimed at enabling computers to process and understand human language. These tasks can be categorized into several broad areas, each addressing different aspects of language processing. Here are some of the key NLP techniques:</p>",unsafe_allow_html= True)
|
| 14 |
|
| 15 |
st.write("**1. Text Processing and Preprocessing In NLP**")
|
| 16 |
+
st.write("Before performing any analysis or modeling, raw text data must be cleaned and prepared.")
|
| 17 |
+
st.write("**a. Tokenization**")
|
| 18 |
+
st.write("Splits text into smaller units like words or sentences.")
|
| 19 |
+
st.write("**Types:**")
|
| 20 |
+
st.write("(i) Word Tokenization: Breaking text into words. Example: "I love NLP" → [“I”, “love”, “NLP”]")
|
| 21 |
+
st.write("(ii) Sentence Tokenization: Breaking text into sentences. Example: "I love NLP. It’s fascinating!" → [“I love NLP.”, “It’s fascinating!”]")
|
| 22 |
|