Spaces:
Sleeping
Sleeping
Update pages/Data Collection.py
Browse files- pages/Data Collection.py +38 -12
pages/Data Collection.py
CHANGED
|
@@ -40,7 +40,7 @@ st.markdown(
|
|
| 40 |
unsafe_allow_html=True
|
| 41 |
)
|
| 42 |
|
| 43 |
-
# Ensure session state for
|
| 44 |
if "current_page" not in st.session_state:
|
| 45 |
st.session_state.current_page = "main"
|
| 46 |
|
|
@@ -134,8 +134,7 @@ if st.session_state.current_page == "main":
|
|
| 134 |
st.write("Click to explore Structured Data Formats:")
|
| 135 |
if st.button("Explore Excel"):
|
| 136 |
navigate_to("explore_excel")
|
| 137 |
-
|
| 138 |
-
navigate_to("explore_csv")
|
| 139 |
|
| 140 |
# Unstructured Data Content
|
| 141 |
elif data_type == "Unstructured Data":
|
|
@@ -156,6 +155,17 @@ if st.session_state.current_page == "main":
|
|
| 156 |
Examples include multimedia files (images, videos, audio), emails, and social media posts.
|
| 157 |
""")
|
| 158 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 159 |
st.write("Click to explore Unstructured Data Formats:")
|
| 160 |
if st.button("Explore Images"):
|
| 161 |
navigate_to("explore_images")
|
|
@@ -184,7 +194,22 @@ if st.session_state.current_page == "main":
|
|
| 184 |
This type of data is more flexible than structured data but still organized enough to allow for easier analysis than unstructured data.
|
| 185 |
""")
|
| 186 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 187 |
st.write("Click to explore Semi-Structured Data Formats:")
|
|
|
|
|
|
|
| 188 |
if st.button("Explore JSON"):
|
| 189 |
navigate_to("explore_json")
|
| 190 |
if st.button("Explore XML"):
|
|
@@ -203,15 +228,6 @@ elif st.session_state.current_page == "explore_excel":
|
|
| 203 |
if st.button("Go Back"):
|
| 204 |
navigate_to("main")
|
| 205 |
|
| 206 |
-
elif st.session_state.current_page == "explore_csv":
|
| 207 |
-
st.markdown("""
|
| 208 |
-
<h3 style="color: #e25822;">Exploring CSV</h3>
|
| 209 |
-
""", unsafe_allow_html=True)
|
| 210 |
-
st.write("""
|
| 211 |
-
CSV is a simple text-based format where data fields are separated by commas.
|
| 212 |
-
""")
|
| 213 |
-
if st.button("Go Back"):
|
| 214 |
-
navigate_to("main")
|
| 215 |
|
| 216 |
elif st.session_state.current_page == "explore_images":
|
| 217 |
st.markdown("""
|
|
@@ -253,6 +269,16 @@ elif st.session_state.current_page == "explore_text":
|
|
| 253 |
if st.button("Go Back"):
|
| 254 |
navigate_to("main")
|
| 255 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 256 |
elif st.session_state.current_page == "explore_json":
|
| 257 |
st.markdown("""
|
| 258 |
<h3 style="color: #e25822;">Exploring JSON</h3>
|
|
|
|
| 40 |
unsafe_allow_html=True
|
| 41 |
)
|
| 42 |
|
| 43 |
+
# Ensure session state for navigation
|
| 44 |
if "current_page" not in st.session_state:
|
| 45 |
st.session_state.current_page = "main"
|
| 46 |
|
|
|
|
| 134 |
st.write("Click to explore Structured Data Formats:")
|
| 135 |
if st.button("Explore Excel"):
|
| 136 |
navigate_to("explore_excel")
|
| 137 |
+
|
|
|
|
| 138 |
|
| 139 |
# Unstructured Data Content
|
| 140 |
elif data_type == "Unstructured Data":
|
|
|
|
| 155 |
Examples include multimedia files (images, videos, audio), emails, and social media posts.
|
| 156 |
""")
|
| 157 |
|
| 158 |
+
st.markdown("""
|
| 159 |
+
<div style="text-align: left; margin-top: 20px;">
|
| 160 |
+
<h4 style="color: #5b2c6f;">Characteristics:</h4>
|
| 161 |
+
</div>
|
| 162 |
+
""", unsafe_allow_html=True)
|
| 163 |
+
st.write("""
|
| 164 |
+
- Does not follow a specific schema or structure.
|
| 165 |
+
- Cannot be stored in traditional tabular formats like rows and columns.
|
| 166 |
+
- Requires advanced tools like machine learning or natural language processing (NLP) for analysis.
|
| 167 |
+
""")
|
| 168 |
+
|
| 169 |
st.write("Click to explore Unstructured Data Formats:")
|
| 170 |
if st.button("Explore Images"):
|
| 171 |
navigate_to("explore_images")
|
|
|
|
| 194 |
This type of data is more flexible than structured data but still organized enough to allow for easier analysis than unstructured data.
|
| 195 |
""")
|
| 196 |
|
| 197 |
+
st.markdown("""
|
| 198 |
+
<div style="text-align: left; margin-top: 20px;">
|
| 199 |
+
<h4 style="color: #5b2c6f;">Examples:</h4>
|
| 200 |
+
</div>
|
| 201 |
+
""", unsafe_allow_html=True)
|
| 202 |
+
st.write("""
|
| 203 |
+
Examples of semi-structured data include:
|
| 204 |
+
- **CSV**: Comma-separated values in plain-text files.
|
| 205 |
+
- **JSON**: A lightweight data-interchange format used in web applications.
|
| 206 |
+
- **XML**: Extensible Markup Language for structured document encoding.
|
| 207 |
+
- **HTML**: Markup language for web pages.
|
| 208 |
+
""")
|
| 209 |
+
|
| 210 |
st.write("Click to explore Semi-Structured Data Formats:")
|
| 211 |
+
if st.button("Explore CSV"):
|
| 212 |
+
navigate_to("explore_csv")
|
| 213 |
if st.button("Explore JSON"):
|
| 214 |
navigate_to("explore_json")
|
| 215 |
if st.button("Explore XML"):
|
|
|
|
| 228 |
if st.button("Go Back"):
|
| 229 |
navigate_to("main")
|
| 230 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 231 |
|
| 232 |
elif st.session_state.current_page == "explore_images":
|
| 233 |
st.markdown("""
|
|
|
|
| 269 |
if st.button("Go Back"):
|
| 270 |
navigate_to("main")
|
| 271 |
|
| 272 |
+
elif st.session_state.current_page == "explore_csv":
|
| 273 |
+
st.markdown("""
|
| 274 |
+
<h3 style="color: #e25822;">Exploring CSV</h3>
|
| 275 |
+
""", unsafe_allow_html=True)
|
| 276 |
+
st.write("""
|
| 277 |
+
CSV is a simple text-based format where data fields are separated by commas.
|
| 278 |
+
""")
|
| 279 |
+
if st.button("Go Back"):
|
| 280 |
+
navigate_to("main")
|
| 281 |
+
|
| 282 |
elif st.session_state.current_page == "explore_json":
|
| 283 |
st.markdown("""
|
| 284 |
<h3 style="color: #e25822;">Exploring JSON</h3>
|