Spaces:
Sleeping
Sleeping
Update pages/1_Introduction to Data_Analysis.py
Browse files
pages/1_Introduction to Data_Analysis.py
CHANGED
|
@@ -0,0 +1,42 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
import streamlit as st
|
| 2 |
+
st.title(":blue[Introduction to Data Analysis]")
|
| 3 |
+
st.caption("***From data dust to diamond insights — analysis is the alchemy***")
|
| 4 |
+
st.subheader("What is Data Analysis?...",divider="green")
|
| 5 |
+
multi = '''The process of inspecting the data , cleaning the data and transforming the data into meaningful sights from extracting the data that is collected.
|
| 6 |
+
It is the process of systematically applying statistical, logical, and computational techniques to describe, summarize, and evaluate the data.
|
| 7 |
+
'''
|
| 8 |
+
st.markdown(multi)
|
| 9 |
+
st.subheader("Types of Data",divider="green")
|
| 10 |
+
multi = '''For performing the data analysis we need to know the type of data that we collected . Majorly data is divided based on the pre-defined structure.
|
| 11 |
+
Based on this data is classified into three types.
|
| 12 |
+
'''
|
| 13 |
+
st.markdown(multi)
|
| 14 |
+
multi=''':violet[1.Structured data]'''
|
| 15 |
+
st.markdown(multi)
|
| 16 |
+
multi=''':violet[2.Unstructured data]'''
|
| 17 |
+
st.markdown(multi)
|
| 18 |
+
multi=''':violet[3.Semi-Structured data]'''
|
| 19 |
+
st.markdown(multi)
|
| 20 |
+
st.subheader("1.Structured Data",divider="red")
|
| 21 |
+
multi = '''Structured data is well-formatted and organized data.
|
| 22 |
+
It is usually in tabular format known as RDBMS("Relational Database Management System") where the data is stored in rows and columns.
|
| 23 |
+
It is easy to search and typically known as quantitative data.
|
| 24 |
+
Examples of structured data is - Excel files(.xlsx), SQL files etc...
|
| 25 |
+
'''
|
| 26 |
+
st.image("https://cdn-uploads.huggingface.co/production/uploads/66bde9bf3c885d04498227a0/ewYq-ld-Fr7SCE7Th0idQ.png")
|
| 27 |
+
st.markdown(multi)
|
| 28 |
+
st.subheader("2.Unstructured Data",divider="red")
|
| 29 |
+
multi = '''Unstructured data is not pre-definely formatted and organized data.
|
| 30 |
+
This type of data doesn't fit into rows and columns it is combination of text, images and audio etc..
|
| 31 |
+
It is not easy to analyse and perform the analysis typically known as qualitative data.
|
| 32 |
+
Examples of unstructured data is - Text, images, audios, videos etc...
|
| 33 |
+
'''
|
| 34 |
+
st.image("https://cdn-uploads.huggingface.co/production/uploads/66bde9bf3c885d04498227a0/o96nGe5pQ7EkbXTdjOkpW.png")
|
| 35 |
+
st.markdown(multi)
|
| 36 |
+
st.subheader("3.Semistructured Data",divider="red")
|
| 37 |
+
multi = '''Semi structured data is a hybrid of structured and unstructured data.
|
| 38 |
+
As the data is combination of both it is much more difficult for analysis.
|
| 39 |
+
Examples of semi-structured data is - csv files, json files and xml files
|
| 40 |
+
'''
|
| 41 |
+
st.image("https://cdn-uploads.huggingface.co/production/uploads/66bde9bf3c885d04498227a0/Gz_AZKg8M7e9K96TsVenU.png")
|
| 42 |
+
st.marldown(multi)
|