Harika22 commited on
Commit
58faf30
·
verified ·
1 Parent(s): ac9f5ed

Update pages/5_Descriptive Statistics.py

Browse files
Files changed (1) hide show
  1. pages/5_Descriptive Statistics.py +54 -1
pages/5_Descriptive Statistics.py CHANGED
@@ -316,7 +316,9 @@ st.markdown(multi)
316
  st.latex(r'''
317
  \sigma^2 = \frac{\sum (X_i - \mu)^2}{N}''')
318
  multi = '''There are two types of variance:
 
319
  :red[population variance]
 
320
  :red[sample variance]'''
321
  st.markdown(multi)
322
 
@@ -338,4 +340,55 @@ st.latex(r'''
338
  st.subheader("Coefficient of Variance (Sample)")
339
  st.latex(r'''
340
  \text{CV} = \left( \frac{s}{\bar{X}} \right) \times 100''')
341
-
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
316
  st.latex(r'''
317
  \sigma^2 = \frac{\sum (X_i - \mu)^2}{N}''')
318
  multi = '''There are two types of variance:
319
+
320
  :red[population variance]
321
+
322
  :red[sample variance]'''
323
  st.markdown(multi)
324
 
 
340
  st.subheader("Coefficient of Variance (Sample)")
341
  st.latex(r'''
342
  \text{CV} = \left( \frac{s}{\bar{X}} \right) \times 100''')
343
+
344
+
345
+ st.subheader("Standard Deviation",divider="violet")
346
+ multi = '''Variance can't be easily interpreted because we are doubling the deviation i.e.,variance is also doubled to overcaome this standard deviation is used.
347
+
348
+ --->**More the spread it means more the standard deviation**
349
+
350
+ --->**spread is directly proportional to the standard deviation**
351
+
352
+ --->to check the consistency of data co-efficient of variance is used'''
353
+ st.markdown(multi)
354
+ st.latex(r'''
355
+ \sigma = \sqrt{\frac{\sum (X_i - \mu)^2}{N}}''')
356
+
357
+ multi = '''Outliers are detected by standard deviation.
358
+
359
+ If the points are away from 3 standard deviation they are considered as outliers.
360
+
361
+ 3STD is used as treshold to check outliers'''
362
+ st.markdown(multi)
363
+
364
+ st.subheader("Co-efficient of Standard deviation",divider="violet")
365
+ st.latex(r'''
366
+ \text{Coefficient of Standard Deviation} = \frac{\sigma}{\mu}''')
367
+
368
+ multi = '''As the sample data is subset of population data there is a error known as sampling error ---> to overcome this error degree of freedom is used.
369
+
370
+ When the outliers are in the data the measure of dispersion is known as **MAD-Median Absolute Deviation**'''
371
+ st.markdown(multi)
372
+
373
+ st.subheader("Population standard deviation")
374
+ st.latex(r'''
375
+ \sigma = \sqrt{\frac{\sum (X_i - \mu)^2}{N}}''')
376
+
377
+ st.subheader("Sample standard deviation")
378
+ st.latex(r'''
379
+ s = \sqrt{\frac{\sum (X_i - \bar{X})^2}{n - 1}}''')
380
+
381
+ multi = '''--->σ is the population standard deviation
382
+
383
+ --->s is the sample standard deviation
384
+
385
+ --->Xi represents each data point
386
+
387
+ --->μ is the population mean
388
+
389
+ --->Xˉ is the sample mean
390
+
391
+ --->N is the total number of data points in the population
392
+
393
+ --->n is the number of data points in the sample.'''
394
+ st.markdown(multi)