[https://www.r-bloggers.com/2019/02/descriptive-summary-statistics-with-descriptr/] [https://descriptr.rsquaredacademy.com/index.html]
# Install release version from CRAN
#install.packages("descriptr")
# Install development version from GitHub
# install.packages("devtools")
devtools::install_github("rsquaredacademy/descriptr")
Skipping install of 'descriptr' from a github remote, the SHA1 (99fc706e) has not changed since last install.
Use `force = TRUE` to force installation
library(descriptr)
# ds_launch_shiny_app()
str(mtcarz)
'data.frame': 32 obs. of 11 variables:
$ mpg : num 21 21 22.8 21.4 18.7 18.1 14.3 24.4 22.8 19.2 ...
$ cyl : Factor w/ 3 levels "4","6","8": 2 2 1 2 3 2 3 1 1 2 ...
$ disp: num 160 160 108 258 360 ...
$ hp : num 110 110 93 110 175 105 245 62 95 123 ...
$ drat: num 3.9 3.9 3.85 3.08 3.15 2.76 3.21 3.69 3.92 3.92 ...
$ wt : num 2.62 2.88 2.32 3.21 3.44 ...
$ qsec: num 16.5 17 18.6 19.4 17 ...
$ vs : Factor w/ 2 levels "0","1": 1 1 2 2 1 2 1 2 2 2 ...
$ am : Factor w/ 2 levels "0","1": 2 2 2 1 1 1 1 1 1 1 ...
$ gear: Factor w/ 3 levels "3","4","5": 2 2 2 1 1 1 1 2 2 2 ...
$ carb: Factor w/ 6 levels "1","2","3","4",..: 4 4 1 1 2 1 4 2 2 4 ...
ds_screener(mtcarz)
-----------------------------------------------------------------------
| Column Name | Data Type | Levels | Missing | Missing (%) |
-----------------------------------------------------------------------
| mpg | numeric | NA | 0 | 0 |
| cyl | factor | 4 6 8 | 0 | 0 |
| disp | numeric | NA | 0 | 0 |
| hp | numeric | NA | 0 | 0 |
| drat | numeric | NA | 0 | 0 |
| wt | numeric | NA | 0 | 0 |
| qsec | numeric | NA | 0 | 0 |
| vs | factor | 0 1 | 0 | 0 |
| am | factor | 0 1 | 0 | 0 |
| gear | factor | 3 4 5 | 0 | 0 |
| carb | factor |1 2 3 4 6 8| 0 | 0 |
-----------------------------------------------------------------------
Overall Missing Values 0
Percentage of Missing Values 0 %
Rows with Missing Values 0
Columns With Missing Values 0
ds_summary_stats(mtcarz, mpg)
-------------------------------- Variable: mpg --------------------------------
Univariate Analysis
N 32.00 Variance 36.32
Missing 0.00 Std Deviation 6.03
Mean 20.09 Range 23.50
Median 19.20 Interquartile Range 7.38
Mode 10.40 Uncorrected SS 14042.31
Trimmed Mean 19.95 Corrected SS 1126.05
Skewness 0.67 Coeff Variation 30.00
Kurtosis -0.02 Std Error Mean 1.07
Quantiles
Quantile Value
Max 33.90
99% 33.44
95% 31.30
90% 30.09
Q3 22.80
Median 19.20
Q1 15.43
10% 14.34
5% 12.00
1% 10.40
Min 10.40
Extreme Values
Low High
Obs Value Obs Value
15 10.4 20 33.9
16 10.4 18 32.4
24 13.3 19 30.4
7 14.3 28 30.4
17 14.7 26 27.3
ds_summary_stats(mtcarz, mpg, disp)
-------------------------------- Variable: mpg --------------------------------
Univariate Analysis
N 32.00 Variance 36.32
Missing 0.00 Std Deviation 6.03
Mean 20.09 Range 23.50
Median 19.20 Interquartile Range 7.38
Mode 10.40 Uncorrected SS 14042.31
Trimmed Mean 19.95 Corrected SS 1126.05
Skewness 0.67 Coeff Variation 30.00
Kurtosis -0.02 Std Error Mean 1.07
Quantiles
Quantile Value
Max 33.90
99% 33.44
95% 31.30
90% 30.09
Q3 22.80
Median 19.20
Q1 15.43
10% 14.34
5% 12.00
1% 10.40
Min 10.40
Extreme Values
Low High
Obs Value Obs Value
15 10.4 20 33.9
16 10.4 18 32.4
24 13.3 19 30.4
7 14.3 28 30.4
17 14.7 26 27.3
------------------------------- Variable: disp -------------------------------
Univariate Analysis
N 32.00 Variance 15360.80
Missing 0.00 Std Deviation 123.94
Mean 230.72 Range 400.90
Median 196.30 Interquartile Range 205.18
Mode 275.80 Uncorrected SS 2179627.47
Trimmed Mean 228.00 Corrected SS 476184.79
Skewness 0.42 Coeff Variation 53.72
Kurtosis -1.07 Std Error Mean 21.91
Quantiles
Quantile Value
Max 472.00
99% 468.28
95% 449.00
90% 396.00
Q3 326.00
Median 196.30
Q1 120.83
10% 80.61
5% 77.35
1% 72.53
Min 71.10
Extreme Values
Low High
Obs Value Obs Value
20 71.1 15 472
19 75.7 16 460
18 78.7 17 440
26 79 25 400
28 95.1 5 360
ds_freq_table(mtcarz, mpg, 4)
Variable: mpg
|---------------------------------------------------------------------------|
| Bins | Frequency | Cum Frequency | Percent | Cum Percent |
|---------------------------------------------------------------------------|
| 10.4 - 16.3 | 10 | 10 | 31.25 | 31.25 |
|---------------------------------------------------------------------------|
| 16.3 - 22.1 | 13 | 23 | 40.62 | 71.88 |
|---------------------------------------------------------------------------|
| 22.1 - 28 | 5 | 28 | 15.62 | 87.5 |
|---------------------------------------------------------------------------|
| 28 - 33.9 | 4 | 32 | 12.5 | 100 |
|---------------------------------------------------------------------------|
| Total | 32 | - | 100.00 | - |
|---------------------------------------------------------------------------|
k <- ds_freq_table(mtcarz, mpg, 4)
plot(k)
ds_auto_summary_stats(mtcarz, disp, mpg)
------------------------------- Variable: disp -------------------------------
----------------------------- Summary Statistics -----------------------------
------------------------------- Variable: disp -------------------------------
Univariate Analysis
N 32.00 Variance 15360.80
Missing 0.00 Std Deviation 123.94
Mean 230.72 Range 400.90
Median 196.30 Interquartile Range 205.18
Mode 275.80 Uncorrected SS 2179627.47
Trimmed Mean 228.00 Corrected SS 476184.79
Skewness 0.42 Coeff Variation 53.72
Kurtosis -1.07 Std Error Mean 21.91
Quantiles
Quantile Value
Max 472.00
99% 468.28
95% 449.00
90% 396.00
Q3 326.00
Median 196.30
Q1 120.83
10% 80.61
5% 77.35
1% 72.53
Min 71.10
Extreme Values
Low High
Obs Value Obs Value
20 71.1 15 472
19 75.7 16 460
18 78.7 17 440
26 79 25 400
28 95.1 5 360
NULL
--------------------------- Frequency Distribution ---------------------------
Variable: disp
|---------------------------------------------------------------------------|
| Bins | Frequency | Cum Frequency | Percent | Cum Percent |
|---------------------------------------------------------------------------|
| 71.1 - 151.3 | 12 | 12 | 37.5 | 37.5 |
|---------------------------------------------------------------------------|
| 151.3 - 231.5 | 5 | 17 | 15.62 | 53.12 |
|---------------------------------------------------------------------------|
| 231.5 - 311.6 | 6 | 23 | 18.75 | 71.88 |
|---------------------------------------------------------------------------|
| 311.6 - 391.8 | 5 | 28 | 15.62 | 87.5 |
|---------------------------------------------------------------------------|
| 391.8 - 472 | 4 | 32 | 12.5 | 100 |
|---------------------------------------------------------------------------|
| Total | 32 | - | 100.00 | - |
|---------------------------------------------------------------------------|
-------------------------------- Variable: mpg --------------------------------
----------------------------- Summary Statistics -----------------------------
-------------------------------- Variable: mpg --------------------------------
Univariate Analysis
N 32.00 Variance 36.32
Missing 0.00 Std Deviation 6.03
Mean 20.09 Range 23.50
Median 19.20 Interquartile Range 7.38
Mode 10.40 Uncorrected SS 14042.31
Trimmed Mean 19.95 Corrected SS 1126.05
Skewness 0.67 Coeff Variation 30.00
Kurtosis -0.02 Std Error Mean 1.07
Quantiles
Quantile Value
Max 33.90
99% 33.44
95% 31.30
90% 30.09
Q3 22.80
Median 19.20
Q1 15.43
10% 14.34
5% 12.00
1% 10.40
Min 10.40
Extreme Values
Low High
Obs Value Obs Value
15 10.4 20 33.9
16 10.4 18 32.4
24 13.3 19 30.4
7 14.3 28 30.4
17 14.7 26 27.3
NULL
--------------------------- Frequency Distribution ---------------------------
Variable: mpg
|-----------------------------------------------------------------------|
| Bins | Frequency | Cum Frequency | Percent | Cum Percent |
|-----------------------------------------------------------------------|
| 10.4 - 15.1 | 6 | 6 | 18.75 | 18.75 |
|-----------------------------------------------------------------------|
| 15.1 - 19.8 | 12 | 18 | 37.5 | 56.25 |
|-----------------------------------------------------------------------|
| 19.8 - 24.5 | 8 | 26 | 25 | 81.25 |
|-----------------------------------------------------------------------|
| 24.5 - 29.2 | 2 | 28 | 6.25 | 87.5 |
|-----------------------------------------------------------------------|
| 29.2 - 33.9 | 4 | 32 | 12.5 | 100 |
|-----------------------------------------------------------------------|
| Total | 32 | - | 100.00 | - |
|-----------------------------------------------------------------------|
k <- ds_group_summary(mtcarz, cyl, mpg)
k
by
-----------------------------------------------------------------------------------------
| Statistic/Levels| 4| 6| 8|
-----------------------------------------------------------------------------------------
| Obs| 11| 7| 14|
| Minimum| 21.4| 17.8| 10.4|
| Maximum| 33.9| 21.4| 19.2|
| Mean| 26.66| 19.74| 15.1|
| Median| 26| 19.7| 15.2|
| Mode| 22.8| 21| 10.4|
| Std. Deviation| 4.51| 1.45| 2.56|
| Variance| 20.34| 2.11| 6.55|
| Skewness| 0.35| -0.26| -0.46|
| Kurtosis| -1.43| -1.83| 0.33|
| Uncorrected SS| 8023.83| 2741.14| 3277.34|
| Corrected SS| 203.39| 12.68| 85.2|
| Coeff Variation| 16.91| 7.36| 16.95|
| Std. Error Mean| 1.36| 0.55| 0.68|
| Range| 12.5| 3.6| 8.8|
| Interquartile Range| 7.6| 2.35| 1.85|
-----------------------------------------------------------------------------------------
k$tidy_stats
k <- ds_group_summary(mtcarz, cyl, mpg)
plot(k)
ds_auto_group_summary(mtcarz, cyl, gear, mpg)
by
-----------------------------------------------------------------------------------------
| Statistic/Levels| 4| 6| 8|
-----------------------------------------------------------------------------------------
| Obs| 11| 7| 14|
| Minimum| 21.4| 17.8| 10.4|
| Maximum| 33.9| 21.4| 19.2|
| Mean| 26.66| 19.74| 15.1|
| Median| 26| 19.7| 15.2|
| Mode| 22.8| 21| 10.4|
| Std. Deviation| 4.51| 1.45| 2.56|
| Variance| 20.34| 2.11| 6.55|
| Skewness| 0.35| -0.26| -0.46|
| Kurtosis| -1.43| -1.83| 0.33|
| Uncorrected SS| 8023.83| 2741.14| 3277.34|
| Corrected SS| 203.39| 12.68| 85.2|
| Coeff Variation| 16.91| 7.36| 16.95|
| Std. Error Mean| 1.36| 0.55| 0.68|
| Range| 12.5| 3.6| 8.8|
| Interquartile Range| 7.6| 2.35| 1.85|
-----------------------------------------------------------------------------------------
by
-----------------------------------------------------------------------------------------
| Statistic/Levels| 3| 4| 5|
-----------------------------------------------------------------------------------------
| Obs| 15| 12| 5|
| Minimum| 10.4| 17.8| 15|
| Maximum| 21.5| 33.9| 30.4|
| Mean| 16.11| 24.53| 21.38|
| Median| 15.5| 22.8| 19.7|
| Mode| 10.4| 21| 15|
| Std. Deviation| 3.37| 5.28| 6.66|
| Variance| 11.37| 27.84| 44.34|
| Skewness| -0.09| 0.7| 0.56|
| Kurtosis| -0.38| -0.77| -1.83|
| Uncorrected SS| 4050.52| 7528.9| 2462.89|
| Corrected SS| 159.15| 306.29| 177.37|
| Coeff Variation| 20.93| 21.51| 31.15|
| Std. Error Mean| 0.87| 1.52| 2.98|
| Range| 11.1| 16.1| 15.4|
| Interquartile Range| 3.9| 7.08| 10.2|
-----------------------------------------------------------------------------------------
ds_tidy_stats(mtcarz, mpg, disp, hp)
ds_measures_location(mtcarz)
ds_measures_variation(mtcarz)
ds_measures_symmetry(mtcarz)
ds_percentiles(mtcarz)
ds_cross_table(mtcarz, cyl, gear)
Cell Contents
|---------------|
| Frequency |
| Percent |
| Row Pct |
| Col Pct |
|---------------|
Total Observations: 32
----------------------------------------------------------------------------
| | gear |
----------------------------------------------------------------------------
| cyl | 3 | 4 | 5 | Row Total |
----------------------------------------------------------------------------
| 4 | 1 | 8 | 2 | 11 |
| | 0.031 | 0.25 | 0.062 | |
| | 0.09 | 0.73 | 0.18 | 0.34 |
| | 0.07 | 0.67 | 0.4 | |
----------------------------------------------------------------------------
| 6 | 2 | 4 | 1 | 7 |
| | 0.062 | 0.125 | 0.031 | |
| | 0.29 | 0.57 | 0.14 | 0.22 |
| | 0.13 | 0.33 | 0.2 | |
----------------------------------------------------------------------------
| 8 | 12 | 0 | 2 | 14 |
| | 0.375 | 0 | 0.062 | |
| | 0.86 | 0 | 0.14 | 0.44 |
| | 0.8 | 0 | 0.4 | |
----------------------------------------------------------------------------
| Column Total | 15 | 12 | 5 | 32 |
| | 0.468 | 0.375 | 0.155 | |
----------------------------------------------------------------------------
ds_twoway_table(mtcarz, cyl, gear)
Joining, by = c("cyl", "gear", "count")
k <- ds_cross_table(mtcarz, cyl, gear)
plot(k)
k <- ds_cross_table(mtcarz, cyl, gear)
plot(k, stacked = TRUE)
k <- ds_cross_table(mtcarz, cyl, gear)
plot(k, proportional = TRUE)
ds_freq_table(mtcarz, cyl)
Variable: cyl
-----------------------------------------------------------------------
Levels Frequency Cum Frequency Percent Cum Percent
-----------------------------------------------------------------------
4 11 11 34.38 34.38
-----------------------------------------------------------------------
6 7 18 21.88 56.25
-----------------------------------------------------------------------
8 14 32 43.75 100
-----------------------------------------------------------------------
Total 32 - 100.00 -
-----------------------------------------------------------------------
k <- ds_freq_table(mtcarz, cyl)
plot(k)
ds_auto_freq_table(mtcarz)
Variable: cyl
-----------------------------------------------------------------------
Levels Frequency Cum Frequency Percent Cum Percent
-----------------------------------------------------------------------
4 11 11 34.38 34.38
-----------------------------------------------------------------------
6 7 18 21.88 56.25
-----------------------------------------------------------------------
8 14 32 43.75 100
-----------------------------------------------------------------------
Total 32 - 100.00 -
-----------------------------------------------------------------------
Variable: vs
-----------------------------------------------------------------------
Levels Frequency Cum Frequency Percent Cum Percent
-----------------------------------------------------------------------
0 18 18 56.25 56.25
-----------------------------------------------------------------------
1 14 32 43.75 100
-----------------------------------------------------------------------
Total 32 - 100.00 -
-----------------------------------------------------------------------
Variable: am
-----------------------------------------------------------------------
Levels Frequency Cum Frequency Percent Cum Percent
-----------------------------------------------------------------------
0 19 19 59.38 59.38
-----------------------------------------------------------------------
1 13 32 40.62 100
-----------------------------------------------------------------------
Total 32 - 100.00 -
-----------------------------------------------------------------------
Variable: gear
-----------------------------------------------------------------------
Levels Frequency Cum Frequency Percent Cum Percent
-----------------------------------------------------------------------
3 15 15 46.88 46.88
-----------------------------------------------------------------------
4 12 27 37.5 84.38
-----------------------------------------------------------------------
5 5 32 15.62 100
-----------------------------------------------------------------------
Total 32 - 100.00 -
-----------------------------------------------------------------------
Variable: carb
-----------------------------------------------------------------------
Levels Frequency Cum Frequency Percent Cum Percent
-----------------------------------------------------------------------
1 7 7 21.88 21.88
-----------------------------------------------------------------------
2 10 17 31.25 53.12
-----------------------------------------------------------------------
3 3 20 9.38 62.5
-----------------------------------------------------------------------
4 10 30 31.25 93.75
-----------------------------------------------------------------------
6 1 31 3.12 96.88
-----------------------------------------------------------------------
8 1 32 3.12 100
-----------------------------------------------------------------------
Total 32 - 100.00 -
-----------------------------------------------------------------------
ds_auto_cross_table(mtcarz, cyl, gear, am)
Cell Contents
|---------------|
| Frequency |
| Percent |
| Row Pct |
| Col Pct |
|---------------|
Total Observations: 32
cyl vs gear
----------------------------------------------------------------------------
| | gear |
----------------------------------------------------------------------------
| cyl | 3 | 4 | 5 | Row Total |
----------------------------------------------------------------------------
| 4 | 1 | 8 | 2 | 11 |
| | 0.031 | 0.25 | 0.062 | |
| | 0.09 | 0.73 | 0.18 | 0.34 |
| | 0.07 | 0.67 | 0.4 | |
----------------------------------------------------------------------------
| 6 | 2 | 4 | 1 | 7 |
| | 0.062 | 0.125 | 0.031 | |
| | 0.29 | 0.57 | 0.14 | 0.22 |
| | 0.13 | 0.33 | 0.2 | |
----------------------------------------------------------------------------
| 8 | 12 | 0 | 2 | 14 |
| | 0.375 | 0 | 0.062 | |
| | 0.86 | 0 | 0.14 | 0.44 |
| | 0.8 | 0 | 0.4 | |
----------------------------------------------------------------------------
| Column Total | 15 | 12 | 5 | 32 |
| | 0.468 | 0.375 | 0.155 | |
----------------------------------------------------------------------------
cyl vs am
-------------------------------------------------------------
| | am |
-------------------------------------------------------------
| cyl | 0 | 1 | Row Total |
-------------------------------------------------------------
| 4 | 3 | 8 | 11 |
| | 0.094 | 0.25 | |
| | 0.27 | 0.73 | 0.34 |
| | 0.16 | 0.62 | |
-------------------------------------------------------------
| 6 | 4 | 3 | 7 |
| | 0.125 | 0.094 | |
| | 0.57 | 0.43 | 0.22 |
| | 0.21 | 0.23 | |
-------------------------------------------------------------
| 8 | 12 | 2 | 14 |
| | 0.375 | 0.062 | |
| | 0.86 | 0.14 | 0.44 |
| | 0.63 | 0.15 | |
-------------------------------------------------------------
| Column Total | 19 | 13 | 32 |
| | 0.594 | 0.406 | |
-------------------------------------------------------------
gear vs am
-------------------------------------------------------------
| | am |
-------------------------------------------------------------
| gear | 0 | 1 | Row Total |
-------------------------------------------------------------
| 3 | 15 | 0 | 15 |
| | 0.469 | 0 | |
| | 1 | 0 | 0.47 |
| | 0.79 | 0 | |
-------------------------------------------------------------
| 4 | 4 | 8 | 12 |
| | 0.125 | 0.25 | |
| | 0.33 | 0.67 | 0.38 |
| | 0.21 | 0.62 | |
-------------------------------------------------------------
| 5 | 0 | 5 | 5 |
| | 0 | 0.156 | |
| | 0 | 1 | 0.16 |
| | 0 | 0.38 | |
-------------------------------------------------------------
| Column Total | 19 | 13 | 32 |
| | 0.594 | 0.406 | |
-------------------------------------------------------------
ds_plot_scatter(mtcarz, mpg, disp, hp)
ds_plot_bar_stacked(mtcarz, cyl, gear, am)
NA
NA
NA
NA
NA
NA
NA
NA
NA
NA
NA
NA
NA
NA