Gerekli paketleri ve veri setini yükleme

library(dplyr)
## 
## Attaching package: 'dplyr'
## The following objects are masked from 'package:stats':
## 
##     filter, lag
## The following objects are masked from 'package:base':
## 
##     intersect, setdiff, setequal, union
library(haven)
veri<- read_sav("C:/Users/Salih/Desktop/spss data.sav")
veri <- expss::drop_var_labs(veri)
head(veri)
## # A tibble: 6 × 7
##     Age    A1    A2    A3    A4    A5    A6
##   <dbl> <dbl> <dbl> <dbl> <dbl> <dbl> <dbl>
## 1    21     5     5     5     5     5     5
## 2    18     4     3     3     4     4     5
## 3    20     4     4     4     4     4     4
## 4    20     5     2     4     5     5     5
## 5    20     3     4     5     5     3     4
## 6    26     5     4     4     5     4     5
library(DT)
veri[,-1] %>% DT::datatable()

Veri Seti ön inceleme

summary(veri)
##       Age              A1              A2              A3       
##  Min.   :17.00   Min.   :1.000   Min.   :1.000   Min.   :1.000  
##  1st Qu.:20.00   1st Qu.:4.000   1st Qu.:4.000   1st Qu.:3.000  
##  Median :22.00   Median :5.000   Median :5.000   Median :4.000  
##  Mean   :25.02   Mean   :4.355   Mean   :4.285   Mean   :4.065  
##  3rd Qu.:29.25   3rd Qu.:5.000   3rd Qu.:5.000   3rd Qu.:5.000  
##  Max.   :44.00   Max.   :5.000   Max.   :5.000   Max.   :5.000  
##        A4              A5             A6       
##  Min.   :2.000   Min.   :1.00   Min.   :1.000  
##  1st Qu.:4.000   1st Qu.:4.00   1st Qu.:4.000  
##  Median :5.000   Median :5.00   Median :5.000  
##  Mean   :4.555   Mean   :4.19   Mean   :4.475  
##  3rd Qu.:5.000   3rd Qu.:5.00   3rd Qu.:5.000  
##  Max.   :5.000   Max.   :5.00   Max.   :5.000

psych

library(psych)
describe(veri[,-1])
##    vars   n mean   sd median trimmed  mad min max range  skew kurtosis   se
## A1    1 200 4.36 0.91      5    4.52 0.00   1   5     4 -1.48     1.89 0.06
## A2    2 200 4.28 0.90      5    4.43 0.00   1   5     4 -1.32     1.55 0.06
## A3    3 200 4.07 1.04      4    4.19 1.48   1   5     4 -0.99     0.54 0.07
## A4    4 200 4.56 0.71      5    4.71 0.00   2   5     3 -1.59     2.05 0.05
## A5    5 200 4.19 1.05      5    4.36 0.00   1   5     4 -1.31     1.21 0.07
## A6    6 200 4.47 0.95      5    4.69 0.00   1   5     4 -2.06     3.97 0.07

gtsummary

library(gtsummary)
veri %>% 
  select(2:6) %>%
  tbl_summary(
    statistic = all_continuous() ~ c("{min}, {max}"),
    missing = "always"
  )
Characteristic N = 2001
A1
    1 3 (1.5%)
    2 6 (3.0%)
    3 23 (12%)
    4 53 (27%)
    5 115 (58%)
    Unknown 0
A2
    1 3 (1.5%)
    2 6 (3.0%)
    3 25 (13%)
    4 63 (32%)
    5 103 (52%)
    Unknown 0
A3
    1 7 (3.5%)
    2 4 (2.0%)
    3 47 (24%)
    4 53 (27%)
    5 89 (45%)
    Unknown 0
A4
    2 4 (2.0%)
    3 14 (7.0%)
    4 49 (25%)
    5 133 (67%)
    Unknown 0
A5
    1 8 (4.0%)
    2 4 (2.0%)
    3 35 (18%)
    4 48 (24%)
    5 105 (53%)
    Unknown 0
1 n (%)

vtable

library(vtable)
## Zorunlu paket yükleniyor: kableExtra
## 
## Attaching package: 'kableExtra'
## The following object is masked from 'package:dplyr':
## 
##     group_rows
library(dplyr)

sumtable(veri[,-1], summ=c('notNA(x)','min(x)','max(x)'))
Summary Statistics
Variable NotNA Min Max
A1 200 1 5
A2 200 1 5
A3 200 1 5
A4 200 2 5
A5 200 1 5
A6 200 1 5
st(veri[,-1], summ = c('notNA(x)','min(x)','max(x)'),
   summ.names = c('Frekans','Minimum','Maximum'))
Summary Statistics
Variable Frekans Minimum Maximum
A1 200 1 5
A2 200 1 5
A3 200 1 5
A4 200 2 5
A5 200 1 5
A6 200 1 5
#html dosyası olduğu için buraya alamadım hocam

kable

#rmarkdonda tablo oluşturma

kable(describe(veri[,-1]), format='markdown', 
      caption="Betimsel İstatistikler", digits=2)
Betimsel İstatistikler
vars n mean sd median trimmed mad min max range skew kurtosis se
A1 1 200 4.36 0.91 5 4.52 0.00 1 5 4 -1.48 1.89 0.06
A2 2 200 4.28 0.90 5 4.43 0.00 1 5 4 -1.32 1.55 0.06
A3 3 200 4.07 1.04 4 4.19 1.48 1 5 4 -0.99 0.54 0.07
A4 4 200 4.56 0.71 5 4.71 0.00 2 5 3 -1.59 2.05 0.05
A5 5 200 4.19 1.05 5 4.36 0.00 1 5 4 -1.31 1.21 0.07
A6 6 200 4.47 0.95 5 4.69 0.00 1 5 4 -2.06 3.97 0.07

DataExplorer

otomatik rapor oluşturyor

library(DataExplorer)
create_report(veri)
## 
## 
## processing file: report.rmd
##   |                                             |                                     |   0%  |                                             |.                                    |   2%                                   |                                             |..                                   |   5% [global_options]                  |                                             |...                                  |   7%                                   |                                             |....                                 |  10% [introduce]                       |                                             |....                                 |  12%                                   |                                             |.....                                |  14% [plot_intro]
##   |                                             |......                               |  17%                                   |                                             |.......                              |  19% [data_structure]                  |                                             |........                             |  21%                                   |                                             |.........                            |  24% [missing_profile]
##   |                                             |..........                           |  26%                                   |                                             |...........                          |  29% [univariate_distribution_header]  |                                             |...........                          |  31%                                   |                                             |............                         |  33% [plot_histogram]
##   |                                             |.............                        |  36%                                   |                                             |..............                       |  38% [plot_density]                    |                                             |...............                      |  40%                                   |                                             |................                     |  43% [plot_frequency_bar]              |                                             |.................                    |  45%                                   |                                             |..................                   |  48% [plot_response_bar]               |                                             |..................                   |  50%                                   |                                             |...................                  |  52% [plot_with_bar]                   |                                             |....................                 |  55%                                   |                                             |.....................                |  57% [plot_normal_qq]
##   |                                             |......................               |  60%                                   |                                             |.......................              |  62% [plot_response_qq]                |                                             |........................             |  64%                                   |                                             |.........................            |  67% [plot_by_qq]                      |                                             |..........................           |  69%                                   |                                             |..........................           |  71% [correlation_analysis]
##   |                                             |...........................          |  74%                                   |                                             |............................         |  76% [principal_component_analysis]
##   |                                             |.............................        |  79%                                   |                                             |..............................       |  81% [bivariate_distribution_header]   |                                             |...............................      |  83%                                   |                                             |................................     |  86% [plot_response_boxplot]           |                                             |.................................    |  88%                                   |                                             |.................................    |  90% [plot_by_boxplot]                 |                                             |..................................   |  93%                                   |                                             |...................................  |  95% [plot_response_scatterplot]       |                                             |.................................... |  98%                                   |                                             |.....................................| 100% [plot_by_scatterplot]           
## output file: C:/Users/Salih/Desktop/report.knit.md
## "C:/Program Files/RStudio/resources/app/bin/quarto/bin/tools/pandoc" +RTS -K512m -RTS "C:\Users\Salih\Desktop\report.knit.md" --to html4 --from markdown+autolink_bare_uris+tex_math_single_backslash --output pandoc7ac43102c22.html --lua-filter "C:\Users\Salih\AppData\Local\R\win-library\4.4\rmarkdown\rmarkdown\lua\pagebreak.lua" --lua-filter "C:\Users\Salih\AppData\Local\R\win-library\4.4\rmarkdown\rmarkdown\lua\latex-div.lua" --embed-resources --standalone --variable bs3=TRUE --section-divs --table-of-contents --toc-depth 6 --template "C:\Users\Salih\AppData\Local\R\win-library\4.4\rmarkdown\rmd\h\default.html" --no-highlight --variable highlightjs=1 --variable theme=yeti --mathjax --variable "mathjax-url=https://mathjax.rstudio.com/latest/MathJax.js?config=TeX-AMS-MML_HTMLorMML" --include-in-header "C:\Users\Salih\AppData\Local\Temp\RtmpINOj0i\rmarkdown-str7ac21272e34.html"
## 
## Output created: report.html

file:///C:/Users/Salih/Desktop/report.html

funModeling

# veri setindeki eşsiz ve eksik verileri görmeyi sağlar

library(funModeling)
## Zorunlu paket yükleniyor: Hmisc
## Registered S3 methods overwritten by 'Hmisc':
##   method                 from 
##   [.labelled             expss
##   print.labelled         expss
##   as.data.frame.labelled expss
## 
## Attaching package: 'Hmisc'
## The following object is masked from 'package:psych':
## 
##     describe
## The following objects are masked from 'package:dplyr':
## 
##     src, summarize
## The following objects are masked from 'package:base':
## 
##     format.pval, units
## funModeling v.1.9.5 :)
## Examples and tutorials at livebook.datascienceheroes.com
##  / Now in Spanish: librovivodecienciadedatos.ai
df_status(veri)
##   variable q_zeros p_zeros q_na p_na q_inf p_inf    type unique
## 1      Age       0       0    0    0     0     0 numeric     28
## 2       A1       0       0    0    0     0     0 numeric      5
## 3       A2       0       0    0    0     0     0 numeric      5
## 4       A3       0       0    0    0     0     0 numeric      5
## 5       A4       0       0    0    0     0     0 numeric      4
## 6       A5       0       0    0    0     0     0 numeric      5
## 7       A6       0       0    0    0     0     0 numeric      5

Age değişkeninde 28 tane benzersiz değer var. Veri setinde eksik veri yok