本文档使用Rmarkdown技术,利用Rstudio的Notebook编写。

knitr::opts_chunk$set(echo=FALSE)

对数据的简单掌握

方法1:Base包中的基本函数

##   X X1.1 X1.2 X1.3 X1.4 X1.5 X1.6 X1.7 X1.8 X2.1 X2.2 X2.3 X2.4 X2.5 X2.6
## 1 2    1 2004    2    1    2    1    2    1    3    6    4    4    4    6
## 2 3    1 2004   NA    1    2    1    2    2    4    5    6    6    7    5
## 3 4    1 2004    2    2    2    1    2    2    5    7    7    7    7    7
## 4 5    1 2003    1    2    2    1    3    2    4    5    5    5    5    5
## 5 6    2 2004    2    1    2    1    2    1    4    1    7    7    7    7
## 6 7    2 2004    2    1    2    1    2    2    5    5    7    7    7    6
##   X2.7 X2.8 X2.9 X2.10 X2.11 X2.12 X3.1 X3.2 X3.3 X3.4 X3.5 X3.6 X3.7 X3.8
## 1    5    3    7     4     3     5    2    2    3    3    2    2    1    1
## 2    5    7    7     7     7     7    1    1    4    1    3    1    2    2
## 3    5    7    7     7     4     4    3    3    3    3    3    2    2    4
## 4    4    4    5     5     5     5    2    2    4    2    3    1    2    2
## 5    1    2    7     1     4     3    4    3    2    1    1    4    4    3
## 6    7    5    7     7     6     5    2    3    4    2    2    2    3    1
##   X3.9 X3.10 X4.1.1 X4.1.2 X4.1.3 X4.1.4 X4.1.5 X4.1.6 X4.1.7 X4.1.8
## 1    2     3      1      0      0      0      1      1      1      1
## 2    4     4      1      0      0      0      0      0      1      1
## 3    1     2      1      1      1      1      0      0      0      1
## 4    4     4      1      0      0      0      0      0      0      0
## 5    2     1      1      0      1      0      0      0      0      0
## 6    3     3      0      0      1     NA     NA     NA     NA      1
##   X4.1.9 X4.1.10 X4.1.11 X4.1.12 X4.1.13 X4.1.14 X4.1.15 X4.1.16 X4.1.17
## 1      1       1       1       0       0       0       1       1       0
## 2      1       1       0       0       0       0       0       0       0
## 3      1       0       0       1       0       0       1       1       1
## 4      0       0       0       0       0       0       0       0       0
## 5      0       0       1       0       0       0       0       1       0
## 6      1       1       0       0       0       0       0       1       0
##   X4.1.18 X4.1.19 X4.1.20 X4.1.21 X4.1.22 X4.1.23 X4.1.24 X4.1.25 X4.1.26
## 1       0       0       0       0       0       0       0       0       1
## 2       0       0       0       0       0       0       0       0       0
## 3       0       0       1       0       0       0       0       0       1
## 4       0       0       0       1       0       0       0       0       0
## 5       0       0       1       0       0       0       0       1       1
## 6       0       0       0       0       0       0       0       1       0
##   X4.1.27 X4.1.28 X4.1.29 X4.2.1 X4.2.2 X4.2.3 X4.2.4 X4.2.5 X4.2.6 X4.2.7
## 1       0       0       0      2     NA     NA      2      2      3      2
## 2       0       0       0      2      1      1      1      1      1      3
## 3       0       0       0      3      2      1      4     NA     NA     NA
## 4       0       0       0      2     NA     NA     NA     NA     NA     NA
## 5       0       0       0      3     NA      3     NA     NA     NA     NA
## 6       1       0       0      1      1      2      1      1      1      1
##   X4.2.8 X4.2.9 X4.2.10 X4.2.11 X4.2.12 X4.2.13 X4.2.14 X4.2.15 X4.2.16
## 1      3      2       3       3      NA      NA      NA       2       2
## 2      3      3       3       1       1       1       1       1       1
## 3      4      4      NA      NA       2      NA      NA       3       3
## 4     NA     NA      NA      NA      NA      NA      NA      NA      NA
## 5     NA     NA      NA       3      NA      NA      NA      NA       2
## 6      2      2       3       1       1       1       1       1       2
##   X4.2.17 X4.2.18 X4.2.19 X4.2.20 X4.2.21 X4.2.22 X4.2.23 X4.2.24 X4.2.25
## 1      NA      NA      NA      NA      NA      NA      NA      NA      NA
## 2       1       1       1       1       1       1       1       1       1
## 3       4      NA      NA       2      NA      NA      NA      NA      NA
## 4      NA      NA      NA      NA       1      NA      NA      NA      NA
## 5      NA      NA      NA       3      NA      NA      NA      NA       4
## 6       1       1       1       1       1       1       1       1       2
##   X4.2.26 X4.2.27 X4.2.28 X4.2.29 X5.1 X5.2 X5.3 X5.4 X5.5 X5.6 X5.7 X5.8
## 1      NA      NA      NA      NA    5    6    5    4    6    1    1    4
## 2       1       1       1       1    7    2    7    7    1    7    1    7
## 3       4      NA      NA      NA    3    3    6    7    1    5    1    5
## 4      NA      NA      NA      NA    6    2    7    7    1    7    1    7
## 5       4      NA      NA      NA    1    5    7    4    7    3    1    3
## 6       1       2       1       1    3    4    4    5    5    5    2    5
##   X5.9 X5.1.1 X5.11 X5.12 X5.13 X5.14 X5.15 X5.16 X5.17 X5.18 X5.19 X5.20
## 1    6      6     1     1     3     5     7     7     4     7     3     6
## 2    7      7     1     7     7     1     7     7     1     1     1     7
## 3    1      4     5     5     1     3     7     1     3     3     4     3
## 4    6      6     6     6     6     3     6     7     1     1     3     7
## 5    1      3     7     1     3     7     7     1     5     1     4     4
## 6    6      6     1     6     3     2     6     2     3     5     3     5
##       X X1.1 X1.2 X1.3 X1.4 X1.5 X1.6 X1.7 X1.8 X2.1 X2.2 X2.3 X2.4 X2.5
## 452 453    1 2004    1    2    2    1    3    3    6    6    7    7    7
## 453 454    2 2004    1    2    2    1    5    5    4    6    6    6    6
## 454 455    1 2003    1    2    2    1    5    6    6    3    7    7    3
## 455 456    2 2004    1    2    2    1    6    5    7    7    7    7    7
## 456 457    1 2004    1    2    2    1    3    5    5    4    6    5    3
## 457 458    1 2004    1    2    2    1    5    5    3    2    7    7    3
##     X2.6 X2.7 X2.8 X2.9 X2.10 X2.11 X2.12 X3.1 X3.2 X3.3 X3.4 X3.5 X3.6
## 452   NA   NA   NA   NA    NA    NA    NA    1    1  1,3    2    2    2
## 453    6    6    6    5     5     5     7    2    2    3    2    2    3
## 454    6    6    6    6     6     6     6    1    1    3    1    3    1
## 455    7    7    7    7     7     7     7    2    2    3   NA    2    2
## 456    3    4    5    5     2     3     4    1    2    4    1    2    1
## 457    7    2    3    1     1     7    NA    1    2    1    3    4    3
##     X3.7 X3.8 X3.9 X3.10 X4.1.1 X4.1.2 X4.1.3 X4.1.4 X4.1.5 X4.1.6 X4.1.7
## 452    2    1    4     4      0      1      0     NA      0     NA      0
## 453    2    1    3     3      1      2      0      1      1      2      1
## 454    1    1    4     4      1      1      0      1      1      1      0
## 455    2    2    3     3      1      2      0      2      1      2      1
## 456    1    1    3     4      1      3      0      1      1      3      1
## 457    2    1    4     4      1      1      0      1      1      2      0
##     X4.1.8 X4.1.9 X4.1.10 X4.1.11 X4.1.12 X4.1.13 X4.1.14 X4.1.15 X4.1.16
## 452     NA      0      NA       0      NA       0      NA       0      NA
## 453      2      0       1       1       2       1       2       1       3
## 454      1      0       1       0       1       0       1       1       3
## 455      1      0       1       1       1       0       1      NA       2
## 456      2      0       1       0       1       0       1       1       3
## 457      1      0       1       1       4       1       4       1       4
##     X4.1.17 X4.1.18 X4.1.19 X4.1.20 X4.1.21 X4.1.22 X4.1.23 X4.1.24
## 452       0      NA       0      NA       0      NA       0      NA
## 453       1       2       1       2       1       2       0       1
## 454       0      NA       0      NA       0      NA       0      NA
## 455       1       2       0       2       1       1       0       1
## 456       1       2       0       1       1       2       1       2
## 457       1       4       1       4       0       1       0       1
##     X4.1.25 X4.1.26 X4.1.27 X4.1.28 X4.1.29 X4.2.1 X4.2.2 X4.2.3 X4.2.4
## 452       0       1       2       1       3      0      0     NA      0
## 453       0       1       0       1       0      1      1      2      0
## 454       0      NA       0      NA       0     NA      0     NA      0
## 455       0       2       1       2       1      3      1      1      0
## 456       1       2       1       2       0      1      1      2      0
## 457       0       1       0       1       0      1      1      1      0
##     X4.2.5 X4.2.6 X4.2.7 X4.2.8 X4.2.9 X4.2.10 X4.2.11 X4.2.12 X4.2.13
## 452     NA      0     NA      0     NA       0      NA       0      NA
## 453      1      0      1      0      1       0       1       0       1
## 454     NA      0     NA      0     NA       0      NA       0      NA
## 455      1      0      1      1      1       1       1       1       1
## 456      1      0      1      0      1       1       3       0       1
## 457      4      0      1      1      1       0       1       1       1
##     X4.2.14 X4.2.15 X4.2.16 X4.2.17 X4.2.18 X4.2.19 X4.2.20 X4.2.21
## 452       0      NA       0      NA       0      NA       0      NA
## 453       0       1       0       1       0       1       0       1
## 454       0      NA      NA      NA      NA      NA       0      NA
## 455       0       1       0       1       0       1       0       1
## 456       0       1       0       1       0       1       0       1
## 457       0       1       1       1       0       1       0       1
##     X4.2.22 X4.2.23 X4.2.24 X4.2.25 X4.2.26 X4.2.27 X4.2.28 X4.2.29 X5.1
## 452       0      NA       0      NA       0      NA       1       2    6
## 453       1       2       0       1       0       1       0       1    5
## 454       0      NA       0      NA       0      NA       0      NA    7
## 455       1       1       0       1       0       1       0       1    2
## 456       0       1       0       1       0       1       0       1    5
## 457       0       1       0       1       1       4       1       4    7
##     X5.2 X5.3 X5.4 X5.5 X5.6 X5.7 X5.8 X5.9 X5.1.1 X5.11 X5.12 X5.13 X5.14
## 452    4    7    7    1    7    1    5    4      7     1     7     7     2
## 453    3    5   NA   NA   NA   NA   NA   NA     NA    NA    NA     6     2
## 454    4    7    7    5    1    7    7    7      7     1     7     7     1
## 455    5    4    4    4    1    1    5    6      1     3     1     2     6
## 456    5    6    5    5    3    1    5    7      5     4     4     5     5
## 457    1    7    7    1    7    1    1    1      1     7     7     7     7
##     X5.15 X5.16 X5.17 X5.18 X5.19 X5.20
## 452     7     7     2     1     3     6
## 453     6     6     1     1     2     7
## 454     7     7     4     1     1     7
## 455     7     7     3     3     5     4
## 456     2     6     3     5     5     4
## 457     7     7     1     7     1     7

方法2:使用dplyr包

## 
## Attaching package: 'dplyr'
## The following objects are masked from 'package:stats':
## 
##     filter, lag
## The following objects are masked from 'package:base':
## 
##     intersect, setdiff, setequal, union
## Observations: 457
## Variables: 109
## $ X       <int> 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17...
## $ X1.1    <int> 1, 1, 1, 1, 2, 2, 2, 2, 1, 1, 1, 2, 1, 2, 2, 1, 1, NA,...
## $ X1.2    <int> 2004, 2004, 2004, 2003, 2004, 2004, 2004, 2004, 2004, ...
## $ X1.3    <int> 2, NA, 2, 1, 2, 2, 2, 1, 2, 1, 2, 2, 2, 2, 2, 1, 2, 2,...
## $ X1.4    <int> 1, 1, 2, 2, 1, 1, 1, 2, 1, 1, 1, 1, 2, 2, 1, 1, 1, 2, ...
## $ X1.5    <int> 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, ...
## $ X1.6    <int> 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 2, 2, 2, 2, 2, 2, ...
## $ X1.7    <int> 2, 2, 2, 3, 2, 2, 1, 3, 2, 3, 2, 2, 2, 3, 2, 2, 2, 1, ...
## $ X1.8    <int> 1, 2, 2, 2, 1, 2, 1, 3, 2, 3, 1, 2, 2, 2, 2, 1, 1, 2, ...
## $ X2.1    <int> 3, 4, 5, 4, 4, 5, 6, 7, 4, 7, 4, 7, 6, 4, 5, 4, 3, 4, ...
## $ X2.2    <int> 6, 5, 7, 5, 1, 5, 5, 7, 3, 7, 6, 6, 6, 4, 5, 4, 3, 4, ...
## $ X2.3    <int> 4, 6, 7, 5, 7, 7, 4, 7, 4, 7, 6, 7, 7, 4, 5, 4, 7, 5, ...
## $ X2.4    <int> 4, 6, 7, 5, 7, 7, 6, 7, 4, 7, 5, 7, 7, 5, 5, 5, 7, 4, ...
## $ X2.5    <int> 4, 7, 7, 5, 7, 7, 6, 7, 4, 7, 6, 7, 6, 5, 5, 7, 6, 3, ...
## $ X2.6    <int> 6, 5, 7, 5, 7, 6, 7, 5, 4, 7, 5, 6, 5, 5, 5, 7, 7, 4, ...
## $ X2.7    <int> 5, 5, 5, 4, 1, 7, 6, 7, 4, 7, 5, 6, 6, 4, 6, 4, 5, 4, ...
## $ X2.8    <int> 3, 7, 7, 4, 2, 5, 6, 7, 1, 7, 5, 7, 6, 5, 5, 7, 7, 3, ...
## $ X2.9    <int> 7, 7, 7, 5, 7, 7, 6, 7, 1, 7, 6, 6, 6, 4, 6, 7, 7, 4, ...
## $ X2.10   <int> 4, 7, 7, 5, 1, 7, 7, 7, 4, 7, 6, 7, 6, 5, 5, 4, 4, 3, ...
## $ X2.11   <int> 3, 7, 4, 5, 4, 6, 7, 7, 6, 7, 5, 7, 7, 5, 4, 7, 7, 6, ...
## $ X2.12   <int> 5, 7, 4, 5, 3, 5, 7, 7, 1, 7, 6, 5, 6, 6, 6, 4, 6, 4, ...
## $ X3.1    <int> 2, 1, 3, 2, 4, 2, 1, 2, 2, 2, 2, 1, 2, 2, 2, 2, 2, 2, ...
## $ X3.2    <int> 2, 1, 3, 2, 3, 3, 1, 2, 2, 2, 2, 1, 2, 1, 2, 1, 2, 3, ...
## $ X3.3    <fctr> 3, 4, 3, 4, 2, 4, 4, 4, 3, 4, 3, 3, 4, 4, 3, 1, 3, 3,...
## $ X3.4    <int> 3, 1, 3, 2, 1, 2, 1, 1, 2, 2, 2, 1, 1, 1, 2, 2, 2, 2, ...
## $ X3.5    <int> 2, 3, 3, 3, 1, 2, 4, 3, 2, 2, 2, 1, 2, 3, 2, 3, 2, 3, ...
## $ X3.6    <int> 2, 1, 2, 1, 4, 2, 1, 2, 2, 1, 2, 1, 1, 2, 2, 1, 2, 3, ...
## $ X3.7    <int> 1, 2, 2, 2, 4, 3, 1, 1, 2, 1, 3, 1, 1, 1, 2, 4, 2, 2, ...
## $ X3.8    <int> 1, 2, 4, 2, 3, 1, 1, 1, 3, 1, 1, 1, 1, 1, 1, 1, 3, 3, ...
## $ X3.9    <int> 2, 4, 1, 4, 2, 3, 4, 1, 3, 4, 3, 1, 4, 4, 3, 2, 4, 3, ...
## $ X3.10   <int> 3, 4, 2, 4, 1, 3, 4, 4, 3, 4, 3, 4, 4, 4, 3, 3, 3, 3, ...
## $ X4.1.1  <int> 1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 1, ...
## $ X4.1.2  <int> 0, 0, 1, 0, 0, 0, 0, 0, NA, 0, 0, NA, 3, NA, 2, 3, 1, ...
## $ X4.1.3  <int> 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, ...
## $ X4.1.4  <int> 0, 0, 1, 0, 0, NA, 0, 0, 0, 0, NA, NA, NA, NA, NA, NA,...
## $ X4.1.5  <int> 1, 0, 0, 0, 0, NA, 0, 0, 0, 0, NA, 0, 1, 0, 0, 0, 0, 0...
## $ X4.1.6  <int> 1, 0, 0, 0, 0, NA, 1, 0, 1, 0, NA, NA, 1, NA, 1, NA, N...
## $ X4.1.7  <int> 1, 1, 0, 0, 0, NA, 1, 0, 1, 0, NA, 0, 0, 0, 0, 0, 0, 0...
## $ X4.1.8  <int> 1, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, NA, NA, NA, 1, NA, NA...
## $ X4.1.9  <int> 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, ...
## $ X4.1.10 <int> 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, NA, NA, NA, 1, NA, NA...
## $ X4.1.11 <int> 1, 0, 0, 0, 1, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 1, 1, 0, ...
## $ X4.1.12 <int> 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, NA, NA, NA, 1, 4, 1, ...
## $ X4.1.13 <int> 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, NA,...
## $ X4.1.14 <int> 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, NA, NA, 1, 1, 4, NA, ...
## $ X4.1.15 <int> 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 0, ...
## $ X4.1.16 <int> 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, NA, 2, 1, 1, 4, 4, NA...
## $ X4.1.17 <int> 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, ...
## $ X4.1.18 <int> 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, NA, 3, NA, 1, NA, NA,...
## $ X4.1.19 <int> 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, ...
## $ X4.1.20 <int> 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, NA, 2, 1, 1, NA, 1, N...
## $ X4.1.21 <int> 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, ...
## $ X4.1.22 <int> 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, NA, NA, NA, 2, NA, 1,...
## $ X4.1.23 <int> 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, ...
## $ X4.1.24 <int> 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, NA, NA, NA, 1, NA, NA...
## $ X4.1.25 <int> 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, ...
## $ X4.1.26 <int> 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, NA, NA, NA, 1, 1, 3, ...
## $ X4.1.27 <int> 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, ...
## $ X4.1.28 <int> 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, NA, 2, NA, 1, 4, NA, ...
## $ X4.1.29 <int> 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, ...
## $ X4.2.1  <int> 2, 2, 3, 2, 3, 1, 2, NA, 2, NA, 2, NA, 2, NA, 2, 4, 2,...
## $ X4.2.2  <int> NA, 1, 2, NA, NA, 1, NA, NA, NA, NA, NA, 0, 1, 0, 1, 0...
## $ X4.2.3  <int> NA, 1, 1, NA, 3, 2, 3, NA, 2, 4, 2, NA, 2, NA, 2, NA, ...
## $ X4.2.4  <int> 2, 1, 4, NA, NA, 1, NA, NA, NA, NA, NA, 0, 0, 0, 0, 1,...
## $ X4.2.5  <int> 2, 1, NA, NA, NA, 1, NA, NA, NA, NA, NA, NA, NA, NA, 1...
## $ X4.2.6  <int> 3, 1, NA, NA, NA, 1, 4, NA, 2, NA, NA, 0, 0, 0, 0, 1, ...
## $ X4.2.7  <int> 2, 3, NA, NA, NA, 1, 4, NA, 2, NA, NA, NA, NA, NA, 1, ...
## $ X4.2.8  <int> 3, 3, 4, NA, NA, 2, 4, 4, 2, 3, 3, 0, 0, 0, 0, 0, 0, 0...
## $ X4.2.9  <int> 2, 3, 4, NA, NA, 2, 3, 2, 2, NA, 3, NA, NA, NA, 1, NA,...
## $ X4.2.10 <int> 3, 3, NA, NA, NA, 3, 4, NA, NA, NA, 3, 0, 0, 0, 0, 1, ...
## $ X4.2.11 <int> 3, 1, NA, NA, 3, 1, 3, NA, 1, 3, 3, NA, NA, NA, 1, 4, ...
## $ X4.2.12 <int> NA, 1, 2, NA, NA, 1, NA, NA, NA, NA, NA, 0, 0, 0, 0, 0...
## $ X4.2.13 <int> NA, 1, NA, NA, NA, 1, NA, NA, NA, NA, NA, NA, NA, NA, ...
## $ X4.2.14 <int> NA, 1, NA, NA, NA, 1, NA, 2, 1, NA, NA, 0, 0, 0, 0, 0,...
## $ X4.2.15 <int> 2, 1, 3, NA, NA, 1, NA, NA, NA, NA, NA, NA, NA, NA, 1,...
## $ X4.2.16 <int> 2, 1, 3, NA, 2, 2, 2, 4, 1, 4, 3, 0, 0, 0, 0, 0, 0, 0,...
## $ X4.2.17 <int> NA, 1, 4, NA, NA, 1, NA, NA, NA, NA, NA, NA, NA, NA, 1...
## $ X4.2.18 <int> NA, 1, NA, NA, NA, 1, NA, NA, 1, NA, NA, 0, 0, 0, 0, 0...
## $ X4.2.19 <int> NA, 1, NA, NA, NA, 1, NA, NA, NA, 3, 3, NA, NA, NA, 1,...
## $ X4.2.20 <int> NA, 1, 2, NA, 3, 1, NA, NA, NA, NA, NA, 0, 0, 0, 0, 0,...
## $ X4.2.21 <int> NA, 1, NA, 1, NA, 1, NA, NA, NA, NA, NA, NA, NA, NA, 1...
## $ X4.2.22 <int> NA, 1, NA, NA, NA, 1, NA, NA, NA, NA, NA, 0, 0, 0, 0, ...
## $ X4.2.23 <int> NA, 1, NA, NA, NA, 1, NA, NA, NA, NA, NA, NA, NA, NA, ...
## $ X4.2.24 <int> NA, 1, NA, NA, NA, 1, NA, NA, NA, NA, NA, 0, 0, 0, 1, ...
## $ X4.2.25 <int> NA, 1, NA, NA, 4, 2, NA, 2, NA, NA, 2, NA, NA, NA, 2, ...
## $ X4.2.26 <int> NA, 1, 4, NA, 4, 1, NA, NA, NA, NA, NA, 0, 0, 0, 0, 0,...
## $ X4.2.27 <int> NA, 1, NA, NA, NA, 2, NA, 4, 1, NA, 3, NA, NA, NA, 1, ...
## $ X4.2.28 <int> NA, 1, NA, NA, NA, 1, NA, NA, NA, NA, NA, 0, 0, 0, 0, ...
## $ X4.2.29 <int> NA, 1, NA, NA, NA, 1, NA, NA, NA, NA, NA, NA, NA, NA, ...
## $ X5.1    <int> 5, 7, 3, 6, 1, 3, 6, 6, 7, 6, 5, 7, 6, 6, 5, 5, 4, 4, ...
## $ X5.2    <int> 6, 2, 3, 2, 5, 4, 1, 1, 2, 1, 3, 1, 1, 3, 5, 3, 1, 5, ...
## $ X5.3    <int> 5, 7, 6, 7, 7, 4, 6, 7, 5, 6, 4, 7, 7, 5, 3, 6, 7, 4, ...
## $ X5.4    <int> 4, 7, 7, 7, 4, 5, 7, 7, 6, 7, 6, 7, 7, 5, 5, 7, 7, 4, ...
## $ X5.5    <int> 6, 1, 1, 1, 7, 5, 2, 2, 4, 1, 4, 1, 1, 3, 5, 3, 1, 5, ...
## $ X5.6    <int> 1, 7, 5, 7, 3, 5, 7, 6, 7, 7, 7, 1, 7, 5, 3, 7, 7, 4, ...
## $ X5.7    <int> 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 2, 1, 1, 2, 1, 1, 3, 3, ...
## $ X5.8    <int> 4, 7, 5, 7, 3, 5, 6, 7, 5, 7, 6, 7, 6, 6, 4, 6, 6, 4, ...
## $ X5.9    <int> 6, 7, 1, 6, 1, 6, 6, 6, 6, 7, 6, 7, 5, 5, 5, 5, 6, 4, ...
## $ X5.1.1  <int> 6, 7, 4, 6, 3, 6, 7, 6, 7, 7, 6, 7, 6, 4, 4, 7, 3, 4, ...
## $ X5.11   <int> 1, 1, 5, 6, 7, 1, 1, 3, 1, 1, 2, 7, 2, 5, 6, 4, 1, 5, ...
## $ X5.12   <int> 1, 7, 5, 6, 1, 6, 7, 6, 7, 6, 6, 7, 6, 3, 3, 6, 6, 4, ...
## $ X5.13   <int> 3, 7, 1, 6, 3, 3, 7, 7, 6, 6, 5, 7, 7, 5, 7, 6, 5, 4, ...
## $ X5.14   <int> 5, 1, 3, 3, 7, 2, 4, 1, 2, 1, 6, 1, 1, 3, 1, 7, 4, 3, ...
## $ X5.15   <int> 7, 7, 7, 6, 7, 6, 7, 7, 6, 7, 7, 7, 7, 6, 6, 7, 6, 1, ...
## $ X5.16   <int> 7, 7, 1, 7, 1, 2, 7, 1, 7, 7, 3, 7, 7, 3, 3, 5, 7, 7, ...
## $ X5.17   <int> 4, 1, 3, 1, 5, 3, 1, 1, 2, 2, 2, 1, 1, 3, 3, 2, 3, 4, ...
## $ X5.18   <int> 7, 1, 3, 1, 1, 5, 1, 1, 2, 1, 2, 1, 1, 2, 4, 1, 7, 2, ...
## $ X5.19   <int> 3, 1, 4, 3, 4, 3, 1, 2, 1, 2, 4, 1, 2, 3, 5, 3, 1, 3, ...
## $ X5.20   <int> 6, 7, 3, 7, 4, 5, 7, 5, 6, 7, 6, 7, 6, 5, 4, 4, 5, 5, ...

描述统计

##        X            X1.1            X1.2           X1.3       
##  Min.   :  2   Min.   :1.000   Min.   :2000   Min.   : 1.000  
##  1st Qu.:116   1st Qu.:1.000   1st Qu.:2003   1st Qu.: 1.000  
##  Median :230   Median :1.000   Median :2003   Median : 1.000  
##  Mean   :230   Mean   :1.492   Mean   :2003   Mean   : 1.491  
##  3rd Qu.:344   3rd Qu.:2.000   3rd Qu.:2004   3rd Qu.: 2.000  
##  Max.   :458   Max.   :2.000   Max.   :2013   Max.   :11.000  
##                NA's   :16      NA's   :13     NA's   :19      
##       X1.4      
##  Min.   :1.000  
##  1st Qu.:1.000  
##  Median :2.000  
##  Mean   :1.644  
##  3rd Qu.:2.000  
##  Max.   :2.000  
##  NA's   :16
##      vars   n    mean     sd median trimmed    mad  min  max range  skew
## X       1 457  230.00 132.07    230  230.00 169.02    2  458   456  0.00
## X1.1    2 441    1.49   0.50      1    1.49   0.00    1    2     1  0.03
## X1.2    3 444 2003.20   1.02   2003 2003.22   1.48 2000 2013    13  3.12
## X1.3    4 438    1.49   0.68      1    1.46   0.00    1   11    10  6.36
## X1.4    5 441    1.64   0.48      2    1.68   0.00    1    2     1 -0.60
##      kurtosis   se
## X       -1.21 6.18
## X1.1    -2.00 0.02
## X1.2    29.32 0.05
## X1.3    86.90 0.03
## X1.4    -1.64 0.02

简单可视化

## 
## Attaching package: 'ggplot2'
## The following objects are masked from 'package:psych':
## 
##     %+%, alpha
## `stat_bin()` using `bins = 30`. Pick better value with `binwidth`.
## Warning: Removed 17 rows containing non-finite values (stat_bin).

## `stat_bin()` using `bins = 30`. Pick better value with `binwidth`.
## Warning: Removed 17 rows containing non-finite values (stat_bin).

## Warning: Removed 17 rows containing non-finite values (stat_count).

## Warning: Removed 17 rows containing non-finite values (stat_count).

文件操作

使用dplyr包中的五个函数:select, filter, mutate, summarize, group_by 管道操作符 %>%:可以将上一个运算得到的结果直接传递给下一个函数的第一个参数

##   X1.1
## 1    1
## 2    1
## 3    1
## 4    1
## 5    2
## 6    2
##   X1.1 X1.2 X1.3 X1.4 X1.5 X1.6 X1.7 X1.8
## 1    1 2004    2    1    2    1    2    1
## 2    1 2004   NA    1    2    1    2    2
## 3    1 2004    2    2    2    1    2    2
## 4    1 2003    1    2    2    1    3    2
## 5    2 2004    2    1    2    1    2    1
## 6    2 2004    2    1    2    1    2    2
##   X1.1 X2.1 X3.1 X4.1.1 X4.2.1 X5.1 X5.1.1
## 1    1    3    2      1      2    5      6
## 2    1    4    1      1      2    7      7
## 3    1    5    3      1      3    3      4
## 4    1    4    2      1      2    6      6
## 5    2    4    4      1      3    1      3
## 6    2    5    2      0      1    3      6
##   X4.1.1 X4.1.2 X4.1.3 X4.1.4 X4.1.5 X4.1.6 X4.1.7 X4.1.8 X4.1.9 X4.1.10
## 1      1      0      0      0      1      1      1      1      1       1
## 2      1      0      0      0      0      0      1      1      1       1
## 3      1      1      1      1      0      0      0      1      1       0
## 4      1      0      0      0      0      0      0      0      0       0
## 5      1      0      1      0      0      0      0      0      0       0
## 6      0      0      1     NA     NA     NA     NA      1      1       1
##   X4.1.11 X4.1.12 X4.1.13 X4.1.14 X4.1.15 X4.1.16 X4.1.17 X4.1.18 X4.1.19
## 1       1       0       0       0       1       1       0       0       0
## 2       0       0       0       0       0       0       0       0       0
## 3       0       1       0       0       1       1       1       0       0
## 4       0       0       0       0       0       0       0       0       0
## 5       1       0       0       0       0       1       0       0       0
## 6       0       0       0       0       0       1       0       0       0
##   X4.1.20 X4.1.21 X4.1.22 X4.1.23 X4.1.24 X4.1.25 X4.1.26 X4.1.27 X4.1.28
## 1       0       0       0       0       0       0       1       0       0
## 2       0       0       0       0       0       0       0       0       0
## 3       1       0       0       0       0       0       1       0       0
## 4       0       1       0       0       0       0       0       0       0
## 5       1       0       0       0       0       1       1       0       0
## 6       0       0       0       0       0       1       0       1       0
##   X4.1.29 X5.1.1
## 1       0      6
## 2       0      7
## 3       0      4
## 4       0      6
## 5       0      3
## 6       0      6
##    X X1.1 X1.2 X1.3 X1.4 X1.5 X1.6 X1.7 X1.8 X2.1 X2.2 X2.3 X2.4 X2.5 X2.6
## 1  6    2 2004    2    1    2    1    2    1    4    1    7    7    7    7
## 2  7    2 2004    2    1    2    1    2    2    5    5    7    7    7    6
## 3  8    2 2004    2    1    2    1    1    1    6    5    4    6    6    7
## 4  9    2 2004    1    2    2    1    3    3    7    7    7    7    7    5
## 5 13    2 2003    2    1    2    2    2    2    7    6    7    7    7    6
## 6 15    2 2002    2    2    2    2    3    2    4    4    4    5    5    5
##   X2.7 X2.8 X2.9 X2.10 X2.11 X2.12 X3.1 X3.2 X3.3 X3.4 X3.5 X3.6 X3.7 X3.8
## 1    1    2    7     1     4     3    4    3    2    1    1    4    4    3
## 2    7    5    7     7     6     5    2    3    4    2    2    2    3    1
## 3    6    6    6     7     7     7    1    1    4    1    4    1    1    1
## 4    7    7    7     7     7     7    2    2    4    1    3    2    1    1
## 5    6    7    6     7     7     5    1    1    3    1    1    1    1    1
## 6    4    5    4     5     5     6    2    1    4    1    3    2    1    1
##   X3.9 X3.10 X4.1.1 X4.1.2 X4.1.3 X4.1.4 X4.1.5 X4.1.6 X4.1.7 X4.1.8
## 1    2     1      1      0      1      0      0      0      0      0
## 2    3     3      0      0      1     NA     NA     NA     NA      1
## 3    4     4      1      0      1      0      0      1      1      1
## 4    1     4      0      0      0      0      0      0      0      1
## 5    1     4      0     NA      0     NA      0     NA      0     NA
## 6    4     4      0     NA      0     NA      0     NA      0     NA
##   X4.1.9 X4.1.10 X4.1.11 X4.1.12 X4.1.13 X4.1.14 X4.1.15 X4.1.16 X4.1.17
## 1      0       0       1       0       0       0       0       1       0
## 2      1       1       0       0       0       0       0       1       0
## 3      1       1       1       0       0       0       0       1       0
## 4      1       0       0       0       0       1       0       1       0
## 5      0      NA       0      NA       0      NA       0      NA       0
## 6      0      NA       0      NA       1       1       1       1       0
##   X4.1.18 X4.1.19 X4.1.20 X4.1.21 X4.1.22 X4.1.23 X4.1.24 X4.1.25 X4.1.26
## 1       0       0       1       0       0       0       0       1       1
## 2       0       0       0       0       0       0       0       1       0
## 3       0       0       0       0       0       0       0       0       0
## 4       0       0       0       0       0       0       0       1       0
## 5      NA       0      NA       0      NA       0      NA       0      NA
## 6      NA       1       1       0      NA       0      NA       0      NA
##   X4.1.27 X4.1.28 X4.1.29 X4.2.1 X4.2.2 X4.2.3 X4.2.4 X4.2.5 X4.2.6 X4.2.7
## 1       0       0       0      3     NA      3     NA     NA     NA     NA
## 2       1       0       0      1      1      2      1      1      1      1
## 3       0       0       0      2     NA      3     NA     NA      4      4
## 4       1       0       0     NA     NA     NA     NA     NA     NA     NA
## 5       0      NA       0     NA      0     NA      0     NA      0     NA
## 6       0      NA       0     NA      0     NA      0     NA      0     NA
##   X4.2.8 X4.2.9 X4.2.10 X4.2.11 X4.2.12 X4.2.13 X4.2.14 X4.2.15 X4.2.16
## 1     NA     NA      NA       3      NA      NA      NA      NA       2
## 2      2      2       3       1       1       1       1       1       2
## 3      4      3       4       3      NA      NA      NA      NA       2
## 4      4      2      NA      NA      NA      NA       2      NA       4
## 5      0     NA       0      NA       0      NA       0      NA       0
## 6      0     NA       0      NA       0      NA       0      NA       0
##   X4.2.17 X4.2.18 X4.2.19 X4.2.20 X4.2.21 X4.2.22 X4.2.23 X4.2.24 X4.2.25
## 1      NA      NA      NA       3      NA      NA      NA      NA       4
## 2       1       1       1       1       1       1       1       1       2
## 3      NA      NA      NA      NA      NA      NA      NA      NA      NA
## 4      NA      NA      NA      NA      NA      NA      NA      NA       2
## 5      NA       0      NA       0      NA       0      NA       0      NA
## 6      NA       0      NA       0      NA       0      NA       0      NA
##   X4.2.26 X4.2.27 X4.2.28 X4.2.29 X5.1 X5.2 X5.3 X5.4 X5.5 X5.6 X5.7 X5.8
## 1       4      NA      NA      NA    1    5    7    4    7    3    1    3
## 2       1       2       1       1    3    4    4    5    5    5    2    5
## 3      NA      NA      NA      NA    6    1    6    7    2    7    1    6
## 4      NA       4      NA      NA    6    1    7    7    2    6    1    7
## 5       0      NA       0      NA    7    1    7    7    1    1    1    7
## 6       0      NA       0      NA    6    3    5    5    3    5    2    6
##   X5.9 X5.1.1 X5.11 X5.12 X5.13 X5.14 X5.15 X5.16 X5.17 X5.18 X5.19 X5.20
## 1    1      3     7     1     3     7     7     1     5     1     4     4
## 2    6      6     1     6     3     2     6     2     3     5     3     5
## 3    6      7     1     7     7     4     7     7     1     1     1     7
## 4    6      6     3     6     7     1     7     1     1     1     2     5
## 5    7      7     7     7     7     1     7     7     1     1     1     7
## 6    5      4     5     3     5     3     6     3     3     2     3     5
##   X X1.1 X1.2 X1.3 X1.4 X1.5 X1.6 X1.7 X1.8 X2.1 X2.2 X2.3 X2.4 X2.5 X2.6
## 1 2    1 2004    2    1    2    1    2    1    3    6    4    4    4    6
## 2 3    1 2004   NA    1    2    1    2    2    4    5    6    6    7    5
## 3 4    1 2004    2    2    2    1    2    2    5    7    7    7    7    7
## 4 5    1 2003    1    2    2    1    3    2    4    5    5    5    5    5
## 5 6    2 2004    2    1    2    1    2    1    4    1    7    7    7    7
## 6 7    2 2004    2    1    2    1    2    2    5    5    7    7    7    6
##   X2.7 X2.8 X2.9 X2.10 X2.11 X2.12 X3.1 X3.2 X3.3 X3.4 X3.5 X3.6 X3.7 X3.8
## 1    5    3    7     4     3     5    2    2    3    3    2    2    1    1
## 2    5    7    7     7     7     7    1    1    4    1    3    1    2    2
## 3    5    7    7     7     4     4    3    3    3    3    3    2    2    4
## 4    4    4    5     5     5     5    2    2    4    2    3    1    2    2
## 5    1    2    7     1     4     3    4    3    2    1    1    4    4    3
## 6    7    5    7     7     6     5    2    3    4    2    2    2    3    1
##   X3.9 X3.10 X4.1.1 X4.1.2 X4.1.3 X4.1.4 X4.1.5 X4.1.6 X4.1.7 X4.1.8
## 1    2     3      1      0      0      0      1      1      1      1
## 2    4     4      1      0      0      0      0      0      1      1
## 3    1     2      1      1      1      1      0      0      0      1
## 4    4     4      1      0      0      0      0      0      0      0
## 5    2     1      1      0      1      0      0      0      0      0
## 6    3     3      0      0      1     NA     NA     NA     NA      1
##   X4.1.9 X4.1.10 X4.1.11 X4.1.12 X4.1.13 X4.1.14 X4.1.15 X4.1.16 X4.1.17
## 1      1       1       1       0       0       0       1       1       0
## 2      1       1       0       0       0       0       0       0       0
## 3      1       0       0       1       0       0       1       1       1
## 4      0       0       0       0       0       0       0       0       0
## 5      0       0       1       0       0       0       0       1       0
## 6      1       1       0       0       0       0       0       1       0
##   X4.1.18 X4.1.19 X4.1.20 X4.1.21 X4.1.22 X4.1.23 X4.1.24 X4.1.25 X4.1.26
## 1       0       0       0       0       0       0       0       0       1
## 2       0       0       0       0       0       0       0       0       0
## 3       0       0       1       0       0       0       0       0       1
## 4       0       0       0       1       0       0       0       0       0
## 5       0       0       1       0       0       0       0       1       1
## 6       0       0       0       0       0       0       0       1       0
##   X4.1.27 X4.1.28 X4.1.29 X4.2.1 X4.2.2 X4.2.3 X4.2.4 X4.2.5 X4.2.6 X4.2.7
## 1       0       0       0      2     NA     NA      2      2      3      2
## 2       0       0       0      2      1      1      1      1      1      3
## 3       0       0       0      3      2      1      4     NA     NA     NA
## 4       0       0       0      2     NA     NA     NA     NA     NA     NA
## 5       0       0       0      3     NA      3     NA     NA     NA     NA
## 6       1       0       0      1      1      2      1      1      1      1
##   X4.2.8 X4.2.9 X4.2.10 X4.2.11 X4.2.12 X4.2.13 X4.2.14 X4.2.15 X4.2.16
## 1      3      2       3       3      NA      NA      NA       2       2
## 2      3      3       3       1       1       1       1       1       1
## 3      4      4      NA      NA       2      NA      NA       3       3
## 4     NA     NA      NA      NA      NA      NA      NA      NA      NA
## 5     NA     NA      NA       3      NA      NA      NA      NA       2
## 6      2      2       3       1       1       1       1       1       2
##   X4.2.17 X4.2.18 X4.2.19 X4.2.20 X4.2.21 X4.2.22 X4.2.23 X4.2.24 X4.2.25
## 1      NA      NA      NA      NA      NA      NA      NA      NA      NA
## 2       1       1       1       1       1       1       1       1       1
## 3       4      NA      NA       2      NA      NA      NA      NA      NA
## 4      NA      NA      NA      NA       1      NA      NA      NA      NA
## 5      NA      NA      NA       3      NA      NA      NA      NA       4
## 6       1       1       1       1       1       1       1       1       2
##   X4.2.26 X4.2.27 X4.2.28 X4.2.29 X5.1 X5.2 X5.3 X5.4 X5.5 X5.6 X5.7 X5.8
## 1      NA      NA      NA      NA    5    6    5    4    6    1    1    4
## 2       1       1       1       1    7    2    7    7    1    7    1    7
## 3       4      NA      NA      NA    3    3    6    7    1    5    1    5
## 4      NA      NA      NA      NA    6    2    7    7    1    7    1    7
## 5       4      NA      NA      NA    1    5    7    4    7    3    1    3
## 6       1       2       1       1    3    4    4    5    5    5    2    5
##   X5.9 X5.1.1 X5.11 X5.12 X5.13 X5.14 X5.15 X5.16 X5.17 X5.18 X5.19 X5.20
## 1    6      6     1     1     3     5     7     7     4     7     3     6
## 2    7      7     1     7     7     1     7     7     1     1     1     7
## 3    1      4     5     5     1     3     7     1     3     3     4     3
## 4    6      6     6     6     6     3     6     7     1     1     3     7
## 5    1      3     7     1     3     7     7     1     5     1     4     4
## 6    6      6     1     6     3     2     6     2     3     5     3     5
##   X1.9
## 1    3
## 2   NA
## 3    3
## 4    2
## 5    4
## 6    4
## # A tibble: 3 × 3
##    X1.1     mean   sum
##   <int>    <dbl> <int>
## 1     1 5.608108  1134
## 2     2 5.246512  1111
## 3    NA 5.500000    NA

假设检验

t检验

## 
##  Welch Two Sample t-test
## 
## data:  t1$X5.20 and t2$X5.20
## t = 1.0771, df = 272.38, p-value = 0.2824
## alternative hypothesis: true difference in means is not equal to 0
## 95 percent confidence interval:
##  -0.2993101  1.0225030
## sample estimates:
## mean of x mean of y 
##  5.608108  5.246512
## 
##  Paired t-test
## 
## data:  t1$X5.20 and t1$X5.18
## t = 7.9961, df = 221, p-value = 7.123e-14
## alternative hypothesis: true difference in means is not equal to 0
## 95 percent confidence interval:
##  2.230060 3.688859
## sample estimates:
## mean of the differences 
##                2.959459

方差分析

##              Df Sum Sq Mean Sq F value Pr(>F)  
## X1.1          1   13.4  13.423   3.837 0.0508 .
## X1.3          1    5.0   5.004   1.431 0.2323  
## X1.1:X1.3     1    0.4   0.372   0.106 0.7445  
## Residuals   429 1500.7   3.498                 
## ---
## Signif. codes:  0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1
## 24 observations deleted due to missingness
## % latex table generated in R 3.3.2 by xtable 1.8-2 package
## % Fri Dec 16 18:17:44 2016
## \begin{table}[ht]
## \centering
## \begin{tabular}{lrrrrr}
##   \hline
##  & Df & Sum Sq & Mean Sq & F value & Pr($>$F) \\ 
##   \hline
## X1.1 & 1 & 13.42 & 13.42 & 3.84 & 0.0508 \\ 
##   X1.3 & 1 & 5.00 & 5.00 & 1.43 & 0.2323 \\ 
##   X1.1:X1.3 & 1 & 0.37 & 0.37 & 0.11 & 0.7445 \\ 
##   Residuals & 429 & 1500.72 & 3.50 &  &  \\ 
##    \hline
## \end{tabular}
## \end{table}

卡方检验

##    
##      1  2  3  4  5  6  7
##   1 19 13 25 30 40 36 60
##   2 23 11 23 43 54 30 33
## 
##  Pearson's Chi-squared test
## 
## data:  table(totalTable$X1.1, totalTable$X5.1)
## X-squared = 13.336, df = 6, p-value = 0.038