This is an R Markdown Notebook. When you execute code within the notebook, the results appear beneath the code.

Try executing this chunk by clicking the Run button within the chunk or by placing your cursor inside it and pressing Ctrl+Shift+Enter.

plot(cars)

Add a new chunk by clicking the Insert Chunk button on the toolbar or by pressing Ctrl+Alt+I.

When you save the notebook, an HTML file containing the code and output will be saved alongside it (click the Preview button or press Ctrl+Shift+K to preview the HTML file).

Chapter 1 to 3: You can do arithmetic and use # for comments

2*2
[1] 4
2+2
[1] 4
x <-c(1:10)
x
 [1]  1  2  3  4  5  6  7  8  9 10
# doing complicated math examples 
10^2+3*60/8-3
[1] 119.5
5^3*(6-2)/(61-3+4)
[1] 8.064516
2^(2+1)-4+64^((-2)^(2.25-1/4))
[1] 16777220
# Logarithms 
log(x=243,base=3)
[1] 5
# Exponentials
exp(x=3)
[1] 20.08554
log(x=20.08554)
[1] 3

Lesson 2: Assigning objects and Vectors

# you can use either <- or = sign
x <-3
y =3
x+y
[1] 6
myvec <- c(1,2,1,42)
myvec
[1]  1  2  1 42
# Then create a second vector
myvec2 <- c(2,3,4,5)
myvec2
[1] 2 3 4 5
# now create a third vector by appending both myvec and myvec2 together
myvec3 <-c(myvec,myvec2)
myvec3
[1]  1  2  1 42  2  3  4  5
# creating sequences with the : colon 
3:27
 [1]  3  4  5  6  7  8  9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27
foo <- 5.3
bar <-foo:(-47+1.5)
bar
 [1]   5.3   4.3   3.3   2.3   1.3   0.3  -0.7  -1.7  -2.7  -3.7  -4.7  -5.7  -6.7  -7.7  -8.7  -9.7 -10.7 -11.7
[19] -12.7 -13.7 -14.7 -15.7 -16.7 -17.7 -18.7 -19.7 -20.7 -21.7 -22.7 -23.7 -24.7 -25.7 -26.7 -27.7 -28.7 -29.7
[37] -30.7 -31.7 -32.7 -33.7 -34.7 -35.7 -36.7 -37.7 -38.7 -39.7 -40.7 -41.7 -42.7 -43.7 -44.7
# we can also use the seq command which provides more options
seq(from=3, to=27, by=4)
[1]  3  7 11 15 19 23 27
# instead of by you can also use length.out
seq(from=3, to=27, length.out = 40)
 [1]  3.000000  3.615385  4.230769  4.846154  5.461538  6.076923  6.692308  7.307692  7.923077  8.538462  9.153846
[12]  9.769231 10.384615 11.000000 11.615385 12.230769 12.846154 13.461538 14.076923 14.692308 15.307692 15.923077
[23] 16.538462 17.153846 17.769231 18.384615 19.000000 19.615385 20.230769 20.846154 21.461538 22.076923 22.692308
[34] 23.307692 23.923077 24.538462 25.153846 25.769231 26.384615 27.000000
# Repetition with rep command
rep(x=1,times=4)
[1] 1 1 1 1
rep(x=c(3,62,8.3), times=3)
[1]  3.0 62.0  8.3  3.0 62.0  8.3  3.0 62.0  8.3
rep(x=c(3,62,8.3), each=2)
[1]  3.0  3.0 62.0 62.0  8.3  8.3
rep(x=c(3,62,8.3),times=3, each=2)
 [1]  3.0  3.0 62.0 62.0  8.3  8.3  3.0  3.0 62.0 62.0  8.3  8.3  3.0  3.0 62.0 62.0  8.3  8.3
# sort function
sort(x=c(2.5,-1,-10, 3.44),decreasing = FALSE)
[1] -10.00  -1.00   2.50   3.44
sort(x=c(2.5,-1,-10, 3.44),decreasing = TRUE)
[1]   3.44   2.50  -1.00 -10.00
# finding a vector with length
length(x=c(2.5,-1,-10, 3.44))
[1] 4
length(x=5:13)
[1] 9
# Subsetting or how to address specific elements of an array
myvec3
[1]  1  2  1 42  2  3  4  5
length(myvec3)
[1] 8
myvec3[4]
[1] 42
myvec3[5]
[1] 2
myvec3[4]+myvec3[5]
[1] 44
# Vector-Oriented behavior
foo <-5.5:0.5
foo
[1] 5.5 4.5 3.5 2.5 1.5 0.5
foo-c(2,4,6,8,10,12)
[1]   3.5   0.5  -2.5  -5.5  -8.5 -11.5
# why vectors? Because it is faster adding each element by 3
qux <-3
foo+qux
[1] 8.5 7.5 6.5 5.5 4.5 3.5
sum(foo)
[1] 18
# Vector oriented behavior also applies to overwriting multiple elements
foo
[1] 5.5 4.5 3.5 2.5 1.5 0.5
foo[c(1,3,5,6)]-c(-99,99)
[1] 104.5 -95.5 100.5 -98.5
# from vectors to Matrix (2D) to Arrays (xD)
# use matrix command to create matrix
A <-matrix(data=c(1,2,3,4),nrow=2, ncol = 2)
A
     [,1] [,2]
[1,]    1    3
[2,]    2    4
# you can fill a matrix by row or column using the byrow=true|false
A <- matrix(data = c(1,2,3,4,5,6),nrow = 2, ncol = 3,byrow = FALSE)
A
     [,1] [,2] [,3]
[1,]    1    3    5
[2,]    2    4    6
B <- matrix(data = c(1,2,3,4,5,6),nrow = 2, ncol = 3,byrow = TRUE)
B
     [,1] [,2] [,3]
[1,]    1    2    3
[2,]    4    5    6
# you can also use rbind anc cbind to create matrix
# rbind creates by row
# cbind creates by column
A <-rbind(1:3,4:6)
A
     [,1] [,2] [,3]
[1,]    1    2    3
[2,]    4    5    6
B <-cbind(1:3,4:6)
B
     [,1] [,2]
[1,]    1    4
[2,]    2    5
[3,]    3    6
# then get its dimensions using the dim command
dim(A)
[1] 2 3
dim(B)
[1] 3 2
# you can also refer to each subelement by the [] notation
A
     [,1] [,2] [,3]
[1,]    1    2    3
[2,]    4    5    6
nrow(A)
[1] 2
ncol(A)
[1] 3
dim(A)[2]
[1] 3
# subsetting of a matrix using []
A
     [,1] [,2] [,3]
[1,]    1    2    3
[2,]    4    5    6
A[1,2]
[1] 2
# to extract an entire column
A
     [,1] [,2] [,3]
[1,]    1    2    3
[2,]    4    5    6
A[,2]
[1] 2 5
# to extract an entire row
A[1,]
[1] 1 2 3
# you can also extract multiple rows or columns
A
     [,1] [,2] [,3]
[1,]    1    2    3
[2,]    4    5    6
A[1:2,]
     [,1] [,2] [,3]
[1,]    1    2    3
[2,]    4    5    6
A[,1:2]
     [,1] [,2]
[1,]    1    2
[2,]    4    5
# you can omit rows and columns in matrix by using the negative sign
A
     [,1] [,2] [,3]
[1,]    1    2    3
[2,]    4    5    6
A[,-2]
     [,1] [,2]
[1,]    1    3
[2,]    4    6

To overwrite particular elements, or entire rows or columsn, you identify the elecments to be replaced and then assign the new values, as you did with vectors.

The new elements acan be a single avlue, a vector of the same length or a vector whose length evenly divides the number of elements to be replaced.

# copy matrix A to B
B <- A
B
     [,1] [,2] [,3]
[1,]    1    2    3
[2,]    4    5    6
# overwrite the 2nd row of B with the sequence 1,2,3
B[2,]<-1:3
B
     [,1] [,2] [,3]
[1,]    1    2    3
[2,]    1    2    3
# overwrite 2nd column of the first and 3rd rows with 900
B
     [,1] [,2] [,3]
[1,]    1    2    3
[2,]    1    2    3
B[-2,2]<-900
B
     [,1] [,2] [,3]
[1,]    1  900    3
[2,]    1    2    3

Matrix Operations and Algebra

# Matrix Transpose
A<-rbind(c(2,5,2),c(6,1,4))
A
     [,1] [,2] [,3]
[1,]    2    5    2
[2,]    6    1    4
t(A)
     [,1] [,2]
[1,]    2    6
[2,]    5    1
[3,]    2    4

Identity Matrix is a square matrix mxm with ones on the diagonal and zeros elsewhere. A quick way to generate an identity matrix is with the use of the diag() command

A <- diag(x=3)
A
     [,1] [,2] [,3]
[1,]    1    0    0
[2,]    0    1    0
[3,]    0    0    1

Scalar Multiplication of a Matrix Multiplication of any matrix A by a scalar values (a) results in a matrix in which every individual element is multipled by (a)

A <-rbind(c(2,5,2),c(6,1,4))
A
     [,1] [,2] [,3]
[1,]    2    5    2
[2,]    6    1    4
a<-2
a*A
     [,1] [,2] [,3]
[1,]    4   10    4
[2,]   12    2    8

Matrix Addition and Subtraction Additions and substractions of any two matrices of the SAME size is also performed in an element wise fashion.

A <-rbind(c(2,5,2),c(6,1,4))
A
     [,1] [,2] [,3]
[1,]    2    5    2
[2,]    6    1    4
B <- rbind(c(-2,3,6),c(8.1,8.2,-9.8))
B
     [,1] [,2] [,3]
[1,] -2.0  3.0  6.0
[2,]  8.1  8.2 -9.8
A-B
     [,1] [,2] [,3]
[1,]  4.0  2.0 -4.0
[2,] -2.1 -7.2 13.8

Matrix Multiplication In order to multiply two matrics (mxn) and (pxq) n must be equal to p the result is mxq matrix

A <-rbind(c(2,5,2),c(6,1,4))
dim(A)
[1] 2 3
B <-cbind(c(3,-1,1),c(-3,1,5))
dim(B)
[1] 3 2
A
     [,1] [,2] [,3]
[1,]    2    5    2
[2,]    6    1    4
B
     [,1] [,2]
[1,]    3   -3
[2,]   -1    1
[3,]    1    5
A %*% B
     [,1] [,2]
[1,]    3    9
[2,]   21    3

the matrix multiplication is non commutative. reversing the order will give different results:

B %*% A
     [,1] [,2] [,3]
[1,]  -12   12   -6
[2,]    4   -4    2
[3,]   32   10   22

Chapter 4 Non-Numeric Values Logical Values are TRUE (1) or FALSE(0). Here logical values can be added:

TRUE+TRUE
[1] 2
FALSE-TRUE
[1] -1

Relational Operators: (==, !=, >,<,>=,<=) Multiple comparisons (& | !)

Concat function

qux <-c("awesome","R","is")
length(x=qux)
[1] 3
qux
[1] "awesome" "R"       "is"     
cat(qux[2],qux[3],"totally",qux[1],"!")
R is totally awesome !

Using the substring function Substr() function

foo <-"This is a character string!"
substr(x=foo,start=21, stop=27)
[1] "string!"

Factors are R’s way of representing data points tha tfit in only one of a finite number of distinct categories (like nominal values ie sex=male or female)

sex.char <-c("Male","Female","Male","Female")
sex.char
[1] "Male"   "Female" "Male"   "Female"
sex.char.fac<-factor(x=sex.char)
sex.char.fac
[1] Male   Female Male   Female
Levels: Female Male
