svm

We will use the linear svm classifier to predict the suv buyer dataset using 1. linear kernel, 2. gussian kernel, 3. polynomial kernel, 4. sigmoid kernel

We will use Social Network dataset #### Importing the dataset

dataset = read.csv('Social_Network_Ads.csv')
dataset = dataset[3:5]

Encoding the target feature as factor

dataset$Purchased = factor(dataset$Purchased, levels = c(0, 1))

Splitting the dataset into the Training set and Test set

install.packages(‘caTools’)

library(caTools)

## Warning: package 'caTools' was built under R version 3.4.2

set.seed(123)
split = sample.split(dataset$Purchased, SplitRatio = 0.75)
training_set = subset(dataset, split == TRUE)
test_set = subset(dataset, split == FALSE)
library(e1071)

## Warning: package 'e1071' was built under R version 3.4.2

Feature Scaling

training_set[-3] = scale(training_set[-3])
test_set[-3] = scale(test_set[-3])

Fitting classifier to the Training set

Create your classifier here

classifier=svm(formula= Purchased ~., data=training_set, 
               type="C-classification", kernel="linear" )
y_pred = predict(classifier,newdata=test_set[-3])

Making the Confusion Matrix

cm = table(test_set[, 3], y_pred)

1. Visualising the Training set results with linear kernel

library(ElemStatLearn)

## Warning: package 'ElemStatLearn' was built under R version 3.4.2

set = training_set
X1 = seq(min(set[, 1]) - 1, max(set[, 1]) + 1, by = 0.01)
X2 = seq(min(set[, 2]) - 1, max(set[, 2]) + 1, by = 0.01)
grid_set = expand.grid(X1, X2)
colnames(grid_set) = c('Age', 'EstimatedSalary')
y_grid = predict(classifier,newdata=grid_set)
plot(set[, -3],
     main = 'SVM (Training set)',
     xlab = 'Age', ylab = 'Estimated Salary',
     xlim = range(X1), ylim = range(X2))
contour(X1, X2, matrix(as.numeric(y_grid), length(X1), length(X2)), add = TRUE)
points(grid_set, pch = '.', col = ifelse(y_grid == 1, 'springgreen3', 'tomato'))
points(set, pch = 21, bg = ifelse(set[, 3] == 1, 'green4', 'red3'))

2. Visiulising the training set with gussian kernel

classifier1=svm(formula= Purchased ~., data=training_set, 
               type="C-classification", kernel="radial" )
y_pred1 = predict(classifier1,newdata=test_set[-3])

Making the Confusion Matrix

cm = table(test_set[, 3], y_pred1)

library(ElemStatLearn)
set = training_set
X1 = seq(min(set[, 1]) - 1, max(set[, 1]) + 1, by = 0.01)
X2 = seq(min(set[, 2]) - 1, max(set[, 2]) + 1, by = 0.01)
grid_set = expand.grid(X1, X2)
colnames(grid_set) = c('Age', 'EstimatedSalary')
y_grid = predict(classifier1,newdata=grid_set)
plot(set[, -3],
     main = 'SVM (Training set)',
     xlab = 'Age', ylab = 'Estimated Salary',
     xlim = range(X1), ylim = range(X2))
contour(X1, X2, matrix(as.numeric(y_grid), length(X1), length(X2)), add = TRUE)
points(grid_set, pch = '.', col = ifelse(y_grid == 1, 'springgreen3', 'tomato'))
points(set, pch = 21, bg = ifelse(set[, 3] == 1, 'green3', 'red2'))

####3. Visiulising the training set with polynomial kernel

classifier2=svm(formula= Purchased ~., data=training_set, 
               type="C-classification", kernel="poly" )
y_pred2 = predict(classifier2,newdata=test_set[-3])

Making the Confusion Matrix

cm = table(test_set[, 3], y_pred2)

set = training_set
X1 = seq(min(set[, 1]) - 1, max(set[, 1]) + 1, by = 0.01)
X2 = seq(min(set[, 2]) - 1, max(set[, 2]) + 1, by = 0.01)
grid_set = expand.grid(X1, X2)
colnames(grid_set) = c('Age', 'EstimatedSalary')
y_grid = predict(classifier2,newdata=grid_set)
plot(set[, -3],
     main = 'SVM (Training set)',
     xlab = 'Age', ylab = 'Estimated Salary',
     xlim = range(X1), ylim = range(X2))
contour(X1, X2, matrix(as.numeric(y_grid), length(X1), length(X2)), add = TRUE)
points(grid_set, pch = '.', col = ifelse(y_grid == 1, 'springgreen3', 'tomato'))
points(set, pch = 21, bg = ifelse(set[, 3] == 1, 'green3', 'red2'))

4. Visiulising the training set with sigmoid kernel

classifier3=svm(formula= Purchased ~., data=training_set, 
               type="C-classification", kernel="sigmoid" )
y_pred3 = predict(classifier3,newdata=test_set[-3])

Making the Confusion Matrix

cm = table(test_set[, 3], y_pred3)

set = training_set
X1 = seq(min(set[, 1]) - 1, max(set[, 1]) + 1, by = 0.01)
X2 = seq(min(set[, 2]) - 1, max(set[, 2]) + 1, by = 0.01)
grid_set = expand.grid(X1, X2)
colnames(grid_set) = c('Age', 'EstimatedSalary')
y_grid = predict(classifier3,newdata=grid_set)
plot(set[, -3],
     main = 'SVM (Training set)',
     xlab = 'Age', ylab = 'Estimated Salary',
     xlim = range(X1), ylim = range(X2))
contour(X1, X2, matrix(as.numeric(y_grid), length(X1), length(X2)), add = TRUE)
points(grid_set, pch = '.', col = ifelse(y_grid == 1, 'springgreen3', 'tomato'))
points(set, pch = 21, bg = ifelse(set[, 3] == 1, 'green3', 'red2'))

Visualising the Test set results with linear kernel

set = test_set
X1 = seq(min(set[, 1]) - 1, max(set[, 1]) + 1, by = 0.01)
X2 = seq(min(set[, 2]) - 1, max(set[, 2]) + 1, by = 0.01)
grid_set = expand.grid(X1, X2)
colnames(grid_set) = c('Age', 'EstimatedSalary')
y_grid = predict(classifier,newdata=grid_set)
plot(set[, -3],
     main = 'SVM (Test set)',
     xlab = 'Age', ylab = 'Estimated Salary',
     xlim = range(X1), ylim = range(X2))
contour(X1, X2, matrix(as.numeric(y_grid), length(X1), length(X2)), add = TRUE)
points(grid_set, pch = '.', col = ifelse(y_grid == 1, 'springgreen3', 'tomato'))
points(set, pch = 21, bg = ifelse(set[, 3] == 1, 'green4', 'red3'))

svm

fangya tan

November 21, 2017

Encoding the target feature as factor

Splitting the dataset into the Training set and Test set

install.packages(‘caTools’)

Feature Scaling

Fitting classifier to the Training set

Create your classifier here

Making the Confusion Matrix

1. Visualising the Training set results with linear kernel

2. Visiulising the training set with gussian kernel

Making the Confusion Matrix

Making the Confusion Matrix

4. Visiulising the training set with sigmoid kernel

Making the Confusion Matrix

Visualising the Test set results with linear kernel