GET DATA FROM MUSHROOMS DATA SOURCE
Mushrooms_link <- read.csv(url("https://archive.ics.uci.edu/ml/machine-learning-databases/mushroom/agaricus-lepiota.data"))
Mushrooms_data <- as.data.frame(Mushrooms_link)
names(Mushrooms_data) = c("EDIBILITY", "CAP_SHAPE", "CAP_SURFACE", "CAP_COLOR", "BRUISES", "ODOR", "GILL_ATTACHMENT", "GILL_SPACING", "GILL_SIZE", "GILL_COLOR", "STALK_SHAPE", "STALK_ROOT", "STALK_SURFACE_ABOVE_RING", "STALK_SURFACE_BELOW_RING", "STALK_COLOR_ABOVE_RING", "STALK_COLOR_ABOVE_RING", "VEIL_TYPE", "VEIL_COLOR", "RING_NUMBER", "RING_TYPE", "SPORE_PRINT_COLOR", "POPULATION", "HABITAT")
head(Mushrooms_data)
## EDIBILITY CAP_SHAPE CAP_SURFACE CAP_COLOR BRUISES ODOR GILL_ATTACHMENT
## 1 e x s y t a f
## 2 e b s w t l f
## 3 p x y w t p f
## 4 e x s g f n f
## 5 e x y y t a f
## 6 e b s w t a f
## GILL_SPACING GILL_SIZE GILL_COLOR STALK_SHAPE STALK_ROOT
## 1 c b k e c
## 2 c b n e c
## 3 c n n e e
## 4 w b k t e
## 5 c b n e c
## 6 c b g e c
## STALK_SURFACE_ABOVE_RING STALK_SURFACE_BELOW_RING STALK_COLOR_ABOVE_RING
## 1 s s w
## 2 s s w
## 3 s s w
## 4 s s w
## 5 s s w
## 6 s s w
## STALK_COLOR_ABOVE_RING VEIL_TYPE VEIL_COLOR RING_NUMBER RING_TYPE
## 1 w p w o p
## 2 w p w o p
## 3 w p w o p
## 4 w p w o e
## 5 w p w o p
## 6 w p w o p
## SPORE_PRINT_COLOR POPULATION HABITAT
## 1 n n g
## 2 n n m
## 3 k s u
## 4 n a g
## 5 k n g
## 6 k n m
SUBSET
final_data_Column <- subset(Mushrooms_data, select = EDIBILITY:ODOR)
head(final_data_Column)
## EDIBILITY CAP_SHAPE CAP_SURFACE CAP_COLOR BRUISES ODOR
## 1 e x s y t a
## 2 e b s w t l
## 3 p x y w t p
## 4 e x s g f n
## 5 e x y y t a
## 6 e b s w t a
REPLACE THE ABBREVIATIONS USED IN THE DATA
EDIBILITY
final_data_Column$EDIBILITY = ifelse( final_data_Column$EDIBILITY == "p" , "POISONOUS", "EDIBLE")
CAP SHAPE
levels(final_data_Column$`CAP_SHAPE`) <- c(levels(final_data_Column$`CAP_SHAPE`), c("BELL","CONICAL","CONVEX","FLAT","KNOBBED","SUNKEN"))
final_data_Column$`CAP_SHAPE`[final_data_Column$`CAP_SHAPE` == "b"] <- "BELL"
final_data_Column$`CAP_SHAPE`[final_data_Column$`CAP_SHAPE` == "c"] <- "CONICAL"
final_data_Column$`CAP_SHAPE`[final_data_Column$`CAP_SHAPE` == "x"] <- "CONVEX"
final_data_Column$`CAP_SHAPE`[final_data_Column$`CAP_SHAPE` == "f"] <- "FLAT"
final_data_Column$`CAP_SHAPE`[final_data_Column$`CAP_SHAPE` == "k"] <- "KNOBBED"
final_data_Column$`CAP_SHAPE`[final_data_Column$`CAP_SHAPE` == "s"] <- "SUNKEN"
CAP SURFACE
levels(final_data_Column$`CAP_SURFACE`) <- c(levels(final_data_Column$`CAP_SURFACE`), c("FIBROUS", "GROOVES", "SCALY", "SMOOTH"))
final_data_Column$`CAP_SURFACE`[final_data_Column$`CAP_SURFACE` == "f"] <- "FIBROUS"
final_data_Column$`CAP_SURFACE`[final_data_Column$`CAP_SURFACE` == "g"] <- "GROOVES"
final_data_Column$`CAP_SURFACE`[final_data_Column$`CAP_SURFACE` == "y"] <- "SCALY"
final_data_Column$`CAP_SURFACE`[final_data_Column$`CAP_SURFACE` == "s"] <- "SMOOTH"
CAP COLOR
levels(final_data_Column$`CAP_COLOR`) <- c(levels(final_data_Column$`CAP_COLOR`), c("BROWN", "BUFF", "CINNAMON", "GRAY", "GREEN", "PINK", "PURPLE", "RED", "WHITE", "YELLOW"))
final_data_Column$`CAP_COLOR`[final_data_Column$`CAP_COLOR` == "n"] <- "BROWN"
final_data_Column$`CAP_COLOR`[final_data_Column$`CAP_COLOR` == "b"] <- "BUFF"
final_data_Column$`CAP_COLOR`[final_data_Column$`CAP_COLOR` == "c"] <- "CINNAMON"
final_data_Column$`CAP_COLOR`[final_data_Column$`CAP_COLOR` == "g"] <- "GRAY"
final_data_Column$`CAP_COLOR`[final_data_Column$`CAP_COLOR` == "r"] <- "GREEN"
final_data_Column$`CAP_COLOR`[final_data_Column$`CAP_COLOR` == "p"] <- "PINK"
final_data_Column$`CAP_COLOR`[final_data_Column$`CAP_COLOR` == "u"] <- "PURPLE"
final_data_Column$`CAP_COLOR`[final_data_Column$`CAP_COLOR` == "e"] <- "RED"
final_data_Column$`CAP_COLOR`[final_data_Column$`CAP_COLOR` == "w"] <- "WHITE"
final_data_Column$`CAP_COLOR`[final_data_Column$`CAP_COLOR` == "y"] <- "YELLOW"
BRUISES
final_data_Column$BRUISES = ifelse( final_data_Column$BRUISES == "t" , "BRUISES", "NO")
ODOR
levels(final_data_Column$`ODOR`) <- c(levels(final_data_Column$`ODOR`), c("ALMOND", "ANISE", "CREOSOTE", "FISHY", "FOUL", "MUSTY", "NONE", "PUNGENT", "SPICY"))
final_data_Column$`ODOR`[final_data_Column$`ODOR` == "a"] <- "ALMOND"
final_data_Column$`ODOR`[final_data_Column$`ODOR` == "l"] <- "ANISE"
final_data_Column$`ODOR`[final_data_Column$`ODOR` == "c"] <- "CREOSOTE"
final_data_Column$`ODOR`[final_data_Column$`ODOR` == "y"] <- "FISHY"
final_data_Column$`ODOR`[final_data_Column$`ODOR` == "m"] <- "MUSTY"
final_data_Column$`ODOR`[final_data_Column$`ODOR` == "n"] <- "NONE"
final_data_Column$`ODOR`[final_data_Column$`ODOR` == "p"] <- "PUNGENT"
final_data_Column$`ODOR`[final_data_Column$`ODOR` == "s"] <- "SPICY"
FINAL RESULT
head(final_data_Column)
## EDIBILITY CAP_SHAPE CAP_SURFACE CAP_COLOR BRUISES ODOR
## 1 EDIBLE CONVEX SMOOTH YELLOW BRUISES ALMOND
## 2 EDIBLE BELL SMOOTH WHITE BRUISES ANISE
## 3 POISONOUS CONVEX SCALY WHITE BRUISES PUNGENT
## 4 EDIBLE CONVEX SMOOTH GRAY NO NONE
## 5 EDIBLE CONVEX SCALY YELLOW BRUISES ALMOND
## 6 EDIBLE BELL SMOOTH WHITE BRUISES ALMOND