library(dplyr)
##
## Attaching package: 'dplyr'
## The following objects are masked from 'package:stats':
##
## filter, lag
## The following objects are masked from 'package:base':
##
## intersect, setdiff, setequal, union
library(ggplot2)
Loading Data into R
DataN <- read.csv("Data.csv")
MasterDF <- read.csv("MasterData.csv")
Renaming column names
names(MasterDF)<-c("District","Mandal","Village","UDISE","School_Name","Address","Area","School_Category","School_Management","Enrolment")
names(DataN)<-c("District","Mandal","UDISE","School_Name","Enrolment")
Seeing through data
head(MasterDF)
## District Mandal Village UDISE
## 1 SRIKAKULAM VEERAGHATTAM KADAKELLA 28110100101
## 2 SRIKAKULAM VEERAGHATTAM KAMBARA 28110100201
## 3 SRIKAKULAM VEERAGHATTAM KAMBARA 28110100203
## 4 SRIKAKULAM VEERAGHATTAM KAMBARA 28110100204
## 5 SRIKAKULAM VEERAGHATTAM DASUMANTHA PURAM 28110100301
## 6 SRIKAKULAM VEERAGHATTAM NARSIPURAM 28110100401
## School_Name
## 1 MPPS KADAKELLA
## 2 CBMAPS KAMBARA
## 3 MPUPS KAMBARA
## 4 ZPHS KAMBARA VALASA
## 5 MPUPS DASUMANTHAPURAM
## 6 MPPS NARSIPURAM
## Address
## 1 KADAKELLA-KADAKELLA (VILL)-KADAKELLA(VILL)-VEERAAGHATTAM(MANDAL)
## 2 KAMBARA-KAMBARA (VILL)-KAMBARA(VILL)-VEERAAGHATTAM(MANDAL)
## 3 KAMBARA-KAMBARA (VILL)-KAMBARA(VILL)-VEERAAGHATTAM(MANDAL)
## 4 KAMBARA VALASA-NADUKURU-KAMBARA(VILL)-VEERAAGHATTAM(MANDAL)
## 5 DASUMANTHA PURAM-DASUMANTHA PURAM (VILL)-DASUMANTHA PURAM(VILL)-VEERAAGHATTAM(MANDAL)
## 6 NARSIPURAM-NARSIPURAM (VILL)-NARSIPURAM(VILL)-VEERAAGHATTAM(MANDAL)
## Area School_Category School_Management Enrolment
## 1 RURAL 1-Primary 33-MPP_ZPP SCHOOLS 54
## 2 RURAL 1-Primary 35-Pvt.Aided 18
## 3 RURAL 2-Primary with Upper Primary 33-MPP_ZPP SCHOOLS 80
## 4 RURAL 7-Upper Pr. and Secondary 33-MPP_ZPP SCHOOLS 146
## 5 RURAL 2-Primary with Upper Primary 33-MPP_ZPP SCHOOLS 108
## 6 RURAL 1-Primary 33-MPP_ZPP SCHOOLS 68
DataN$Enrolment<-NULL
head(DataN)
## District Mandal UDISE School_Name
## 1 Krishna Chandarlapadu 28160501304 ZPHS Thotaravulapadu
## 2 Guntur Amthurhaluru 28174900107 SKV HIGH SCHOOL KUCHIPUDI
## 3 Guntur Amthurhaluru 28132102101 MPPS GOVADA
## 4 Guntur Amthurhaluru 28174900102 MPPS NTR ROAD
## 5 Guntur Ponnur 28174801906 ZPHS NANDURU
## 6 East Godavari Kothapeta 28144600204 ZPHS VADAPALEM
Creating new data frame from MasterDF with “UDISE”,“Enrolment”,“School_Category”
DfNew <- MasterDF[,c("UDISE","School_Category","Enrolment")]
head(DfNew)
## UDISE School_Category Enrolment
## 1 28110100101 1-Primary 54
## 2 28110100201 1-Primary 18
## 3 28110100203 2-Primary with Upper Primary 80
## 4 28110100204 7-Upper Pr. and Secondary 146
## 5 28110100301 2-Primary with Upper Primary 108
## 6 28110100401 1-Primary 68
DataN <-left_join(DataN,DfNew,by="UDISE")
head(DataN)
## District Mandal UDISE School_Name
## 1 Krishna Chandarlapadu 28160501304 ZPHS Thotaravulapadu
## 2 Guntur Amthurhaluru 28174900107 SKV HIGH SCHOOL KUCHIPUDI
## 3 Guntur Amthurhaluru 28132102101 MPPS GOVADA
## 4 Guntur Amthurhaluru 28174900102 MPPS NTR ROAD
## 5 Guntur Ponnur 28174801906 ZPHS NANDURU
## 6 East Godavari Kothapeta 28144600204 ZPHS VADAPALEM
## School_Category Enrolment
## 1 7-Upper Pr. and Secondary 157
## 2 7-Upper Pr. and Secondary 241
## 3 1-Primary 111
## 4 1-Primary 97
## 5 7-Upper Pr. and Secondary 239
## 6 7-Upper Pr. and Secondary 488
Saving Data Frame to CSv
write.csv(DataN, file = "DataN.csv")