library(dplyr)
## 
## Attaching package: 'dplyr'
## The following objects are masked from 'package:stats':
## 
##     filter, lag
## The following objects are masked from 'package:base':
## 
##     intersect, setdiff, setequal, union
library(ggplot2)

Loading Data into R

DataN <- read.csv("Data.csv")
MasterDF <- read.csv("MasterData.csv")

Renaming column names

names(MasterDF)<-c("District","Mandal","Village","UDISE","School_Name","Address","Area","School_Category","School_Management","Enrolment")
names(DataN)<-c("District","Mandal","UDISE","School_Name","Enrolment")

Seeing through data

head(MasterDF)
##     District       Mandal          Village       UDISE
## 1 SRIKAKULAM VEERAGHATTAM        KADAKELLA 28110100101
## 2 SRIKAKULAM VEERAGHATTAM          KAMBARA 28110100201
## 3 SRIKAKULAM VEERAGHATTAM          KAMBARA 28110100203
## 4 SRIKAKULAM VEERAGHATTAM          KAMBARA 28110100204
## 5 SRIKAKULAM VEERAGHATTAM DASUMANTHA PURAM 28110100301
## 6 SRIKAKULAM VEERAGHATTAM       NARSIPURAM 28110100401
##             School_Name
## 1        MPPS KADAKELLA
## 2        CBMAPS KAMBARA
## 3         MPUPS KAMBARA
## 4   ZPHS KAMBARA VALASA
## 5 MPUPS DASUMANTHAPURAM
## 6       MPPS NARSIPURAM
##                                                                                 Address
## 1                      KADAKELLA-KADAKELLA (VILL)-KADAKELLA(VILL)-VEERAAGHATTAM(MANDAL)
## 2                            KAMBARA-KAMBARA (VILL)-KAMBARA(VILL)-VEERAAGHATTAM(MANDAL)
## 3                            KAMBARA-KAMBARA (VILL)-KAMBARA(VILL)-VEERAAGHATTAM(MANDAL)
## 4                           KAMBARA VALASA-NADUKURU-KAMBARA(VILL)-VEERAAGHATTAM(MANDAL)
## 5 DASUMANTHA PURAM-DASUMANTHA PURAM (VILL)-DASUMANTHA PURAM(VILL)-VEERAAGHATTAM(MANDAL)
## 6                   NARSIPURAM-NARSIPURAM (VILL)-NARSIPURAM(VILL)-VEERAAGHATTAM(MANDAL)
##    Area              School_Category  School_Management Enrolment
## 1 RURAL                    1-Primary 33-MPP_ZPP SCHOOLS        54
## 2 RURAL                    1-Primary       35-Pvt.Aided        18
## 3 RURAL 2-Primary with Upper Primary 33-MPP_ZPP SCHOOLS        80
## 4 RURAL    7-Upper Pr. and Secondary 33-MPP_ZPP SCHOOLS       146
## 5 RURAL 2-Primary with Upper Primary 33-MPP_ZPP SCHOOLS       108
## 6 RURAL                    1-Primary 33-MPP_ZPP SCHOOLS        68
DataN$Enrolment<-NULL
head(DataN)
##        District        Mandal       UDISE               School_Name
## 1       Krishna Chandarlapadu 28160501304      ZPHS Thotaravulapadu
## 2        Guntur  Amthurhaluru 28174900107 SKV HIGH SCHOOL KUCHIPUDI
## 3        Guntur  Amthurhaluru 28132102101               MPPS GOVADA
## 4        Guntur  Amthurhaluru 28174900102             MPPS NTR ROAD
## 5        Guntur        Ponnur 28174801906              ZPHS NANDURU
## 6 East Godavari     Kothapeta 28144600204            ZPHS VADAPALEM

Creating new data frame from MasterDF with “UDISE”,“Enrolment”,“School_Category”

DfNew <- MasterDF[,c("UDISE","School_Category","Enrolment")]
head(DfNew)
##         UDISE              School_Category Enrolment
## 1 28110100101                    1-Primary        54
## 2 28110100201                    1-Primary        18
## 3 28110100203 2-Primary with Upper Primary        80
## 4 28110100204    7-Upper Pr. and Secondary       146
## 5 28110100301 2-Primary with Upper Primary       108
## 6 28110100401                    1-Primary        68
DataN <-left_join(DataN,DfNew,by="UDISE")
head(DataN)
##        District        Mandal       UDISE               School_Name
## 1       Krishna Chandarlapadu 28160501304      ZPHS Thotaravulapadu
## 2        Guntur  Amthurhaluru 28174900107 SKV HIGH SCHOOL KUCHIPUDI
## 3        Guntur  Amthurhaluru 28132102101               MPPS GOVADA
## 4        Guntur  Amthurhaluru 28174900102             MPPS NTR ROAD
## 5        Guntur        Ponnur 28174801906              ZPHS NANDURU
## 6 East Godavari     Kothapeta 28144600204            ZPHS VADAPALEM
##             School_Category Enrolment
## 1 7-Upper Pr. and Secondary       157
## 2 7-Upper Pr. and Secondary       241
## 3                 1-Primary       111
## 4                 1-Primary        97
## 5 7-Upper Pr. and Secondary       239
## 6 7-Upper Pr. and Secondary       488

Saving Data Frame to CSv

write.csv(DataN, file = "DataN.csv")