Dataset: Loksabha 2019 Candidates General Information. (https://www.kaggle.com/datasets/themlphdstudent/lok-sabha-election-candidate-list-2004-to-2019)
# Importing required libraries
library(tidyverse)
## ── Attaching core tidyverse packages ──────────────────────── tidyverse 2.0.0 ──
## ✔ dplyr 1.1.2 ✔ readr 2.1.4
## ✔ forcats 1.0.0 ✔ stringr 1.5.0
## ✔ ggplot2 3.4.3 ✔ tibble 3.2.1
## ✔ lubridate 1.9.2 ✔ tidyr 1.3.0
## ✔ purrr 1.0.2
## ── Conflicts ────────────────────────────────────────── tidyverse_conflicts() ──
## ✖ dplyr::filter() masks stats::filter()
## ✖ dplyr::lag() masks stats::lag()
## ℹ Use the conflicted package (<http://conflicted.r-lib.org/>) to force all conflicts to become errors
library(ggrepel)
# Loading our dataset
data <-read.csv('C:\\Users\\bhush\\Downloads\\Coursework\\I 590 INTRO TO R\\datasets\\data_final\\LokSabha2019_xl.csv')
df1 <- data |>
group_by(Party) |>
summarise(total_winners = sum(Winner))
sort_df1<- df1|>
arrange(desc(total_winners))
head(sort_df1,7)
## # A tibble: 7 Ă— 2
## Party total_winners
## <chr> <int>
## 1 BJP 184
## 2 INC 22
## 3 AITC 13
## 4 DMK 13
## 5 YSRCP 12
## 6 BJD 11
## 7 SHS 7
plt1 <- sort_df1[c(1:7),]
ggplot(data = plt1)+
geom_bar(mapping = aes(x = Party, y = total_winners), stat = "identity") +
theme_classic() +
labs(title = "Winning Candidates", x = "Parties", y = "Count")
df2 <- data |>
group_by(Education) |>
summarise(noOfCandidates = sum(Winner))
print(df2)
## # A tibble: 12 Ă— 2
## Education noOfCandidates
## <chr> <int>
## 1 10th Pass 21
## 2 12th Pass 34
## 3 5th Pass 3
## 4 8th Pass 6
## 5 Doctorate 13
## 6 Graduate 72
## 7 Graduate Professional 68
## 8 Illiterate 1
## 9 Literate 1
## 10 Not Given 0
## 11 Others 11
## 12 Post Graduate 75
sort_df2<- df2|>
arrange(desc(noOfCandidates))
plt2 <- sort_df2[c(1:7),]
ggplot(data = plt2)+
geom_bar(mapping = aes(x = Education, y = noOfCandidates), stat = "identity") +
theme_classic() +
labs(title = "Winning Candidates - Education Lvl", x = "Education", y = "Count")
df3 <- data[grep("Delhi", data$Constituency, ignore.case = TRUE), ]
print(df3)
## Candidate Party
## 4350 Gautam Gambhir BJP
## 4351 Ajay Chaudhary Aapki Apni Party (Peoples)
## 4352 Amanullah Ahmed Bhartiya Insan Party
## 4353 Anupam Tripathi Bhartiya Kisan Party
## 4354 Arvinder Singh Lovely INC
## 4355 Ashok Surana IND
## 4356 Atishi AAP
## 4357 D. Durga Prasad Challengers Party
## 4358 Deepti Nadella Pyramid Party of India
## 4359 Hafiz Burhanuddin The National Road Map Party of India
## 4360 Harbalwinder Singh IND
## 4361 Hitesh Kumar Jai Prakash Janata Dal
## 4362 Krishan Singh Chauhan Peoples Party of India (Democratic)
## 4363 Manjeet Singh Rashtra Nirman Party
## 4364 Manju Chhibber RPI(A)
## 4365 Manoj Kumar Gupta IND
## 4366 Mohan Lal Sharma Satya Bahumat Party
## 4367 Mukesh Jadly Uttarakhand Pragatisheel Party
## 4368 Neeru Mongia PRISM Party
## 4369 Rahimuddin Shah IND
## 4370 Raj Kumar Dhingiya IND
## 4371 Ravi Kumar IND
## 4372 Sanjay Kumar BSP
## 4373 Satish Kumar Prajapati Mazdoor Kirayedar Vikas Party
## 4374 Shiv Kumar IND
## 4375 Surender Gupta National Apni Party
## 4376 Meenakashi Lekhi BJP
## 4377 Aashish S Saxena IND
## 4378 Ajay Kumar Lal IND
## 4379 Ajay Makan INC
## 4380 Brijesh Goyal AAP
## 4381 Dilip Singh Kothari IND
## 4382 Harkrishan Das Nijhawan IND
## 4383 Jitendra Raut Akhil Bharatiya Manavata Paksha
## 4384 K Sreekrishna Jammu & Kashmir National Panthers Party
## 4385 Kripashankar C Pandey IND
## 4386 Lal Ji Akhand Rashtrawadi Party
## 4387 Naveen Kumar Rashtriya Samrasta Party
## 4388 Nilanjan Banerjee Bharat Lok Sewak Party
## 4389 Priyanka Bharihoke IND
## 4390 Raj Karan Corruption Abolition Party
## 4391 Raj Shekhar Gunti PRISM Party
## 4392 Rajesh Satiya Sanatan Sanskriti Raksha Dal
## 4393 Ramesh IND
## 4394 Ravinder Paul Sehgal Pyramid Party of India
## 4395 Sree Nivasan Ramamoorthy IND
## 4396 Sunil Aapki Apni Party (Peoples)
## 4397 Sunil Kumar Peoples Party of India (Democratic)
## 4398 Suresh Kumar IND
## 4399 Swadesh Kumar Ohr Atulya Bharat Party
## 4400 Umesh Chandra Gaur RPI(A)
## 4401 Upendra Anjaan Aadmi Party
## 4402 Virendra Singh Bharat Rashtriya Rashtrawadi Party
## 4403 Manoj Tiwari BJP
## 4404 Abhinav Kumar Sanyukt Vikas Party
## 4405 Ajay Bhai Right to Recall Party
## 4406 Amit Kumar Sharma Sanjhi Virasat Party
## 4407 Amrender Kumar IND
## 4408 Anil Kumar Yadav IND
## 4409 Anuruddh Kumar Dube Bharat Lok Sewak Party
## 4410 D Durga Prasad Challengers Party
## 4411 Dan Bahadur Yadav Bhartiya Janta Dal (Integrated)
## 4412 Dilip Pandey AAP
## 4413 J. K. Jain Jai Prakash Janata Dal
## 4414 Mahender Paswan Mazdoor Kirayedar Vikas Party
## 4415 Mahfooj Khan IND
## 4416 Manager Chaurasiya SUCI(C)
## 4417 Md Akram IND
## 4418 Mohd Hasan RPI(A)
## 4419 Mohd Irfan Bharat Prabhat Party
## 4420 Mukesh Aapki Apni Party (Peoples)
## 4421 Pradesh Kumar Sarvodaya Prabhat Party
## 4422 Rajveer Singh BSP
## 4423 S N Singh IND
## 4424 Sheila Dikshit INC
## 4425 Sunil Vishvakarma Ambedkar National Congress
## 4426 Yogesh Swamy IND
## 4427 Hans Raj Hans BJP
## 4428 Aditi IND
## 4429 Charan Singh "Babrik" IND
## 4430 Gaurav Bhatia Mazdoor Kirayedar Vikas Party
## 4431 Gugan Singh AAP
## 4432 Ishwar Mansukh Ishu Satya Bahumat Party
## 4433 Madan Lal Balmiki Rashtriya Samrasta Party
## 4434 Naveen IND
## 4435 Rajesh Lilothia INC
## 4436 Ram Kumar Bhartiya Pragatisheel Congress
## 4437 Suresh Kumar Socialist Janata Party
## 4438 Ramesh Bidhuri BJP
## 4439 Aditya Kumar Naveen Hum Bhartiya Party
## 4440 Birju Nayak IND
## 4441 Dalbir Singh Malik Voters Party International
## 4442 Deepak Kumar Aapki Apni Party (Peoples)
## 4443 Desh Kumar Akhil Bharatiya Jan Sangh
## 4444 Dilip Kumar Sanatan Sanskriti Raksha Dal
## 4445 Dr. Mahender Singh Churiyana Peoples Party of India (Democratic)
## 4446 Dr. Suman Yadav Jai Maha Bharath Party
## 4447 Harsh Nath Verma IND
## 4448 Jitendra PRISM Party
## 4449 K Roshan Kumar Pyramid Party of India
## 4450 Mathews Bhartiya Insan Party
## 4451 Mohan Kumar Gupta Mazdoor Kirayedar Vikas Party
## 4452 Naise Khan IND
## 4453 Navanit National Youth Party
## 4454 Raghav Chadha AAP
## 4455 Rajendra Prasad Gupta Parivartan Samaj Party
## 4456 Ram Khelawan Proutist Bloc, India
## 4457 Roshan Kumar Choudhary IND
## 4458 Sandeep Rashtriya Jan Adhikar Party
## 4459 Siddhant Gautam BSP
## 4460 Sobran Singh Chauhan Rashtriya Rashtrawadi Party
## 4461 Sumedha Bodh Jan Samman party
## 4462 Sunil Kumar IND
## 4463 Vijender INC
## 4464 Parvesh Sahib Singh BJP
## 4465 Baidyanath Sah Proutist Bloc, India
## 4466 Balbir Singh Jakhar AAP
## 4467 Balbir Singh S/O Dayaram Chaudhary IND
## 4468 Daya Nand Vats RPI(A)
## 4469 Dharambir Singh Rashtriya Janshakti Party (Secular)
## 4470 Harsh Vardhan Shukla IND
## 4471 Iqbal Singh (Sonu) IND
## 4472 Janak Raj Rana Akhand Rashtrawadi Party
## 4473 Kulwinder Singh Mehta Pyramid Party of India
## 4474 M. Mishra IND
## 4475 Mahabal Mishra INC
## 4476 Manmohan Singh Rashtra Nirman Party
## 4477 Navin Chandra Das IND
## 4478 Poonam Peoples Party of India (Democratic)
## 4479 Pravesh Sharma IND
## 4480 Probir Dutta Satya Bahumat Party
## 4481 Rajiv Kumar IND
## 4482 Ramesh Chand Verma IND
## 4483 Shashijeet National Youth Party
## 4484 Shish Pal Singh PRISM Party
## 4485 Sita Saran Sen BSP
## 4486 Vikash Kumar Mohal Aapki Apni Party (Peoples)
## Criminal.Cases Education Age Total.Assets Constituency
## 4350 1 12th Pass 37 1471587789 East Delhi
## 4351 0 12th Pass 42 559000 East Delhi
## 4352 0 10th Pass 34 7944500 East Delhi
## 4353 0 Graduate Professional 38 3071500 East Delhi
## 4354 0 Graduate 50 50452066 East Delhi
## 4355 0 Graduate 44 112354277 East Delhi
## 4356 1 Post Graduate 37 12012824 East Delhi
## 4357 0 Graduate Professional 53 47138000 East Delhi
## 4358 0 Post Graduate 38 9062141 East Delhi
## 4359 0 Post Graduate 57 6645000 East Delhi
## 4360 0 Post Graduate 38 143303628 East Delhi
## 4361 0 Post Graduate 38 53725000 East Delhi
## 4362 0 Doctorate 56 26415314 East Delhi
## 4363 0 Graduate Professional 31 6240443 East Delhi
## 4364 0 Graduate 64 31868000 East Delhi
## 4365 0 Post Graduate 42 35324 East Delhi
## 4366 0 Post Graduate 72 20428012 East Delhi
## 4367 0 Post Graduate 48 12504856 East Delhi
## 4368 0 Graduate Professional 40 21370288 East Delhi
## 4369 0 10th Pass 39 938785 East Delhi
## 4370 0 Post Graduate 40 708293 East Delhi
## 4371 0 Graduate 53 39705621 East Delhi
## 4372 0 12th Pass 48 4693400 East Delhi
## 4373 0 8th Pass 48 4114657 East Delhi
## 4374 0 5th Pass 45 1198000 East Delhi
## 4375 0 5th Pass 43 590000 East Delhi
## 4376 0 Graduate Professional 51 361441689 New Delhi
## 4377 0 Post Graduate 39 2680000 New Delhi
## 4378 0 Post Graduate 60 46731242 New Delhi
## 4379 0 Post Graduate 55 245732926 New Delhi
## 4380 0 Graduate 43 9594156 New Delhi
## 4381 0 Post Graduate 59 5852977 New Delhi
## 4382 1 12th Pass 56 36167926 New Delhi
## 4383 1 Graduate 40 649510 New Delhi
## 4384 0 Post Graduate 49 59282 New Delhi
## 4385 0 12th Pass 61 69416833 New Delhi
## 4386 1 Graduate 49 6494000 New Delhi
## 4387 0 Graduate Professional 44 7606632 New Delhi
## 4388 0 12th Pass 41 60000 New Delhi
## 4389 0 Post Graduate 33 3832340 New Delhi
## 4390 0 10th Pass 61 20105350 New Delhi
## 4391 0 Graduate 44 492771 New Delhi
## 4392 0 Post Graduate 36 62108 New Delhi
## 4393 1 Graduate Professional 58 44836000 New Delhi
## 4394 0 Post Graduate 70 45725073 New Delhi
## 4395 0 Graduate Professional 57 9996766 New Delhi
## 4396 0 8th Pass 36 2509219 New Delhi
## 4397 0 Post Graduate 47 11664371 New Delhi
## 4398 0 Graduate 41 1376000 New Delhi
## 4399 0 Graduate 77 33423025 New Delhi
## 4400 0 Doctorate 51 3901922 New Delhi
## 4401 0 Graduate Professional 31 1024406 New Delhi
## 4402 0 Graduate Professional 57 3406386 New Delhi
## 4403 3 Post Graduate 48 242817031 North East Delhi
## 4404 0 Graduate 32 1167520 North East Delhi
## 4405 0 10th Pass 35 14088213 North East Delhi
## 4406 0 Graduate 43 2386000 North East Delhi
## 4407 0 10th Pass 30 2590450 North East Delhi
## 4408 0 Graduate 27 222218 North East Delhi
## 4409 1 10th Pass 39 13345000 North East Delhi
## 4410 0 Graduate Professional 53 47138000 North East Delhi
## 4411 0 Graduate Professional 43 4305100 North East Delhi
## 4412 1 Post Graduate 38 5433393 North East Delhi
## 4413 0 Graduate Professional 61 12182945 North East Delhi
## 4414 0 8th Pass 41 1857000 North East Delhi
## 4415 0 8th Pass 42 259000 North East Delhi
## 4416 0 12th Pass 51 903000 North East Delhi
## 4417 0 Graduate Professional 34 330057 North East Delhi
## 4418 0 12th Pass 44 372000 North East Delhi
## 4419 0 Graduate Professional 41 12463190 North East Delhi
## 4420 1 10th Pass 53 17285880 North East Delhi
## 4421 0 Graduate Professional 35 1102410 North East Delhi
## 4422 0 12th Pass 43 92354028 North East Delhi
## 4423 1 Doctorate 72 28183644 North East Delhi
## 4424 0 Post Graduate 81 49285773 North East Delhi
## 4425 0 10th Pass 47 4502000 North East Delhi
## 4426 0 Graduate 36 32514 North East Delhi
## 4427 0 10th Pass 57 130937732 North West Delhi
## 4428 1 Graduate 25 18505 North West Delhi
## 4429 0 8th Pass 50 205330 North West Delhi
## 4430 0 8th Pass 31 283000 North West Delhi
## 4431 0 8th Pass 70 12853787 North West Delhi
## 4432 1 8th Pass 34 125718 North West Delhi
## 4433 1 10th Pass 66 2637085 North West Delhi
## 4434 0 12th Pass 33 4375000 North West Delhi
## 4435 0 Post Graduate 53 44456251 North West Delhi
## 4436 0 Graduate 62 28000 North West Delhi
## 4437 0 Graduate Professional 65 25320000 North West Delhi
## 4438 2 Graduate Professional 57 180052708 South Delhi
## 4439 0 12th Pass 34 2044023 South Delhi
## 4440 0 Graduate 44 4589741 South Delhi
## 4441 0 12th Pass 56 69949801 South Delhi
## 4442 0 8th Pass 41 6254000 South Delhi
## 4443 0 Graduate 56 611000 South Delhi
## 4444 0 Graduate 44 4856379 South Delhi
## 4445 0 Post Graduate 61 32015000 South Delhi
## 4446 0 Doctorate 42 24054066 South Delhi
## 4447 0 8th Pass 61 50000 South Delhi
## 4448 0 Graduate Professional 40 4392289 South Delhi
## 4449 0 Others 53 3217000 South Delhi
## 4450 0 Graduate 63 592000 South Delhi
## 4451 0 Graduate 31 1948254 South Delhi
## 4452 0 5th Pass 60 260500 South Delhi
## 4453 2 Post Graduate 40 94043 South Delhi
## 4454 0 Graduate Professional 30 1647954 South Delhi
## 4455 0 Post Graduate 49 278181 South Delhi
## 4456 0 10th Pass 50 2602100 South Delhi
## 4457 0 12th Pass 45 29000 South Delhi
## 4458 0 8th Pass 36 1206152 South Delhi
## 4459 0 Post Graduate 52 7797516 South Delhi
## 4460 0 Graduate 63 5643963 South Delhi
## 4461 0 Post Graduate 35 1378221 South Delhi
## 4462 0 10th Pass 39 2031247 South Delhi
## 4463 0 Graduate 33 121525000 South Delhi
## 4464 0 Post Graduate 41 155195014 West Delhi
## 4465 0 Graduate Professional 53 5240190 West Delhi
## 4466 0 Graduate Professional 47 32894288 West Delhi
## 4467 0 Graduate 56 2629592 West Delhi
## 4468 0 Post Graduate 62 10570909 West Delhi
## 4469 0 10th Pass 57 499904 West Delhi
## 4470 0 Graduate Professional 26 508722 West Delhi
## 4471 1 8th Pass 45 10436974 West Delhi
## 4472 0 Graduate Professional 57 41572000 West Delhi
## 4473 0 12th Pass 54 1762088 West Delhi
## 4474 0 Graduate Professional 41 6425058 West Delhi
## 4475 3 12th Pass 65 450721618 West Delhi
## 4476 0 Post Graduate 58 35166395 West Delhi
## 4477 0 Graduate 69 8044000 West Delhi
## 4478 0 Graduate 48 4189796 West Delhi
## 4479 0 Post Graduate 36 5421404 West Delhi
## 4480 0 Post Graduate 44 6093819 West Delhi
## 4481 0 Graduate Professional 51 140037 West Delhi
## 4482 0 5th Pass 58 9684561 West Delhi
## 4483 0 12th Pass 44 1173350 West Delhi
## 4484 0 5th Pass 64 2362891 West Delhi
## 4485 0 10th Pass 40 15707415 West Delhi
## 4486 0 12th Pass 25 108973 West Delhi
## Liabilities Winner Gender
## 4350 342035860 0 M
## 4351 180000 0 M
## 4352 0 0 M
## 4353 700000 0 M
## 4354 0 0 M
## 4355 2250000 0 M
## 4356 0 0 M
## 4357 0 0 M
## 4358 0 0 F
## 4359 0 0 M
## 4360 0 0 M
## 4361 3000000 0 M
## 4362 750832 0 M
## 4363 230501 0 M
## 4364 0 0 F
## 4365 0 0 M
## 4366 0 0 M
## 4367 950000 0 M
## 4368 1980000 0 F
## 4369 0 0 M
## 4370 0 0 M
## 4371 334500 0 M
## 4372 845000 0 M
## 4373 0 0 M
## 4374 0 0 M
## 4375 0 0 M
## 4376 7938378 1 F
## 4377 242000 0 M
## 4378 4301374 0 M
## 4379 0 0 M
## 4380 3285554 0 M
## 4381 0 0 M
## 4382 575000 0 M
## 4383 14406 0 M
## 4384 0 0 M
## 4385 3570000 0 M
## 4386 170000 0 M
## 4387 86034 0 M
## 4388 0 0 M
## 4389 0 0 F
## 4390 100000 0 M
## 4391 2601000 0 M
## 4392 43326 0 M
## 4393 65000 0 M
## 4394 73782 0 M
## 4395 0 0 M
## 4396 1810000 0 M
## 4397 1761306 0 M
## 4398 0 0 M
## 4399 476000 0 M
## 4400 0 0 M
## 4401 0 0 M
## 4402 1500000 0 M
## 4403 13618755 0 M
## 4404 0 0 M
## 4405 8750871 0 M
## 4406 0 0 M
## 4407 250000 0 M
## 4408 0 0 M
## 4409 1820843 0 M
## 4410 0 0 M
## 4411 0 0 M
## 4412 0 0 M
## 4413 0 0 M
## 4414 0 0 M
## 4415 100000 0 M
## 4416 0 0 M
## 4417 0 0 M
## 4418 0 0 M
## 4419 0 0 M
## 4420 600000 0 M
## 4421 201238 0 M
## 4422 40746162 0 M
## 4423 0 0 M
## 4424 0 0 F
## 4425 682000 0 M
## 4426 0 0 M
## 4427 47897494 1 M
## 4428 0 0 M
## 4429 0 0 M
## 4430 0 0 M
## 4431 0 0 M
## 4432 20000 0 M
## 4433 0 0 M
## 4434 0 0 M
## 4435 79000 0 M
## 4436 0 0 M
## 4437 0 0 M
## 4438 2038454 0 M
## 4439 0 0 M
## 4440 130000 0 M
## 4441 5181183 0 M
## 4442 0 0 M
## 4443 0 0 M
## 4444 586000 0 M
## 4445 1150000 0 M
## 4446 1600000 0 F
## 4447 0 0 M
## 4448 0 0 M
## 4449 0 0 M
## 4450 0 0 M
## 4451 0 0 M
## 4452 0 0 M
## 4453 1150000 0 M
## 4454 0 0 M
## 4455 0 0 M
## 4456 108000 0 M
## 4457 0 0 M
## 4458 0 0 M
## 4459 900000 0 M
## 4460 0 0 M
## 4461 0 0 F
## 4462 0 0 M
## 4463 31967000 0 M
## 4464 40097329 1 M
## 4465 211300 0 M
## 4466 4161197 0 M
## 4467 0 0 M
## 4468 0 0 M
## 4469 0 0 M
## 4470 0 0 M
## 4471 0 0 M
## 4472 700000 0 M
## 4473 0 0 M
## 4474 0 0 M
## 4475 2814393 0 M
## 4476 12015 0 M
## 4477 1280000 0 M
## 4478 1271875 0 F
## 4479 926560 0 M
## 4480 0 0 M
## 4481 0 0 M
## 4482 0 0 M
## 4483 0 0 M
## 4484 0 0 M
## 4485 400000 0 M
## 4486 25000 0 M
df3_mean <- mean(df3$Total.Assets)
print(df3_mean)
## [1] 37408946
winD <- mutate(df3, Winner == 1)
df3 |>
ggplot(mapping = aes(x = Constituency, y = Total.Assets)) +
geom_point(data = filter(winD, Winner == 1), color = 'green') +
geom_point(data = filter(winD, !Winner == 1), color = 'blue')+
geom_text_repel(data = filter(winD, Winner==1),
mapping = aes(label = Candidate))+
theme_classic()
df4 <- df3 |>
group_by(Party) |>
summarise(total_assets_ = sum(Total.Assets))
sort_df4<- df4|>
arrange(desc(total_assets_))
plt4 <- sort_df4[c(1:7),]
ggplot(data = plt4)+
geom_bar(mapping = aes(x = Party, y = total_assets_), stat = "identity") +
theme_classic() +
theme(axis.text.x = element_text(angle = 90, hjust = 1))+
labs(title = "Parties and their Assets", x = "Party", y = "Amounts")
1. Party
2. Total Winners in that party
3. Total Assets in that party
We will choose a row at random and find the probability that the party in that row would have assets greater than 300000 INR.
We do an estimated_probability operations by running almost 1000 times our for loop.
l_join <- merge(x = sort_df1, y = sort_df4, by = "Party", all.x = TRUE)
iterations <- 1000
condition_counter <- 0
for (i in 1:iterations) {
random_row <- l_join[sample(nrow(l_join), 1), ]
ifelse(random_row$total_assets_ > 300000, condition_counter <- condition_counter + 1,condition_counter <- condition_counter )
}
estimated_probability <- condition_counter / iterations
cat("Estimated probability of the following example is:", estimated_probability)
## Estimated probability of the following example is: 0.077