cat(“# Section 1: Data Loading and Exploration”)

library(rmarkdown)

level = c(1,2,3,4,5) title = c(‘Dataset Exploration’, ‘Plotting and Visualization’, ‘Model Creation’,‘PCA’,‘Conclusion’ )

for(i in 1:length(level)){ cat(“##”, rep(‘#’, level[i]), title[i],‘’) }


data_frame=read.csv('job.csv')
tail(data_frame)
NA

Dataset Summary

Rows: 215
Columns: 8
$ sl_no           <int> 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14~
$ gender          <chr> "M", "M", "M", "M", "M", "M", "F", "M", "M", ~
$ ssc.grade       <dbl> 67.00, 79.33, 65.00, 56.00, 85.80, 55.00, 46.~
$ hsc.grade       <dbl> 91.00, 78.33, 68.00, 52.00, 73.60, 49.80, 49.~
$ Subject         <chr> "Commerce", "Science", "Arts", "Science", "Co~
$ bachelor.grade  <dbl> 58.00, 77.48, 64.00, 52.00, 73.30, 67.25, 79.~
$ work.experience <chr> "No", "Yes", "No", "No", "No", "Yes", "No", "~
$ status          <chr> "Placed", "Placed", "Placed", "Not Placed", "~

library(plotly)
library(ggplot2)
gg_box_plot=ggplot(data_frame,aes(y=hsc.grade,x=status))+
geom_boxplot(fill=c('red','green'),alpha=0.5)
gg_box_plot

ggplotly(gg_box_plot)
LS0tDQp0aXRsZTogIlByb2plY3QgUGFydCAtIDIiDQpvdXRwdXQ6IGh0bWxfbm90ZWJvb2sNCi0tLQ0KDQpjYXQoIiMgU2VjdGlvbiAxOiBEYXRhIExvYWRpbmcgYW5kIEV4cGxvcmF0aW9uXG5cbiIpDQoNCg0KbGlicmFyeShybWFya2Rvd24pDQoNCmxldmVsID0gYygxLDIsMyw0LDUpDQp0aXRsZSA9IGMoJ0RhdGFzZXQgRXhwbG9yYXRpb24nLCAnUGxvdHRpbmcgYW5kIFZpc3VhbGl6YXRpb24nLCAnTW9kZWwgQ3JlYXRpb24nLCdQQ0EnLCdDb25jbHVzaW9uJyApDQoNCg0KZm9yKGkgaW4gMTpsZW5ndGgobGV2ZWwpKXsNCmNhdCgiIyMiLCByZXAoJyMnLCBsZXZlbFtpXSksIHRpdGxlW2ldLCdcbicpDQp9DQoNCmBgYHtyfQ0KDQpkYXRhX2ZyYW1lPXJlYWQuY3N2KCdqb2IuY3N2JykNCnRhaWwoZGF0YV9mcmFtZSkNCg0KYGBgDQojIERhdGFzZXQgU3VtbWFyeQ0KDQpgYGB7ciBlY2hvPUZBTFNFfQ0KbGlicmFyeShkcGx5cikNCmdsaW1wc2UoZGF0YV9mcmFtZSkNCmBgYA0KDQpgYGB7cn0NCg0KbGlicmFyeShwbG90bHkpDQpsaWJyYXJ5KGdncGxvdDIpDQpnZ19ib3hfcGxvdD1nZ3Bsb3QoZGF0YV9mcmFtZSxhZXMoeT1oc2MuZ3JhZGUseD1zdGF0dXMpKSsNCmdlb21fYm94cGxvdChmaWxsPWMoJ3JlZCcsJ2dyZWVuJyksYWxwaGE9MC41KQ0KZ2dfYm94X3Bsb3QNCmdncGxvdGx5KGdnX2JveF9wbG90KQ0KYGBgDQoNCg0KDQo=