Initial Setup

#including libs
library(dplyr)
library(ggplot2)

#importing data
occupation <- read.csv("occupation_data.csv")


occupation_complete <- occupation[complete.cases(occupation),]
#removing all null values
cleandata <- occupation[complete.cases(occupation),]

#filter data for office workers only
just_office <- cleandata %>% filter(occupation_category == "OFFICE")

Printout of Number of Categories


#print count of occ_category
table(occupation_complete$occupation_category)

           AGRICULTURAL                    ARTS                BUSINESS           COMPUTATIONAL 
                      1                       3                      12                       7 
               CULINARY               EDUCATION             ENGINEERING          GROUNDSKEEPING 
                      7                       4                       2                       3 
HEALTHCARE PROFESSIONAL      HEALTHCARE SUPPORT                   LEGAL              MANAGEMENT 
                      7                       1                       1                      16 
                 OFFICE              PRODUCTION      PROTECTIVE SERVICE                   SALES 
                     17                      11                       3                      11 
                SCIENCE                 SERVICE          SOCIAL SERVICE          TRANSPORTATION 
                      3                       3                       3                       4 
#using a frequency table to assess the number of categories 
LS0tCnRpdGxlOiAiT2NjdXBhdGlvbmFsIERhdGEgR3JhcGhzIgpvdXRwdXQ6IGh0bWxfbm90ZWJvb2sKZWRpdG9yX29wdGlvbnM6IAogIG1hcmtkb3duOiAKICAgIHdyYXA6IDcyCi0tLQoKCiMjIEluaXRpYWwgU2V0dXAKYGBge3J9CiNpbmNsdWRpbmcgbGlicwpsaWJyYXJ5KGRwbHlyKQpsaWJyYXJ5KGdncGxvdDIpCgojaW1wb3J0aW5nIGRhdGEKb2NjdXBhdGlvbiA8LSByZWFkLmNzdigib2NjdXBhdGlvbl9kYXRhLmNzdiIpCgoKb2NjdXBhdGlvbl9jb21wbGV0ZSA8LSBvY2N1cGF0aW9uW2NvbXBsZXRlLmNhc2VzKG9jY3VwYXRpb24pLF0KI3JlbW92aW5nIGFsbCBudWxsIHZhbHVlcwpjbGVhbmRhdGEgPC0gb2NjdXBhdGlvbltjb21wbGV0ZS5jYXNlcyhvY2N1cGF0aW9uKSxdCgojZmlsdGVyIGRhdGEgZm9yIG9mZmljZSB3b3JrZXJzIG9ubHkKanVzdF9vZmZpY2UgPC0gY2xlYW5kYXRhICU+JSBmaWx0ZXIob2NjdXBhdGlvbl9jYXRlZ29yeSA9PSAiT0ZGSUNFIikKCgpgYGAKCgojIyBQcmludG91dCBvZiBOdW1iZXIgb2YgQ2F0ZWdvcmllcwpgYGB7cn0KCiNwcmludCBjb3VudCBvZiBvY2NfY2F0ZWdvcnkKdGFibGUob2NjdXBhdGlvbl9jb21wbGV0ZSRvY2N1cGF0aW9uX2NhdGVnb3J5KQojdXNpbmcgYSBmcmVxdWVuY3kgdGFibGUgdG8gYXNzZXNzIHRoZSBudW1iZXIgb2YgY2F0ZWdvcmllcyAKYGBgCgoKCiMjIFByaW50IEdyYXBoIE4xCnRoaXMgZ3JhcGggc2hvd3MgdGhlIGRpc3RyaWJ1dGlvbiBvZiBlYXJuaW5ncyBmb3IgZWFjaCBjYXRlZ29yeQpgYGB7cn0KaGlzdChvY2N1cGF0aW9uX2NvbXBsZXRlJEFsbF93ZWVrbHksIGJyZWFrcyA9IDQwLCBjb2wgPSAibGlnaHRwaW5rIiwgbWFpbiA9ICJEaXN0cmlidXRpb24gb2YgRWFybmluZ3MgLSBBbGwgQ2F0ZWdvcmllcyIsCiAgICAgeGxhYiA9ICJXZWVrbHkgRWFybmluZ3MiLCB5bGFiID0gIkZyZXF1ZW5jeSIpCmBgYAoKCiMgUHJpbnQgSGlzdG9ncmFtCmBgYHtyfQojSElTVE9HUkFNLS12aXN1YWxpemVzIHRoZSBkaXN0cmlidXRpb24gb2YgZWFybmluZ3Mgd2l0aGluIHRoZSBjYXRlZ29yeSBmb3IgYm90aCBnZW5kZXJzCgptYW5hZ2VtZW50IDwtIG9jY3VwYXRpb25fY29tcGxldGUgJT4lIGZpbHRlcihvY2N1cGF0aW9uX2NhdGVnb3J5ICVpbiUgKCJNQU5BR0VNRU5UIikpICNmaWx0ZXJpbmcgbWFuYWdlbWVudCBvY2N1cGF0aW9ucyBvbmx5Cm1hbmFnZW1lbnRfZWFybmluZ3MgPC0gbWFuYWdlbWVudCRBbGxfd2Vla2x5ICNzYXZpbmcgdGhlIHZhbHVlcyBpbiBhIHZlY3RvciBhcyByZWZlcmVuY2UKCmhpc3QobWFuYWdlbWVudCRBbGxfd2Vla2x5LCBicmVha3MgPSAxMCwgY29sID0gImxpZ2h0eWVsbG93IiwgbWFpbiA9ICJEaXN0cmlidXRpb24gb2YgRWFybmluZ3MgLSBNYW5hZ2VtZW50IiwKICAgICB4bGFiID0gIldlZWtseSBFYXJuaW5ncyIsIHlsYWIgPSAiRnJlcXVlbmN5IikKCiN0aGUgZGF0YSBwb2ludHMgYWxsIGFwcGVhciB0byBmYWxsIGludG8gdGhlIHNhbWUgcmFuZ2Ugb2YgZnJlcXVlbmN5IQoKYGBgCgpgYGB7cn0KI0JhciBQbG90LS1pbnZlc3RpZ2F0ZXMgdGhlIGdlbmRlciBiYWxhbmNlIGFjcm9zcyBkaWZmZXJlbnQgb2NjdXBhdGlvbnMgd2l0aGluIHRoZSBjYXRlZ29yeQoKI3N1bSB0aGUgY291bnRzIG9mIGZlbWFsZXMgJiBtYWxlcwpmZW1hbGVfY291bnQgPC0gc3VtKG1hbmFnZW1lbnQkRl93b3JrZXJzKSAKbWFsZV9jb3VudCA8LSBzdW0obWFuYWdlbWVudCRNX3dvcmtlcnMpCgojY3JlYXRlIGEgZGF0YSBmcmFtZSB3aXRoIGdlbmRlciBjb3VudHMKZ2VuZGVyX2RhdGEgPC0gZGF0YS5mcmFtZShHZW5kZXIgPSBjKCJGZW1hbGUiLCAiTWFsZSIpLAogICAgICAgICAgICAgICAgICAgICAgICAgIENvdW50ID0gYyhmZW1hbGVfY291bnQsIG1hbGVfY291bnQpKQoKZ2dwbG90KGRhdGEgPSBnZW5kZXJfZGF0YSwgYWVzKHggPSBHZW5kZXIsIHkgPSBDb3VudCwgZmlsbCA9IEdlbmRlcikpICsKICBnZW9tX2JhcihzdGF0ID0gImlkZW50aXR5Iiwgd2lkdGggPSAwLjYpICsKICBsYWJzKHRpdGxlID0gIkdlbmRlciBCYWxhbmNlIGluIE1hbmFnZW1lbnQiLAogICAgICAgeCA9ICJHZW5kZXIiLCB5ID0gIkNvdW50IikgKwogIHNjYWxlX2ZpbGxfbWFudWFsKHZhbHVlcyA9IGMoInBpbmsiLCAic2t5Ymx1ZSIpKSArCiAgdGhlbWVfbWluaW1hbCgpCmBgYAo=