Load and clean health profile data

require(imputeMissings); library(factoextra)
Loading required package: imputeMissings
Loading required package: ggplot2

Attaching package: ‘ggplot2’

The following objects are masked _by_ ‘.GlobalEnv’:

    diamonds, economics, mpg

The following object is masked from ‘package:kernlab’:

    alpha
profile <- read.csv("~/Documents/R_projects/profiles/profile.csv")
rownames(profile) <- profile$area
profile <- impute(profile[, -c(1:2,7)], method = "randomForest")
head(profile)

Correlations

Clustering and kmeans

LS0tCnRpdGxlOiAiUiBOb3RlYm9vayIKb3V0cHV0OgogIGh0bWxfbm90ZWJvb2s6IGRlZmF1bHQKICBwZGZfZG9jdW1lbnQ6CiAgICBudW1iZXJfc2VjdGlvbnM6IHllcwogICAgdG9jOiB5ZXMKLS0tCgojI0xvYWQgYW5kIGNsZWFuIGhlYWx0aCBwcm9maWxlIGRhdGEKCmBgYHtyLCBjYWNoZT1UUlVFfQpyZXF1aXJlKGltcHV0ZU1pc3NpbmdzKTsgbGlicmFyeShmYWN0b2V4dHJhKQpwcm9maWxlIDwtIHJlYWQuY3N2KCJ+L0RvY3VtZW50cy9SX3Byb2plY3RzL3Byb2ZpbGVzL3Byb2ZpbGUuY3N2IikKcm93bmFtZXMocHJvZmlsZSkgPC0gcHJvZmlsZSRhcmVhCnByb2ZpbGUgPC0gaW1wdXRlKHByb2ZpbGVbLCAtYygxOjIsNyldLCBtZXRob2QgPSAicmFuZG9tRm9yZXN0IikKCmhlYWQocHJvZmlsZSkKYGBgCiMjIENvcnJlbGF0aW9ucwoKYGBge3J9CnJlcXVpcmUoY29ycnBsb3QpCmNvcnJwbG90KGNvcihwcm9maWxlKSwgbWV0aG9kID0gJ2VsbGlwc2UnLCB0bC5jZXggPSAwLjUsIHRsLmNvbCA9ICJibGFjayIsIGFkZHJlY3QgPSA3LCBvcmRlciA9ICJoY2x1c3QiLCBhZGRncmlkLmNvbCA9IE5BKQpgYGAKCiMjQ2x1c3RlcmluZyBhbmQga21lYW5zCgpgYGB7ciwgZWNobz1GQUxTRSwgbWVzc2FnZT1GQUxTRSwgd2FybmluZz1GQUxTRX0KbGlicmFyeShGYWN0b01pbmVSKQpkZiA8LSBkYXRhLmZyYW1lKHNjYWxlKHByb2ZpbGUpKQoKZnZpel9wY2FfdmFyKFBDQShkZiksIGxhYmVsc2l6ZSA9IDIsIHJlcGVsID0gVFJVRSkKc2V0LnNlZWQoMTIzKQpyZXMgPC0gaGttZWFucyhkZiwgNCwgaXRlci5tYXggPSAyNSkKaGttZWFuc190cmVlKHJlcywgY2V4ID0gMC4zKQpmdml6X2RlbmQocmVzLCBjZXggPSAwLjI1KQpmdml6X2NsdXN0ZXIocmVzLCBmcmFtZS50eXBlID0gIm5vcm0iLCBmcmFtZS5sZXZlbCA9IDAuOCwgbGFiZWxzaXplID0gMikKYGBgCgoKCg==