df <- read.csv("cabg_perfmeasures.csv")
table(df$PerformanceMeasure)
##
## AAA Repair Endo Unrupture AAA Repair Open Unrupture
## 638 638
## Acute Stroke Acute Stroke Hemorrhagic
## 1598 1598
## Acute Stroke Ischemic Acute Stroke Subarachnoid
## 1598 1598
## AMI Carotid Endarterectomy
## 1598 1598
## Elective PCI Emergency CABG Elective PCI Mortality
## 69 69
## Elective PCI Stroke GI Hemorrhage
## 69 1598
## Heart Failure Hip Fracture
## 1598 1598
## Isolated CABG Operative Mortalit Pancreatic Resection
## 618 1598
## PCI Pneumonia
## 1598 1598
colSums(is.na(df))
## Year County Hospital
## 0 0 0
## OSHPDID system TypeofReport
## 0 0 0
## PerformanceMeasure NumberofAdverseEvents NumberofCases
## 0 5912 5912
## Risk.adjusted.Rate HospitalRatings Longitude
## 6005 0 98
## Latitude
## 98
outlier_values <- boxplot(df$NumberofAdverseEvents)$out

outlier_rows <- which(df$NumberofAdverseEvents %in% outlier_values)
print(paste("Row numbers of outliers:", paste(outlier_rows, collapse = ", ")))
## [1] "Row numbers of outliers: 66, 90, 91, 160, 204, 218, 225, 246, 352, 354, 367, 380, 386, 394, 395, 401, 410, 420, 606, 608, 618, 619, 620, 630, 631, 632, 644, 645, 646, 658, 670, 676, 682, 683, 694, 696, 700, 711, 712, 717, 728, 729, 738, 802, 1030, 1032, 1033, 1046, 1052, 1058, 1059, 1061, 1065, 1069, 1074, 1075, 1080, 1088, 1089, 1095, 1099, 1357, 1358, 1359, 1369, 1370, 1371, 1375, 1381, 1382, 1383, 1387, 1395, 1396, 1397, 1401, 1409, 1410, 1411, 1419, 1498, 1507, 1526, 1533, 1548, 1567, 1950, 1967, 1971, 2022, 2023, 2024, 2025, 2026, 2029, 2035, 2036, 2037, 2038, 2042, 2048, 2049, 2050, 2051, 2055, 2063, 2064, 2065, 2066, 2069, 2070, 2078, 2079, 2080, 2081, 2085, 2089, 2155, 2156, 2162, 2166, 2168, 2169, 2175, 2181, 2182, 2188, 2192, 2196, 2197, 2203, 2207, 2211, 2212, 2217, 2218, 2222, 2695, 2929, 2930, 2942, 2943, 2955, 2956, 2962, 2970, 2971, 2972, 2977, 2985, 2986, 2996, 3188, 3318, 3319, 3320, 3321, 3325, 3331, 3332, 3333, 3334, 3338, 3344, 3345, 3346, 3360, 3361, 3374, 3375, 3385, 3582, 3838, 3841, 3851, 3853, 3854, 3855, 3864, 3867, 3877, 3881, 3882, 3892, 3896, 3897, 3907, 3910, 3935, 3966, 4044, 4109, 4112, 4125, 4311, 4463, 4527, 4591, 4594, 4619, 4634, 4649, 4660, 4947, 4960, 4972, 4998, 5003, 5013, 5016, 5022, 5026, 5028, 5029, 5035, 5041, 5042, 5043, 5056, 5057, 5072, 5082, 5261, 5262, 5288, 5329, 5332, 5333, 5346, 5359, 5365, 5373, 5374, 5389, 5390, 5401, 5414, 5415, 5423, 5428, 5429, 5430, 5442, 5443, 5444, 5445, 5457, 5458, 5459, 5460, 5468, 5470, 5483, 5496, 5511, 5512, 5526, 5536, 5538, 5551, 5579, 5594, 5605, 5607, 5608, 5614, 5620, 5621, 5627, 5629, 5633, 5634, 5640, 5648, 5649, 5650, 5651, 5655, 5657, 5664, 5665, 5670, 5674, 5677, 5678, 5679, 5680, 5684, 5690, 5691, 5692, 5693, 5697, 5703, 5704, 5705, 5706, 5710, 5718, 5719, 5720, 5721, 5725, 5733, 5734, 5735, 5736, 5740, 5790, 5938, 5939, 5940, 5951, 5952, 5954, 5964, 5965, 5966, 5967, 5971, 5979, 5980, 5981, 5982, 5994, 5995, 6001, 6005, 6238, 6307, 6371, 6374, 6375, 6376, 6386, 6387, 6388, 6399, 6400, 6401, 6402, 6415, 6416, 6417, 6430, 6431, 6432, 6440, 6442, 6443, 6444, 6455, 6456, 6458, 6468, 6469, 6470, 6475, 6484, 6485, 6486, 6490, 6499, 6500, 6501, 6509, 6573, 6638, 6639, 6640, 6641, 6645, 6647, 6651, 6652, 6653, 6654, 6655, 6658, 6660, 6664, 6665, 6666, 6667, 6671, 6673, 6679, 6680, 6681, 6682, 6686, 6688, 6694, 6695, 6696, 6701, 6703, 6705, 6708, 6720, 6721, 6733, 6734, 6735, 6736, 6748, 6749, 6750, 6751, 6764, 6774, 6928, 6929, 6930, 6931, 6941, 6942, 6943, 6944, 6954, 6955, 6956, 6957, 6969, 6970, 6971, 6972, 6976, 6985, 6986, 6987, 6988, 6995, 6998, 6999, 7000, 7011, 7012, 7024, 7025, 7026, 7027, 7039, 7040, 7041, 7042, 7055, 7056, 7057, 7065, 7067, 7079, 7129, 7257, 7385, 7513, 7514, 7515, 7527, 7528, 7540, 7541, 7556, 7581, 7598, 7626, 7641, 7651, 7654, 7656, 7660, 7667, 7669, 7680, 7682, 7695, 7697, 7701, 7710, 7720, 7855, 7856, 7863, 7868, 7876, 7880, 7881, 7889, 7895, 7896, 7902, 7904, 7911, 7989, 8215, 8320, 8322, 8362, 8388, 8403, 8404, 8417, 8432, 8433, 8446, 8447, 8460, 8461, 8473, 8474, 8479, 8486, 8487, 8500, 8501, 8516, 8517, 8522, 8526, 8685, 8686, 8687, 8688, 8698, 8699, 8711, 8712, 8714, 8726, 8727, 8728, 8741, 8742, 8880, 8946, 9077, 9103, 9118, 9594, 9724, 9737, 9750, 9771, 9780, 9790, 9858, 9871, 9899, 9914, 9924, 10391, 10458, 10459, 10471, 10472, 10473, 10484, 10485, 10486, 10499, 10500, 10501, 10515, 10516, 10525, 10596, 10597, 10603, 10610, 10611, 10622, 10623, 10624, 10629, 10637, 10638, 10639, 10644, 10652, 10653, 10659, 10663, 10796, 10811, 10826, 10828, 10843, 10844, 10860, 10861, 10870, 10937, 10939, 10949, 10950, 10963, 10964, 10977, 10978, 10979, 10980, 10992, 10993, 10994, 10995, 11003, 11005, 11006, 11007, 11018, 11019, 11020, 11031, 11032, 11045, 11046, 11136, 11203, 11216, 11222, 11229, 11244, 11246, 11250, 11259, 11336, 11348, 11349, 11361, 11362, 11376, 11377, 11383, 11392, 11398, 11402, 11404, 11405, 11417, 11418, 11419, 11420, 11430, 11431, 11432, 11433, 11445, 11446, 11460, 11461, 11463, 11471, 11567, 11570, 11583, 11596, 11611, 11626, 11651, 11663, 11675, 11681, 11689, 11713, 11846, 11848, 11852, 11860, 11861, 11867, 11876, 11893, 11910, 11912, 11920, 11925, 11927, 11931, 11939, 11940, 11946, 11955, 11961, 11978, 11989, 11995, 11999, 12261, 12263, 12264, 12266, 12276, 12277, 12278, 12289, 12290, 12291, 12292, 12304, 12305, 12306, 12307, 12319, 12320, 12321, 12322, 12330, 12332, 12333, 12343, 12346, 12359, 12360, 12374, 12389, 12399, 12463, 12661, 12663, 12664, 12665, 12672, 12676, 12677, 12678, 12685, 12689, 12690, 12691, 12692, 12698, 12704, 12705, 12707, 12713, 12719, 12720, 12721, 12722, 12730, 13000, 13012, 13026, 13040, 13052, 13053, 13064, 13076, 13077, 13090, 13091, 13104, 13105, 13143, 13156, 13169, 13170, 13185, 13200, 13212, 13225, 13234, 13238, 13247, 13253, 13262, 13268, 13277, 13279, 13282, 13283, 13284, 13294, 13295, 13296, 13306, 13307, 13308, 13320, 13321, 13322, 13334, 13335, 13336, 13345, 13354, 13358, 13365, 13367, 13371, 13380, 13386, 13393, 13401, 13408, 13410, 13414, 13415, 13416, 13417, 13421, 13427, 13428, 13429, 13430, 13431, 13434, 13440, 13441, 13442, 13443, 13444, 13455, 13456, 13457, 13458, 13470, 13471, 13472, 13473, 13474, 13477, 13481, 13549, 13550, 13555, 13562, 13563, 13564, 13568, 13575, 13576, 13590, 13591, 13596, 13605, 13616, 13617, 13623, 13628, 13629, 13635, 13641, 13642, 13644, 13648, 13656, 13657, 13663, 13672, 13673, 13678, 13704, 13719, 13725, 13735, 13736, 13742, 13763, 14085, 14086, 14087, 14092, 14098, 14099, 14100, 14101, 14105, 14112, 14113, 14114, 14118, 14127, 14128, 14129, 14133, 14142, 14144, 14148, 14152, 14153, 14154, 14155, 14156, 14160, 14166, 14167, 14168, 14169, 14173, 14179, 14180, 14181, 14182, 14183, 14188, 14194, 14195, 14196, 14197, 14201, 14203, 14209, 14210, 14211, 14216, 14218, 14299, 14311, 14325, 14339, 14349, 14351, 14352, 14365, 14377, 14378, 14379, 14392, 14393, 14407, 14408, 14418, 14484, 14485, 14497, 14498, 14499, 14510, 14511, 14525, 14526, 14527, 14540, 14541, 14551, 14553, 14579, 14620, 14886, 14898, 14899, 14910, 14924, 14925, 14938, 14939, 14948, 15147, 15153, 15157, 15160, 15166, 15172, 15173, 15179, 15187, 15188, 15190, 15203, 15205, 15213, 15216, 15217, 15218, 15228, 15229, 15230, 15231, 15237, 15241, 15242, 15243, 15244, 15247, 15256, 15257, 15258, 15259, 15272, 15273, 15274, 15282, 15284, 15286, 15290, 15296, 15302, 15308, 15314, 15322, 15324, 15328, 15336, 15338, 15342, 15346, 15348, 15349, 15350, 15355, 15361, 15362, 15363, 15374, 15375, 15376, 15381, 15389, 15390, 15391, 15392, 15396, 15405, 15406, 15411, 15415, 15417, 15418, 15419, 15420, 15424, 15426, 15430, 15431, 15432, 15433, 15437, 15443, 15444, 15445, 15446, 15450, 15458, 15459, 15460, 15461, 15465, 15473, 15474, 15475, 15476, 15480, 15484, 15549, 15550, 15551, 15552, 15556, 15558, 15562, 15563, 15564, 15565, 15571, 15575, 15576, 15577, 15578, 15579, 15582, 15584, 15590, 15591, 15592, 15593, 15597, 15599, 15605, 15606, 15607, 15608, 15612, 15614, 15616, 15620, 15633, 15645, 15646, 15661, 15662, 15663, 15676, 15677, 15686, 15687, 15688, 15699, 15700, 15706, 15711, 15712, 15718, 15725, 15726, 15732, 15740, 15750, 15752, 15765, 15771, 15778, 15793, 15807, 15808, 15818, 16019, 16045, 16140, 16141, 16147, 16154, 16160, 16166, 16167, 16173, 16195, 16197, 16207, 16209, 16219, 16221, 16233, 16235, 16247, 16259, 16260, 16271, 16283, 16284, 16297, 16311, 16312, 16313, 16492, 16493, 16505, 16517, 16518, 16519, 16524, 16532, 16533, 16535, 16536, 16539, 16548, 16549, 16558, 16626, 16632, 16646, 16650, 16890, 16891, 16892, 16903, 16904, 16912, 16916, 16917, 16923, 16925, 16931, 16932, 16946, 16955, 17149, 17539, 17552, 17580, 17609, 17650, 17665, 17747, 17748, 17749, 17759, 17760, 17761, 17771, 17772, 17773, 17785, 17786, 17799, 17800, 17801, 17939, 17952, 18008, 18010, 18014, 18021, 18023, 18034, 18035, 18036, 18048, 18049, 18050, 18064, 18065, 18066, 18074, 18141, 18142, 18143, 18144, 18145, 18148, 18155, 18156, 18157, 18167, 18168, 18169, 18183, 18184, 18185, 18198, 18211, 18224, 18237, 18252, 18277, 18279, 18285, 18292, 18293, 18298, 18305, 18320, 18335, 18345, 18415, 18417, 18430, 18487, 18489, 18500, 18502, 18506, 18513, 18515, 18519, 18528, 18530, 18543, 18545, 18549, 18553, 18599, 18605, 18626, 18692, 18693, 18699, 18705, 18712, 18718, 18719, 18725, 18733, 18734, 18740, 18748, 18755, 18759, 18774, 18793, 19025, 19027, 19028, 19029, 19034, 19040, 19041, 19043, 19047, 19054, 19055, 19056, 19060, 19069, 19071, 19075, 19084, 19086, 19090, 19094, 19263, 19291, 19381, 19393, 19424, 19434, 19436, 19448, 19627, 19628, 19654, 19655, 19669, 19670, 19671, 19675, 19684, 19690, 19694, 19944, 19945, 19946, 19957, 19958, 19959, 19970, 19971, 19972, 19973, 19985, 19986, 19987, 19988, 19992, 20000, 20001, 20002, 20003, 20007, 20011, 20089, 20091, 20092, 20117, 20124, 20139, 20147, 20158, 20351, 20352, 20357, 20358, 20360, 20362, 20364, 20365, 20367, 20370, 20371, 20373, 20375, 20377, 20378, 20379, 20384, 20386, 20388, 20392, 20393, 20394, 20399, 20407, 20408, 20414, 20418, 20486, 20616, 20750, 20751, 20752, 20763, 20764, 20765, 20769, 20776, 20778, 20791, 20793, 20806, 20816, 21055, 21070, 21072, 21209, 21235, 21242, 21246, 21250, 21257, 21276"
count_outliers <- length(boxplot(df$NumberofAdverseEvents)$out)

duplicate_records <- df[duplicated(df), ]
if (nrow(duplicate_records) > 0) {
print("Duplicate records found:")
print(duplicate_records)
} else {
print("No duplicate records found.")
}
## [1] "No duplicate records found."
![]()
newdf <- subset(df, PerformanceMeasure == "Pneumonia")
table(newdf$PerformanceMeasure)
##
## Pneumonia
## 1598