Rows: 72
Columns: 31
$ npi <dbl> 1003042540, 1033598263, 1003009861, 1639239015, 1003012444, 1013649623, 1255577508, 1083798…
$ entity_type <int> 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1…
$ first_name <chr> "VERONICA", "VERONICA", "MOUSTAFA", "JAIME", "ANDREW", "ANDREW", "ANDREW", "ANDREW", "LAKSH…
$ last_name_leg <chr> "COMBS", "COMBS", "BANNA", "MICHEL", "PICEL", "PRICE", "PRICE", "PICHLER", "SRINIVASAN", "S…
$ last_name <chr> "COMBS", "COMBS", "BANNA", "MICHEL", "PICEL", "PRICE", "PRICE", "PICHLER", "SRINIVASAN", "S…
$ org_name <chr> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA,…
$ state <chr> "AR", "AR", "AZ", "AZ", "CA", "CA", "CA", "CA", "CA", "CA", "CA", "CO", "CO", "CO", "CO", "…
$ city <chr> "HARRISON", "WEST MEMPHIS", "PEORIA", "YUMA", "STANFORD", "RIVERSIDE", "OAKLAND", "CARMICHA…
$ tax_code_1 <chr> "1041C0700X", "104100000X", "207RC0000X", "2084A0401X", "2085R0202X", "152WC0802X", "101Y00…
$ tax_code_2 <chr> NA, NA, NA, "2084P0800X", "2085R0204X", "152WL0500X", NA, NA, NA, "207Q00000X", "2085R0202X…
$ tax_code_3 <chr> NA, NA, NA, NA, NA, "152WP0200X", NA, NA, NA, NA, NA, NA, NA, NA, "363A00000X", NA, NA, NA,…
$ tax_code_4 <chr> NA, NA, NA, NA, NA, "152WS0006X", NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, N…
$ tax_code_5 <chr> NA, NA, NA, NA, NA, "152WV0400X", NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, N…
$ state_part <chr> "AR", "AR", "AZ", "AZ", "CA", "CA", "CA", "CA", "CA", "CA", "CA", "CO", "CO", "CO", "CO", "…
$ lname_initial <chr> "C", "C", "B", "M", "P", "P", "P", "P", "S", "S", "S", "B", "B", "C", "C", "H", "H", "H", "…
$ name_for_initial <chr> "COMBS", "COMBS", "BANNA", "MICHEL", "PICEL", "PRICE", "PRICE", "PICHLER", "SRINIVASAN", "S…
$ lname <chr> "COMBS", "COMBS", "BANNA", "MICHEL", "PICEL", "PRICE", "PRICE", "PICHLER", "SRINIVASAN", "S…
$ cand_first_norm <chr> "VERONICA", "VERONICA", "MOUSTAFA", "JAIME", "ANDREW", "ANDREW", "ANDREW", "ANDREW", "LAKSH…
$ cand_last_norm <chr> "COMBS", "COMBS", "BANNA", "MICHEL", "PICEL", "PRICE", "PRICE", "PICHLER", "SRINIVASAN", "S…
$ cand_full_norm <chr> "VERONICA COMBS", "VERONICA COMBS", "MOUSTAFA BANNA", "JAIME MICHEL", "ANDREW PICEL", "ANDR…
$ cand_first_initial <chr> "V", "V", "M", "J", "A", "A", "A", "A", "L", "M", "E", "J", "J", "J", "J", "D", "D", "D", "…
$ cand_city_norm <chr> "HARRISON", "WEST MEMPHIS", "PEORIA", "YUMA", "STANFORD", "RIVERSIDE", "OAKLAND", "CARMICHA…
$ input_id <int> 47, 47, 13, 10, 27, 27, 27, 27, 28, 35, 48, 2, 2, 37, 37, 23, 23, 23, 18, 21, 21, 9, 9, 9, …
$ first_norm <chr> "VERONICA", "VERONICA", "MOUSTAFA", "JAIME", "ANDREW", "ANDREW", "ANDREW", "ANDREW", "LAKSH…
$ last_norm <chr> "COMBS", "COMBS", "BANNA", "MICHAELSON", "PICEL", "PICEL", "PICEL", "PICEL", "SRINIVASAN", …
$ city_norm <chr> "HARRISON", "HARRISON", "SUN CITY WEST", "TUBA CITY", "STANFORD", "STANFORD", "STANFORD", "…
$ jaro_winkler <dbl> 1.0000000, 1.0000000, 1.0000000, 0.9500000, 1.0000000, 0.9666667, 0.9666667, 0.9547619, 1.0…
$ exact_name <lgl> TRUE, TRUE, TRUE, FALSE, TRUE, FALSE, FALSE, FALSE, TRUE, TRUE, TRUE, TRUE, TRUE, TRUE, FAL…
$ city_match <lgl> TRUE, FALSE, FALSE, FALSE, TRUE, FALSE, FALSE, FALSE, TRUE, FALSE, FALSE, TRUE, FALSE, FALS…
$ rank_num <int> 1, 2, 2, 4, 1, 4, 4, 4, 1, 2, 2, 1, 2, 2, 3, 2, 4, 4, 2, 1, 4, 1, 2, 4, 1, 4, 1, 2, 1, 4, 4…
$ rank_label <chr> "Extremely Likely Match", "Very Likely Match", "Very Likely Match", "Possible Match", "Extr…