library(summarytools)
## Warning: package 'summarytools' was built under R version 3.4.3
setwd("/Volumes/Seagate Backup Plus Drive/DataSets/LA_Data/Crash/csv/2010")
library(data.table)
## Warning: package 'data.table' was built under R version 3.4.2
dat1 <- fread("2010DOT_TB.csv", na.strings=c("NA", "", " ","NaN"))
dim(dat1)

[1] 147831 40

dfSummary(dat1, style='grid', plain.ascii = FALSE, graph.col = FALSE)
## Warning in as.POSIXlt.POSIXct(Sys.time()): unknown timezone 'zone/tz/2017c.
## 1.0/zoneinfo/America/Chicago'

Data Frame Summary

dat1
N: 147831

No Variable Stats / Values Freqs (% of Valid) Valid Missing

1

crash_num [character]

  1. `
  2. 0
  3. 0000004
  4. 0000012
  5. 0000013
  6. 0000015
  7. 0000016
  8. 0000021
  9. 0000029
  10. 0000031
    [ 147820 others ]

1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
147820 (0.0%)

147830 (100%)

1 (0%)

2

CRASH_NUM1 [character]

  1. LA10_
  2. LA10_ 4670557
  3. LA10_`
  4. LA10_0
  5. LA10_0000004
  6. LA10_0000012
  7. LA10_0000013
  8. LA10_0000015
  9. LA10_0000016
  10. LA10_0000021
    [ 147821 others ]

1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
147821 (0.0%)

147831 (100%)

0 (0%)

3

dotd_crash_num [integer]

mean (sd) : 110519842.9 (152445720.79)
min < med < max :
0 < 100010246 < 810903004
IQR (CV) : 119825577 (1.38)

147656 distinct val.

147805 (99.98%)

26 (0.02%)

4

hwy_type_cd [character]

  1. A
  2. B
  3. C
  4. D
  5. E
  6. G

14339 ( 9.8%)
24562 (16.8%)
48442 (33.1%)
17567 (12.0%)
41398 (28.3%)
161 ( 0.1%)

146469 (99.08%)

1362 (0.92%)

5

pri_hwy_num [integer]

mean (sd) : 233.83 (649.78)
min < med < max :
0 < 14 < 8000
IQR (CV) : 98 (2.78)

974 distinct val.

146959 (99.41%)

872 (0.59%)

6

bypass_cd [character]

  1. Z
  2. X
  3. 2
  4. Y
  5. 3
  6. S
  7. B
  8. 1
  9. 9
  10. 6
    [ 8 others ]

2207 (41.1%)
1361 (25.3%)
385 ( 7.2%)
294 ( 5.5%)
271 ( 5.0%)
175 ( 3.3%)
148 ( 2.8%)
145 ( 2.7%)
131 ( 2.4%)
126 ( 2.4%)
130 ( 2.4%)

5373 (3.63%)

142458 (96.37%)

7

milepost [numeric]

mean (sd) : 44.5 (150.96)
min < med < max :
0 < 2.74 < 29124
IQR (CV) : 37.85 (3.39)

18223 distinct val.

147831 (100%)

0 (0%)

8

stl_route [character]

  1. I010
  2. 0190
  3. 0090
  4. 0061
  5. 0001
  6. 0090Z
  7. 0071
  8. 0080
  9. 0182
  10. I020
    [ 1055 others ]

7420 ( 8.4%)
3577 ( 4.0%)
3546 ( 4.0%)
3452 ( 3.9%)
2757 ( 3.1%)
2211 ( 2.5%)
2160 ( 2.4%)
2012 ( 2.3%)
1995 ( 2.3%)
1993 ( 2.2%)
57269 (64.0%)

88392 (59.79%)

59439 (40.21%)

9

adt [integer]

mean (sd) : 28670.78 (30035.63)
min < med < max :
0 < 20700 < 196600
IQR (CV) : 27800 (1.05)

725 distinct val.

88392 (59.79%)

59439 (40.21%)

10

control_section [character]

  1. 450-90
  2. 450-15
  3. 450-10
  4. 283-09
  5. 007-90
  6. 283-08
  7. 000-00
  8. 080-02
  9. 053-09
  10. 809-08
    [ 2126 others ]

1666 ( 1.9%)
1418 ( 1.6%)
1394 ( 1.6%)
1232 ( 1.4%)
1111 ( 1.3%)
975 ( 1.1%)
950 ( 1.1%)
934 ( 1.1%)
779 ( 0.9%)
778 ( 0.9%)
76322 (85.6%)

87559 (59.23%)

60272 (40.77%)

11

dotd_district [integer]

mean (sd) : 20.7 (26.39)
min < med < max :
2 < 4 < 62
IQR (CV) : 59 (1.27)

2 : 41730 (28.2%)
3 : 21409 (14.5%)
4 : 16771 (11.3%)
5 : 7834 ( 5.3%)
7 : 8229 ( 5.6%)
8 : 8058 ( 5.5%)
58 : 835 ( 0.6%)
61 : 27491 (18.6%)
62 : 15459 (10.5%)

147816 (99.99%)

15 (0.01%)

12

functional_class [integer]

mean (sd) : 12.19 (4.26)
min < med < max :
0 < 14 < 19
IQR (CV) : 3 (0.35)

13 distinct val.

88392 (59.79%)

59439 (40.21%)

13

highway_class [integer]

mean (sd) : 5.52 (2.19)
min < med < max :
1 < 6 < 8
IQR (CV) : 2 (0.4)

1 : 12467 (14.4%)
2 : 248 ( 0.3%)
3 : 1677 ( 1.9%)
4 : 2740 ( 3.2%)
5 : 18906 (21.8%)
6 : 10698 (12.3%)
7 : 28301 (32.7%)
8 : 11581 (13.4%)

86618 (58.59%)

61213 (41.41%)

14

logmile [numeric]

mean (sd) : 5.27 (5.62)
min < med < max :
0 < 3.58 < 60.43
IQR (CV) : 5.72 (1.07)

3054 distinct val.

87559 (59.23%)

60272 (40.77%)

15

logmile_from [numeric]

mean (sd) : 4.61 (5.49)
min < med < max :
0 < 3 < 55.23
IQR (CV) : 5.7 (1.19)

1625 distinct val.

88392 (59.79%)

59439 (40.21%)

16

logmile_to [numeric]

mean (sd) : 5.86 (5.84)
min < med < max :
0 < 4.26 < 60.96
IQR (CV) : 6.38 (1)

1761 distinct val.

88392 (59.79%)

59439 (40.21%)

17

latitude [numeric]

mean (sd) : 30.52 (2.69)
min < med < max :
-37.6 < 30.36 < 39.94
IQR (CV) : 0.68 (0.09)

65064 distinct val.

117341 (79.38%)

30490 (20.62%)

18

longitude [numeric]

mean (sd) : -91.4 (3.45)
min < med < max :
-99.17 < -91.15 < 0
IQR (CV) : 1.76 (-0.04)

71682 distinct val.

117292 (79.34%)

30539 (20.66%)

19

median_width [integer]

mean (sd) : 27.39 (56.27)
min < med < max :
0 < 10 < 299
IQR (CV) : 32 (2.05)

75 distinct val.

88392 (59.79%)

59439 (40.21%)

20

milepoint [numeric]

mean (sd) : 64.64 (84.82)
min < med < max :
0 < 19.43 < 431.36
IQR (CV) : 99.06 (1.31)

17804 distinct val.

86618 (58.59%)

61213 (41.41%)

21

milepost_from [numeric]

mean (sd) : 70.58 (113.85)
min < med < max :
0 < 19.73 < 908.06
IQR (CV) : 94.7 (1.61)

4501 distinct val.

88392 (59.79%)

59439 (40.21%)

22

milepost_to [numeric]

mean (sd) : 72.2 (113.81)
min < med < max :
0 < 20.98 < 908.68
IQR (CV) : 93.73 (1.58)

4652 distinct val.

88392 (59.79%)

59439 (40.21%)

23

num_lanes [integer]

mean (sd) : 3.48 (1.43)
min < med < max :
0 < 4 < 8
IQR (CV) : 2 (0.41)

9 distinct val.

88392 (59.79%)

59439 (40.21%)

24

parish_cd [integer]

mean (sd) : 28.9 (15.57)
min < med < max :
0 < 28 < 64
IQR (CV) : 20 (0.54)

65 distinct val.

146980 (99.42%)

851 (0.58%)

25

pavement_type [integer]

mean (sd) : 61.44 (9.98)
min < med < max :
0 < 60 < 80
IQR (CV) : 10 (0.16)

6 distinct val.

88392 (59.79%)

59439 (40.21%)

26

pavement_width [integer]

mean (sd) : 41.97 (18.35)
min < med < max :
0 < 48 < 99
IQR (CV) : 24 (0.44)

73 distinct val.

88392 (59.79%)

59439 (40.21%)

27

section_length [numeric]

mean (sd) : 1.77 (1.91)
min < med < max :
0 < 1.13 < 17.4
IQR (CV) : 1.76 (1.08)

849 distinct val.

88392 (59.79%)

59439 (40.21%)

28

hwy_type_flag [integer]

mean (sd) : 0 (0.04)
min < med < max :
0 < 0 < 1
IQR (CV) : 0 (25.96)

2 distinct val.

147831 (100%)

0 (0%)

29

hwy_num_flag [integer]

mean (sd) : 0 (0.04)
min < med < max :
0 < 0 < 1
IQR (CV) : 0 (25.84)

2 distinct val.

147831 (100%)

0 (0%)

30

bypass_flag [integer]

mean (sd) : 0.04 (0.19)
min < med < max :
0 < 0 < 1
IQR (CV) : 0 (4.94)

2 distinct val.

147831 (100%)

0 (0%)

31

milepost_flag [integer]

mean (sd) : 2.8 (2.44)
min < med < max :
0 < 5 < 5
IQR (CV) : 5 (0.87)

3 distinct val.

147831 (100%)

0 (0%)

32

direction [character]

  1. 1
  2. 2
  3. C
  4. N
  5. E
  6. 3
  7. P
  8. 4
  9. A
  10. L
    [ 10 others ]

84850 (97.0%)
1790 ( 2.1%)
149 ( 0.2%)
111 ( 0.1%)
103 ( 0.1%)
93 ( 0.1%)
86 ( 0.1%)
72 ( 0.1%)
69 ( 0.1%)
54 ( 0.1%)
83 ( 0.1%)

87460 (59.16%)

60371 (40.84%)

33

section_oid [integer]

mean (sd) : 289416670.63 (279838654.09)
min < med < max :
1010000 < 254021077 < 864110461
IQR (CV) : 418330182 (0.97)

7396 distinct val.

86618 (58.59%)

61213 (41.41%)

34

type_acc [character]

  1. D
  2. A
  3. I
  4. E
  5. J
  6. K
  7. H
  8. C
  9. B
  10. G
    [ 1 others ]

112572 (76.1%)
17373 (11.8%)
4377 ( 3.0%)
3749 ( 2.5%)
3553 ( 2.4%)
2987 ( 2.0%)
1761 ( 1.2%)
753 ( 0.5%)
376 ( 0.2%)
262 ( 0.2%)
68 ( 0.1%)

147831 (100%)

0 (0%)

35

urban_area [integer]

mean (sd) : 2.85 (1.22)
min < med < max :
0 < 3 < 4
IQR (CV) : 2 (0.43)

5 distinct val.

88392 (59.79%)

59439 (40.21%)

36

intersection [integer]

mean (sd) : 0.36 (0.48)
min < med < max :
0 < 0 < 1
IQR (CV) : 1 (1.34)

2 distinct val.

147831 (100%)

0 (0%)

37

milepoint_from [numeric]

mean (sd) : 63.74 (84.85)
min < med < max :
0 < 18.81 < 428.96
IQR (CV) : 99.06 (1.33)

4418 distinct val.

86618 (58.59%)

61213 (41.41%)

38

milepoint_to [numeric]

mean (sd) : 65.55 (84.79)
min < med < max :
0.03 < 20.2 < 432.84
IQR (CV) : 98.86 (1.29)

4601 distinct val.

86618 (58.59%)

61213 (41.41%)

39

lrs_id [character]

  1. 450-90-2-010
  2. 450-90-1-010
  3. 451-01-1-010
  4. 450-10-2-010
  5. 007-90-2-010
  6. 450-15-2-010
  7. 283-08-2-010
  8. 004-01-1-010
  9. 450-15-1-010
  10. 007-90-1-010
    [ 3439 others ]

639 ( 1.1%)
587 ( 1.0%)
454 ( 0.8%)
428 ( 0.7%)
423 ( 0.7%)
407 ( 0.7%)
400 ( 0.7%)
396 ( 0.7%)
380 ( 0.7%)
351 ( 0.6%)
53451 (91.2%)

57916 (39.18%)

89915 (60.82%)

40

lrs_logmile [numeric]

mean (sd) : 5.22 (5.64)
min < med < max :
0 < 3.42 < 60.89
IQR (CV) : 6.07 (1.08)

2826 distinct val.

57916 (39.18%)

89915 (60.82%)

dat2 <- fread("2010CRASH_TB.csv", na.strings=c("NA", "", " ","NaN"))
## Warning in fread("2010CRASH_TB.csv", na.strings = c("NA", "", " ", "NaN")):
## Bumped column 124 to type character on data row 1958, field contains
## '1138-2'. Coercing previously read values in this column from logical,
## integer or numeric back to character which may not be lossless; e.g., if
## '00' and '000' occurred before they will now be just '0', and there may
## be inconsistencies with treatment of ',,' and ',NA,' too (if they occurred
## in this column before the bump). If this matters please rerun and set
## 'colClasses' to 'character' for this column. Please note that column type
## detection uses a sample of 1,000 rows (100 rows at 10 points) so hopefully
## this message should be very rare. If reporting to datatable-help, please
## rerun and include the output from verbose=TRUE.

Read 94.7% of 147869 rows Read 147869 rows and 154 (of 154) columns from 0.092 GB file in 00:00:03

dim(dat2)

[1] 147869 154

dfSummary(dat2, style='grid', plain.ascii = FALSE, graph.col = FALSE)

Data Frame Summary

dat2
N: 147869

No Variable Stats / Values Freqs (% of Valid) Valid Missing

1

CRASH_NUM [character]

  1. `
  2. 0
  3. 0000004
  4. 0000012
  5. 0000013
  6. 0000015
  7. 0000016
  8. 0000021
  9. 0000029
  10. 0000031
    [ 147858 others ]

1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
147858 (0.0%)

147868 (100%)

1 (0%)

2

CRASH_NUM1 [character]

  1. LA10_
  2. LA10_ 4670557
  3. LA10_`
  4. LA10_0
  5. LA10_0000004
  6. LA10_0000012
  7. LA10_0000013
  8. LA10_0000015
  9. LA10_0000016
  10. LA10_0000021
    [ 147859 others ]

1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
1 (0.0%)
147859 (0.0%)

147869 (100%)

0 (0%)

3

ISDS_CODE [character]

  1. 0
  2. 1
  3. office
  4. 6480
  5. 4089
  6. `0
  7. 0 
  8. 3871
  9. o
  10. 1 
    [ 75 others ]

29554 (88.1%)
2842 ( 8.5%)
329 ( 1.0%)
99 ( 0.3%)
72 ( 0.2%)
41 ( 0.1%)
35 ( 0.1%)
32 ( 0.1%)
24 ( 0.1%)
19 ( 0.1%)
491 ( 1.4%)

33538 (22.68%)

114331 (77.32%)

4

CRASH_DATE [integer]

mean (sd) : 40359.83 (105.3)
min < med < max :
38310 < 40358 < 41600
IQR (CV) : 184 (0)

403 distinct val.

147869 (100%)

0 (0%)

5

CRASH_TIME [numeric]

mean (sd) : 367.54 (3.03)
min < med < max :
0.05 < 367.59 < 368
IQR (CV) : 0.31 (0.01)

1450 distinct val.

147869 (100%)

0 (0%)

6

CR_MONTH [integer]

mean (sd) : 6.5 (3.43)
min < med < max :
1 < 6 < 12
IQR (CV) : 7 (0.53)

12 distinct val.

147869 (100%)

0 (0%)

7

CR_HOUR [integer]

mean (sd) : 14.22 (5.32)
min < med < max :
1 < 15 < 24
IQR (CV) : 7 (0.37)

24 distinct val.

147869 (100%)

0 (0%)

8

LAT [numeric]

mean (sd) : 18.8 (15.56)
min < med < max :
0 < 29.98 < 98.65
IQR (CV) : 30.41 (0.83)

64838 distinct val.

147869 (100%)

0 (0%)

9

LONG [numeric]

mean (sd) : 55.31 (44.55)
min < med < max :
0 < 90.19 < 99.34
IQR (CV) : 91.2 (0.81)

66165 distinct val.

147869 (100%)

0 (0%)

10

ACCESS_CNTL_CD [character]

  1. A
  2. B
  3. C
  4. Y
  5. Z

120461 (81.7%)
10697 ( 7.2%)
15456 (10.5%)
317 ( 0.2%)
518 ( 0.4%)

147449 (99.72%)

420 (0.28%)

11

ALCOHOL [logical]

141322 (95.6%)
6547 ( 4.4%)

147869 (100%)

0 (0%)

12

ALIGNMENT_CD [character]

  1. A
  2. C
  3. B
  4. E
  5. D
  6. F
  7. G
  8. Z
  9. H
  10. I
    [ 2 others ]

125978 (85.3%)
10263 ( 7.0%)
4175 ( 2.8%)
2664 ( 1.8%)
1361 ( 0.9%)
1197 ( 0.8%)
1171 ( 0.8%)
265 ( 0.2%)
225 ( 0.1%)
182 ( 0.1%)
197 ( 0.1%)

147678 (99.87%)

191 (0.13%)

13

AMBULANCE [logical]

117366 (79.4%)
30503 (20.6%)

147869 (100%)

0 (0%)

14

AMB_SERVICE [character]

  1. ACADIAN AMBULANCE
  2. ACADIAN
  3. ACADIAN AMBULANCE SERVICE
  4. AMR
  5. NONE
  6. N/A
  7. NOT NEEDED
  8. MED EXPRESS
  9. EMS
  10. SFD
    [ 5597 others ]

6705 (22.3%)
3612 (12.0%)
879 ( 2.9%)
778 ( 2.6%)
616 ( 2.1%)
397 ( 1.3%)
395 ( 1.3%)
286 ( 0.9%)
283 ( 0.9%)
262 ( 0.9%)
15812 (40.5%)

30025 (20.31%)

117844 (79.69%)

15

BYPASS_CD [character]

  1. B
  2. W
  3. E
  4. 0
  5. S
  6. 2
  7. N
  8. 3
  9. 1
  10. 6
    [ 32 others ]

2308 (33.4%)
980 (14.2%)
748 (10.8%)
639 ( 9.3%)
480 ( 7.0%)
380 ( 5.5%)
342 ( 5.0%)
241 ( 3.5%)
213 ( 3.1%)
134 ( 1.9%)
437 ( 6.3%)

6902 (4.67%)

140967 (95.33%)

16

CITY_CD [integer]

mean (sd) : 2.62 (4.47)
min < med < max :
0 < 1 < 55
IQR (CV) : 3 (1.71)

28 distinct val.

147869 (100%)

0 (0%)

17

PRI_CONTRIB_FAC_CD [character]

  1. A
  2. B
  3. D
  4. G
  5. E
  6. C
  7. F
  8. I
  9. K
  10. M
    [ 3 others ]

111589 (75.8%)
20666 (14.0%)
8157 ( 5.5%)
2186 ( 1.5%)
1556 ( 1.1%)
761 ( 0.5%)
533 ( 0.4%)
515 ( 0.4%)
513 ( 0.4%)
484 ( 0.3%)
360 ( 0.2%)

147320 (99.63%)

549 (0.37%)

18

SEC_CONTRIB_FAC_CD [character]

  1. B
  2. A
  3. D
  4. K
  5. I
  6. C
  7. G
  8. E
  9. F
  10. H
    [ 3 others ]

95330 (72.8%)
20619 (15.8%)
7898 ( 6.0%)
1408 ( 1.1%)
1074 ( 0.8%)
1061 ( 0.8%)
880 ( 0.7%)
855 ( 0.7%)
824 ( 0.6%)
444 ( 0.3%)
525 ( 0.4%)

130918 (88.54%)

16951 (11.46%)

19

DAY_OF_WK [character]

  1. FR
  2. MO
  3. SA
  4. SU
  5. TH
  6. TU
  7. WE

25981 (17.6%)
21787 (14.7%)
19070 (12.9%)
14488 ( 9.8%)
22543 (15.2%)
22024 (14.9%)
21976 (14.9%)

147869 (100%)

0 (0%)

20

DIST_ZONE [character]

  1. 2
  2. 1
  3. 3
  4. 4
  5. 003
  6. 12
  7. 002
  8. 5
  9. 06
  10. 05
    [ 4308 others ]

2907 ( 3.0%)
2602 ( 2.7%)
2530 ( 2.6%)
2411 ( 2.5%)
1799 ( 1.8%)
1749 ( 1.8%)
1674 ( 1.7%)
1386 ( 1.4%)
1349 ( 1.4%)
1309 ( 1.3%)
77691 (76.8%)

97407 (65.87%)

50462 (34.13%)

21

PUB_PROP_DAM [logical]

142923 (96.7%)
4946 ( 3.3%)

147869 (100%)

0 (0%)

22

RR_TRAIN_INV [logical]

147762 (99.9%)
107 ( 0.1%)

147869 (100%)

0 (0%)

23

HIT_AND_RUN [logical]

131116 (88.7%)
16753 (11.3%)

147869 (100%)

0 (0%)

24

DRUGS [logical]

146094 (98.8%)
1775 ( 1.2%)

147869 (100%)

0 (0%)

25

FIRE_DEPT [character]

  1. NONE
  2. N/A
  3. NOT NEEDED
  4. SFD
  5. PINEVILLE FIRE DEPARTMENT
  6. LAFAYETTE FIRE DEPARTMENT
  7. HAMMOND FIRE
  8. NATCHITOCHES FIRE DEPARTM
  9. MONROE FD
  10. AFD
    [ 4496 others ]

637 ( 5.0%)
434 ( 3.4%)
399 ( 3.1%)
174 ( 1.4%)
136 ( 1.1%)
91 ( 0.7%)
79 ( 0.6%)
76 ( 0.6%)
66 ( 0.5%)
65 ( 0.5%)
10564 (91.5%)

12721 (8.6%)

135148 (91.4%)

26

INTER_ROAD [character]

  1. I-10
  2. I-12
  3. US 90
  4. US 190
  5. LA 182
  6. LA 1
  7. US 61
  8. LA 3246
  9. LA 42
  10. VETERANS BLVD
    [ 41258 others ]

973 ( 0.7%)
703 ( 0.5%)
464 ( 0.3%)
455 ( 0.3%)
431 ( 0.3%)
426 ( 0.3%)
408 ( 0.3%)
378 ( 0.3%)
351 ( 0.2%)
297 ( 0.2%)
134518 (59.9%)

139404 (94.28%)

8465 (5.72%)

27

INVEST_AGENCY_CD [character]

  1. A
  2. B
  3. C
  4. Z

34271 (23.2%)
84630 (57.3%)
26767 (18.1%)
2102 ( 1.4%)

147770 (99.93%)

99 (0.07%)

28

INVEST_COMP [logical]

12180 ( 8.2%)
135689 (91.8%)

147869 (100%)

0 (0%)

29

INVEST_OFFICER [character]

  1. BURGE, KARL
  2. ONEZIME, MICHAEL
  3. LEICHLITER, CHERYL
  4. MARTIN, JACK
  5. KUNAK, JARED
  6. TISDALE, MICHAEL
  7. ,
  8. JAMES, DEPUTY JOHN
  9. IDOM, FLETCHER
  10. BRUJIC, DEPUTY ZLATKO
    [ 19031 others ]

358 ( 0.2%)
358 ( 0.2%)
342 ( 0.2%)
336 ( 0.2%)
317 ( 0.2%)
317 ( 0.2%)
308 ( 0.2%)
258 ( 0.2%)
255 ( 0.2%)
252 ( 0.2%)
141490 (81.5%)

144591 (97.78%)

3278 (2.22%)

30

LIGHTING_CD [character]

  1. A
  2. B
  3. C
  4. D
  5. E
  6. F
  7. Y
  8. Z

106781 (72.6%)
12218 ( 8.3%)
20282 (13.8%)
3601 ( 2.5%)
2075 ( 1.4%)
1292 ( 0.9%)
767 ( 0.5%)
144 ( 0.1%)

147160 (99.52%)

709 (0.48%)

31

LOC_TYPE_CD [character]

  1. A
  2. B
  3. C
  4. D
  5. E
  6. F
  7. G
  8. Z

3577 ( 2.4%)
49960 (33.9%)
41254 (28.0%)
23016 (15.6%)
11605 ( 7.9%)
1122 ( 0.8%)
12930 ( 8.8%)
4091 ( 2.8%)

147555 (99.79%)

314 (0.21%)

32

MAN_COLL_CD [character]

  1. B
  2. A
  3. D
  4. Z
  5. J
  6. F
  7. E
  8. K
  9. G
  10. H
    [ 8 others ]

50541 (35.0%)
21889 (15.2%)
20036 (13.9%)
16385 (11.3%)
15837 (11.0%)
5193 ( 3.6%)
2965 ( 2.1%)
2954 ( 2.1%)
2853 ( 2.0%)
2126 ( 1.5%)
3547 ( 2.4%)

144326 (97.6%)

3543 (2.4%)

33

MILEPOST [numeric]

mean (sd) : 44.92 (1321.71)
min < med < max :
-36.8 < 0 < 394338
IQR (CV) : 12.41 (29.42)

7494 distinct val.

147868 (100%)

1 (0%)

34

NUM_DRI_IK [integer]

mean (sd) : 0.31 (0.57)
min < med < max :
0 < 0 < 6
IQR (CV) : 1 (1.87)

7 distinct val.

147869 (100%)

0 (0%)

35

NUM_DRI_INJ [integer]

mean (sd) : 0.3 (0.57)
min < med < max :
0 < 0 < 6
IQR (CV) : 1 (1.88)

7 distinct val.

147869 (100%)

0 (0%)

36

NUM_DRI_KIL [integer]

mean (sd) : 0 (0.06)
min < med < max :
0 < 0 < 3
IQR (CV) : 0 (18.22)

4 distinct val.

147869 (100%)

0 (0%)

37

NUM_OCC_IK [integer]

mean (sd) : 0.15 (0.63)
min < med < max :
0 < 0 < 40
IQR (CV) : 0 (4.08)

27 distinct val.

147869 (100%)

0 (0%)

38

NUM_OCC_INJ [integer]

mean (sd) : 0.15 (0.63)
min < med < max :
0 < 0 < 40
IQR (CV) : 0 (4.09)

27 distinct val.

147869 (100%)

0 (0%)

39

NUM_OCC_KIL [integer]

mean (sd) : 0 (0.04)
min < med < max :
0 < 0 < 3
IQR (CV) : 0 (32.99)

4 distinct val.

147869 (100%)

0 (0%)

40

NUM_PED_IK [integer]

mean (sd) : 0.01 (0.1)
min < med < max :
0 < 0 < 8
IQR (CV) : 0 (12.16)

7 distinct val.

147869 (100%)

0 (0%)

41

NUM_PED_INJ [integer]

mean (sd) : 0.01 (0.1)
min < med < max :
0 < 0 < 8
IQR (CV) : 0 (12.58)

7 distinct val.

147869 (100%)

0 (0%)

42

NUM_PED_KIL [integer]

mean (sd) : 0 (0.02)
min < med < max :
0 < 0 < 1
IQR (CV) : 0 (43.81)

2 distinct val.

147869 (100%)

0 (0%)

43

NUM_TOT_IK [integer]

mean (sd) : 0.47 (0.98)
min < med < max :
0 < 0 < 41
IQR (CV) : 1 (2.09)

30 distinct val.

147869 (100%)

0 (0%)

44

NUM_TOT_INJ [integer]

mean (sd) : 0.46 (0.97)
min < med < max :
0 < 0 < 41
IQR (CV) : 1 (2.1)

30 distinct val.

147869 (100%)

0 (0%)

45

NUM_TOT_KIL [integer]

mean (sd) : 0 (0.08)
min < med < max :
0 < 0 < 4
IQR (CV) : 0 (16.22)

5 distinct val.

147869 (100%)

0 (0%)

46

NUM_VEH [integer]

mean (sd) : 1.89 (0.53)
min < med < max :
0 < 2 < 16
IQR (CV) : 0 (0.28)

11 distinct val.

147869 (100%)

0 (0%)

47

PARISH_CD [integer]

mean (sd) : 28.91 (15.55)
min < med < max :
0 < 28 < 64
IQR (CV) : 20 (0.54)

65 distinct val.

147869 (100%)

0 (0%)

48

PRI_HWY_NUM [integer]

mean (sd) : 251.95 (696.56)
min < med < max :
0 < 12 < 9999
IQR (CV) : 104 (2.76)

1007 distinct val.

147848 (99.99%)

21 (0.01%)

49

PRI_ROAD_DIR [character]

  1. E
  2. N
  3. NE
  4. NW
  5. S
  6. SE
  7. SW
  8. W

5944 (24.4%)
6041 (24.8%)
272 ( 1.1%)
228 ( 0.9%)
4979 (20.4%)
138 ( 0.6%)
291 ( 1.2%)
6449 (26.5%)

24342 (16.46%)

123527 (83.54%)

50

PRI_ROAD_NUM [numeric]

mean (sd) : 841.02 (2602.6)
min < med < max :
0 < 0 < 104000
IQR (CV) : 0 (3.09)

3525 distinct val.

147726 (99.9%)

143 (0.1%)

51

PRI_ROAD_NAME [character]

  1. I-10
  2. AIRLINE
  3. VETERANS
  4. MAIN
  5. FLORIDA
  6. AMBASSADOR CAFFERY
  7. JOHNSTON
  8. I-20
  9. CLAIBORNE
  10. I-12
    [ 20178 others ]

2337 ( 1.7%)
1725 ( 1.2%)
1117 ( 0.8%)
1086 ( 0.8%)
946 ( 0.7%)
905 ( 0.6%)
864 ( 0.6%)
828 ( 0.6%)
825 ( 0.6%)
817 ( 0.6%)
129096 (72.0%)

140546 (95.05%)

7323 (4.95%)

52

PRI_ROAD_TYPE [character]

  1. ST
  2. RD
  3. STREET
  4. DR
  5. AVE
  6. BLVD
  7. AVENUE
  8. ROAD
  9. DRIVE
  10. BOULEVARD
    [ 197 others ]

13587 (17.4%)
10203 (13.1%)
8445 (10.8%)
6251 ( 8.0%)
6042 ( 7.8%)
4971 ( 6.4%)
4898 ( 6.3%)
3616 ( 4.6%)
3089 ( 4.0%)
2488 ( 3.2%)
14342 (18.2%)

77932 (52.7%)

69937 (47.3%)

53

PRI_DIST [numeric]

mean (sd) : 57.98 (2658.1)
min < med < max :
-2.3 < 0.5 < 999999
IQR (CV) : 30 (45.85)

1500 distinct val.

145701 (98.53%)

2168 (1.47%)

54

PRI_DIR [character]

  1. 0
  2. 1
  3. 2
  4. 4
  5. C
  6. E
  7. M
  8. N
  9. S
  10. W

20 ( 0.0%)
1 ( 0.0%)
2 ( 0.0%)
1 ( 0.0%)
2 ( 0.0%)
24058 (25.4%)
1 ( 0.0%)
22585 (23.9%)
23721 (25.1%)
24215 (25.6%)

94606 (63.98%)

53263 (36.02%)

55

REPORT_NUM [character]

  1. EBRSO
  2. STATEMENTS
  3. NOPD
  4. N.O.P.D.
  5. STATEMENT
  6. ATTACHMENTS
  7. JEFFERSON P.S.O.
  8. 760
  9. ATTACHMENT
  10. LA0500100
    [ 70232 others ]

1870 (2.4%)
1369 (1.7%)
1249 (1.6%)
634 (0.8%)
427 (0.5%)
314 (0.4%)
173 (0.2%)
145 (0.2%)
138 (0.2%)
83 (0.1%)
72292 (2.2%)

78694 (53.22%)

69175 (46.78%)

56

RESCUE_UNIT [logical]

137252 (92.8%)
10617 ( 7.2%)

147869 (100%)

0 (0%)

57

ROAD_COND_CD [character]

  1. A
  2. G
  3. L
  4. K
  5. Z
  6. B
  7. M
  8. E
  9. F
  10. C
    [ 5 others ]

140027 (94.8%)
1684 ( 1.1%)
1544 ( 1.1%)
1515 ( 1.0%)
562 ( 0.4%)
544 ( 0.4%)
478 ( 0.3%)
376 ( 0.2%)
338 ( 0.2%)
219 ( 0.1%)
378 ( 0.2%)

147665 (99.86%)

204 (0.14%)

58

ROAD_REL_CD [character]

  1. A
  2. B
  3. C
  4. D
  5. E
  6. F
  7. G
  8. Y
  9. Z

125560 (85.0%)
4149 ( 2.8%)
806 ( 0.5%)
5638 ( 3.8%)
9251 ( 6.3%)
585 ( 0.4%)
114 ( 0.1%)
227 ( 0.1%)
1337 ( 0.9%)

147667 (99.86%)

202 (0.14%)

59

ROAD_TYPE_CD [character]

  1. A
  2. B
  3. C
  4. D
  5. Y
  6. Z

14849 (10.1%)
85651 (58.0%)
38722 (26.2%)
6769 ( 4.6%)
114 ( 0.1%)
1545 ( 1.1%)

147650 (99.85%)

219 (0.15%)

60

RPT_ORIGIN [character]

  1. IN
  2. LSU
  3. SHREVEPORTPD
  4. BATONROUGEPD
  5. LAFAYETTEPD
  6. BR
  7. JEFFERSONPSO
  8. LAKECHARLESPD
  9. KENNERPD
  10. EBRPSO
    [ 151 others ]

34034 (23.0%)
33572 (22.7%)
9202 ( 6.2%)
7727 ( 5.2%)
7365 ( 5.0%)
5778 ( 3.9%)
3996 ( 2.7%)
3423 ( 2.3%)
2086 ( 1.4%)
1964 ( 1.3%)
38722 (26.1%)

147869 (100%)

0 (0%)

61

SEC_DIST [numeric]

mean (sd) : 11 (139.73)
min < med < max :
-2.34 < 0 < 10000
IQR (CV) : 0 (12.7)

1069 distinct val.

142226 (96.18%)

5643 (3.82%)

62

SEC_DIR [character]

  1. 0
  2. E
  3. N
  4. S
  5. W

1 ( 0.0%)
5798 (24.2%)
5860 (24.5%)
6023 (25.2%)
6240 (26.1%)

23922 (16.18%)

123947 (83.82%)

63

SEC_INTERSECTION [logical]

145954 (98.7%)
1915 ( 1.3%)

147869 (100%)

0 (0%)

64

SEC_INTERSECTION_NOT [logical]

100657 (68.1%)
47212 (31.9%)

147869 (100%)

0 (0%)

65

INTERSECTION [logical]

94758 (64.1%)
53111 (35.9%)

147869 (100%)

0 (0%)

66

INTERSECTION_NOT [logical]

60411 (40.8%)
87458 (59.2%)

147869 (100%)

0 (0%)

67

SEC_INTER_ROAD [character]

  1. I-10
  2. I-610
  3. I-20
  4. HWY 14
  5. LA 45
  6. HWY 182
  7. LA 49
  8. I-12
  9. US 90B
  10. US 90
    [ 9516 others ]

352 ( 1.3%)
277 ( 1.1%)
248 ( 0.9%)
243 ( 0.9%)
223 ( 0.9%)
189 ( 0.7%)
177 ( 0.7%)
174 ( 0.7%)
153 ( 0.6%)
151 ( 0.6%)
24101 (68.2%)

26288 (17.78%)

121581 (82.22%)

68

SEVERITY_CD [character]

  1. A
  2. B
  3. C
  4. D
  5. E

636 ( 0.4%)
1228 ( 0.8%)
9082 ( 6.1%)
32048 (21.7%)
104875 (70.9%)

147869 (100%)

0 (0%)

69

SURF_COND_CD [character]

  1. A
  2. B
  3. C
  4. D
  5. E
  6. Y
  7. Z

126463 (85.6%)
20207 (13.7%)
188 ( 0.1%)
236 ( 0.2%)
123 ( 0.1%)
493 ( 0.3%)
24 ( 0.0%)

147734 (99.91%)

135 (0.09%)

70

SURF_TYPE_CD [character]

  1. B
  2. A
  3. D
  4. Z
  5. C
  6. E
  7. Y
  8. I
  9. F
  10. G
    [ 5 others ]

88378 (61.4%)
54125 (37.6%)
663 ( 0.5%)
186 ( 0.1%)
180 ( 0.1%)
133 ( 0.1%)
126 ( 0.1%)
26 ( 0.0%)
24 ( 0.0%)
11 ( 0.0%)
23 ( 0.0%)

143875 (97.3%)

3994 (2.7%)

71

TIME_AMB_ARR [numeric]

mean (sd) : 367.09 (2.71)
min < med < max :
0.05 < 367 < 368
IQR (CV) : 0 (0.01)

1448 distinct val.

147867 (100%)

2 (0%)

72

TIME_AMB_ARR_HOSP [numeric]

mean (sd) : 367.06 (2.14)
min < med < max :
0.07 < 367 < 368
IQR (CV) : 0 (0.01)

1444 distinct val.

147864 (100%)

5 (0%)

73

TIME_AMB_CALLED [numeric]

mean (sd) : 367.09 (2.87)
min < med < max :
0.05 < 367 < 368
IQR (CV) : 0 (0.01)

1449 distinct val.

147868 (100%)

1 (0%)

74

TIME_AMB_DEPART [numeric]

mean (sd) : 367.09 (2.71)
min < med < max :
0.06 < 367 < 368
IQR (CV) : 0 (0.01)

1447 distinct val.

147867 (100%)

2 (0%)

75

TIME_RESCUE_CALLED [numeric]

mean (sd) : 367.03 (2.14)
min < med < max :
0.41 < 367 < 368
IQR (CV) : 0 (0.01)

1424 distinct val.

147864 (100%)

5 (0%)

76

TIME_RESCUE_ARR [numeric]

mean (sd) : 367.03 (1.91)
min < med < max :
0.41 < 367 < 368
IQR (CV) : 0 (0.01)

1429 distinct val.

147863 (100%)

6 (0%)

77

TIME_LANES_OPEN [numeric]

mean (sd) : 367.53 (3.03)
min < med < max :
0.04 < 367.59 < 368
IQR (CV) : 0.34 (0.01)

1450 distinct val.

147869 (100%)

0 (0%)

78

TIME_POLICE_NOTE [numeric]

mean (sd) : 367.54 (3.03)
min < med < max :
0.06 < 367.6 < 368
IQR (CV) : 0.31 (0.01)

1450 distinct val.

147869 (100%)

0 (0%)

79

TIME_POLICE_ARR [numeric]

mean (sd) : 367.55 (3.03)
min < med < max :
0.09 < 367.6 < 368
IQR (CV) : 0.31 (0.01)

1450 distinct val.

147869 (100%)

0 (0%)

80

TRK_BUS_INV [logical]

143096 (96.8%)
4773 ( 3.2%)

147869 (100%)

0 (0%)

81

TROOP [character]

  1. B
  2. A
  3. I
  4. L
  5. E
  6. G
  7. C
  8. F
  9. D
  10. Q
    [ 3 others ]

10455 (20.8%)
8522 (17.0%)
6766 (13.5%)
5384 (10.7%)
4594 ( 9.1%)
4539 ( 9.0%)
4138 ( 8.2%)
3705 ( 7.4%)
2134 ( 4.2%)
2 ( 0.0%)
3 ( 0.0%)

50242 (33.98%)

97627 (66.02%)

82

WEATHER_CD [character]

  1. A
  2. B
  3. C
  4. D
  5. E
  6. F
  7. G
  8. H
  9. Y
  10. Z

108915 (73.7%)
22688 (15.4%)
14407 ( 9.8%)
568 ( 0.4%)
113 ( 0.1%)
245 ( 0.2%)
37 ( 0.0%)
12 ( 0.0%)
650 ( 0.4%)
70 ( 0.1%)

147705 (99.89%)

164 (0.11%)

83

CODE [integer]

mean (sd) : 2892.64 (1554.51)
min < med < max :
0 < 2804 < 6405
IQR (CV) : 1999 (0.54)

315 distinct val.

147869 (100%)

0 (0%)

84

EST_ALCOHOL [integer]

mean (sd) : 0.06 (0.24)
min < med < max :
0 < 0 < 3
IQR (CV) : 0 (4.2)

3 distinct val.

147869 (100%)

0 (0%)

85

WHO_ENTERED [character]

  1. entry
  2. aclark1
  3. jlebl61
  4. bcrist1
  5. sregne1
  6. barbaradavis
  7. bstrin2
  8. cdougl6
  9. kforbe1
  10. asanso1
    [ 4597 others ]

9202 ( 6.6%)
6761 ( 4.9%)
4129 ( 3.0%)
4073 ( 2.9%)
2504 ( 1.8%)
2467 ( 1.8%)
2113 ( 1.5%)
1397 ( 1.0%)
1333 ( 1.0%)
1108 ( 0.8%)
103798 (72.7%)

138885 (93.92%)

8984 (6.08%)

86

DATE_CHANGED [numeric]

mean (sd) : 40405.49 (299.53)
min < med < max :
367 < 40414 < 43842
IQR (CV) : 190 (0.01)

487 distinct val.

147869 (100%)

0 (0%)

87

PROCESS_DATE [integer]

mean (sd) : 40061.16 (3816.58)
min < med < max :
367 < 40363 < 369202
IQR (CV) : 178 (0.1)

708 distinct val.

147869 (100%)

0 (0%)

88

CITY [character]

  1. NEW ORLEANS
  2. BATON ROUGE
  3. SHREVEPORT
  4. LAFAYETTE
  5. RURAL
  6. LAKE CHARLES
  7. BOSSIER CITY
  8. MONROE
  9. KENNER
  10. HOUMA
    [ 543 others ]

16315 (16.8%)
14567 (15.0%)
9216 ( 9.5%)
7382 ( 7.6%)
4695 ( 4.9%)
3557 ( 3.7%)
3091 ( 3.2%)
2494 ( 2.6%)
2089 ( 2.2%)
1546 ( 1.6%)
31905 (32.6%)

96857 (65.5%)

51012 (34.5%)

89

CONST_MAINT_ZN [logical]

146012 (98.7%)
1857 ( 1.3%)

147869 (100%)

0 (0%)

90

FATALITY [logical]

147213 (99.6%)
656 ( 0.4%)

147869 (100%)

0 (0%)

91

HWY_TYPE_CD [character]

  1. A
  2. B
  3. C
  4. D
  5. E
  6. G

15039 (10.3%)
23846 (16.3%)
48386 (33.1%)
17993 (12.3%)
40960 (28.0%)
161 ( 0.1%)

146385 (99%)

1484 (1%)

92

INJURY [logical]

120323 (81.4%)
27546 (18.6%)

147869 (100%)

0 (0%)

93

INTER_ROAD_DIR [character]

  1. E
  2. N
  3. NE
  4. NW
  5. S
  6. SE
  7. SW
  8. W

4425 (25.3%)
4710 (26.9%)
102 ( 0.6%)
119 ( 0.7%)
3919 (22.4%)
53 ( 0.3%)
111 ( 0.6%)
4075 (23.3%)

17514 (11.84%)

130355 (88.16%)

94

INTER_ROAD_NAME [character]

  1. I-10
  2. I-12
  3. AIRLINE
  4. VETERANS
  5. US 90
  6. MAIN
  7. US 190
  8. LA 1
  9. LA 182
  10. CANAL
    [ 25857 others ]

1159 ( 0.8%)
821 ( 0.6%)
586 ( 0.4%)
514 ( 0.4%)
496 ( 0.3%)
494 ( 0.3%)
479 ( 0.3%)
470 ( 0.3%)
451 ( 0.3%)
439 ( 0.3%)
138959 (71.9%)

144868 (97.97%)

3001 (2.03%)

95

INTER_ROAD_NUM [numeric]

mean (sd) : 232.87 (1207.18)
min < med < max :
-49 < 0 < 111000
IQR (CV) : 0 (5.18)

961 distinct val.

142279 (96.22%)

5590 (3.78%)

96

INTER_ROAD_TYPE [character]

  1. ST
  2. STREET
  3. RD
  4. DR
  5. AVE
  6. AVENUE
  7. BLVD
  8. DRIVE
  9. ROAD
  10. HWY
    [ 209 others ]

15650 (20.8%)
10315 (13.7%)
8968 (11.9%)
7752 (10.3%)
6191 ( 8.2%)
3769 ( 5.0%)
3537 ( 4.7%)
2862 ( 3.8%)
2730 ( 3.6%)
1976 ( 2.6%)
11298 (14.9%)

75048 (50.75%)

72821 (49.25%)

97

INVEST_AGENCY_NAME [character]

  1. LADPS
  2. NEW ORLEANS PD
  3. BATON ROUGE POLICE
  4. LAFAYETTE CITY POLICE
  5. SPD
  6. city
  7. JEFFERSON PARISH SHERIFF’
  8. LAKE CHARLES PD
  9. NOPD
  10. SHREVEPORT POLICE DEPT
    [ 1486 others ]

34030 (23.0%)
9036 ( 6.1%)
7742 ( 5.2%)
7363 ( 5.0%)
6610 ( 4.5%)
5697 ( 3.9%)
4269 ( 2.9%)
3507 ( 2.4%)
2684 ( 1.8%)
2491 ( 1.7%)
64373 (42.3%)

147802 (99.95%)

67 (0.05%)

98

INVEST_OFFICER_BADGENUM [character]

  1. 102630
  2. 225
  3. 474
  4. 2512
  5. 102333
  6. 96367
  7. 106928
  8. 13233
  9. 27097
  10. 113071
    [ 6240 others ]

424 ( 0.3%)
400 ( 0.3%)
381 ( 0.3%)
366 ( 0.2%)
347 ( 0.2%)
334 ( 0.2%)
326 ( 0.2%)
316 ( 0.2%)
304 ( 0.2%)
302 ( 0.2%)
142078 (94.3%)

145578 (98.45%)

2291 (1.55%)

99

PARISH [character]

  1. EBR
  2. ORLNS
  3. JEFF
  4. CADDO
  5. LAFYT
  6. CALC
  7. STTAM
  8. OUACH
  9. RAPDS
  10. BOSS
    [ 55 others ]

20336 (13.8%)
16451 (11.1%)
15471 (10.5%)
10316 ( 7.0%)
9982 ( 6.8%)
6267 ( 4.2%)
5823 ( 3.9%)
5183 ( 3.5%)
4344 ( 2.9%)
4035 ( 2.7%)
49661 (33.6%)

147869 (100%)

0 (0%)

100

PEDESTRIAN [logical]

146942 (99.4%)
927 ( 0.6%)

147869 (100%)

0 (0%)

101

PHOTOS_MADE [logical]

128838 (87.1%)
19031 (12.9%)

147869 (100%)

0 (0%)

102

PRI_ROAD [character]

  1. I-10
  2. I-20
  3. LA 1
  4. VETERANS BLVD
  5. I-12
  6. AIRLINE DRIVE
  7. INTERSTATE 10
  8. MAIN ST
  9. Interstate 10
  10. US 90
    [ 40164 others ]

1348 ( 1.0%)
761 ( 0.6%)
694 ( 0.5%)
632 ( 0.5%)
535 ( 0.4%)
525 ( 0.4%)
519 ( 0.4%)
441 ( 0.3%)
433 ( 0.3%)
413 ( 0.3%)
128623 (58.7%)

134924 (91.25%)

12945 (8.75%)

103

QUADRANT_NE [logical]

147385 (99.7%)
484 ( 0.3%)

147869 (100%)

0 (0%)

104

QUADRANT_NW [logical]

147250 (99.6%)
619 ( 0.4%)

147869 (100%)

0 (0%)

105

QUADRANT_SE [logical]

147430 (99.7%)
439 ( 0.3%)

147869 (100%)

0 (0%)

106

QUADRANT_SW [logical]

147378 (99.7%)
491 ( 0.3%)

147869 (100%)

0 (0%)

107

REPORT_NUM_2 [character]

  1. NOPD
  2. N.O.P.D.
  3. MONROE PD
  4. LA0510000
  5. CADDO SO
  6. MONROE CITY P.D.
  7. 760
  8. MONROE
  9. LA0500100
  10. BOSSIER CITY P.D.
    [ 79923 others ]

1250 (1.5%)
621 (0.7%)
271 (0.3%)
249 (0.3%)
154 (0.2%)
141 (0.2%)
105 (0.1%)
88 (0.1%)
75 (0.1%)
57 (0.1%)
82541 (0.8%)

85552 (57.86%)

62317 (42.14%)

108

SEC_INTER_ROAD_DIR [character]

  1. E
  2. N
  3. NE
  4. NW
  5. S
  6. SE
  7. SW
  8. W

1004 (33.8%)
617 (20.7%)
18 ( 0.6%)
23 ( 0.8%)
538 (18.1%)
15 ( 0.5%)
29 ( 1.0%)
731 (24.6%)

2975 (2.01%)

144894 (97.99%)

109

SEC_INTER_ROAD_NAME [character]

  1. I-10
  2. MAIN
  3. HWY 14
  4. HWY 182
  5. WILLIAMS
  6. I-20
  7. HWY 674
  8. AMBASSADOR CAFFERY
  9. JOHNSTON
  10. INTERSTATE
    [ 5012 others ]

407 ( 2.1%)
284 ( 1.5%)
260 ( 1.3%)
260 ( 1.3%)
253 ( 1.3%)
246 ( 1.3%)
192 ( 1.0%)
177 ( 0.9%)
172 ( 0.9%)
148 ( 0.8%)
17068 (105.3%)

19467 (13.17%)

128402 (86.83%)

110

SEC_INTER_ROAD_NUM [numeric]

mean (sd) : 31.01 (363.09)
min < med < max :
0 < 0 < 42000
IQR (CV) : 0 (11.71)

443 distinct val.

142167 (96.14%)

5702 (3.86%)

111

SEC_INTER_ROAD_TYPE [character]

  1. ST
  2. RD
  3. HIGHWAY
  4. HWY
  5. STREET
  6. DR
  7. AVE
  8. BLVD
  9. ROAD
  10. DRIVE
    [ 81 others ]

2147 (19.2%)
1858 (16.6%)
937 ( 8.4%)
865 ( 7.7%)
854 ( 7.6%)
835 ( 7.5%)
746 ( 6.7%)
659 ( 5.9%)
437 ( 3.9%)
254 ( 2.3%)
1585 (14.2%)

11177 (7.56%)

136692 (92.44%)

112

SERVICE_ROAD_N [logical]

147500 (99.8%)
369 ( 0.2%)

147869 (100%)

0 (0%)

113

SERVICE_ROAD_S [logical]

147496 (99.8%)
373 ( 0.2%)

147869 (100%)

0 (0%)

114

SERVICE_ROAD_E [logical]

147717 (99.9%)
152 ( 0.1%)

147869 (100%)

0 (0%)

115

SERVICE_ROAD_W [logical]

147730 (99.9%)
139 ( 0.1%)

147869 (100%)

0 (0%)

116

SERVICE_ROAD [logical]

All NA’s

0 (0%)

147869 (100%)

117

PRI_MEASUREMENT_MILES [logical]

104686 (70.8%)
43183 (29.2%)

147869 (100%)

0 (0%)

118

PRI_MEASUREMENT_FEET [logical]

94718 (64.1%)
53151 (35.9%)

147869 (100%)

0 (0%)

119

SEC_MEASUREMENT_FEET [logical]

143858 (97.3%)
4011 ( 2.7%)

147869 (100%)

0 (0%)

120

SEC_MEASUREMENT_MILES [logical]

127553 (86.3%)
20316 (13.7%)

147869 (100%)

0 (0%)

121

DATE_ENTERED [numeric]

mean (sd) : 40327.63 (1662.23)
min < med < max :
367 < 40399 < 40848
IQR (CV) : 179 (0.04)

492 distinct val.

147869 (100%)

0 (0%)

122

DISTRICT [integer]

mean (sd) : 20.76 (26.41)
min < med < max :
2 < 4 < 62
IQR (CV) : 59 (1.27)

2 : 41608 (28.1%)
3 : 21431 (14.5%)
4 : 16786 (11.3%)
5 : 7841 ( 5.3%)
7 : 8205 ( 5.5%)
8 : 8042 ( 5.4%)
58 : 828 ( 0.6%)
61 : 27570 (18.6%)
62 : 15542 (10.5%)

147853 (99.99%)

16 (0.01%)

123

CRASH_YEAR [integer]

mean (sd) : 2010 (0.03)
min < med < max :
2004 < 2010 < 2013
IQR (CV) : 0 (0)

2004 : 1 ( 0.0%)
2007 : 2 ( 0.0%)
2008 : 12 ( 0.0%)
2009 : 13 ( 0.0%)
2010 : 147831 (100.0%)
2011 : 8 ( 0.0%)
2012 : 1 ( 0.0%)
2013 : 1 ( 0.0%)

147869 (100%)

0 (0%)

124

HWY_BYPASS [character]

  1. 182
  2. 674
  3. 90
  4. 14
  5. 10
  6. 675
  7. 1
  8. 57
  9. 3040
  10. 84
    [ 208 others ]

230 (10.7%)
212 ( 9.9%)
194 ( 9.0%)
110 ( 5.1%)
66 ( 3.1%)
56 ( 2.6%)
42 ( 2.0%)
42 ( 2.0%)
41 ( 1.9%)
40 ( 1.9%)
1113 (52.1%)

2146 (1.45%)

145723 (98.55%)

125

STATE_RPT_NUM [integer]

mean (sd) : 0 (0)
min < med < max :
0 < 0 < 0
IQR (CV) : 0 (NaN)

1 distinct val.

6 (0%)

147863 (100%)

126

REV_NUM [integer]

mean (sd) : 0.08 (0.33)
min < med < max :
-1 < 0 < 7
IQR (CV) : 0 (4.34)

9 distinct val.

147869 (100%)

0 (0%)

127

CURR_STAT [logical]

147869 (100.0%)

147869 (100%)

0 (0%)

128

REV_STAT [integer]

mean (sd) : 0.01 (0.12)
min < med < max :
0 < 0 < 5
IQR (CV) : 0 (9.41)

6 distinct val.

146724 (99.23%)

1145 (0.77%)

129

GLOB_STAT [logical]

147869 (100.0%)

147869 (100%)

0 (0%)

130

OUT [character]

  1. DE
  2. OF

86156 (60.6%)
55911 (39.4%)

142067 (96.08%)

5802 (3.92%)

131

PAGE_OWNER [character]

  1. User, Test
  2. Etienne, Chris
  3. MALLENAHALLI, SUDHA
  4. HAMILTON, LONNIE
  5. Parker, Gerald
  6. Ledoux, Ashley
  7. Kreamer, Michael
  8. Poirier, Donald
  9. Rachal, Michael
  10. Bedwell, Sgt. Ray
    [ 557 others ]

438 (24.5%)
173 ( 9.7%)
91 ( 5.1%)
38 ( 2.1%)
27 ( 1.5%)
25 ( 1.4%)
23 ( 1.3%)
22 ( 1.2%)
21 ( 1.2%)
16 ( 0.9%)
915 (52.6%)

1789 (1.21%)

146080 (98.79%)

132

REV_DATE [integer]

mean (sd) : 10445.77 (17366.44)
min < med < max :
367 < 367 < 40637
IQR (CV) : 39819 (1.66)

411 distinct val.

142155 (96.14%)

5714 (3.86%)

133

PAGE_OWNER_APPROVER [character]

  1. User, Test
  2. Jones, James
  3. Mallenahalli, Sudha
  4. Parker, Gerald
  5. Hamilton, Lonnie
  6. Rachal, Michael
  7. Kreamer, Michael
  8. Michel, Sgt. Shawn
  9. Viney, James
  10. Poirier, Donald
    [ 309 others ]

438 (24.5%)
152 ( 8.5%)
90 ( 5.0%)
42 ( 2.4%)
39 ( 2.2%)
38 ( 2.1%)
29 ( 1.6%)
29 ( 1.6%)
28 ( 1.6%)
25 ( 1.4%)
879 (49.6%)

1789 (1.21%)

146080 (98.79%)

134

VERSION_ORIGINAL [character]

  1. 1.9.2217.21241
  2. 1.9.867.5309

605 ( 0.7%)
84951 (99.3%)

85556 (57.86%)

62313 (42.14%)

135

VERSION_CURRENT [character]

  1. 1.9.2217.21241
  2. 1.9.867.5309

427 ( 0.5%)
87762 (99.5%)

88189 (59.64%)

59680 (40.36%)

136

num_tot_inj_b_veh [integer]

mean (sd) : 0.01 (0.11)
min < med < max :
0 < 0 < 5
IQR (CV) : 0 (11.74)

6 distinct val.

147705 (99.89%)

164 (0.11%)

137

num_tot_inj_c_veh [integer]

mean (sd) : 0.08 (0.35)
min < med < max :
0 < 0 < 11
IQR (CV) : 0 (4.45)

11 distinct val.

147705 (99.89%)

164 (0.11%)

138

num_tot_inj_d_veh [integer]

mean (sd) : 0.37 (0.88)
min < med < max :
0 < 0 < 41
IQR (CV) : 0 (2.38)

29 distinct val.

147705 (99.89%)

164 (0.11%)

139

num_tot_inj_b_ped [integer]

mean (sd) : 0 (0.03)
min < med < max :
0 < 0 < 3
IQR (CV) : 0 (37.67)

4 distinct val.

147869 (100%)

0 (0%)

140

num_tot_inj_c_ped [integer]

mean (sd) : 0 (0.06)
min < med < max :
0 < 0 < 6
IQR (CV) : 0 (18.32)

4 distinct val.

147869 (100%)

0 (0%)

141

num_tot_inj_d_ped [integer]

mean (sd) : 0 (0.06)
min < med < max :
0 < 0 < 4
IQR (CV) : 0 (17.99)

5 distinct val.

147869 (100%)

0 (0%)

142

num_tot_inj_b [integer]

mean (sd) : 0.01 (0.11)
min < med < max :
0 < 0 < 5
IQR (CV) : 0 (11.23)

6 distinct val.

147705 (99.89%)

164 (0.11%)

143

num_tot_inj_c [integer]

mean (sd) : 0.08 (0.35)
min < med < max :
0 < 0 < 11
IQR (CV) : 0 (4.33)

11 distinct val.

147705 (99.89%)

164 (0.11%)

144

num_tot_inj_d [integer]

mean (sd) : 0.37 (0.88)
min < med < max :
0 < 0 < 41
IQR (CV) : 0 (2.36)

29 distinct val.

147705 (99.89%)

164 (0.11%)

145

num_occ [integer]

mean (sd) : 2.72 (1.88)
min < med < max :
1 < 2 < 65
IQR (CV) : 1 (0.69)

56 distinct val.

147705 (99.89%)

164 (0.11%)

146

num_occ_no_seatb [integer]

mean (sd) : 0.1 (1.13)
min < med < max :
0 < 0 < 60
IQR (CV) : 0 (11)

52 distinct val.

147705 (99.89%)

164 (0.11%)

147

violation [integer]

mean (sd) : 1 (0.37)
min < med < max :
0 < 1 < 6
IQR (CV) : 0 (0.37)

7 distinct val.

147705 (99.89%)

164 (0.11%)

148

speed [integer]

mean (sd) : 0 (0)
min < med < max :
0 < 0 < 0
IQR (CV) : 0 (NaN)

1 distinct val.

6 (0%)

147863 (100%)

149

num_hospitalized_veh [integer]

mean (sd) : 0.22 (0.65)
min < med < max :
0 < 0 < 29
IQR (CV) : 0 (2.97)

18 distinct val.

147705 (99.89%)

164 (0.11%)

150

num_hospitalized_ped [integer]

mean (sd) : 0.01 (0.08)
min < med < max :
0 < 0 < 6
IQR (CV) : 0 (14.7)

5 distinct val.

147869 (100%)

0 (0%)

151

num_tot_hospitalized [integer]

mean (sd) : 0.23 (0.66)
min < med < max :
0 < 0 < 29
IQR (CV) : 0 (2.91)

18 distinct val.

147705 (99.89%)

164 (0.11%)

152

agressive [integer]

mean (sd) : 0.7 (0.48)
min < med < max :
0 < 1 < 5
IQR (CV) : 1 (0.69)

6 distinct val.

147705 (99.89%)

164 (0.11%)

153

distraction [integer]

mean (sd) : 0.58 (0.52)
min < med < max :
0 < 1 < 5
IQR (CV) : 1 (0.91)

6 distinct val.

147705 (99.89%)

164 (0.11%)

154

HSRG_DATE [integer]

mean (sd) : 40407.52 (117.45)
min < med < max :
40007 < 40414 < 40763
IQR (CV) : 195 (0)

462 distinct val.

147869 (100%)

0 (0%)

library(DataExplorer)
## Warning: package 'DataExplorer' was built under R version 3.4.3
plot_missing(dat1)

plot_missing(dat2)

plot_bar(dat2)
## 27 columns ignored with more than 50 categories.
## CRASH_NUM: 147869 categories
## CRASH_NUM1: 147869 categories
## ISDS_CODE: 86 categories
## AMB_SERVICE: 5608 categories
## DIST_ZONE: 4319 categories
## FIRE_DEPT: 4507 categories
## INTER_ROAD: 41269 categories
## INVEST_OFFICER: 19042 categories
## PRI_ROAD_NAME: 20189 categories
## PRI_ROAD_TYPE: 208 categories
## REPORT_NUM: 70243 categories
## RPT_ORIGIN: 161 categories
## SEC_INTER_ROAD: 9527 categories
## WHO_ENTERED: 4608 categories
## CITY: 554 categories
## INTER_ROAD_NAME: 25868 categories
## INTER_ROAD_TYPE: 220 categories
## INVEST_AGENCY_NAME: 1497 categories
## INVEST_OFFICER_BADGENUM: 6251 categories
## PARISH: 65 categories
## PRI_ROAD: 40175 categories
## REPORT_NUM_2: 79934 categories
## SEC_INTER_ROAD_NAME: 5023 categories
## SEC_INTER_ROAD_TYPE: 92 categories
## HWY_BYPASS: 219 categories
## PAGE_OWNER: 568 categories
## PAGE_OWNER_APPROVER: 320 categories

plot_correlation(dat2, use = "pairwise.complete.obs")
## 28 features with more than 20 categories ignored!
## CRASH_NUM: 147869 categories
## CRASH_NUM1: 147869 categories
## ISDS_CODE: 86 categories
## AMB_SERVICE: 5608 categories
## BYPASS_CD: 43 categories
## DIST_ZONE: 4319 categories
## FIRE_DEPT: 4507 categories
## INTER_ROAD: 41269 categories
## INVEST_OFFICER: 19042 categories
## PRI_ROAD_NAME: 20189 categories
## PRI_ROAD_TYPE: 208 categories
## REPORT_NUM: 70243 categories
## RPT_ORIGIN: 161 categories
## SEC_INTER_ROAD: 9527 categories
## WHO_ENTERED: 4608 categories
## CITY: 554 categories
## INTER_ROAD_NAME: 25868 categories
## INTER_ROAD_TYPE: 220 categories
## INVEST_AGENCY_NAME: 1497 categories
## INVEST_OFFICER_BADGENUM: 6251 categories
## PARISH: 65 categories
## PRI_ROAD: 40175 categories
## REPORT_NUM_2: 79934 categories
## SEC_INTER_ROAD_NAME: 5023 categories
## SEC_INTER_ROAD_TYPE: 92 categories
## HWY_BYPASS: 219 categories
## PAGE_OWNER: 568 categories
## PAGE_OWNER_APPROVER: 320 categories
## Warning in cor(final_data, ...): the standard deviation is zero