This is a crime data set from Los Angeles from 2020 to the present
library(dplyr)
##
## Attaching package: 'dplyr'
## The following objects are masked from 'package:stats':
##
## filter, lag
## The following objects are masked from 'package:base':
##
## intersect, setdiff, setequal, union
getwd()
## [1] "/Users/elyssa/Desktop"
data <- read.csv("dataset.csv")
Summary…
summary(data)
## DR_NO Date.Rptd DATE.OCC TIME.OCC
## Min. : 817 Length:978628 Length:978628 Min. : 1
## 1st Qu.:210607328 Class :character Class :character 1st Qu.: 900
## Median :220811628 Mode :character Mode :character Median :1420
## Mean :219656430 Mean :1339
## 3rd Qu.:230911028 3rd Qu.:1900
## Max. :249925282 Max. :2359
##
## AREA AREA.NAME Rpt.Dist.No Part.1.2
## Min. : 1.0 Length:978628 Min. : 101 Min. :1.000
## 1st Qu.: 5.0 Class :character 1st Qu.: 589 1st Qu.:1.000
## Median :11.0 Mode :character Median :1141 Median :1.000
## Mean :10.7 Mean :1117 Mean :1.405
## 3rd Qu.:16.0 3rd Qu.:1617 3rd Qu.:2.000
## Max. :21.0 Max. :2199 Max. :2.000
##
## Crm.Cd Crm.Cd.Desc Mocodes Vict.Age
## Min. :110.0 Length:978628 Length:978628 Min. : -4.00
## 1st Qu.:331.0 Class :character Class :character 1st Qu.: 0.00
## Median :442.0 Mode :character Mode :character Median : 30.00
## Mean :500.8 Mean : 29.12
## 3rd Qu.:626.0 3rd Qu.: 44.00
## Max. :956.0 Max. :120.00
##
## Vict.Sex Vict.Descent Premis.Cd Premis.Desc
## Length:978628 Length:978628 Min. :101.0 Length:978628
## Class :character Class :character 1st Qu.:101.0 Class :character
## Mode :character Mode :character Median :203.0 Mode :character
## Mean :306.2
## 3rd Qu.:501.0
## Max. :976.0
## NA's :15
## Weapon.Used.Cd Weapon.Desc Status Status.Desc
## Min. :101.0 Length:978628 Length:978628 Length:978628
## 1st Qu.:311.0 Class :character Class :character Class :character
## Median :400.0 Mode :character Mode :character Mode :character
## Mean :363.8
## 3rd Qu.:400.0
## Max. :516.0
## NA's :652669
## Crm.Cd.1 Crm.Cd.2 Crm.Cd.3 Crm.Cd.4
## Min. :110.0 Min. :210.0 Min. :310.0 Min. :821.0
## 1st Qu.:331.0 1st Qu.:998.0 1st Qu.:998.0 1st Qu.:998.0
## Median :442.0 Median :998.0 Median :998.0 Median :998.0
## Mean :500.6 Mean :958.2 Mean :984.2 Mean :991.2
## 3rd Qu.:626.0 3rd Qu.:998.0 3rd Qu.:998.0 3rd Qu.:998.0
## Max. :956.0 Max. :999.0 Max. :999.0 Max. :999.0
## NA's :11 NA's :909812 NA's :976319 NA's :978564
## LOCATION Cross.Street LAT LON
## Length:978628 Length:978628 Min. : 0.00 Min. :-118.7
## Class :character Class :character 1st Qu.:34.01 1st Qu.:-118.4
## Mode :character Mode :character Median :34.06 Median :-118.3
## Mean :34.00 Mean :-118.1
## 3rd Qu.:34.16 3rd Qu.:-118.3
## Max. :34.33 Max. : 0.0
##
histogram…
hist(data$TIME.OCC)
ggplot…
plot(data$TIME.OCC,data$Crm.Cd)
Correlation…
cor(data$TIME.OCC,data$Crm.Cd)
## [1] 0.01186739