beaver <- read.csv(file=“/Users/domin/OneDrive/Desktop/beaver.csv”, header=TRUE, sep=“,”) 1. Use the summary function to gain an overview of the data set. Then display the mean and median for at least two attributes.
beaver <- read.csv(file="/Users/domin/OneDrive/Desktop/beaver.csv", header=TRUE, sep=",")
summary(beaver)
## X day time temp activ
## Min. : 1.00 Min. :307.0 Min. : 0 Min. :36.58 Min. :0.00
## 1st Qu.: 25.75 1st Qu.:307.0 1st Qu.:1128 1st Qu.:37.15 1st Qu.:0.00
## Median : 50.50 Median :307.0 Median :1535 Median :37.73 Median :1.00
## Mean : 50.50 Mean :307.1 Mean :1446 Mean :37.60 Mean :0.62
## 3rd Qu.: 75.25 3rd Qu.:307.0 3rd Qu.:1942 3rd Qu.:37.98 3rd Qu.:1.00
## Max. :100.00 Max. :308.0 Max. :2350 Max. :38.35 Max. :1.00
time_mean <- mean(beaver$time)
time_median <- median(beaver$time)
temp_mean <- mean(beaver$temp)
temp_median <- median(beaver$temp)
print(paste0("time mean is ", round(time_mean, 2),", time median is ", round(time_median, 2)))
## [1] "time mean is 1446.2, time median is 1535"
print(paste0("temp mean is ", round(temp_mean, 2),", temp median is ", round(temp_median, 2)))
## [1] "temp mean is 37.6, temp median is 37.74"
animals <- data.frame(subset(beaver, time >1535 & temp>=37.74 ))
colnames(animals) <- c("X_new","day_new","time_new","temp_new","activ_new")
summary(animals)
## X_new day_new time_new temp_new activ_new
## Min. :39.00 Min. :307 Min. :1550 Min. :37.74 Min. :1
## 1st Qu.:49.75 1st Qu.:307 1st Qu.:1738 1st Qu.:37.84 1st Qu.:1
## Median :60.50 Median :307 Median :1925 Median :37.99 Median :1
## Mean :61.82 Mean :307 Mean :1946 Mean :37.99 Mean :1
## 3rd Qu.:73.50 3rd Qu.:307 3rd Qu.:2135 3rd Qu.:38.11 3rd Qu.:1
## Max. :86.00 Max. :307 Max. :2340 Max. :38.35 Max. :1
ntime_mean <- mean(animals$time_new)
ntime_median <- median(animals$time_new)
ntemp_mean <- mean(animals$temp_new)
ntemp_median <- median(animals$temp_new)
print(paste0("time mean is ", round(time_mean, 2),", time_new mean is ", round(ntime_mean, 2)))
## [1] "time mean is 1446.2, time_new mean is 1946.36"
print(paste0("time median is ", round(time_median, 2),", time_new median is ", round(ntime_median, 2)))
## [1] "time median is 1535, time_new median is 1925"
print(paste0("temp mean is ", round(temp_mean, 2),", temp_new mean is ", round(ntemp_mean,2)))
## [1] "temp mean is 37.6, temp_new mean is 37.99"
print(paste0("temp median is ", round(temp_median,2),", temp_new median is ", round(ntemp_median,2)))
## [1] "temp median is 37.74, temp_new median is 37.99"
animals$activ_new <- as.character(animals$activ_new)
animals$activ_new[animals$activ_new == "1"] <- "ACTIVE"
head(animals,10)
## X_new day_new time_new temp_new activ_new
## 39 39 307 1550 37.98 ACTIVE
## 40 40 307 1600 38.02 ACTIVE
## 41 41 307 1610 38.00 ACTIVE
## 42 42 307 1620 38.24 ACTIVE
## 43 43 307 1630 38.10 ACTIVE
## 44 44 307 1640 38.24 ACTIVE
## 45 45 307 1650 38.11 ACTIVE
## 46 46 307 1700 38.02 ACTIVE
## 47 47 307 1710 38.11 ACTIVE
## 48 48 307 1720 38.01 ACTIVE