beaver <- read.csv(file=“/Users/domin/OneDrive/Desktop/beaver.csv”, header=TRUE, sep=“,”) 1. Use the summary function to gain an overview of the data set. Then display the mean and median for at least two attributes.

  beaver <- read.csv(file="/Users/domin/OneDrive/Desktop/beaver.csv", header=TRUE, sep=",")
  summary(beaver)
##        X               day             time           temp           activ     
##  Min.   :  1.00   Min.   :307.0   Min.   :   0   Min.   :36.58   Min.   :0.00  
##  1st Qu.: 25.75   1st Qu.:307.0   1st Qu.:1128   1st Qu.:37.15   1st Qu.:0.00  
##  Median : 50.50   Median :307.0   Median :1535   Median :37.73   Median :1.00  
##  Mean   : 50.50   Mean   :307.1   Mean   :1446   Mean   :37.60   Mean   :0.62  
##  3rd Qu.: 75.25   3rd Qu.:307.0   3rd Qu.:1942   3rd Qu.:37.98   3rd Qu.:1.00  
##  Max.   :100.00   Max.   :308.0   Max.   :2350   Max.   :38.35   Max.   :1.00
time_mean <- mean(beaver$time)
time_median <- median(beaver$time)

temp_mean <- mean(beaver$temp)
temp_median <- median(beaver$temp)
print(paste0("time mean is ", round(time_mean, 2),", time median is ", round(time_median, 2)))
## [1] "time mean is 1446.2, time median is 1535"
print(paste0("temp mean is ", round(temp_mean, 2),", temp median is ", round(temp_median, 2)))
## [1] "temp mean is 37.6, temp median is 37.74"
  1. Create a new data frame with a subset of the columns and rows. Make sure to rename it.
animals <- data.frame(subset(beaver, time >1535 & temp>=37.74 ))
  1. Create new column names for the new data frame
colnames(animals) <- c("X_new","day_new","time_new","temp_new","activ_new")
  1. Use the summary function to create an overview of your new data frame. The print the mean and median for the same two attributes. Please compare.
summary(animals)
##      X_new          day_new       time_new       temp_new       activ_new
##  Min.   :39.00   Min.   :307   Min.   :1550   Min.   :37.74   Min.   :1  
##  1st Qu.:49.75   1st Qu.:307   1st Qu.:1738   1st Qu.:37.84   1st Qu.:1  
##  Median :60.50   Median :307   Median :1925   Median :37.99   Median :1  
##  Mean   :61.82   Mean   :307   Mean   :1946   Mean   :37.99   Mean   :1  
##  3rd Qu.:73.50   3rd Qu.:307   3rd Qu.:2135   3rd Qu.:38.11   3rd Qu.:1  
##  Max.   :86.00   Max.   :307   Max.   :2340   Max.   :38.35   Max.   :1
ntime_mean <- mean(animals$time_new)
ntime_median <- median(animals$time_new)
ntemp_mean <- mean(animals$temp_new)
ntemp_median <- median(animals$temp_new)
print(paste0("time mean is ", round(time_mean, 2),", time_new mean is ", round(ntime_mean, 2)))
## [1] "time mean is 1446.2, time_new mean is 1946.36"
print(paste0("time median is ", round(time_median, 2),", time_new median is ", round(ntime_median, 2)))
## [1] "time median is 1535, time_new median is 1925"
print(paste0("temp mean is ", round(temp_mean, 2),", temp_new mean is ", round(ntemp_mean,2)))
## [1] "temp mean is 37.6, temp_new mean is 37.99"
print(paste0("temp median is ", round(temp_median,2),", temp_new median is ", round(ntemp_median,2)))
## [1] "temp median is 37.74, temp_new median is 37.99"
  1. For at least 3 values in a column please rename so that every value in that column is renamed.
animals$activ_new <- as.character(animals$activ_new)
animals$activ_new[animals$activ_new == "1"] <- "ACTIVE"
  1. Display enough rows to see examples of all of steps 1-5 above
head(animals,10)
##    X_new day_new time_new temp_new activ_new
## 39    39     307     1550    37.98    ACTIVE
## 40    40     307     1600    38.02    ACTIVE
## 41    41     307     1610    38.00    ACTIVE
## 42    42     307     1620    38.24    ACTIVE
## 43    43     307     1630    38.10    ACTIVE
## 44    44     307     1640    38.24    ACTIVE
## 45    45     307     1650    38.11    ACTIVE
## 46    46     307     1700    38.02    ACTIVE
## 47    47     307     1710    38.11    ACTIVE
## 48    48     307     1720    38.01    ACTIVE