Reading the excel file
library(readxl)
mydiamonds<-read_excel("diamonds.xlsx")
Names of variables
names(mydiamonds)
## [1] "carat" "cut" "color" "clarity" "depth" "table" "price"
## [8] "x" "y" "z"
Top 6 observations
head(mydiamonds)
## # A tibble: 6 x 10
## carat cut color clarity depth table price x y z
## <dbl> <chr> <chr> <chr> <dbl> <dbl> <dbl> <dbl> <dbl> <dbl>
## 1 0.23 Ideal E SI2 61.5 55 326 3.95 3.98 2.43
## 2 0.21 Premium E SI1 59.8 61 326 3.89 3.84 2.31
## 3 0.23 Good E VS1 56.9 65 327 4.05 4.07 2.31
## 4 0.290 Premium I VS2 62.4 58 334 4.2 4.23 2.63
## 5 0.31 Good J SI2 63.3 58 335 4.34 4.35 2.75
## 6 0.24 Very Good J VVS2 62.8 57 336 3.94 3.96 2.48
Creating a new variable
mydiamonds$pricetable<-mydiamonds$price+mydiamonds$table
head(mydiamonds$pricetable)
## [1] 381 387 392 392 393 393
summary(mydiamonds$pricetable)
## Min. 1st Qu. Median Mean 3rd Qu. Max.
## 381 1007 2459 3990 5383 18883