Base R has many built in functions that can be used to create different type of plots. Some of them are discussed here.

Get help on your problems from experienced statisticians at homeworkhelponline.net.


Pie Chart

> food <- c("Burger","Pasta","Pizza","Rice","Chicken")
> price <- c(200,150,600,100,90)
> # to find percentage amount
> par <- round(price/sum(price)*100)    
> # to define Food object in pie chart with percentage sign and value
> labs <- paste(food,par,"%")
> pie(price,
+     labels = labs, 
+     col=1:5,
+     main="Pie Chart of Food Price")

> pie(price,
+     labels = labs, col=1:5,
+     main="Pie Chart of Food Price",
+     radius=0.4)

Barplot

> barplot(price,main="Barplot", xlab="Food", ylab="Price",
+         names.arg=food)

> barplot(price,main="Barplot", xlab="Price", ylab="Food Item",
+         names.arg=food,col=1:5)

> barplot(price, ylab="Food", xlab="Price", main="Barplot of Foods",
+         horiz=F, names.arg=food,
+         border="blue",
+         col="lightblue",
+         density=30)

Using legend -

> barplot(price,
+         main="Barplot", xlab="Price", ylab="Food Item",
+         col=1:5)
> legend(x = "topright",food,lty="solid",col=1:5, bg = "gray90", text.col = "blue4")

Histogram

> N <- 100
> set.seed(11)
> x <- rnorm(1000, 10, 3)   # to draw 1000 normal random numebrs
> hist(x, breaks=N,
+      main="Histogram of Sampling DIstribution",xlab="Samples Range",ylab="Frequency")

Reducing the number of breaks -

> N <- 30
> hist(x, breaks=N,
+      main="Histogram of Sampling DIstribution",xlab="Samples Range",ylab="Frequency")

Increasing the number of breaks -

> N <- 200
> hist(x, breaks=N,
+      main="Histogram of Sampling DIstribution",xlab="Samples Range",ylab="Frequency")

Sturges formula can be used for breaks using “Sturges” -

> hist(x, breaks="Sturges",
+      main="Histogram of Sampling DIstribution",xlab="Samples Range",ylab="Frequency")

To set probabilities in the y-axis set probability=T -

> hist(x, breaks="Sturges",
+      main="Histogram of Sampling Distribution",xlab="Samples Range",ylab="Probability",
+      probability = T)

Y and X axis’s range can be changed using xlim and ylim -

> hist(x, breaks=100,
+      main="Histogram of Sampling Distribution",xlab="Samples Range",ylab="Probability",
+      probability = T, xlim=c(-5,25), ylim= c(0,0.2))

Density Plot

Using the function density() we can find kernal density -

> set.seed(11)
> a <- rnorm(1000, 10, 3)   # to draw 1000 normal random numbers
> x <- density(a)
> plot(x,
+      main="Histogram of Sampling DIstribution",xlab="Samples Range",ylab="Frequency")

Using polygon() we can customize it-

> plot(x,
+      main="Histogram of Sampling DIstribution",
+      xlab="Samples Range",ylab="Frequency")
> polygon(x, col = "steelblue", border="black")

Boxplot

> set.seed(10)
> norm.number <- rnorm(100, 10, 3)
> pois.number <- rpois(10, 10)
> unif.number <- runif(n = 100, min = 0, max = 20)
> boxplot(norm.number, pois.number, unif.number,
+         main="Boxplot of different distributions")

Passing data frame to boxplot and using horizontal = T-

> dists <- data.frame(Normal=norm.number,
+                     Poisson=pois.number,
+                     Uniform=unif.number)
> boxplot(dists,
+         main="Boxplot of different distributions", horizontal = T)

> boxplot(dists,
+         main="Boxplot of different distributions", horizontal = T,
+         xlab="Frequiency", ylab="Distributions", col=1:3, las=1)

Scatter plot

This is the simplest way to graph a scatter plot -

> x <- 1:20
> y <- log10(x)*10
> plot(x,y,
+      main="Relationship between X and Y",
+      xlab="X-axis", ylab="Y-axis")

Changing the type of points -

> x <- 1:20
> y <- log10(x)*10
> plot(x,y,
+      main="Relationship between X and Y",
+      xlab="X-axis", ylab="Y-axis",
+      pch=20)

> x <- 1:20
> y <- log10(x)*10
> plot(x,y,
+      main="Relationship between X and Y",
+      xlab="X-axis", ylab="Y-axis",
+      pch=10)

See the effect of using the argument las=1. It rotates the value of y-axis when las=1, rotates the value of x-axis when las=2 and rotates both when las=3. las=1 is pretty good to see:

> plot(x,y,
+      main="Relationship between X and Y",
+      xlab="X-axis", ylab="Y-axis",
+      las=1)

Adding a fitted line to the graph -

> x <- 1:20
> y <- log10(x)*10
> plot(x,y,
+      main="Relationship between X and Y",
+      xlab="X-axis", ylab="Y-axis",
+      pch=20)
> abline(lm(y ~ x), col="red")  # regression line
> lines(lowess(x,y), col="blue")  # draws a smooth line through the plot

Using cex to change the size of dots:

> plot(x,y,
+      main="Relationship between X and Y",
+      xlab="X-axis", ylab="Y-axis",
+      cex=0.55)

> plot(x,y,
+      main="Relationship between X and Y",
+      xlab="X-axis", ylab="Y-axis",
+      cex=1.4)

Let’s use the built-in USArrests data set-

> head(USArrests)
           Murder Assault UrbanPop Rape
Alabama      13.2     236       58 21.2
Alaska       10.0     263       48 44.5
Arizona       8.1     294       80 31.0
Arkansas      8.8     190       50 19.5
California    9.0     276       91 40.6
Colorado      7.9     204       78 38.7

Now -

> plot(USArrests$Murder, USArrests$Assault,
+      main="Relationship between Assault and Murder",
+      xlab="No. of Murder", ylab="Np. of Assault")
> abline(lm(USArrests$Assault ~ USArrests$Murder), col="red")
> lines(lowess(USArrests$Murder, USArrests$Assault), col="blue")

Multiple Scatterplots

Let’s use the built-in USArrests data set-

> head(USArrests)
           Murder Assault UrbanPop Rape
Alabama      13.2     236       58 21.2
Alaska       10.0     263       48 44.5
Arizona       8.1     294       80 31.0
Arkansas      8.8     190       50 19.5
California    9.0     276       91 40.6
Colorado      7.9     204       78 38.7

Let’s see the relationships through graph and correlation matrix -

> pairs(~Murder+UrbanPop+Rape,data=USArrests,
+    main="Simple Scatterplot Matrix")

> round(cor(USArrests[,c(1,3,4)]),2)
         Murder UrbanPop Rape
Murder     1.00     0.07 0.56
UrbanPop   0.07     1.00 0.41
Rape       0.56     0.41 1.00

Line plot

In plot() the argument type takes the values: “p” for points
“l” for lines
“b” for both points and lines
“c” for empty points joined by lines
“o” for overplotted points and lines
“s” and “S” for stair steps
“n” does not produce any points or lines

lty is for line type. Line types can either be specified as an integer (0=blank, 1=solid (default), 2=dashed, 3=dotted, 4=dotdash, 5=longdash, 6=twodash) or as one of the character strings “blank”, “solid”, “dashed”, “dotted”, “dotdash”, “longdash”, or “twodash” -

> x <- 1:20
> y <- log10(x)*10
> plot(x,y,
+      main="Relationship between X and Y",
+      xlab="X-axis", ylab="Y-axis", 
+      type="l",lty=1)

Using type=b and pch=20 -

> plot(x,y,
+      main="Relationship between X and Y",
+      xlab="X-axis", ylab="Y-axis", 
+      type="b",lty=1, pch=20)

---
title: "Basic Plotting"
author: "MD AHSANUL ISLAM"
output: 
  html_document:
    toc: false
    toc_float: true
    toc_depth: 2
    theme: cerulean
    code_download: true
---

---

```{r, include=FALSE}
knitr::opts_chunk$set(
  comment = "", prompt = TRUE, message=F, warning = F
)
```
## {.tabset .tabset-fade .tabset-pills}

Base R has many built in functions that can be used to create different type of plots. Some of them are discussed here.

Get help on your problems from experienced statisticians at [homeworkhelponline.net](https://www.homeworkhelponline.net/programming/r-programming).

------

### Pie Chart

```{r}
food <- c("Burger","Pasta","Pizza","Rice","Chicken")
price <- c(200,150,600,100,90)
# to find percentage amount
par <- round(price/sum(price)*100)	
# to define Food object in pie chart with percentage sign and value
labs <- paste(food,par,"%")
pie(price,
    labels = labs, 
    col=1:5,
    main="Pie Chart of Food Price")
```


```{r}
pie(price,
    labels = labs, col=1:5,
    main="Pie Chart of Food Price",
    radius=0.4)
```



### Barplot

```{r}
barplot(price,main="Barplot", xlab="Food", ylab="Price",
        names.arg=food)
```

```{r}
barplot(price,main="Barplot", xlab="Price", ylab="Food Item",
        names.arg=food,col=1:5)
```
```{r}
barplot(price, ylab="Food", xlab="Price", main="Barplot of Foods",
        horiz=F, names.arg=food,
        border="blue",
        col="lightblue",
        density=30)
```

Using legend -
```{r}
barplot(price,
        main="Barplot", xlab="Price", ylab="Food Item",
        col=1:5)
legend(x = "topright",food,lty="solid",col=1:5, bg = "gray90", text.col = "blue4")
```


### Histogram

```{r}
N <- 100
set.seed(11)
x <- rnorm(1000, 10, 3)	# to draw 1000 normal random numebrs
hist(x, breaks=N,
     main="Histogram of Sampling DIstribution",xlab="Samples Range",ylab="Frequency")
```

Reducing the number of breaks -
```{r}
N <- 30
hist(x, breaks=N,
     main="Histogram of Sampling DIstribution",xlab="Samples Range",ylab="Frequency")
```

Increasing the number of breaks -
```{r}
N <- 200
hist(x, breaks=N,
     main="Histogram of Sampling DIstribution",xlab="Samples Range",ylab="Frequency")
```

Sturges formula can be used for breaks using "Sturges" -
```{r}
hist(x, breaks="Sturges",
     main="Histogram of Sampling DIstribution",xlab="Samples Range",ylab="Frequency")
```

To set probabilities in the y-axis set `probability=T` -
```{r}
hist(x, breaks="Sturges",
     main="Histogram of Sampling Distribution",xlab="Samples Range",ylab="Probability",
     probability = T)
```

Y and X axis's range can be changed using `xlim` and `ylim` -
```{r}
hist(x, breaks=100,
     main="Histogram of Sampling Distribution",xlab="Samples Range",ylab="Probability",
     probability = T, xlim=c(-5,25), ylim= c(0,0.2))
```


### Density Plot

Using the function `density()` we can find kernal density -
```{r}
set.seed(11)
a <- rnorm(1000, 10, 3)	# to draw 1000 normal random numbers
x <- density(a)
plot(x,
     main="Histogram of Sampling DIstribution",xlab="Samples Range",ylab="Frequency")
```

Using `polygon()` we can customize it-
```{r}
plot(x,
     main="Histogram of Sampling DIstribution",
     xlab="Samples Range",ylab="Frequency")
polygon(x, col = "steelblue", border="black")
```

### Boxplot

```{r}
set.seed(10)
norm.number <- rnorm(100, 10, 3)
pois.number <- rpois(10, 10)
unif.number <- runif(n = 100, min = 0, max = 20)
boxplot(norm.number, pois.number, unif.number,
        main="Boxplot of different distributions")
```

Passing data frame to boxplot and using `horizontal = T`-
```{r}
dists <- data.frame(Normal=norm.number,
                    Poisson=pois.number,
                    Uniform=unif.number)
boxplot(dists,
        main="Boxplot of different distributions", horizontal = T)
```

```{r}
boxplot(dists,
        main="Boxplot of different distributions", horizontal = T,
        xlab="Frequiency", ylab="Distributions", col=1:3, las=1)
```

### Scatter plot

This is the simplest way to graph a scatter plot -
```{r}
x <- 1:20
y <- log10(x)*10
plot(x,y,
     main="Relationship between X and Y",
     xlab="X-axis", ylab="Y-axis")
```

Changing the type of points -
```{r}
x <- 1:20
y <- log10(x)*10
plot(x,y,
     main="Relationship between X and Y",
     xlab="X-axis", ylab="Y-axis",
     pch=20)
```

```{r}
x <- 1:20
y <- log10(x)*10
plot(x,y,
     main="Relationship between X and Y",
     xlab="X-axis", ylab="Y-axis",
     pch=10)
```


See the effect of using the argument `las=1`. It rotates the value of y-axis when `las=1`, rotates the value of x-axis when `las=2` and rotates both when `las=3`. `las=1` is pretty good to see:
```{r}
plot(x,y,
     main="Relationship between X and Y",
     xlab="X-axis", ylab="Y-axis",
     las=1)
```

Adding a fitted line to the graph - 
```{r}
x <- 1:20
y <- log10(x)*10
plot(x,y,
     main="Relationship between X and Y",
     xlab="X-axis", ylab="Y-axis",
     pch=20)
abline(lm(y ~ x), col="red")  # regression line
lines(lowess(x,y), col="blue")  # draws a smooth line through the plot
```

Using `cex` to change the size of dots:
```{r}
plot(x,y,
     main="Relationship between X and Y",
     xlab="X-axis", ylab="Y-axis",
     cex=0.55)
```

```{r}
plot(x,y,
     main="Relationship between X and Y",
     xlab="X-axis", ylab="Y-axis",
     cex=1.4)
```


Let's use the built-in USArrests data set-
```{r}
head(USArrests)
```

Now -
```{r}
plot(USArrests$Murder, USArrests$Assault,
     main="Relationship between Assault and Murder",
     xlab="No. of Murder", ylab="Np. of Assault")
abline(lm(USArrests$Assault ~ USArrests$Murder), col="red")
lines(lowess(USArrests$Murder, USArrests$Assault), col="blue")
```

### Multiple Scatterplots

Let's use the built-in USArrests data set-
```{r}
head(USArrests)
```

Let's see the relationships through graph and correlation matrix -
```{r}
pairs(~Murder+UrbanPop+Rape,data=USArrests,
   main="Simple Scatterplot Matrix")
round(cor(USArrests[,c(1,3,4)]),2)
```

### Line plot 

In `plot()` the argument `type` takes the values: 
“p” for points   
“l” for lines   
“b” for both points and lines   
“c” for empty points joined by lines   
“o” for overplotted points and lines   
“s” and “S” for stair steps   
“n” does not produce any points or lines   

`lty` is for line type. Line types can either be specified as an integer (0=blank, 1=solid (default), 2=dashed, 3=dotted, 4=dotdash, 5=longdash, 6=twodash) or as one of the character strings “blank”, “solid”, “dashed”, “dotted”, “dotdash”, “longdash”, or “twodash” -
```{r}
x <- 1:20
y <- log10(x)*10
plot(x,y,
     main="Relationship between X and Y",
     xlab="X-axis", ylab="Y-axis", 
     type="l",lty=1)
```

Using type=b and pch=20 -
```{r}
plot(x,y,
     main="Relationship between X and Y",
     xlab="X-axis", ylab="Y-axis", 
     type="b",lty=1, pch=20)
```

















