Project description: https://www.coursera.org/learn/exploratory-data-analysis/peer/ylVFo/course-project-1
Import data from txt file
file_name <- "household_power_consumption.txt"
data <- read.table(file_name, header = TRUE, sep = ";", dec = ".", na.strings = "?")
Subset data from the dates 2007-02-01 and 2007-02-02
data <- data[data$Date %in% c("1/2/2007","2/2/2007"), ]
Plot the histogram plot
hist(data[, 3], col = "red", main = "Global Active Power",
xlab = "Global Active Power (kilowatts)")
Set language to English (days in the x-axis)
Sys.setlocale("LC_TIME", "English")
## [1] "English_United States.1252"
Format the time vector
date_converted <- as.Date(data[, 1], format = "%d/%m/%Y")
time_converted <- strptime(data[, 2], format = "%H:%M:%S")
time_axis <- as.POSIXct(paste(date_converted, data[, 2]))
Plot global active power against time vector
plot(time_axis, data[, 3], xlab = "", ylab = "Global Active Power (kilowatts)", type = "l")
plot(time_axis, data[, 7], xlab = "", ylab = "Energy sub metering", type = "l")
lines(time_axis, data[, 8], col = "red")
lines(time_axis, data[, 9], col = "blue")
legend("topright", c("Sub_metering_1", "Sub_metering_2", "Sub_metering_3"),
col = c("black","red","blue"), lty = 1)
Plot four graphs based on a 2x2 layout
par(mfrow = c(2,2))
plot(time_axis, data[, 3], xlab = "", ylab = "Global Active Power (kilowatts)", type = "l")
plot(time_axis, data[, 5], xlab = "datetime", ylab = "Voltage", type = "l")
plot(time_axis, data[, 7], xlab = "", ylab = "Energy sub metering", type = "l")
lines(time_axis, data[, 8], col = "red")
lines(time_axis, data[, 9], col = "blue")
legend("topright", c("Sub_metering_1", "Sub_metering_2", "Sub_metering_3"),
col = c("black","red","blue"), cex = 0.8, lty = 1 , bty = "n")
plot(time_axis, data[, 4], xlab = "datetime", ylab = "Global_reactive_power", type = "l")