First we bring in the data file and rename the columns to be more usable names
kickstart <- read.csv("A2_kickstart.csv", stringsAsFactors = FALSE)
colnames(kickstart) <- c("Project", "num_launched", "num_successful", "dol_pleged", "num_pleged", "success_rate", "avg_pleged")
Convert the dollars pleged into millions
library(dplyr)
## Warning: package 'dplyr' was built under R version 3.4.3
##
## Attaching package: 'dplyr'
## The following objects are masked from 'package:stats':
##
## filter, lag
## The following objects are masked from 'package:base':
##
## intersect, setdiff, setequal, union
kickstart2 <- kickstart %>% arrange(dol_pleged) %>% mutate(mdol_pleged = round(dol_pleged / 1000000, digits = 0))
## Warning: package 'bindrcpp' was built under R version 3.4.4
Create graphic
library(ggplot2)
library(ggthemes)
## Warning: package 'ggthemes' was built under R version 3.4.4
library(scales)
## Warning: package 'scales' was built under R version 3.4.4
ggplot(kickstart2, aes(x = reorder(Project, mdol_pleged), fill = success_rate)) +
geom_bar(stat = "identity", aes(y = mdol_pleged)) +
geom_text(aes(label=dollar(mdol_pleged), y = mdol_pleged),hjust = -0.05, color="grey", size = 3) +
coord_flip() +
xlab("Project Category") +
ylab("Total Pledged (M)") +
ggtitle("Kickstarter 2012 Crowdfunded Projects") +
labs(fill='*Success Rate (%)', caption = "Source: Company Reports *Fully funded projects as a % of all projects", subtitle = "Author: Sean McGowan") +
scale_y_continuous(labels = scales :: dollar, limits=c(0, 90))+
scale_fill_gradient(low="blue", high="red") +
theme_few()
