Who Will Win the 2016 Presidential Election?

##   polarity subjectivity pos_refs_per_ref neg_refs_per_ref
## 1       -1    0.6666667        0.0000000        0.6666667
## 2        1    0.5000000        0.5000000        0.0000000
## 3        0    0.3333333        0.1666667        0.1666667
##   senti_diffs_per_ref
## 1          -0.6666667
## 2           0.5000000
## 3           0.0000000

##   polarity subjectivity pos_refs_per_ref neg_refs_per_ref
## 1       -1          0.5              0.0              0.5
## 2        1          0.5              0.5              0.0
##   senti_diffs_per_ref
## 1                -0.5
## 2                 0.5

##       polarity subjectivity pos_refs_per_ref neg_refs_per_ref
## 1   1.00000000   0.09803922       0.09803922       0.00000000
## 2   0.09090909   0.25581395       0.13953488       0.11627907
## 3   0.50000000   0.12500000       0.09375000       0.03125000
## 4   1.00000000   0.07317073       0.07317073       0.00000000
## 5   1.00000000   0.08333333       0.08333333       0.00000000
## 6   0.60000000   0.07352941       0.05882353       0.01470588
## 7  -0.14285714   0.14893617       0.06382979       0.08510638
## 8  -1.00000000   0.06666667       0.00000000       0.06666667
## 9   1.00000000   0.06122449       0.06122449       0.00000000
## 10  0.25000000   0.23529412       0.14705882       0.08823529
## 11  0.00000000   0.10526316       0.05263158       0.05263158
## 12  0.00000000   0.05555556       0.02777778       0.02777778
## 13  0.60000000   0.09259259       0.07407407       0.01851852
## 14  1.00000000   0.03030303       0.03030303       0.00000000
## 15 -0.33333333   0.09375000       0.03125000       0.06250000
## 16  1.00000000   0.03703704       0.03703704       0.00000000
## 17  0.00000000   0.07547170       0.03773585       0.03773585
## 18  0.60000000   0.17857143       0.14285714       0.03571429
## 19  0.33333333   0.11111111       0.07407407       0.03703704
## 20  0.00000000   0.00000000       0.00000000       0.00000000
## 21  1.00000000   0.06250000       0.06250000       0.00000000
## 22  1.00000000   0.10000000       0.10000000       0.00000000
## 23 -0.60000000   0.19230769       0.03846154       0.15384615
## 24  0.60000000   0.15151515       0.12121212       0.03030303
## 25  1.00000000   0.12500000       0.12500000       0.00000000
## 26  0.00000000   0.07142857       0.03571429       0.03571429
## 27  0.00000000   0.21052632       0.10526316       0.10526316
## 28  0.33333333   0.09090909       0.06060606       0.03030303
## 29  0.00000000   0.06451613       0.03225806       0.03225806
## 30 -0.33333333   0.10714286       0.03571429       0.07142857
##    senti_diffs_per_ref
## 1           0.09803922
## 2           0.02325581
## 3           0.06250000
## 4           0.07317073
## 5           0.08333333
## 6           0.04411765
## 7          -0.02127660
## 8          -0.06666667
## 9           0.06122449
## 10          0.05882353
## 11          0.00000000
## 12          0.00000000
## 13          0.05555556
## 14          0.03030303
## 15         -0.03125000
## 16          0.03703704
## 17          0.00000000
## 18          0.10714286
## 19          0.03703704
## 20          0.00000000
## 21          0.06250000
## 22          0.10000000
## 23         -0.11538462
## 24          0.09090909
## 25          0.12500000
## 26          0.00000000
## 27          0.00000000
## 28          0.03030303
## 29          0.00000000
## 30         -0.03571429

##     polarity        subjectivity     pos_refs_per_ref  neg_refs_per_ref 
##  Min.   :-1.0000   Min.   :0.00000   Min.   :0.00000   Min.   :0.00000  
##  1st Qu.: 0.0000   1st Qu.:0.06786   1st Qu.:0.03604   1st Qu.:0.00000  
##  Median : 0.3333   Median :0.09317   Median :0.06186   Median :0.03078  
##  Mean   : 0.3499   Mean   :0.10588   Mean   :0.06811   Mean   :0.03778  
##  3rd Qu.: 1.0000   3rd Qu.:0.12500   3rd Qu.:0.09697   3rd Qu.:0.06003  
##  Max.   : 1.0000   Max.   :0.25581   Max.   :0.14706   Max.   :0.15385  
##  senti_diffs_per_ref
##  Min.   :-0.11538   
##  1st Qu.: 0.00000   
##  Median : 0.03367   
##  Mean   : 0.03033   
##  3rd Qu.: 0.06250   
##  Max.   : 0.12500

##     polarity        subjectivity     pos_refs_per_ref  neg_refs_per_ref 
##  Min.   :-0.3333   Min.   :0.03030   Min.   :0.02778   Min.   :0.00000  
##  1st Qu.: 0.0000   1st Qu.:0.06970   1st Qu.:0.03571   1st Qu.:0.00000  
##  Median : 0.3333   Median :0.09175   Median :0.06720   Median :0.03030  
##  Mean   : 0.4296   Mean   :0.10619   Mean   :0.07334   Mean   :0.03285  
##  3rd Qu.: 1.0000   3rd Qu.:0.11458   3rd Qu.:0.10383   3rd Qu.:0.03721  
##  Max.   : 1.0000   Max.   :0.25581   Max.   :0.14706   Max.   :0.11628  
##  senti_diffs_per_ref
##  Min.   :-0.03571   
##  1st Qu.: 0.00000   
##  Median : 0.03367   
##  Mean   : 0.04049   
##  3rd Qu.: 0.06421   
##  Max.   : 0.12500

##     polarity        subjectivity     pos_refs_per_ref  neg_refs_per_ref 
##  Min.   :-1.0000   Min.   :0.00000   Min.   :0.00000   Min.   :0.00000  
##  1st Qu.:-0.1071   1st Qu.:0.06838   1st Qu.:0.03739   1st Qu.:0.00000  
##  Median : 0.2500   Median :0.09688   Median :0.06066   Median :0.03348  
##  Mean   : 0.2588   Mean   :0.10553   Mean   :0.06212   Mean   :0.04341  
##  3rd Qu.: 0.9000   3rd Qu.:0.14295   3rd Qu.:0.09115   3rd Qu.:0.06563  
##  Max.   : 1.0000   Max.   :0.21053   Max.   :0.14286   Max.   :0.15385  
##  senti_diffs_per_ref
##  Min.   :-0.11538   
##  1st Qu.:-0.01596   
##  Median : 0.01852   
##  Mean   : 0.01872   
##  3rd Qu.: 0.06250   
##  Max.   : 0.10714

##     polarity        subjectivity     pos_refs_per_ref  neg_refs_per_ref 
##  Min.   :0.00000   Min.   :0.06452   Min.   :0.03226   Min.   :0.03030  
##  1st Qu.:0.08333   1st Qu.:0.07111   1st Qu.:0.03935   1st Qu.:0.03079  
##  Median :0.16667   Median :0.07771   Median :0.04643   Median :0.03128  
##  Mean   :0.16667   Mean   :0.07771   Mean   :0.04643   Mean   :0.03128  
##  3rd Qu.:0.25000   3rd Qu.:0.08431   3rd Qu.:0.05352   3rd Qu.:0.03177  
##  Max.   :0.33333   Max.   :0.09091   Max.   :0.06061   Max.   :0.03226  
##  senti_diffs_per_ref
##  Min.   :0.000000   
##  1st Qu.:0.007576   
##  Median :0.015152   
##  Mean   :0.015152   
##  3rd Qu.:0.022727   
##  Max.   :0.030303

##     polarity        subjectivity     pos_refs_per_ref  neg_refs_per_ref 
##  Min.   :-1.0000   Min.   :0.00000   Min.   :0.00000   Min.   :0.00000  
##  1st Qu.: 0.0000   1st Qu.:0.07186   1st Qu.:0.03792   1st Qu.:0.00000  
##  Median : 0.4167   Median :0.09589   Median :0.06850   Median :0.03078  
##  Mean   : 0.3653   Mean   :0.11065   Mean   :0.07222   Mean   :0.03843  
##  3rd Qu.: 1.0000   3rd Qu.:0.14295   3rd Qu.:0.09951   3rd Qu.:0.06003  
##  Max.   : 1.0000   Max.   :0.25581   Max.   :0.14706   Max.   :0.15385  
##  senti_diffs_per_ref
##  Min.   :-0.11538   
##  1st Qu.: 0.00000   
##  Median : 0.04058   
##  Mean   : 0.03378   
##  3rd Qu.: 0.07050   
##  Max.   : 0.12500

##     polarity        subjectivity     pos_refs_per_ref  neg_refs_per_ref 
##  Min.   :-0.3333   Min.   :0.03704   Min.   :0.03571   Min.   :0.00000  
##  1st Qu.: 0.0000   1st Qu.:0.05456   1st Qu.:0.03604   1st Qu.:0.01786  
##  Median : 0.3333   Median :0.07209   Median :0.03638   Median :0.03571  
##  Mean   : 0.3333   Mean   :0.07209   Mean   :0.03638   Mean   :0.03571  
##  3rd Qu.: 0.6667   3rd Qu.:0.08962   3rd Qu.:0.03671   3rd Qu.:0.05357  
##  Max.   : 1.0000   Max.   :0.10714   Max.   :0.03704   Max.   :0.07143  
##  senti_diffs_per_ref 
##  Min.   :-0.0357143  
##  1st Qu.:-0.0175265  
##  Median : 0.0006614  
##  Mean   : 0.0006614  
##  3rd Qu.: 0.0188492  
##  Max.   : 0.0370370

## [1] "Using direct authentication"

## [1] 1

## [1] "Rate limited .... blocking for a minute and retrying up to 119 times ..."

##     polarity      subjectivity     pos_refs_per_ref  neg_refs_per_ref 
##  Min.   :-1.00   Min.   :0.00000   Min.   :0.00000   Min.   :0.00000  
##  1st Qu.: 0.00   1st Qu.:0.00000   1st Qu.:0.00000   1st Qu.:0.00000  
##  Median : 0.00   Median :0.06066   Median :0.00000   Median :0.00000  
##  Mean   : 0.01   Mean   :0.07348   Mean   :0.03633   Mean   :0.03715  
##  3rd Qu.: 0.00   3rd Qu.:0.12500   3rd Qu.:0.07280   3rd Qu.:0.07280  
##  Max.   : 1.00   Max.   :0.33333   Max.   :0.16667   Max.   :0.21429  
##  senti_diffs_per_ref 
##  Min.   :-0.1428571  
##  1st Qu.: 0.0000000  
##  Median : 0.0000000  
##  Mean   :-0.0008273  
##  3rd Qu.: 0.0000000  
##  Max.   : 0.1538461

By comparing the top two Democratic and Republican candidates, I predict that Doanld Trump will win the election because he has the second highest network density, the most mentions on twitter around Washington, realtively equal positive and neutral remarks composing tweets he is mentioned in, and positive mean polarity and mean sentiment.

## [1] "Using direct authentication"

## [1] 1

##     polarity        subjectivity     pos_refs_per_ref  neg_refs_per_ref
##  Min.   :-1.0000   Min.   :0.00000   Min.   :0.00000   Min.   :0.0000  
##  1st Qu.: 0.0000   1st Qu.:0.00000   1st Qu.:0.00000   1st Qu.:0.0000  
##  Median : 0.0000   Median :0.07143   Median :0.00000   Median :0.0000  
##  Mean   : 0.1144   Mean   :0.07288   Mean   :0.04388   Mean   :0.0290  
##  3rd Qu.: 1.0000   3rd Qu.:0.12500   3rd Qu.:0.07692   3rd Qu.:0.0625  
##  Max.   : 1.0000   Max.   :0.46154   Max.   :0.40000   Max.   :0.2500  
##  senti_diffs_per_ref
##  Min.   :-0.25000   
##  1st Qu.: 0.00000   
##  Median : 0.00000   
##  Mean   : 0.01489   
##  3rd Qu.: 0.06667   
##  Max.   : 0.40000

##     polarity        subjectivity     pos_refs_per_ref  neg_refs_per_ref 
##  Min.   :-1.0000   Min.   :0.00000   Min.   :0.00000   Min.   :0.00000  
##  1st Qu.: 0.0000   1st Qu.:0.05000   1st Qu.:0.00000   1st Qu.:0.00000  
##  Median : 0.3333   Median :0.08333   Median :0.06458   Median :0.00000  
##  Mean   : 0.1801   Mean   :0.10513   Mean   :0.06938   Mean   :0.03575  
##  3rd Qu.: 1.0000   3rd Qu.:0.20000   3rd Qu.:0.13333   3rd Qu.:0.06667  
##  Max.   : 1.0000   Max.   :0.55556   Max.   :0.55556   Max.   :0.20000  
##  senti_diffs_per_ref
##  Min.   :-0.20000   
##  1st Qu.: 0.00000   
##  Median : 0.05556   
##  Mean   : 0.03362   
##  3rd Qu.: 0.06667   
##  Max.   : 0.55556

##     polarity         subjectivity     pos_refs_per_ref  neg_refs_per_ref 
##  Min.   :-1.00000   Min.   :0.00000   Min.   :0.00000   Min.   :0.00000  
##  1st Qu.:-0.33333   1st Qu.:0.00000   1st Qu.:0.00000   1st Qu.:0.00000  
##  Median : 0.00000   Median :0.07692   Median :0.00000   Median :0.00000  
##  Mean   : 0.02102   Mean   :0.09039   Mean   :0.04466   Mean   :0.04573  
##  3rd Qu.: 0.60000   3rd Qu.:0.13333   3rd Qu.:0.07692   3rd Qu.:0.07692  
##  Max.   : 1.00000   Max.   :0.75000   Max.   :0.50000   Max.   :0.40000  
##  senti_diffs_per_ref
##  Min.   :-0.400000  
##  1st Qu.:-0.052632  
##  Median : 0.000000  
##  Mean   :-0.001066  
##  3rd Qu.: 0.066667  
##  Max.   : 0.400000

##     polarity         subjectivity     pos_refs_per_ref  neg_refs_per_ref 
##  Min.   :-1.00000   Min.   :0.00000   Min.   :0.00000   Min.   :0.00000  
##  1st Qu.: 0.00000   1st Qu.:0.00000   1st Qu.:0.00000   1st Qu.:0.00000  
##  Median : 0.00000   Median :0.08333   Median :0.00000   Median :0.00000  
##  Mean   : 0.03962   Mean   :0.08621   Mean   :0.04855   Mean   :0.03766  
##  3rd Qu.: 0.50000   3rd Qu.:0.12500   3rd Qu.:0.07692   3rd Qu.:0.07692  
##  Max.   : 1.00000   Max.   :0.36364   Max.   :0.28571   Max.   :0.25000  
##  senti_diffs_per_ref
##  Min.   :-0.25000   
##  1st Qu.: 0.00000   
##  Median : 0.00000   
##  Mean   : 0.01089   
##  3rd Qu.: 0.06250   
##  Max.   : 0.28571

polarityMeans = c(-0.08503, 0.337, 0.03197, 0.2528)
barplot(polarityMeans, main="Comparing Mean Polarities of Top Presidential Candidates", names.arg=c("Hillary Clinton", "Bernie Sanders", "Donald Trump", "Ben Carson"))

Bernie Sanders appears to have the most positive remarks made about him, while most remarks about Hillary Clinton seem to lean towards the negative side of things. Ben Carson was also the subject of mostly positive remarks, while thoughts on Donald Trump seem to almost be neutral.

sentimentMeans = c(-0.009639, 0.02218, 0.007444, 0.03925)
barplot(sentimentMeans, main="Comparing Mean Sentiments Towards Top Presidential Candidates", names.arg=c("Hillary Clinton", "Bernie Sanders", "Donald Trump", "Ben Carson"))

In this comparison, Ben Carson had the most positive remarks in relation to negative ones. On the other hand, negative remarks made about Hillary Clinton seem to outnumber the positive ones.

Words Most Commonly Associated with Hillary Clinton

comparison.cloud(ctdm, colors = brewer.pal(3, "Dark2"), scale = c(3,.5),random.order = FALSE)

Hillary’s wordcloud seems to be equal parts positive, negative, and neutral. Just like in Bernie’s below, negative remarks focus around “raise,” while her positive remarks focus around her “strategy.”

Words Most Commonly Associated with Bernie Sanders

comparison.cloud(stdm, colors = brewer.pal(3, "Dark2"), scale = c(3,.5),random.order = FALSE)

In Sanders’ wordcloud, the amount of negative and neutral words seems to be about equal. Remarks focused on topics surrounding the words “raise,” “untold,” and “1987.”

Words Most Commonly Associated with Donald Trump

comparison.cloud(ttdm, colors = brewer.pal(3, "Dark2"), scale = c(3,.5),random.order = FALSE)

As you can see, “hate” is the most commonly used negative word associated with Trump and his campaign. However, it is used significantly less than other positive and neutral words such as “military” and “like.”

Words Most Commonly Associated with Ben Carson

comparison.cloud(btdm, colors = brewer.pal(3, "Dark2"), scale = c(3,.5),random.order = FALSE)

Carson’s wordcloud had the most reused words out of all his competitors. Positive remarks surround topics like “refugees” and “terrorists.” Neutral and negative remarks take a broader view and involve frequently used words including “wellness,” “poll,” and “meek.”

Hillary Clinton’s Support Around Washington, D.C.

qmplot(longitude, latitude, data = cgeoDF_noNA, colour = I('red'),source="google")

Bernie Sanders’ Support Around Washington, D.C.

qmplot(longitude, latitude, data = sgeoDF_noNA, colour = I('red'),source="google")

Donald Trump’s Support Around Washington, D.C.

qmplot(longitude, latitude, data = tgeoDF_noNA, colour = I('red'),source="google")

Ben Carson’s Support Around Washington, D.C.

qmplot(longitude, latitude, data = bgeoDF_noNA, colour = I('red'),source="google")

When looking over all the candidates’geographical support maps, we see that Trump was tweeted about the most around the D.C. area and Sanders was tweeted about the least. Mentions of Clinton seem to focus more on the inner cities of D.C. and Baltimore as opposed to her competitors mentions, whose also include the outlying suburbs.

## [1] "Using direct authentication"

## [1] 1

The Twitter Network of Hillary Clinton

plot(MyGraph,
     layout=layout.fruchterman.reingold,
     main='Twitter Network',
     vertex.color = 'green',
     vertex.label.dist=0.25,
     vertex.frame.color='blue',
     vertex.label.color='black',
     vertex.label.font=0.1,
     vertex.label.cex=0.5,
     vertex.size = 0.5,
     vertex.shape = "circle",
     edge.arrow.size = 0,
     edge.lty = 6,
     edge.curved=0.5
)

The Twitter Network of Bernie Sanders

plot(sMyGraph,
     layout=layout.fruchterman.reingold,
     main='Twitter Network',
     vertex.color = 'green',
     vertex.label.dist=0.25,
     vertex.frame.color='blue',
     vertex.label.color='black',
     vertex.label.font=0.1,
     vertex.label.cex=0.5,
     vertex.size = 0.5,
     vertex.shape = "circle",
     edge.arrow.size = 0,
     edge.lty = 6,
     edge.curved=0.5
)

The Twitter Network of Donald Trump

plot(tMyGraph,
     layout=layout.fruchterman.reingold,
     main='Twitter Network',
     vertex.color = 'green',
     vertex.label.dist=0.25,
     vertex.frame.color='blue',
     vertex.label.color='black',
     vertex.label.font=0.1,
     vertex.label.cex=0.5,
     vertex.size = 0.5,
     vertex.shape = "circle",
     edge.arrow.size = 0,
     edge.lty = 6,
     edge.curved=0.5
)

The Twitter Network of Ben Carson

plot(bMyGraph,
     layout=layout.fruchterman.reingold,
     main='Twitter Network',
     vertex.color = 'green',
     vertex.label.dist=0.25,
     vertex.frame.color='blue',
     vertex.label.color='black',
     vertex.label.font=0.1,
     vertex.label.cex=0.5,
     vertex.size = 0.5,
     vertex.shape = "circle",
     edge.arrow.size = 0,
     edge.lty = 6,
     edge.curved=0.5
)

## [1] 0

## [1] 0.009679371

## [1] 0

## [1] 0.01585624

## [1] 0

## [1] 0.008928571

## [1] 0

## [1] 0.008751903

networkDensities = c(0.01295097, 0.010181, 0.01245791, 0.008249497)
barplot(networkDensities, main="Comparing Network Densities of Top Presidential Candidates", names.arg=c("Hillary Clinton", "Bernie Sanders", "Donald Trump", "Ben Carson"))

When comparing candidates’ twitter networks and the network densities, Hillary Clinton has the most dense network of mentions about her and her campaign, with Donald Trump close behind. *Analysis may be a little off because the tweets change daily and therefore affect what words appear in the word clouds.