This is an R Markdown Notebook. When you execute code within the notebook, the results appear beneath the code.

Try executing this chunk by clicking the Run button within the chunk or by placing your cursor inside it and pressing Ctrl+Shift+Enter.

##Clean Data
#Filter years - greater 2005
imbdclean <- imbd_rating[imbd_rating$year > 2005, ]
#Get rid of null rows
finalimbd <- imbdclean[complete.cases(imbdclean), ]
#Clean title
imbdclean$title <- gsub("Â", '', imbdclean$title)
#Clean Director 
finalimbd$director <- gsub("Â", '', finalimbd$director)
#filter genre
actionmovies <- filter(finalimbd, grepl('Action', genres))
#filter aspect ratio
actionmovies <- actionmovies[actionmovies$aspect_ratio == "2.35", ]
#histogram
imbdclean$aspect_ratio <- as.factor(imbdclean$aspect_ratio)
count <- count(imbdclean, aspect_ratio)
counts <- table(imbdclean$aspect_ratio)
barplot(counts, main = "Aspect Ratio", xlab = "Dimensions")

#regression model
reg <- lm(actionmovies$gross ~ actionmovies$budget + actionmovies$score + actionmovies$critic_reviews)
summary(reg)

Call:
lm(formula = actionmovies$gross ~ actionmovies$budget + actionmovies$score + 
    actionmovies$critic_reviews)

Residuals:
       Min         1Q     Median         3Q        Max 
-320804488  -30651992   -5086208   23817116  252130825 

Coefficients:
                              Estimate Std. Error t value Pr(>|t|)    
(Intercept)                 -1.398e+08  2.248e+07  -6.217 1.39e-09 ***
actionmovies$budget          5.410e-01  5.269e-02  10.268  < 2e-16 ***
actionmovies$score           1.589e+07  3.945e+06   4.028 6.84e-05 ***
actionmovies$critic_reviews  2.758e+05  2.962e+04   9.312  < 2e-16 ***
---
Signif. codes:  0 ‘***’ 0.001 ‘**’ 0.01 ‘*’ 0.05 ‘.’ 0.1 ‘ ’ 1

Residual standard error: 59470000 on 364 degrees of freedom
Multiple R-squared:  0.6166,    Adjusted R-squared:  0.6135 
F-statistic: 195.2 on 3 and 364 DF,  p-value: < 2.2e-16
plot(actionmovies$budget, actionmovies$gross, xlab = "Budget of Action movies with 2.35 AR", ylab = "Gross of Action movies with 2.35 AR")
abline(9.892e+06, 8.960e-01)

lm(actionmovies$gross ~ actionmovies$budget)

Call:
lm(formula = actionmovies$gross ~ actionmovies$budget)

Coefficients:
        (Intercept)  actionmovies$budget  
          9.892e+06            8.960e-01  
summary(actionmovies)
    title              genres            director            actor1             actor2             actor3         
 Length:368         Length:368         Length:368         Length:368         Length:368         Length:368        
 Class :character   Class :character   Class :character   Class :character   Class :character   Class :character  
 Mode  :character   Mode  :character   Mode  :character   Mode  :character   Mode  :character   Mode  :character  
                                                                                                                  
                                                                                                                  
                                                                                                                  
     length          budget          director_fb_likes actor1_fb_likes    actor2_fb_likes   actor3_fb_likes  
 Min.   : 81.0   Min.   :  2000000   Min.   :    0.0   Min.   :    21.0   Min.   :   17.0   Min.   :    7.0  
 1st Qu.:101.0   1st Qu.: 35000000   1st Qu.:   25.0   1st Qu.:   966.8   1st Qu.:  551.8   1st Qu.:  308.8  
 Median :110.5   Median : 65000000   Median :  135.0   Median : 11000.0   Median :  899.5   Median :  559.0  
 Mean   :114.5   Mean   : 89085685   Mean   :  730.5   Mean   : 11583.1   Mean   : 3475.1   Mean   : 1258.9  
 3rd Qu.:123.0   3rd Qu.:140000000   3rd Qu.:  340.5   3rd Qu.: 18000.0   3rd Qu.: 3000.0   3rd Qu.:  903.0  
 Max.   :215.0   Max.   :553632000   Max.   :22000.0   Max.   :137000.0   Max.   :27000.0   Max.   :23000.0  
 total_cast_likes    fb_likes      critic_reviews  users_reviews     users_votes          score        aspect_ratio 
 Min.   :    58   Min.   :     0   Min.   : 30.0   Min.   :  23.0   Min.   :   2508   Min.   :2.700   Min.   :2.35  
 1st Qu.:  2908   1st Qu.:     0   1st Qu.:188.8   1st Qu.: 178.8   1st Qu.:  54076   1st Qu.:5.875   1st Qu.:2.35  
 Median : 14968   Median : 15000   Median :265.0   Median : 342.5   Median : 119483   Median :6.400   Median :2.35  
 Mean   : 17760   Mean   : 24942   Mean   :290.3   Mean   : 497.3   Mean   : 174112   Mean   :6.371   Mean   :2.35  
 3rd Qu.: 25210   3rd Qu.: 38000   3rd Qu.:372.0   3rd Qu.: 637.0   3rd Qu.: 229681   3rd Qu.:6.925   3rd Qu.:2.35  
 Max.   :137712   Max.   :197000   Max.   :813.0   Max.   :4667.0   Max.   :1676169   Max.   :9.000   Max.   :2.35  
     gross                year     
 Min.   :      162   Min.   :2006  
 1st Qu.: 23047736   1st Qu.:2009  
 Median : 56114221   Median :2011  
 Mean   : 89708090   Mean   :2011  
 3rd Qu.:126248948   3rd Qu.:2014  
 Max.   :533316061   Max.   :2016  
lm(actionmovies$gross ~ actionmovies$score)

Call:
lm(formula = actionmovies$gross ~ actionmovies$score)

Coefficients:
       (Intercept)  actionmovies$score  
        -218685712            48408514  
lm(actionmovies$gross ~ actionmovies$critic_reviews)

Call:
lm(formula = actionmovies$gross ~ actionmovies$critic_reviews)

Coefficients:
                (Intercept)  actionmovies$critic_reviews  
                  -48611078                       476463  
plot(actionmovies$score, actionmovies$gross, xlab = "Score of Action movies with 2.35 AR", ylab = "Gross of Action movies with 2.35 AR")
abline(-218685712, 48408514)

plot(actionmovies$critic_reviews, actionmovies$gross, xlab = "Critics Reviews of Action movies with 2.35 AR", ylab = "Gross of Action movies with 2.35 AR")
abline(-48611078, 476463)

summary(actionmovies$gross)
     Min.   1st Qu.    Median      Mean   3rd Qu.      Max. 
      162  23047736  56114221  89708090 126248948 533316061 
summary(actionmovies$budget)
     Min.   1st Qu.    Median      Mean   3rd Qu.      Max. 
  2000000  35000000  65000000  89085685 140000000 553632000 
summary(actionmovies$score)
   Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
  2.700   5.875   6.400   6.371   6.925   9.000 
summary(actionmovies$critic_reviews)
   Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
   30.0   188.8   265.0   290.3   372.0   813.0 

Add a new chunk by clicking the Insert Chunk button on the toolbar or by pressing Ctrl+Alt+I.

When you save the notebook, an HTML file containing the code and output will be saved alongside it (click the Preview button or press Ctrl+Shift+K to preview the HTML file).

LS0tDQp0aXRsZTogIlIgTm90ZWJvb2siDQpvdXRwdXQ6IGh0bWxfbm90ZWJvb2sNCi0tLQ0KDQpUaGlzIGlzIGFuIFtSIE1hcmtkb3duXShodHRwOi8vcm1hcmtkb3duLnJzdHVkaW8uY29tKSBOb3RlYm9vay4gV2hlbiB5b3UgZXhlY3V0ZSBjb2RlIHdpdGhpbiB0aGUgbm90ZWJvb2ssIHRoZSByZXN1bHRzIGFwcGVhciBiZW5lYXRoIHRoZSBjb2RlLiANCg0KVHJ5IGV4ZWN1dGluZyB0aGlzIGNodW5rIGJ5IGNsaWNraW5nIHRoZSAqUnVuKiBidXR0b24gd2l0aGluIHRoZSBjaHVuayBvciBieSBwbGFjaW5nIHlvdXIgY3Vyc29yIGluc2lkZSBpdCBhbmQgcHJlc3NpbmcgKkN0cmwrU2hpZnQrRW50ZXIqLiANCg0KYGBge3J9DQojI0NsZWFuIERhdGENCiNGaWx0ZXIgeWVhcnMgLSBncmVhdGVyIDIwMDUNCg0KaW1iZGNsZWFuIDwtIGltYmRfcmF0aW5nW2ltYmRfcmF0aW5nJHllYXIgPiAyMDA1LCBdDQpgYGANCg0KYGBge3J9DQojR2V0IHJpZCBvZiBudWxsIHJvd3MNCmZpbmFsaW1iZCA8LSBpbWJkY2xlYW5bY29tcGxldGUuY2FzZXMoaW1iZGNsZWFuKSwgXQ0KI0NsZWFuIHRpdGxlDQppbWJkY2xlYW4kdGl0bGUgPC0gZ3N1YigiwiIsICcnLCBpbWJkY2xlYW4kdGl0bGUpDQojQ2xlYW4gRGlyZWN0b3IgDQpmaW5hbGltYmQkZGlyZWN0b3IgPC0gZ3N1YigiwiIsICcnLCBmaW5hbGltYmQkZGlyZWN0b3IpDQoNCmBgYA0KDQpgYGB7cn0NCiNmaWx0ZXIgZ2VucmUNCmFjdGlvbm1vdmllcyA8LSBmaWx0ZXIoZmluYWxpbWJkLCBncmVwbCgnQWN0aW9uJywgZ2VucmVzKSkNCmBgYA0KDQpgYGB7cn0NCiNmaWx0ZXIgYXNwZWN0IHJhdGlvDQphY3Rpb25tb3ZpZXMgPC0gYWN0aW9ubW92aWVzW2FjdGlvbm1vdmllcyRhc3BlY3RfcmF0aW8gPT0gIjIuMzUiLCBdDQpgYGANCg0KYGBge3J9DQojaGlzdG9ncmFtDQppbWJkY2xlYW4kYXNwZWN0X3JhdGlvIDwtIGFzLmZhY3RvcihpbWJkY2xlYW4kYXNwZWN0X3JhdGlvKQ0KY291bnQgPC0gY291bnQoaW1iZGNsZWFuLCBhc3BlY3RfcmF0aW8pDQpjb3VudHMgPC0gdGFibGUoaW1iZGNsZWFuJGFzcGVjdF9yYXRpbykNCmJhcnBsb3QoY291bnRzLCBtYWluID0gIkFzcGVjdCBSYXRpbyIsIHhsYWIgPSAiRGltZW5zaW9ucyIpDQpgYGANCg0KYGBge3J9DQojcmVncmVzc2lvbiBtb2RlbA0KcmVnIDwtIGxtKGFjdGlvbm1vdmllcyRncm9zcyB+IGFjdGlvbm1vdmllcyRidWRnZXQgKyBhY3Rpb25tb3ZpZXMkc2NvcmUgKyBhY3Rpb25tb3ZpZXMkY3JpdGljX3Jldmlld3MpDQpzdW1tYXJ5KHJlZykNCg0KYGBgDQoNCmBgYHtyfQ0KcGxvdChhY3Rpb25tb3ZpZXMkYnVkZ2V0LCBhY3Rpb25tb3ZpZXMkZ3Jvc3MsIHhsYWIgPSAiQnVkZ2V0IG9mIEFjdGlvbiBtb3ZpZXMgd2l0aCAyLjM1IEFSIiwgeWxhYiA9ICJHcm9zcyBvZiBBY3Rpb24gbW92aWVzIHdpdGggMi4zNSBBUiIpDQphYmxpbmUoOS44OTJlKzA2LCA4Ljk2MGUtMDEpDQpgYGANCg0KYGBge3J9DQoNCmxtKGFjdGlvbm1vdmllcyRncm9zcyB+IGFjdGlvbm1vdmllcyRidWRnZXQpDQpgYGANCg0KYGBge3J9DQpzdW1tYXJ5KGFjdGlvbm1vdmllcykNCmBgYA0KDQpgYGB7cn0NCmxtKGFjdGlvbm1vdmllcyRncm9zcyB+IGFjdGlvbm1vdmllcyRzY29yZSkNCmBgYA0KDQpgYGB7cn0NCmxtKGFjdGlvbm1vdmllcyRncm9zcyB+IGFjdGlvbm1vdmllcyRjcml0aWNfcmV2aWV3cykNCmBgYA0KDQpgYGB7cn0NCnBsb3QoYWN0aW9ubW92aWVzJHNjb3JlLCBhY3Rpb25tb3ZpZXMkZ3Jvc3MsIHhsYWIgPSAiU2NvcmUgb2YgQWN0aW9uIG1vdmllcyB3aXRoIDIuMzUgQVIiLCB5bGFiID0gIkdyb3NzIG9mIEFjdGlvbiBtb3ZpZXMgd2l0aCAyLjM1IEFSIikNCmFibGluZSgtMjE4Njg1NzEyLCA0ODQwODUxNCkNCmBgYA0KDQpgYGB7cn0NCnBsb3QoYWN0aW9ubW92aWVzJGNyaXRpY19yZXZpZXdzLCBhY3Rpb25tb3ZpZXMkZ3Jvc3MsIHhsYWIgPSAiQ3JpdGljcyBSZXZpZXdzIG9mIEFjdGlvbiBtb3ZpZXMgd2l0aCAyLjM1IEFSIiwgeWxhYiA9ICJHcm9zcyBvZiBBY3Rpb24gbW92aWVzIHdpdGggMi4zNSBBUiIpDQphYmxpbmUoLTQ4NjExMDc4LCA0NzY0NjMpDQpgYGANCg0KYGBge3J9DQpzdW1tYXJ5KGFjdGlvbm1vdmllcyRncm9zcykNCmBgYA0KDQpgYGB7cn0NCnN1bW1hcnkoYWN0aW9ubW92aWVzJGJ1ZGdldCkNCmBgYA0KDQpgYGB7cn0NCnN1bW1hcnkoYWN0aW9ubW92aWVzJHNjb3JlKQ0KYGBgDQoNCmBgYHtyfQ0Kc3VtbWFyeShhY3Rpb25tb3ZpZXMkY3JpdGljX3Jldmlld3MpDQpgYGANCg0KDQoNCkFkZCBhIG5ldyBjaHVuayBieSBjbGlja2luZyB0aGUgKkluc2VydCBDaHVuayogYnV0dG9uIG9uIHRoZSB0b29sYmFyIG9yIGJ5IHByZXNzaW5nICpDdHJsK0FsdCtJKi4NCg0KV2hlbiB5b3Ugc2F2ZSB0aGUgbm90ZWJvb2ssIGFuIEhUTUwgZmlsZSBjb250YWluaW5nIHRoZSBjb2RlIGFuZCBvdXRwdXQgd2lsbCBiZSBzYXZlZCBhbG9uZ3NpZGUgaXQgKGNsaWNrIHRoZSAqUHJldmlldyogYnV0dG9uIG9yIHByZXNzICpDdHJsK1NoaWZ0K0sqIHRvIHByZXZpZXcgdGhlIEhUTUwgZmlsZSkuDQo=