Text sentiment analysis

#Replacing "/", "@" and "|" with space
toSpace <- content_transformer(function (x , pattern ) gsub(pattern, " ", x))
TextDoc <- tm_map(TextDoc, toSpace, "/")
TextDoc <- tm_map(TextDoc, toSpace, "@")
TextDoc <- tm_map(TextDoc, toSpace, "\\|")
# Convert the text to lower case
TextDoc <- tm_map(TextDoc, content_transformer(tolower))
# Remove numbers
TextDoc <- tm_map(TextDoc, removeNumbers)
# Remove english common stopwords
TextDoc <- tm_map(TextDoc, removeWords, stopwords("english"))
# Remove your own stop word
# specify your custom stopwords as a character vector
TextDoc <- tm_map(TextDoc, removeWords, c("s", "company", "team")) 
# Remove punctuations
TextDoc <- tm_map(TextDoc, removePunctuation)
# Eliminate extra white spaces
TextDoc <- tm_map(TextDoc, stripWhitespace)
# Text stemming - which reduces words to their root form
TextDoc <- tm_map(TextDoc, stemDocument)
##                      word freq
## martin             martin  154
## trayvon           trayvon  150
## shoot               shoot  107
## case                 case  102
## fla                   fla  100
## zimmerman       zimmerman   76
## teen                 teen   70
## death               death   52
## florida           florida   38
## watch               watch   32
## law                   law   29
## shooter           shooter   28
## polic               polic   25
## charg               charg   24
## neighborhood neighborhood   23
## attorney         attorney   23
## hoodi               hoodi   23
## ralli               ralli   22
## new                   new   22
## prosecutor     prosecutor   22
## say                   say   21
## arrest             arrest   20
## ground             ground   19
## stand               stand   19
## gun                   gun   19
## kill                 kill   18
## group               group   17
## miami               miami   16
## shot                 shot   16
## famili             famili   15
## black               black   14
## want                 want   13
## chief               chief   13
## sanford           sanford   13
## protest           protest   13
## lawyer             lawyer   13
## make                 make   13
## nra                   nra   13
## call                 call   12
## turn                 turn   12
## justic             justic   12
## judg                 judg   12
## media               media   12
## offici             offici   12
## race                 race   12
## apolog             apolog   12
## court               court   12
## answer             answer   11
## march               march   11
## comment           comment   11
## support           support   11
## trial               trial   11
## romney             romney   11
## student           student   10
## dead                 dead   10
## racial             racial   10
## georg               georg   10
## leader             leader    9
## parent             parent    9
## slain               slain    9
## nyc                   nyc    9
## right               right    9
## center             center    9
## photo               photo    9
## show                 show    9
## obama               obama    9
## fight               fight    9
## speak               speak    9
## defens             defens    9
## skittl             skittl    9
## brand               brand    9
## known               known    9
## key                   key    9
## captain           captain    8
## hear                 hear    8
## appear             appear    8
## citi                 citi    8
## teenag             teenag    8
## activist         activist    8
## look                 look    8
## fox                   fox    8
## wade                 wade    8
## heat                 heat    8
## wear                 wear    8
## may                   may    8
## old                   old    8
## town                 town    8
## legal               legal    8
## give                 give    8
## releas             releas    8
## son                   son    7
## good                 good    7
## vigilant         vigilant    7
## expert             expert    7
## step                 step    7
## aid                   aid    7
## church             church    7
## tulsa               tulsa    7
## lawmak             lawmak    7
## video               video    7
## forc                 forc    7
## get                   get    7
## take                 take    7
## murder             murder    7
## grand               grand    7
## juri                 juri    7
## file                 file    7
## sought             sought    6
## investig         investig    6
## sharpton         sharpton    6
## selfdefens     selfdefens    6
## probe               probe    6
## neighbor         neighbor    6
## nation             nation    6
## hundr               hundr    6
## die                   die    6
## social             social    6
## rivera             rivera    6
## join                 join    6
## man                   man    6
## argument         argument    6
## bring               bring    6
## hate                 hate    6
## anthoni           anthoni    6
## address           address    6
## lee                   lee    6
## retweet           retweet    6
## spike               spike    6
## contact           contact    6
## rais                 rais    6
## review             review    6
## event               event    6
## resid               resid    6
## advoc               advoc    6
## food                 food    6
## conserv           conserv    6
## bail                 bail    6
## cosbi               cosbi    6
## jail                 jail    6
## crime               crime    5
## fatal               fatal    5
## fed                   fed    5
## white               white    5
## angst               angst    5
## set                   set    5
## histori           histori    5
## school             school    5
## role                 role    5
## question         question    5
## hous                 hous    5

## $answer
## suburb 
##   0.42 
## 
## $death
## numeric(0)
## 
## $famili
##     info     leak  countri     home identifi 
##     0.36     0.36     0.36     0.36     0.36 
## 
## $teen
## numeric(0)
## 
## $want
## background 
##       0.39 
## 
## $fla
## numeric(0)
## 
## $sought
##   suburb  postpon independ     venu 
##     0.58     0.47     0.41     0.41 
## 
## $captain
## client 
##    0.5 
## 
## $crime
##   baltimor      local        tie        can    citizen      sevag  tateosian 
##       0.45       0.45       0.45       0.45       0.45       0.45       0.45 
##       evid   american blackblack       wide 
##       0.45       0.45       0.45       0.45 
## 
## $kill
## shock  burn 
##  0.47  0.40 
## 
## $shoot
## numeric(0)
## 
## $watch
## numeric(0)
## 
## $call
## horribl   sourc 
##     0.4     0.4 
## 
## $neighborhood
##  volunt    pull     arm postpon 
##    0.41    0.41    0.35    0.35 
## 
## $attorney
## numeric(0)
## 
## $chief
## temporarili     embattl 
##        0.55        0.48 
## 
## $miami
##   gather thousand 
##     0.43     0.37 
## 
## $sanford
## threaten 
##     0.39 
## 
## $turn
##      inc     amid backlash    focus 
##     0.57     0.57     0.57     0.57 
## 
## $arrest
## numeric(0)
## 
## $group
##   advocaci  complaint     common        woo       amid   backlash      focus 
##       0.48       0.48       0.46       0.45       0.45       0.45       0.45 
##       alec        bid   gunright presidenti 
##       0.39       0.39       0.39       0.39 
## 
## $leader
## baptist pressur 
##    0.50    0.38 
## 
## $black
## tension    code    male 
##    0.53    0.46    0.46 
## 
## $investig
##      fbi   depart   provok independ 
##     0.41     0.41     0.41     0.41 
## 
## $parent
## react eager 
##  0.47  0.47 
## 
## $slain
## friend  never 
##   0.50   0.47 
## 
## $martin
## numeric(0)
## 
## $shooter
## numeric(0)
## 
## $trayvon
## numeric(0)
## 
## $ralli
##   hold  naacp gather 
##   0.42   0.42   0.36 
## 
## $sharpton
##  mother     rev alabama headlin 
##    0.71    0.71    0.41    0.41 
## 
## $shot
## numeric(0)
## 
## $student
## numeric(0)
## 
## $law
## numeric(0)
## 
## $selfdefens
##   bush    jeb hamper secret    wit   spur statut  cover 
##   0.47   0.47   0.41   0.41   0.41   0.41   0.41   0.40 
## 
## $protest
## numeric(0)
## 
## $fatal
##  depart atlanta 
##    0.45    0.45 
## 
## $fed
## numeric(0)
## 
## $florida
## numeric(0)
## 
## $justic
## numeric(0)
## 
## $say
## accid   mom 
##  0.37  0.37 
## 
## $ground
## confus   told 
##   0.39   0.39 
## 
## $hear
##  extens     yet    seal   senat   heart   heavi    atti    next    week schedul 
##    0.50    0.50    0.50    0.35    0.35    0.35    0.35    0.35    0.35    0.35 
## 
## $stand
## confus   told 
##   0.39   0.39 
## 
## $lawyer
## numeric(0)
## 
## $probe
##     alleg   plagiar   possibl     laugh newsbreak   sheriff 
##      0.41      0.41      0.41      0.41      0.41      0.41 
## 
## $son
## code male like word hand 
## 0.65 0.65 0.53 0.38 0.38 
## 
## $white
##    word    dade  spread    care conting  health   peopl 
##    0.45    0.45    0.45    0.45    0.45    0.45    0.45 
## 
## $appear
## numeric(0)
## 
## $dead
## numeric(0)
## 
## $march
## numeric(0)
## 
## $nyc
## mother    rev 
##   0.57   0.57 
## 
## $right
##   civil pressur   owner 
##    0.57    0.38    0.38 
## 
## $good
##    morn buffalo 
##    0.43    0.43 
## 
## $neighbor
##  bandag    nose     saw swollen 
##    0.41    0.41    0.41    0.41 
## 
## $vigilant
##  cleaver      end missouri      rep     mike    tyson 
##     0.38     0.38     0.38     0.38     0.38     0.38 
## 
## $nation
##      brief      world     licens       took     galvan      studi    deepwat 
##       0.58       0.58       0.41       0.41       0.41       0.41       0.41 
##    horizon    rookeri      spill comparison     hitler     vandal    martinx 
##       0.41       0.41       0.41       0.41       0.41       0.41       0.40 
## 
## $citi
##  tension     slam    carol    ethic longview   return 
##     0.70     0.35     0.35     0.35     0.35     0.35 
## 
## $polic
## temporarili 
##        0.39 
## 
## $hundr
## numeric(0)
## 
## $teenag
##   horribl oklahoman      hand 
##      0.50      0.35      0.35 
## 
## $expert
##     arm opinion   shape     cri  forens     lay     low    talk  plight 
##    0.65    0.38    0.38    0.38    0.38    0.38    0.38    0.38    0.38 
## 
## $center
## numeric(0)
## 
## $case
## numeric(0)
## 
## $judg
##     cite conflict 
##     0.57     0.57 
## 
## $activist
##     mother        rev      civil    alabama   american blackblack       wide 
##       0.61       0.61       0.40       0.35       0.35       0.35       0.35 
##   challeng 
##       0.35 
## 
## $die
##     mother        rev    alabama      crash  snowmobil   stockton       taho 
##       0.71       0.71       0.41       0.41       0.41       0.41       0.41 
## exgovernor  venezuela       hand 
##       0.41       0.41       0.41 
## 
## $step
## temporarili     embattl        asid      enough 
##        0.75        0.65        0.65        0.38 
## 
## $aid
## react 
##  0.53 
## 
## $angst
## numeric(0)
## 
## $media
## policelik 
##       0.4 
## 
## $social
## galvan 
##   0.41 
## 
## $hoodi
##    mani geraldo 
##    0.35    0.35 
## 
## $photo
## onlin 
##  0.38 
## 
## $show
## tweet typic onlin 
##  0.47  0.47  0.38 
## 
## $new
## gunman 
##   0.36 
## 
## $prosecutor
## numeric(0)
## 
## $set
##   encamp  oakland   occupi     park     furi maryland 
##     0.45     0.45     0.45     0.45     0.45     0.45 
## 
## $offici
## come 
## 0.57 
## 
## $histori
## tension 
##    0.89 
## 
## $racial
##   tension      slur    profil affidavit 
##      0.63      0.47      0.44      0.44 
## 
## $look
##    like  extens     yet rebound forward 
##    0.50    0.50    0.50    0.35    0.35 
## 
## $obama
##  like react owner 
##  0.47  0.47  0.38 
## 
## $comment
## geraldo   sorri 
##    0.52    0.45 
## 
## $school
##   continu      high miamiarea      dade    spread  approach      pant   princip 
##      0.45      0.45      0.45      0.45      0.45      0.45      0.45      0.45 
##     saggi     steve   struggl  tennesse       tri     urkel      dash      grad 
##      0.45      0.45      0.45      0.45      0.45      0.45      0.45      0.45 
##     bulli     south 
##      0.45      0.45 
## 
## $fox
##  geraldo    sorri      ben     movi  stiller  trailer judgment     rush 
##     0.61     0.53     0.35     0.35     0.35     0.35     0.35     0.35 
## 
## $rivera
## geraldo   sorri 
##    0.71    0.61 
## 
## $role
## policelik 
##      0.63 
## 
## $fight
## never 
##  0.47 
## 
## $speak
## fear 
## 0.57 
## 
## $wade
##  nephew   wound chicago   dwyan respond   heart   heavi 
##    0.50    0.50    0.40    0.35    0.35    0.35    0.35 
## 
## $question
## guid quot 
## 0.63 0.63 
## 
## $defens
##   fund   real websit 
##   0.47   0.47   0.38 
## 
## $race
## complic  matter 
##     0.4     0.4 
## 
## $heat
##  piston  athlet     win     dad   thank   dwyan    dade  spread  fourth  messag 
##    0.50    0.50    0.40    0.40    0.40    0.35    0.35    0.35    0.35    0.35 
##    send     nba villain  closur 
##    0.35    0.35    0.35    0.35 
## 
## $support
## fear 
## 0.52 
## 
## $hous
## chastis    dade  spread    care conting  health 
##    0.67    0.45    0.45    0.45    0.45    0.45 
## 
## $join
## numeric(0)
## 
## $use
##         slur    affidavit     bootcamp     playbook        press animalwelfar 
##         0.67         0.63         0.45         0.45         0.45         0.45 
##     grapevin         lamb         lion         live      pastor’       sermon 
##         0.45         0.45         0.45         0.45         0.45         0.45 
## 
## $man
##       accus     disrupt      servic  shotguntot       crash   snowmobil 
##        0.41        0.41        0.41        0.41        0.41        0.41 
##    stockton        taho      manson paternovill        sign       theft 
##        0.41        0.41        0.41        0.41        0.41        0.41 
## 
## $argument
## numeric(0)
## 
## $make
## numeric(0)
## 
## $skittl
##   artist    creat portrait 
##     0.47     0.47     0.47 
## 
## $bring
##   evid closur 
##   0.41   0.41 
## 
## $charg
## come 
##  0.4 
## 
## $hate
##       evid photograph      pursu     speech 
##       0.41       0.41       0.41       0.41 
## 
## $church
##       mani    amplifi    disrupt     servic shotguntot        bia        lds 
##       0.43       0.38       0.38       0.38       0.38       0.38       0.38 
##      blain     christ midwestern       name     pastor       unit    plagiar 
##       0.38       0.38       0.38       0.38       0.38       0.38       0.38 
##    possibl     rememb 
##       0.38       0.37 
## 
## $wear
## chastis  rememb    mani congreg  tribut 
##    0.70    0.53    0.40    0.35    0.35 
## 
## $earli
##  class  learn   rise   film   pull colleg  offer 
##   0.76   0.76   0.76   0.56   0.56   0.43   0.37 
## 
## $trial
## postpon   begin 
##    0.52    0.42 
## 
## $anthoni
## craven 
##   0.41 
## 
## $tulsa
##  rampag  craven  reveng penalti 
##    0.75    0.38    0.38    0.38 
## 
## $lawmak
## chastis  tribut   domin  explor     gov    rick  scottx 
##    0.75    0.38    0.38    0.38    0.38    0.38    0.38 
## 
## $georg
## numeric(0)
## 
## $video
##   gunman    doubt    stori  handcuf    night  surveil   bloodi handcuff 
##     0.65     0.56     0.56     0.53     0.38     0.38     0.38     0.38 
##      add 
##     0.38 
## 
## $zimmerman
## numeric(0)
## 
## $brand
##  inc 
## 0.66 
## 
## $forc
##  confus    told justifi     air  former   domin  explor     gov    rick  scottx 
##    0.65    0.65    0.38    0.38    0.38    0.38    0.38    0.38    0.38    0.38 
## 
## $address
## settl coupl 
##  0.71  0.41 
## 
## $apolog
##   excerpt testimoni 
##       0.5       0.5 
## 
## $lee
## settl coupl 
##  0.71  0.41 
## 
## $retweet
## settl coupl 
##  0.71  0.41 
## 
## $spike
## settl coupl 
##  0.71  0.41 
## 
## $wrong
## settl 
##  0.51 
## 
## $contact
##   worker judgment     rush 
##     0.41     0.41     0.41 
## 
## $rais
##  gunman   doubt   stori   first    full    mack quarter 
##    0.71    0.61    0.61    0.41    0.41    0.41    0.41 
## 
## $known
## victim 
##    0.5 
## 
## $decept
## numeric(0)
## 
## $may
##     opinion       shape      reveng seconddegre 
##        0.35        0.35        0.35        0.35 
## 
## $old
## opinion   shape  manson content    safe    solv 
##    0.35    0.35    0.35    0.35    0.35    0.35 
## 
## $get
##    attent       men  landlord   sentenc    tenant disappear 
##      0.53      0.43      0.38      0.38      0.38      0.37 
## 
## $gun
## owner 
##  0.39 
## 
## $key
##  woo guid quot 
## 0.66 0.47 0.47 
## 
## $town
##    crisi mismanag    small    brace     badg     lose  content     safe 
##     0.35     0.35     0.35     0.35     0.35     0.35     0.35     0.35 
##     solv     meet 
##     0.35     0.35 
## 
## $tough
## numeric(0)
## 
## $take
## policelik       bia       lds     canxt    herald    reader  backdrop      blow 
##      0.53      0.38      0.38      0.38      0.38      0.38      0.38      0.38 
##      imag  sanfordx     bulli     south 
##      0.38      0.38      0.38      0.38 
## 
## $defend
##    air former  bench    opt 
##   0.45   0.45   0.45   0.45 
## 
## $romney
##        woo        bid   gunright presidenti 
##       0.60       0.52       0.52       0.52 
## 
## $review
## thorough      vow    ideal 
##     0.71     0.61     0.41 
## 
## $event
##   woo  lead organ 
##  0.82  0.41  0.41 
## 
## $murder
## congresswoman     frederica      trayvonx        wilson   seconddegre 
##          0.38          0.38          0.38          0.38          0.38 
##       brought         crowd         weigh 
##          0.38          0.38          0.38 
## 
## $task
## confus   told  domin explor    gov   rick scottx 
##   0.77   0.77   0.45   0.45   0.45   0.45   0.45 
## 
## $nra
##  woo 
## 0.55 
## 
## $fire
##      nbc   produc    sourc  teacher     edit     tape    organ fundrais 
##     0.77     0.77     0.63     0.63     0.45     0.45     0.45     0.45 
##     mich 
##     0.45 
## 
## $news
## guid quot edit tape  edt open 
## 0.63 0.63 0.45 0.45 0.45 0.45 
## 
## $court
##        bid   gunright presidenti 
##        0.5        0.5        0.5 
## 
## $grand
## numeric(0)
## 
## $juri
## numeric(0)
## 
## $withdraw
## zimmerman’ 
##       0.45 
## 
## $resid
##   shock    burn penalti   along  engulf   flame   trail forward 
##    0.82    0.71    0.41    0.41    0.41    0.41    0.41    0.41 
## 
## $advoc
##       victim        inmat          row        swing animalwelfar     grapevin 
##         0.61         0.58         0.58         0.58         0.41         0.41 
##         lamb         lion         live      pastor’       sermon         keep 
##         0.41         0.41         0.41         0.41         0.41         0.40 
## 
## $hanniti
## judgment     rush 
##     0.45     0.45 
## 
## $face
##       hurdl paternovill        sign       theft     british      racism 
##        0.63        0.45        0.45        0.45        0.45        0.45 
## 
## $legal
##    plight      data       edg enterpris   unclear 
##      0.35      0.35      0.35      0.35      0.35 
## 
## $casey
## numeric(0)
## 
## $food
##   drink koolaid  twinki 
##    0.41    0.41    0.41 
## 
## $tragedi
## numeric(0)
## 
## $give
##    extens       yet      data       edg enterpris   unclear 
##      0.50      0.50      0.35      0.35      0.35      0.35 
## 
## $conserv
##     woo protect  common 
##    0.82    0.41    0.41 
## 
## $bail
##   atti   next   week  avoid  freed prepar 
##   0.41   0.41   0.41   0.41   0.41   0.41 
## 
## $chanc
## numeric(0)
## 
## $extra
## numeric(0)
## 
## $sensation
## numeric(0)
## 
## $cosbi
## numeric(0)
## 
## $file
##  advocaci complaint      seal      alec      open     claim  pasadena    common 
##      0.53      0.53      0.53      0.43      0.38      0.38      0.38      0.38 
##   schedul 
##      0.38 
## 
## $ask
##     cite conflict 
##     0.44     0.44 
## 
## $releas
##    await      eye    delay document     rape    locat 
##     0.50     0.50     0.40     0.40     0.35     0.35 
## 
## $legisl
##     amid backlash    focus     away   common 
##     0.89     0.89     0.89     0.45     0.45 
## 
## $jail
##         await           eye leavesflorida          fade           now 
##          0.58          0.58          0.41          0.41          0.41 
##         sight 
##          0.41
## [1]  0.00 -0.75 -0.75 -0.75 -0.75 -0.75
##    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
## -2.9500 -0.8000 -0.2500 -0.3506  0.0000  1.7500
## [1]  0 -1 -1 -1 -1 -1
##    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
## -3.0000 -1.0000  0.0000 -0.3299  0.0000  3.0000
## [1]  0 -2 -2 -2 -2 -2
##    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
## -7.0000 -2.0000  0.0000 -0.7868  0.0000  5.0000
##      [,1] [,2] [,3] [,4] [,5] [,6]
## [1,]    0   -1   -1   -1   -1   -1
## [2,]    0   -1   -1   -1   -1   -1
## [3,]    0   -1   -1   -1   -1   -1
##    anger anticipation disgust fear joy sadness surprise trust negative positive
## 1      0            0       0    0   0       0        0     1        0        1
## 2      1            1       1    1   0       1        1     0        1        0
## 3      1            1       1    1   0       1        1     0        1        0
## 4      1            1       1    1   0       1        1     0        1        0
## 5      1            1       1    1   0       1        1     0        1        0
## 6      1            1       1    1   0       1        1     0        1        0
## 7      2            2       0    2   0       0        1     0        2        1
## 8      0            3       0    1   0       0        0     1        1        1
## 9      3            1       1    3   0       1        1     1        2        1
## 10     1            0       0    1   0       1        0     0        1        0