Text sentiment analysis
#Replacing "/", "@" and "|" with space
toSpace <- content_transformer(function (x , pattern ) gsub(pattern, " ", x))
TextDoc <- tm_map(TextDoc, toSpace, "/")
TextDoc <- tm_map(TextDoc, toSpace, "@")
TextDoc <- tm_map(TextDoc, toSpace, "\\|")
# Convert the text to lower case
TextDoc <- tm_map(TextDoc, content_transformer(tolower))
# Remove numbers
TextDoc <- tm_map(TextDoc, removeNumbers)
# Remove english common stopwords
TextDoc <- tm_map(TextDoc, removeWords, stopwords("english"))
# Remove your own stop word
# specify your custom stopwords as a character vector
TextDoc <- tm_map(TextDoc, removeWords, c("s", "company", "team"))
# Remove punctuations
TextDoc <- tm_map(TextDoc, removePunctuation)
# Eliminate extra white spaces
TextDoc <- tm_map(TextDoc, stripWhitespace)
# Text stemming - which reduces words to their root form
TextDoc <- tm_map(TextDoc, stemDocument)
## word freq
## martin martin 154
## trayvon trayvon 150
## shoot shoot 107
## case case 102
## fla fla 100
## zimmerman zimmerman 76
## teen teen 70
## death death 52
## florida florida 38
## watch watch 32
## law law 29
## shooter shooter 28
## polic polic 25
## charg charg 24
## neighborhood neighborhood 23
## attorney attorney 23
## hoodi hoodi 23
## ralli ralli 22
## new new 22
## prosecutor prosecutor 22
## say say 21
## arrest arrest 20
## ground ground 19
## stand stand 19
## gun gun 19
## kill kill 18
## group group 17
## miami miami 16
## shot shot 16
## famili famili 15
## black black 14
## want want 13
## chief chief 13
## sanford sanford 13
## protest protest 13
## lawyer lawyer 13
## make make 13
## nra nra 13
## call call 12
## turn turn 12
## justic justic 12
## judg judg 12
## media media 12
## offici offici 12
## race race 12
## apolog apolog 12
## court court 12
## answer answer 11
## march march 11
## comment comment 11
## support support 11
## trial trial 11
## romney romney 11
## student student 10
## dead dead 10
## racial racial 10
## georg georg 10
## leader leader 9
## parent parent 9
## slain slain 9
## nyc nyc 9
## right right 9
## center center 9
## photo photo 9
## show show 9
## obama obama 9
## fight fight 9
## speak speak 9
## defens defens 9
## skittl skittl 9
## brand brand 9
## known known 9
## key key 9
## captain captain 8
## hear hear 8
## appear appear 8
## citi citi 8
## teenag teenag 8
## activist activist 8
## look look 8
## fox fox 8
## wade wade 8
## heat heat 8
## wear wear 8
## may may 8
## old old 8
## town town 8
## legal legal 8
## give give 8
## releas releas 8
## son son 7
## good good 7
## vigilant vigilant 7
## expert expert 7
## step step 7
## aid aid 7
## church church 7
## tulsa tulsa 7
## lawmak lawmak 7
## video video 7
## forc forc 7
## get get 7
## take take 7
## murder murder 7
## grand grand 7
## juri juri 7
## file file 7
## sought sought 6
## investig investig 6
## sharpton sharpton 6
## selfdefens selfdefens 6
## probe probe 6
## neighbor neighbor 6
## nation nation 6
## hundr hundr 6
## die die 6
## social social 6
## rivera rivera 6
## join join 6
## man man 6
## argument argument 6
## bring bring 6
## hate hate 6
## anthoni anthoni 6
## address address 6
## lee lee 6
## retweet retweet 6
## spike spike 6
## contact contact 6
## rais rais 6
## review review 6
## event event 6
## resid resid 6
## advoc advoc 6
## food food 6
## conserv conserv 6
## bail bail 6
## cosbi cosbi 6
## jail jail 6
## crime crime 5
## fatal fatal 5
## fed fed 5
## white white 5
## angst angst 5
## set set 5
## histori histori 5
## school school 5
## role role 5
## question question 5
## hous hous 5


## $answer
## suburb
## 0.42
##
## $death
## numeric(0)
##
## $famili
## info leak countri home identifi
## 0.36 0.36 0.36 0.36 0.36
##
## $teen
## numeric(0)
##
## $want
## background
## 0.39
##
## $fla
## numeric(0)
##
## $sought
## suburb postpon independ venu
## 0.58 0.47 0.41 0.41
##
## $captain
## client
## 0.5
##
## $crime
## baltimor local tie can citizen sevag tateosian
## 0.45 0.45 0.45 0.45 0.45 0.45 0.45
## evid american blackblack wide
## 0.45 0.45 0.45 0.45
##
## $kill
## shock burn
## 0.47 0.40
##
## $shoot
## numeric(0)
##
## $watch
## numeric(0)
##
## $call
## horribl sourc
## 0.4 0.4
##
## $neighborhood
## volunt pull arm postpon
## 0.41 0.41 0.35 0.35
##
## $attorney
## numeric(0)
##
## $chief
## temporarili embattl
## 0.55 0.48
##
## $miami
## gather thousand
## 0.43 0.37
##
## $sanford
## threaten
## 0.39
##
## $turn
## inc amid backlash focus
## 0.57 0.57 0.57 0.57
##
## $arrest
## numeric(0)
##
## $group
## advocaci complaint common woo amid backlash focus
## 0.48 0.48 0.46 0.45 0.45 0.45 0.45
## alec bid gunright presidenti
## 0.39 0.39 0.39 0.39
##
## $leader
## baptist pressur
## 0.50 0.38
##
## $black
## tension code male
## 0.53 0.46 0.46
##
## $investig
## fbi depart provok independ
## 0.41 0.41 0.41 0.41
##
## $parent
## react eager
## 0.47 0.47
##
## $slain
## friend never
## 0.50 0.47
##
## $martin
## numeric(0)
##
## $shooter
## numeric(0)
##
## $trayvon
## numeric(0)
##
## $ralli
## hold naacp gather
## 0.42 0.42 0.36
##
## $sharpton
## mother rev alabama headlin
## 0.71 0.71 0.41 0.41
##
## $shot
## numeric(0)
##
## $student
## numeric(0)
##
## $law
## numeric(0)
##
## $selfdefens
## bush jeb hamper secret wit spur statut cover
## 0.47 0.47 0.41 0.41 0.41 0.41 0.41 0.40
##
## $protest
## numeric(0)
##
## $fatal
## depart atlanta
## 0.45 0.45
##
## $fed
## numeric(0)
##
## $florida
## numeric(0)
##
## $justic
## numeric(0)
##
## $say
## accid mom
## 0.37 0.37
##
## $ground
## confus told
## 0.39 0.39
##
## $hear
## extens yet seal senat heart heavi atti next week schedul
## 0.50 0.50 0.50 0.35 0.35 0.35 0.35 0.35 0.35 0.35
##
## $stand
## confus told
## 0.39 0.39
##
## $lawyer
## numeric(0)
##
## $probe
## alleg plagiar possibl laugh newsbreak sheriff
## 0.41 0.41 0.41 0.41 0.41 0.41
##
## $son
## code male like word hand
## 0.65 0.65 0.53 0.38 0.38
##
## $white
## word dade spread care conting health peopl
## 0.45 0.45 0.45 0.45 0.45 0.45 0.45
##
## $appear
## numeric(0)
##
## $dead
## numeric(0)
##
## $march
## numeric(0)
##
## $nyc
## mother rev
## 0.57 0.57
##
## $right
## civil pressur owner
## 0.57 0.38 0.38
##
## $good
## morn buffalo
## 0.43 0.43
##
## $neighbor
## bandag nose saw swollen
## 0.41 0.41 0.41 0.41
##
## $vigilant
## cleaver end missouri rep mike tyson
## 0.38 0.38 0.38 0.38 0.38 0.38
##
## $nation
## brief world licens took galvan studi deepwat
## 0.58 0.58 0.41 0.41 0.41 0.41 0.41
## horizon rookeri spill comparison hitler vandal martinx
## 0.41 0.41 0.41 0.41 0.41 0.41 0.40
##
## $citi
## tension slam carol ethic longview return
## 0.70 0.35 0.35 0.35 0.35 0.35
##
## $polic
## temporarili
## 0.39
##
## $hundr
## numeric(0)
##
## $teenag
## horribl oklahoman hand
## 0.50 0.35 0.35
##
## $expert
## arm opinion shape cri forens lay low talk plight
## 0.65 0.38 0.38 0.38 0.38 0.38 0.38 0.38 0.38
##
## $center
## numeric(0)
##
## $case
## numeric(0)
##
## $judg
## cite conflict
## 0.57 0.57
##
## $activist
## mother rev civil alabama american blackblack wide
## 0.61 0.61 0.40 0.35 0.35 0.35 0.35
## challeng
## 0.35
##
## $die
## mother rev alabama crash snowmobil stockton taho
## 0.71 0.71 0.41 0.41 0.41 0.41 0.41
## exgovernor venezuela hand
## 0.41 0.41 0.41
##
## $step
## temporarili embattl asid enough
## 0.75 0.65 0.65 0.38
##
## $aid
## react
## 0.53
##
## $angst
## numeric(0)
##
## $media
## policelik
## 0.4
##
## $social
## galvan
## 0.41
##
## $hoodi
## mani geraldo
## 0.35 0.35
##
## $photo
## onlin
## 0.38
##
## $show
## tweet typic onlin
## 0.47 0.47 0.38
##
## $new
## gunman
## 0.36
##
## $prosecutor
## numeric(0)
##
## $set
## encamp oakland occupi park furi maryland
## 0.45 0.45 0.45 0.45 0.45 0.45
##
## $offici
## come
## 0.57
##
## $histori
## tension
## 0.89
##
## $racial
## tension slur profil affidavit
## 0.63 0.47 0.44 0.44
##
## $look
## like extens yet rebound forward
## 0.50 0.50 0.50 0.35 0.35
##
## $obama
## like react owner
## 0.47 0.47 0.38
##
## $comment
## geraldo sorri
## 0.52 0.45
##
## $school
## continu high miamiarea dade spread approach pant princip
## 0.45 0.45 0.45 0.45 0.45 0.45 0.45 0.45
## saggi steve struggl tennesse tri urkel dash grad
## 0.45 0.45 0.45 0.45 0.45 0.45 0.45 0.45
## bulli south
## 0.45 0.45
##
## $fox
## geraldo sorri ben movi stiller trailer judgment rush
## 0.61 0.53 0.35 0.35 0.35 0.35 0.35 0.35
##
## $rivera
## geraldo sorri
## 0.71 0.61
##
## $role
## policelik
## 0.63
##
## $fight
## never
## 0.47
##
## $speak
## fear
## 0.57
##
## $wade
## nephew wound chicago dwyan respond heart heavi
## 0.50 0.50 0.40 0.35 0.35 0.35 0.35
##
## $question
## guid quot
## 0.63 0.63
##
## $defens
## fund real websit
## 0.47 0.47 0.38
##
## $race
## complic matter
## 0.4 0.4
##
## $heat
## piston athlet win dad thank dwyan dade spread fourth messag
## 0.50 0.50 0.40 0.40 0.40 0.35 0.35 0.35 0.35 0.35
## send nba villain closur
## 0.35 0.35 0.35 0.35
##
## $support
## fear
## 0.52
##
## $hous
## chastis dade spread care conting health
## 0.67 0.45 0.45 0.45 0.45 0.45
##
## $join
## numeric(0)
##
## $use
## slur affidavit bootcamp playbook press animalwelfar
## 0.67 0.63 0.45 0.45 0.45 0.45
## grapevin lamb lion live pastor’ sermon
## 0.45 0.45 0.45 0.45 0.45 0.45
##
## $man
## accus disrupt servic shotguntot crash snowmobil
## 0.41 0.41 0.41 0.41 0.41 0.41
## stockton taho manson paternovill sign theft
## 0.41 0.41 0.41 0.41 0.41 0.41
##
## $argument
## numeric(0)
##
## $make
## numeric(0)
##
## $skittl
## artist creat portrait
## 0.47 0.47 0.47
##
## $bring
## evid closur
## 0.41 0.41
##
## $charg
## come
## 0.4
##
## $hate
## evid photograph pursu speech
## 0.41 0.41 0.41 0.41
##
## $church
## mani amplifi disrupt servic shotguntot bia lds
## 0.43 0.38 0.38 0.38 0.38 0.38 0.38
## blain christ midwestern name pastor unit plagiar
## 0.38 0.38 0.38 0.38 0.38 0.38 0.38
## possibl rememb
## 0.38 0.37
##
## $wear
## chastis rememb mani congreg tribut
## 0.70 0.53 0.40 0.35 0.35
##
## $earli
## class learn rise film pull colleg offer
## 0.76 0.76 0.76 0.56 0.56 0.43 0.37
##
## $trial
## postpon begin
## 0.52 0.42
##
## $anthoni
## craven
## 0.41
##
## $tulsa
## rampag craven reveng penalti
## 0.75 0.38 0.38 0.38
##
## $lawmak
## chastis tribut domin explor gov rick scottx
## 0.75 0.38 0.38 0.38 0.38 0.38 0.38
##
## $georg
## numeric(0)
##
## $video
## gunman doubt stori handcuf night surveil bloodi handcuff
## 0.65 0.56 0.56 0.53 0.38 0.38 0.38 0.38
## add
## 0.38
##
## $zimmerman
## numeric(0)
##
## $brand
## inc
## 0.66
##
## $forc
## confus told justifi air former domin explor gov rick scottx
## 0.65 0.65 0.38 0.38 0.38 0.38 0.38 0.38 0.38 0.38
##
## $address
## settl coupl
## 0.71 0.41
##
## $apolog
## excerpt testimoni
## 0.5 0.5
##
## $lee
## settl coupl
## 0.71 0.41
##
## $retweet
## settl coupl
## 0.71 0.41
##
## $spike
## settl coupl
## 0.71 0.41
##
## $wrong
## settl
## 0.51
##
## $contact
## worker judgment rush
## 0.41 0.41 0.41
##
## $rais
## gunman doubt stori first full mack quarter
## 0.71 0.61 0.61 0.41 0.41 0.41 0.41
##
## $known
## victim
## 0.5
##
## $decept
## numeric(0)
##
## $may
## opinion shape reveng seconddegre
## 0.35 0.35 0.35 0.35
##
## $old
## opinion shape manson content safe solv
## 0.35 0.35 0.35 0.35 0.35 0.35
##
## $get
## attent men landlord sentenc tenant disappear
## 0.53 0.43 0.38 0.38 0.38 0.37
##
## $gun
## owner
## 0.39
##
## $key
## woo guid quot
## 0.66 0.47 0.47
##
## $town
## crisi mismanag small brace badg lose content safe
## 0.35 0.35 0.35 0.35 0.35 0.35 0.35 0.35
## solv meet
## 0.35 0.35
##
## $tough
## numeric(0)
##
## $take
## policelik bia lds canxt herald reader backdrop blow
## 0.53 0.38 0.38 0.38 0.38 0.38 0.38 0.38
## imag sanfordx bulli south
## 0.38 0.38 0.38 0.38
##
## $defend
## air former bench opt
## 0.45 0.45 0.45 0.45
##
## $romney
## woo bid gunright presidenti
## 0.60 0.52 0.52 0.52
##
## $review
## thorough vow ideal
## 0.71 0.61 0.41
##
## $event
## woo lead organ
## 0.82 0.41 0.41
##
## $murder
## congresswoman frederica trayvonx wilson seconddegre
## 0.38 0.38 0.38 0.38 0.38
## brought crowd weigh
## 0.38 0.38 0.38
##
## $task
## confus told domin explor gov rick scottx
## 0.77 0.77 0.45 0.45 0.45 0.45 0.45
##
## $nra
## woo
## 0.55
##
## $fire
## nbc produc sourc teacher edit tape organ fundrais
## 0.77 0.77 0.63 0.63 0.45 0.45 0.45 0.45
## mich
## 0.45
##
## $news
## guid quot edit tape edt open
## 0.63 0.63 0.45 0.45 0.45 0.45
##
## $court
## bid gunright presidenti
## 0.5 0.5 0.5
##
## $grand
## numeric(0)
##
## $juri
## numeric(0)
##
## $withdraw
## zimmerman’
## 0.45
##
## $resid
## shock burn penalti along engulf flame trail forward
## 0.82 0.71 0.41 0.41 0.41 0.41 0.41 0.41
##
## $advoc
## victim inmat row swing animalwelfar grapevin
## 0.61 0.58 0.58 0.58 0.41 0.41
## lamb lion live pastor’ sermon keep
## 0.41 0.41 0.41 0.41 0.41 0.40
##
## $hanniti
## judgment rush
## 0.45 0.45
##
## $face
## hurdl paternovill sign theft british racism
## 0.63 0.45 0.45 0.45 0.45 0.45
##
## $legal
## plight data edg enterpris unclear
## 0.35 0.35 0.35 0.35 0.35
##
## $casey
## numeric(0)
##
## $food
## drink koolaid twinki
## 0.41 0.41 0.41
##
## $tragedi
## numeric(0)
##
## $give
## extens yet data edg enterpris unclear
## 0.50 0.50 0.35 0.35 0.35 0.35
##
## $conserv
## woo protect common
## 0.82 0.41 0.41
##
## $bail
## atti next week avoid freed prepar
## 0.41 0.41 0.41 0.41 0.41 0.41
##
## $chanc
## numeric(0)
##
## $extra
## numeric(0)
##
## $sensation
## numeric(0)
##
## $cosbi
## numeric(0)
##
## $file
## advocaci complaint seal alec open claim pasadena common
## 0.53 0.53 0.53 0.43 0.38 0.38 0.38 0.38
## schedul
## 0.38
##
## $ask
## cite conflict
## 0.44 0.44
##
## $releas
## await eye delay document rape locat
## 0.50 0.50 0.40 0.40 0.35 0.35
##
## $legisl
## amid backlash focus away common
## 0.89 0.89 0.89 0.45 0.45
##
## $jail
## await eye leavesflorida fade now
## 0.58 0.58 0.41 0.41 0.41
## sight
## 0.41
## [1] 0.00 -0.75 -0.75 -0.75 -0.75 -0.75
## Min. 1st Qu. Median Mean 3rd Qu. Max.
## -2.9500 -0.8000 -0.2500 -0.3506 0.0000 1.7500
## [1] 0 -1 -1 -1 -1 -1
## Min. 1st Qu. Median Mean 3rd Qu. Max.
## -3.0000 -1.0000 0.0000 -0.3299 0.0000 3.0000
## [1] 0 -2 -2 -2 -2 -2
## Min. 1st Qu. Median Mean 3rd Qu. Max.
## -7.0000 -2.0000 0.0000 -0.7868 0.0000 5.0000
## [,1] [,2] [,3] [,4] [,5] [,6]
## [1,] 0 -1 -1 -1 -1 -1
## [2,] 0 -1 -1 -1 -1 -1
## [3,] 0 -1 -1 -1 -1 -1
## anger anticipation disgust fear joy sadness surprise trust negative positive
## 1 0 0 0 0 0 0 0 1 0 1
## 2 1 1 1 1 0 1 1 0 1 0
## 3 1 1 1 1 0 1 1 0 1 0
## 4 1 1 1 1 0 1 1 0 1 0
## 5 1 1 1 1 0 1 1 0 1 0
## 6 1 1 1 1 0 1 1 0 1 0
## 7 2 2 0 2 0 0 1 0 2 1
## 8 0 3 0 1 0 0 0 1 1 1
## 9 3 1 1 3 0 1 1 1 2 1
## 10 1 0 0 1 0 1 0 0 1 0

