Extract the clinical trails performed on Hepatocellular Carcinoma

patients on the outcome events to perform word cloud and sentimental

analysis to predict the outcome of the results.

library(rvest)
## Warning: package 'rvest' was built under R version 3.5.1
## Loading required package: xml2
## Warning: package 'xml2' was built under R version 3.5.1
library(XML)
## Warning: package 'XML' was built under R version 3.5.1
## 
## Attaching package: 'XML'
## The following object is masked from 'package:rvest':
## 
##     xml
library(magrittr)
## Warning: package 'magrittr' was built under R version 3.5.1
library(tm)
## Warning: package 'tm' was built under R version 3.5.1
## Loading required package: NLP
## Warning: package 'NLP' was built under R version 3.5.1
library(wordcloud)
## Warning: package 'wordcloud' was built under R version 3.5.1
## Loading required package: RColorBrewer
library(wordcloud2)
library(syuzhet)
## Warning: package 'syuzhet' was built under R version 3.5.1
library(lubridate)
## Warning: package 'lubridate' was built under R version 3.5.1
## 
## Attaching package: 'lubridate'
## The following object is masked from 'package:base':
## 
##     date
library(ggplot2)
## Warning: package 'ggplot2' was built under R version 3.5.1
## 
## Attaching package: 'ggplot2'
## The following object is masked from 'package:NLP':
## 
##     annotate
library(scales)
## Warning: package 'scales' was built under R version 3.5.1
## 
## Attaching package: 'scales'
## The following object is masked from 'package:syuzhet':
## 
##     rescale
library(reshape2)
library(dplyr)
## Warning: package 'dplyr' was built under R version 3.5.1
## 
## Attaching package: 'dplyr'
## The following objects are masked from 'package:lubridate':
## 
##     intersect, setdiff, union
## The following objects are masked from 'package:stats':
## 
##     filter, lag
## The following objects are masked from 'package:base':
## 
##     intersect, setdiff, setequal, union
library(rclinicaltrials)
library(devtools)
## Warning: package 'devtools' was built under R version 3.5.1
## Warning: package 'usethis' was built under R version 3.5.1
# install.packages('devtools')
# devtools::install_github("lchiffon/wordcloud2")
# install_github("sachsmc/rclinicaltrials")


# ClinicalTrailReviews #############################

# HCC_Info <- clinicaltrials_download(query = c("cond=Hepatocellular Carcinoma", "phase=2","type=Intr", "rslt=With"),                                                count = 1e6, include_results = TRUE)
# summary(HCC_Info$study_information$interventions)
z <- clinicaltrials_download(query = 'Hepatocellular Carcinoma', count = 10, include_results = TRUE)
str(z)
## List of 2
##  $ study_information:List of 6
##   ..$ study_info   :'data.frame':    10 obs. of  43 variables:
##   .. ..$ org_study_id                        : chr [1:10] "URL" "HSL 2016-83" "SCheng" "2017-A01885-48" ...
##   .. ..$ nct_id                              : chr [1:10] "NCT03338166" "NCT03448757" "NCT02399033" "NCT03311152" ...
##   .. ..$ brief_title                         : chr [1:10] "Role of LDH as a Predictor of Treatment Outcomes in Hepatocellular Carcinoma" "Determination of Autonomic Responses to the Exposure of Low Energy Electromagnetic Fields With Frequency Modula"| __truncated__ "Xihuang Capsules Prevention of Recurrence in Patients With Hepatocellular Carcinoma After Hepatectomy" "Circulating Cell-free DNA-based Epigenetic Biomarker mSEPT9 for Hepatocellular Carcinoma Detection in Cirrhosis" ...
##   .. ..$ official_title                      : chr [1:10] "Role of LDH as a Predictor of Treatment Outcomes in Hepatocellular Carcinoma" "Determination of Autonomic Responses to the Exposure of Low Energy Electromagnetic Fields With Frequency Modula"| __truncated__ "Xihuang Capsules Prevention of Recurrence in Patients With Hepatocellular Carcinoma After Hepatectomy: A Multic"| __truncated__ "Diagnostic Accuracy of the Circulating Cell-free DNA-based Epigenetic Biomarker mSEPT9 for Hepatocellular Carci"| __truncated__ ...
##   .. ..$ overall_status                      : chr [1:10] "Not yet recruiting" "Recruiting" "Recruiting" "Recruiting" ...
##   .. ..$ start_date.text                     : chr [1:10] "January 2, 2018" "February 15, 2018" NA "February 12, 2018" ...
##   .. ..$ start_date..attrs                   : chr [1:10] "Anticipated" "Actual" NA "Actual" ...
##   .. ..$ completion_date.text                : chr [1:10] "December 2018" "February 16, 2020" "December 2019" "February 12, 2022" ...
##   .. ..$ completion_date..attrs              : chr [1:10] "Anticipated" "Anticipated" "Anticipated" "Anticipated" ...
##   .. ..$ completion_date_type                : chr [1:10] "Anticipated" "Anticipated" "Anticipated" "Anticipated" ...
##   .. ..$ lead_sponsor/agency                 : chr [1:10] "Assiut University" "Hospital Sirio-Libanes" "Shuqun Cheng" "Central Hospital, Nancy, France" ...
##   .. ..$ overall_official.last_name          : chr [1:10] "Aml R Ibrahim, Lecturer" NA "Shuqun Cheng, Ph.D" "Abderrahim OUSSALAH, MD, PhD" ...
##   .. ..$ overall_official.role               : chr [1:10] "Principal Investigator" NA "Principal Investigator" "Principal Investigator" ...
##   .. ..$ overall_official.affiliation        : chr [1:10] "Assiut University" NA "Eastern Hepatobiliary Surgical Hospital" "University Hospital of Nancy, INSERM U954, Faculty of Medicine of Nancy, University of Lorraine" ...
##   .. ..$ study_type                          : chr [1:10] "Observational" "Interventional" "Interventional" "Interventional" ...
##   .. ..$ enrollment.text                     : chr [1:10] "50" "60" "1000" "440" ...
##   .. ..$ enrollment..attrs                   : chr [1:10] "Anticipated" "Anticipated" "Anticipated" "Anticipated" ...
##   .. ..$ primary_condition                   : chr [1:10] "Hepatocellular Carcinoma" "Hepatocellular Carcinoma" "Hepatocellular Carcinoma" "Hepatocellular Carcinoma; Cirrhosis" ...
##   .. ..$ primary_outcome.measure             : chr [1:10] "serum LDH level as a predictor of response in hepatocellular carcinoma" "non-invasive hemodynamic parameter measurements during exposure AM RF EMF" "Hepatocellular carcinoma recurrence rate in the three years after hepatectomy" "Presence of hepatocellular carcinoma." ...
##   .. ..$ primary_outcome.time_frame          : chr [1:10] "2 months" "90 min on day 1 and day 2" "in the three years after hepatectomy" "The diagnosis of HCC will be based on overall patient's evaluation including clinical, biological and imaging w"| __truncated__ ...
##   .. ..$ primary_outcome.description         : chr [1:10] "To evaluate if serum LDH level can be used as a predictor of response in patients receiving different lines of "| __truncated__ "Identification of hemodymanic alterations induced by the exposure to low levels of amplitude modulation radiofr"| __truncated__ "Diagnostic criteria for hepatocellular carcinoma recurrence: refer to Chinese Anti-Cancer Association Professio"| __truncated__ "The diagnosis of hepatocellular carcinoma will be based on the guidelines of the American Association for the S"| __truncated__ ...
##   .. ..$ eligibility.sampling_method         : chr [1:10] "Probability Sample" NA NA NA ...
##   .. ..$ eligibility.textblock.1             : chr [1:10] "\n        Inclusion Criteria:\n\n          -  patients with Hepatocellular carcinoma diagnosed by biopsy or ima"| __truncated__ NA NA NA ...
##   .. ..$ eligibility.gender                  : chr [1:10] "All" "All" "All" "All" ...
##   .. ..$ eligibility.minimum_age             : chr [1:10] "18 Years" "18 Years" "20 Years" "18 Years" ...
##   .. ..$ eligibility.maximum_age             : chr [1:10] "65 Years" "80 Years" "70 Years" "N/A" ...
##   .. ..$ eligibility.healthy_volunteers      : chr [1:10] "No" "Accepts Healthy Volunteers" "No" "No" ...
##   .. ..$ sponsors.lead_sponsor.agency        : chr [1:10] "Assiut University" "Hospital Sirio-Libanes" "Shuqun Cheng" "Central Hospital, Nancy, France" ...
##   .. ..$ sponsors.lead_sponsor.agency_class  : chr [1:10] "Other" "Other" "Other" "Other" ...
##   .. ..$ date_disclaimer                     : chr [1:10] "ClinicalTrials.gov processed this data on December 21, 2018" "ClinicalTrials.gov processed this data on December 21, 2018" "ClinicalTrials.gov processed this data on December 21, 2018" "ClinicalTrials.gov processed this data on December 21, 2018" ...
##   .. ..$ phase                               : chr [1:10] NA "N/A" "Phase 4" "N/A" ...
##   .. ..$ start_date                          : chr [1:10] NA NA "June 2014" NA ...
##   .. ..$ sponsors.collaborator.agency        : chr [1:10] NA NA NA "Institut National de la Santé Et de la Recherche Médicale, France" ...
##   .. ..$ sponsors.collaborator.agency_class  : chr [1:10] NA NA NA "Other" ...
##   .. ..$ sponsors.collaborator.agency.1      : chr [1:10] NA NA NA "Groupement Interrégional de Recherche Clinique et d'Innovation" ...
##   .. ..$ sponsors.collaborator.agency_class.1: chr [1:10] NA NA NA "Other" ...
##   .. ..$ sponsors.collaborator.agency.2      : chr [1:10] NA NA NA "Epigenomics, Inc" ...
##   .. ..$ sponsors.collaborator.agency_class.2: chr [1:10] NA NA NA "Industry" ...
##   .. ..$ primary_outcome.measure.1           : chr [1:10] NA NA NA NA ...
##   .. ..$ primary_outcome.time_frame.1        : chr [1:10] NA NA NA NA ...
##   .. ..$ overall_official.last_name.1        : chr [1:10] NA NA NA NA ...
##   .. ..$ overall_official.role.1             : chr [1:10] NA NA NA NA ...
##   .. ..$ overall_official.affiliation.1      : chr [1:10] NA NA NA NA ...
##   ..$ locations    :'data.frame':    10 obs. of  20 variables:
##   .. ..$ name                    : chr [1:10] "Hospital Sírio-Libanês" "Eastern Hepatobiliary Surgical Hospital" "University Hospital of Nancy (CHRU de Nancy)" "Hospital Sírio Libanês" ...
##   .. ..$ address.city            : chr [1:10] "São Paulo" "Shanghai" "Vandoeuvre-lès-Nancy" "São Paulo" ...
##   .. ..$ address.country         : chr [1:10] "Brazil" "China" "France" "Brazil" ...
##   .. ..$ status                  : chr [1:10] "Recruiting" "Recruiting" "Recruiting" NA ...
##   .. ..$ contact.last_name       : chr [1:10] "Tatiana Zanesco" "Shuqun Cheng, Ph.D" "Abderrahim OUSSALAH, MD, PhD" NA ...
##   .. ..$ contact.phone           : chr [1:10] "5511983539222" "021-65564166" "+33 (0)3 83 15 36 29" NA ...
##   .. ..$ contact.email           : chr [1:10] "tzanesco@hotmail.com" NA "a.oussalah@chru-nancy.fr" NA ...
##   .. ..$ nct_id                  : chr [1:10] "NCT03448757" "NCT02399033" "NCT03311152" "NCT01641276" ...
##   .. ..$ address.state           : chr [1:10] NA "Shanghai" NA NA ...
##   .. ..$ address.zip             : chr [1:10] NA "200438" "54511" "01308-050" ...
##   .. ..$ investigator.last_name  : chr [1:10] NA NA "Abderrahim OUSSALAH, MD, PhD" NA ...
##   .. ..$ investigator.role       : chr [1:10] NA NA "Principal Investigator" NA ...
##   .. ..$ investigator.last_name.1: chr [1:10] NA NA "Jean-Louis GUÉANT, MD,DSc,AGAF" NA ...
##   .. ..$ investigator.role.1     : chr [1:10] NA NA "Sub-Investigator" NA ...
##   .. ..$ investigator.last_name.2: chr [1:10] NA NA "Jean-Pierre BRONOWICKI, MD, PhD" NA ...
##   .. ..$ investigator.role.2     : chr [1:10] NA NA "Sub-Investigator" NA ...
##   .. ..$ investigator.last_name.3: chr [1:10] NA NA "Valérie LAURENT, MD, PhD" NA ...
##   .. ..$ investigator.role.3     : chr [1:10] NA NA "Sub-Investigator" NA ...
##   .. ..$ investigator.last_name.4: chr [1:10] NA NA "Ahmet AYAV, MD, PhD" NA ...
##   .. ..$ investigator.role.4     : chr [1:10] NA NA "Sub-Investigator" NA ...
##   ..$ arms         :'data.frame':    21 obs. of  4 variables:
##   .. ..$ arm_group_label: chr [1:21] "Group A" "Group B" "Group C" "Group D" ...
##   .. ..$ description    : chr [1:21] "Patients with Hepatocellular carcinoma who treated with sorafenib and measure LDH serum level one month pre and post treatment" "Patients with Hepatocellular carcinoma who treated with trans catheter arterial chemo embolization (TACE) and m"| __truncated__ "Patients with Hepatocellular carcinoma who treated surgically and measure LDH serum level one month pre and post treatment" "Patients with Hepatocellular carcinoma who don't receive treatment and asses LDH serum level for 3months" ...
##   .. ..$ nct_id         : chr [1:21] "NCT03338166" "NCT03338166" "NCT03338166" "NCT03338166" ...
##   .. ..$ arm_group_type : chr [1:21] NA NA NA NA ...
##   ..$ interventions:'data.frame':    11 obs. of  10 variables:
##   .. ..$ intervention_type: chr [1:11] "Other" "Other" "Drug" "Diagnostic Test" ...
##   .. ..$ intervention_name: chr [1:11] "LDH serum level" "measuring hemodynamic parameters heart beat to heart beat during single-frequency exposure" "Xihuang Capsules" "\"Epi proColon 2.0 CE\" test from Epigenomics, Inc (Berlin, Germany)" ...
##   .. ..$ description      : chr [1:11] "Blood sample to measure LDH as a predictor of Hepatocellular carcinoma treatment outcome" "This study aims to create a method for non-invasive diagnosis of biofeedback effect exposure to LEEF modulated "| __truncated__ "In two weeks after hepatectomy, Xihuang Capsules group received Xihuang Capsules (2 g, bid), Continuously takin"| __truncated__ "The mSEPT9 assay consists of DNA extraction from plasma, bisulfite conversion of DNA, purification of bis-DNA, "| __truncated__ ...
##   .. ..$ arm_group_label  : chr [1:11] "Group A" "Autonomic response" "Xihuang Capsules group" "HCC-free cirrhotic patients" ...
##   .. ..$ arm_group_label.1: chr [1:11] "Group B" NA NA "HCC-positive cirrhotic patients" ...
##   .. ..$ arm_group_label.2: chr [1:11] "Group C" NA NA NA ...
##   .. ..$ arm_group_label.3: chr [1:11] "Group D" NA NA NA ...
##   .. ..$ nct_id           : chr [1:11] "NCT03338166" "NCT03448757" "NCT02399033" "NCT03311152" ...
##   .. ..$ other_name       : chr [1:11] NA NA "Wangbang Pharmaceutical Xihuang Capsules" "Plasma mSEPT9 test" ...
##   .. ..$ other_name.1     : chr [1:11] NA NA NA NA ...
##   ..$ outcomes     :'data.frame':    37 obs. of  5 variables:
##   .. ..$ measure    : chr [1:37] "serum LDH level as a predictor of response in hepatocellular carcinoma" "non-invasive hemodynamic parameter measurements during exposure AM RF EMF" "Hemodynamic alteration´s comparison among advanced cancer patients and healthy controls" "Searching for cancer-specific frequency modulation" ...
##   .. ..$ time_frame : chr [1:37] "2 months" "90 min on day 1 and day 2" "120 min (single procedure)" "120 min (single procedure)" ...
##   .. ..$ description: chr [1:37] "To evaluate if serum LDH level can be used as a predictor of response in patients receiving different lines of "| __truncated__ "Identification of hemodymanic alterations induced by the exposure to low levels of amplitude modulation radiofr"| __truncated__ "Comparison of hemodynamic alteration during exposure to a group of hepatocellular-specific AM RF EMF recorded i"| __truncated__ "Identification of specifc hemodynamic alteration recorded during the exposure to a series of specific frequency"| __truncated__ ...
##   .. ..$ type       : chr [1:37] "primary_outcome" "primary_outcome" "secondary_outcome" "other_outcome" ...
##   .. ..$ nct_id     : chr [1:37] "NCT03338166" "NCT03448757" "NCT03448757" "NCT03448757" ...
##   ..$ textblocks   : NULL
##  $ study_results    :List of 3
##   ..$ participant_flow: NULL
##   ..$ baseline_data   : NULL
##   ..$ outcome_data    : NULL
zstudyinfo <- z$study_information$study_info
zoutcomes <- z$study_information$outcomes
zinterventions <- z$study_information$interventions
zoutcomes <- as.character(zoutcomes)
zinterventions <- as.character(zinterventions)
zhcc <- rbind(zoutcomes,zinterventions)


setwd("C:/Users/Thiru/Desktop/Assignments In Progress/Text Mining/ClinicalTrialAnalysis")
write.table(zhcc,"zhcc.txt",row.names = F)
write.table(zinterventions,"inv.txt",row.names = F)
write.table(zoutcomes,"out.txt",row.names = F)

hcc <- read.delim('out.txt')
str(hcc)
## 'data.frame':    5 obs. of  1 variable:
##  $ x: Factor w/ 5 levels "c(\\2 months\\, \\90 min on day 1 and day 2\\, \\120 min (single procedure)\\, \\120 min (single procedure)\\, "| __truncated__,..: 4 1 5 3 2
View(hcc)

# Build Corpus and DTM/TDM
library(tm)
corpus <- hcc[-1,]
head(corpus)
## [1] c(\\2 months\\, \\90 min on day 1 and day 2\\, \\120 min (single procedure)\\, \\120 min (single procedure)\\, \\in the three years after hepatectomy\\, \\in a year after hepatectomy\\, \\up to 5 years\\, \\in a year or three years after hepatectomy\\, \\up to 5 years\\, \\in a year or three years after hepatectomy\\, \\participants will be followed for the duration of study, an expected average of 3 months.\\, \\up to 5 years\\, \\The diagnosis of HCC will be based on overall patient's evaluation including clinical, biological and imaging workup which will be carried out during the consultation and/or the three months preceding or following the inclusion consultation.\\, \n\\The diagnosis will be based on an overall patient's evaluation including clinical, biological and imaging workup which will be carried out during the consultation and/or the three months preceding or following the inclusion consultation.\\, \\within 10 min of exposure\\, \\within 10 minutes of exposure\\, \\follow-up of 62.5 months (range, 18 to 112 months),\\, \\follow-up of 62.5 months (range, 18 to 112 months),\\, \\2 years\\, \\2 years or until tumor recurrence\\, \\2 years or until tumor recurrence\\, \\2 years\\, \n\\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\3 years\\, \\Change from baseline to 3 years\\, \\Change from baseline to 3 years\\, \\Change from baseline to 3 years\\, \\1 month\\)                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            
## [2] c(\\To evaluate if serum LDH level can be used as a predictor of response in patients receiving different lines of treatment for hepatocellular carcinoma\\, \\Identification of hemodymanic alterations induced by the exposure to low levels of amplitude modulation radiofrequency electromagnetic fields (AM RF EMF) in healthy individuals and patients with advanced hepatocellular carcinoma using Artificial Intelligence program to analyze the recorded data set collected by a high-precision and non-invasive hemodynamic monitor.\\, \n\\Comparison of hemodynamic alteration during exposure to a group of hepatocellular-specific AM RF EMF recorded in healthy individuals and patients with advanced hepatocellular carcinoma using Artificial Intelligence algorithms to compare the recorded data set collected by a high-precision and non-invasive hemodynamic monitor.\\, \\Identification of specifc hemodynamic alteration recorded during the exposure to a series of specific frequency modulations AM RF EMF recorded in healthy individuals and patients with advanced hepatocellular carcinoma using Artificial Intelligence program.\\, \n\\Diagnostic criteria for hepatocellular carcinoma recurrence: refer to Chinese Anti-Cancer Association Professional Committee of hepatocellular carcinoma developed diagnostic criteria for primary hepatocellular carcinoma belong to Guangzhou standard in 2001. Once new or suspected place nature lesions within liver were found by B-ultrasonography examination,we should do CT, MRI or PET-CT review, in order to confirm the diagnosis. If imaging is positive, diagnosing hepatocellular carcinoma(dominant) recurrence after treatment; if imaging is negative, but AFP values> 400µg/L or ongoing elevated AFP values, diagnosing hepatocellular carcinoma occult recurrence after treatment.\\, \nNA, \\RFS is defined as from date of randomization until the date of first documented tumor recurrence or date of death from any cause, whichever came first.\\, NA, \\OS is defined as from date of randomization until the date of documented death from any cause.\\, \\Using Karnofsky-Performance-Status score:\\nEvaluation Methods: Comparison of symptom scores before and after the treatment.\\nMarkedly: increasing by more than 20 points after treatment compared to before treatment; Effective: increasing by more than 10 points after treatment compared to before treatment; Stable: increasing by less than 10 points or no change after treatment compared to before treatment; Invalid: decrease after treatment than before treatment.\\, \n\\Evaluation index : according to clinical observations, TCM symptoms are divided into 4 levels: (0) no symptoms, (1) mild, (2) moderate, (3)severe, Recording treatment according to symptoms.\\nEvaluation methods: comparison of symptom total integral before and after the treatment (before treatment / after treatment) Markedly: symptom disappeared, or symptom integral reduce = 2/3; Effective: symptom alleviative, integral is reduced=1/3,=2/3; Invalid: symptom is not alleviated or reduced<1/3.\\  , \\Classification according to the Common Terminology Criteria Adverse Events Version 4.0(CTCAE v4.0).\\, \n\\The diagnosis of hepatocellular carcinoma will be based on the guidelines of the American Association for the Study of Liver Diseases (AASLD) (Hepatology. 2011;53:1020-2). The adjudicating physicians will be blinded to patient results associated with the mSEPT9 test.\\, \\The diagnosis of hepatocellular carcinoma will be based on the guidelines of the American Association for the Study of Liver Diseases (AASLD) (Hepatology. 2011;53:1020-2). The adjudicating physicians will be blinded to patient results associated with the mSEPT9 test.\\, \n\\biofeedback response will be monitored\\, \\Representation of autonomous response during the exposure of specific frequencies of modulation\\, \\The primary endpoint of the study was the development of Hepatocellular carcinoma. We assessed the risk of development of hepatocellular carcinoma according to liver status, viral response to treatment, and the presence of previous resistance to NUC therapy.\\, \\survival in cirrhosis and chronic hepatitis B patients\\, \\Time from the day of liver resection to the day of clinical diagnosis of recurrence\\, \n\\Peripheral blood is drawn every 3 months after liver resection. 5hmc level in cfDNA in particular recurrence-related genes is tested by cfDNA sequencing and calculated by feature counts.\\, NA, \\Any adverse effect of the test is to be recorded.\\, NA, NA, NA, \\Difference would be found out by estimating cfDNA in terms of ng/mL of the blood specimen\\, NA, NA, NA, NA, NA, NA, \\According to standard imaging surveillance protocol, and confirmatory CT/MRI/biopsy\\, \\Positive family history of liver cancer, BMI, active/previous smoking, active/previous alcohol consumption, caffeine consumption in diet, diabetes mellitus, use of drugs for chronic medical conditions\\, \n\\Composite of regression of fibrosis plus other specific conditions decreasing incidence of hepatocellular carcinoma to <1.5% / year\\, \\According to Fibrotest/Fibrosure and transient elastography\\, \\to determine the clinical utility of Annexin A2 serum level as a novel diagnostic marker of hepatocellular carcinoma (HCC) and to correlate its level with alpha fetoprotein the current marker of (HCC).\\)
## [3] c(\\primary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\other_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \n\\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\other_outcome\\, \\primary_outcome\\)                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      
## [4] c(\\NCT03338166\\, \\NCT03448757\\, \\NCT03448757\\, \\NCT03448757\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT03311152\\, \\NCT03311152\\, \\NCT01641276\\, \\NCT01641276\\, \\NCT02025842\\, \\NCT02025842\\, \\NCT03493763\\, \\NCT03493763\\, \\NCT03493763\\, \\NCT03493763\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT01831037\\, \\NCT01831037\\, \n\\NCT01831037\\, \\NCT01831037\\, \\NCT02541149\\)                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      
## 5 Levels: c(\\2 months\\, \\90 min on day 1 and day 2\\, \\120 min (single procedure)\\, \\120 min (single procedure)\\, \\in the three years after hepatectomy\\, \\in a year after hepatectomy\\, \\up to 5 years\\, \\in a year or three years after hepatectomy\\, \\up to 5 years\\, \\in a year or three years after hepatectomy\\, \\participants will be followed for the duration of study, an expected average of 3 months.\\, \\up to 5 years\\, \\The diagnosis of HCC will be based on overall patient's evaluation including clinical, biological and imaging workup which will be carried out during the consultation and/or the three months preceding or following the inclusion consultation.\\, \n\\The diagnosis will be based on an overall patient's evaluation including clinical, biological and imaging workup which will be carried out during the consultation and/or the three months preceding or following the inclusion consultation.\\, \\within 10 min of exposure\\, \\within 10 minutes of exposure\\, \\follow-up of 62.5 months (range, 18 to 112 months),\\, \\follow-up of 62.5 months (range, 18 to 112 months),\\, \\2 years\\, \\2 years or until tumor recurrence\\, \\2 years or until tumor recurrence\\, \\2 years\\, \n\\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\3 years\\, \\Change from baseline to 3 years\\, \\Change from baseline to 3 years\\, \\Change from baseline to 3 years\\, \\1 month\\) ...
class(corpus)
## [1] "factor"
corpus <- Corpus(VectorSource(corpus))
inspect(corpus[1:5])
## <<SimpleCorpus>>
## Metadata:  corpus specific: 1, document level (indexed): 0
## Content:  documents: 5
## 
## [1] c(\\2 months\\, \\90 min on day 1 and day 2\\, \\120 min (single procedure)\\, \\120 min (single procedure)\\, \\in the three years after hepatectomy\\, \\in a year after hepatectomy\\, \\up to 5 years\\, \\in a year or three years after hepatectomy\\, \\up to 5 years\\, \\in a year or three years after hepatectomy\\, \\participants will be followed for the duration of study, an expected average of 3 months.\\, \\up to 5 years\\, \\The diagnosis of HCC will be based on overall patient's evaluation including clinical, biological and imaging workup which will be carried out during the consultation and/or the three months preceding or following the inclusion consultation.\\, \n\\The diagnosis will be based on an overall patient's evaluation including clinical, biological and imaging workup which will be carried out during the consultation and/or the three months preceding or following the inclusion consultation.\\, \\within 10 min of exposure\\, \\within 10 minutes of exposure\\, \\follow-up of 62.5 months (range, 18 to 112 months),\\, \\follow-up of 62.5 months (range, 18 to 112 months),\\, \\2 years\\, \\2 years or until tumor recurrence\\, \\2 years or until tumor recurrence\\, \\2 years\\, \n\\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\3 years\\, \\Change from baseline to 3 years\\, \\Change from baseline to 3 years\\, \\Change from baseline to 3 years\\, \\1 month\\)                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            
## [2] c(\\To evaluate if serum LDH level can be used as a predictor of response in patients receiving different lines of treatment for hepatocellular carcinoma\\, \\Identification of hemodymanic alterations induced by the exposure to low levels of amplitude modulation radiofrequency electromagnetic fields (AM RF EMF) in healthy individuals and patients with advanced hepatocellular carcinoma using Artificial Intelligence program to analyze the recorded data set collected by a high-precision and non-invasive hemodynamic monitor.\\, \n\\Comparison of hemodynamic alteration during exposure to a group of hepatocellular-specific AM RF EMF recorded in healthy individuals and patients with advanced hepatocellular carcinoma using Artificial Intelligence algorithms to compare the recorded data set collected by a high-precision and non-invasive hemodynamic monitor.\\, \\Identification of specifc hemodynamic alteration recorded during the exposure to a series of specific frequency modulations AM RF EMF recorded in healthy individuals and patients with advanced hepatocellular carcinoma using Artificial Intelligence program.\\, \n\\Diagnostic criteria for hepatocellular carcinoma recurrence: refer to Chinese Anti-Cancer Association Professional Committee of hepatocellular carcinoma developed diagnostic criteria for primary hepatocellular carcinoma belong to Guangzhou standard in 2001. Once new or suspected place nature lesions within liver were found by B-ultrasonography examination,we should do CT, MRI or PET-CT review, in order to confirm the diagnosis. If imaging is positive, diagnosing hepatocellular carcinoma(dominant) recurrence after treatment; if imaging is negative, but AFP values> 400µg/L or ongoing elevated AFP values, diagnosing hepatocellular carcinoma occult recurrence after treatment.\\, \nNA, \\RFS is defined as from date of randomization until the date of first documented tumor recurrence or date of death from any cause, whichever came first.\\, NA, \\OS is defined as from date of randomization until the date of documented death from any cause.\\, \\Using Karnofsky-Performance-Status score:\\nEvaluation Methods: Comparison of symptom scores before and after the treatment.\\nMarkedly: increasing by more than 20 points after treatment compared to before treatment; Effective: increasing by more than 10 points after treatment compared to before treatment; Stable: increasing by less than 10 points or no change after treatment compared to before treatment; Invalid: decrease after treatment than before treatment.\\, \n\\Evaluation index : according to clinical observations, TCM symptoms are divided into 4 levels: (0) no symptoms, (1) mild, (2) moderate, (3)severe, Recording treatment according to symptoms.\\nEvaluation methods: comparison of symptom total integral before and after the treatment (before treatment / after treatment) Markedly: symptom disappeared, or symptom integral reduce = 2/3; Effective: symptom alleviative, integral is reduced=1/3,=2/3; Invalid: symptom is not alleviated or reduced<1/3.\\  , \\Classification according to the Common Terminology Criteria Adverse Events Version 4.0(CTCAE v4.0).\\, \n\\The diagnosis of hepatocellular carcinoma will be based on the guidelines of the American Association for the Study of Liver Diseases (AASLD) (Hepatology. 2011;53:1020-2). The adjudicating physicians will be blinded to patient results associated with the mSEPT9 test.\\, \\The diagnosis of hepatocellular carcinoma will be based on the guidelines of the American Association for the Study of Liver Diseases (AASLD) (Hepatology. 2011;53:1020-2). The adjudicating physicians will be blinded to patient results associated with the mSEPT9 test.\\, \n\\biofeedback response will be monitored\\, \\Representation of autonomous response during the exposure of specific frequencies of modulation\\, \\The primary endpoint of the study was the development of Hepatocellular carcinoma. We assessed the risk of development of hepatocellular carcinoma according to liver status, viral response to treatment, and the presence of previous resistance to NUC therapy.\\, \\survival in cirrhosis and chronic hepatitis B patients\\, \\Time from the day of liver resection to the day of clinical diagnosis of recurrence\\, \n\\Peripheral blood is drawn every 3 months after liver resection. 5hmc level in cfDNA in particular recurrence-related genes is tested by cfDNA sequencing and calculated by feature counts.\\, NA, \\Any adverse effect of the test is to be recorded.\\, NA, NA, NA, \\Difference would be found out by estimating cfDNA in terms of ng/mL of the blood specimen\\, NA, NA, NA, NA, NA, NA, \\According to standard imaging surveillance protocol, and confirmatory CT/MRI/biopsy\\, \\Positive family history of liver cancer, BMI, active/previous smoking, active/previous alcohol consumption, caffeine consumption in diet, diabetes mellitus, use of drugs for chronic medical conditions\\, \n\\Composite of regression of fibrosis plus other specific conditions decreasing incidence of hepatocellular carcinoma to <1.5% / year\\, \\According to Fibrotest/Fibrosure and transient elastography\\, \\to determine the clinical utility of Annexin A2 serum level as a novel diagnostic marker of hepatocellular carcinoma (HCC) and to correlate its level with alpha fetoprotein the current marker of (HCC).\\)
## [3] c(\\primary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\other_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \n\\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\other_outcome\\, \\primary_outcome\\)                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      
## [4] c(\\NCT03338166\\, \\NCT03448757\\, \\NCT03448757\\, \\NCT03448757\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT03311152\\, \\NCT03311152\\, \\NCT01641276\\, \\NCT01641276\\, \\NCT02025842\\, \\NCT02025842\\, \\NCT03493763\\, \\NCT03493763\\, \\NCT03493763\\, \\NCT03493763\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT01831037\\, \\NCT01831037\\, \n\\NCT01831037\\, \\NCT01831037\\, \\NCT02541149\\)                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      
## [5] <NA>
# Clean the text 
corpus <- tm_map(corpus,tolower)
## Warning in tm_map.SimpleCorpus(corpus, tolower): transformation drops
## documents
inspect(corpus[1:5])
## <<SimpleCorpus>>
## Metadata:  corpus specific: 1, document level (indexed): 0
## Content:  documents: 5
## 
## [1] c(\\2 months\\, \\90 min on day 1 and day 2\\, \\120 min (single procedure)\\, \\120 min (single procedure)\\, \\in the three years after hepatectomy\\, \\in a year after hepatectomy\\, \\up to 5 years\\, \\in a year or three years after hepatectomy\\, \\up to 5 years\\, \\in a year or three years after hepatectomy\\, \\participants will be followed for the duration of study, an expected average of 3 months.\\, \\up to 5 years\\, \\the diagnosis of hcc will be based on overall patient's evaluation including clinical, biological and imaging workup which will be carried out during the consultation and/or the three months preceding or following the inclusion consultation.\\, \n\\the diagnosis will be based on an overall patient's evaluation including clinical, biological and imaging workup which will be carried out during the consultation and/or the three months preceding or following the inclusion consultation.\\, \\within 10 min of exposure\\, \\within 10 minutes of exposure\\, \\follow-up of 62.5 months (range, 18 to 112 months),\\, \\follow-up of 62.5 months (range, 18 to 112 months),\\, \\2 years\\, \\2 years or until tumor recurrence\\, \\2 years or until tumor recurrence\\, \\2 years\\, \n\\day 0\\, \\day 0\\, \\day 0\\, \\day 0\\, \\day 0\\, \\day 0\\, \\day 0\\, \\day 0\\, \\day 0\\, \\day 0\\, \\3 years\\, \\change from baseline to 3 years\\, \\change from baseline to 3 years\\, \\change from baseline to 3 years\\, \\1 month\\)                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            
## [2] c(\\to evaluate if serum ldh level can be used as a predictor of response in patients receiving different lines of treatment for hepatocellular carcinoma\\, \\identification of hemodymanic alterations induced by the exposure to low levels of amplitude modulation radiofrequency electromagnetic fields (am rf emf) in healthy individuals and patients with advanced hepatocellular carcinoma using artificial intelligence program to analyze the recorded data set collected by a high-precision and non-invasive hemodynamic monitor.\\, \n\\comparison of hemodynamic alteration during exposure to a group of hepatocellular-specific am rf emf recorded in healthy individuals and patients with advanced hepatocellular carcinoma using artificial intelligence algorithms to compare the recorded data set collected by a high-precision and non-invasive hemodynamic monitor.\\, \\identification of specifc hemodynamic alteration recorded during the exposure to a series of specific frequency modulations am rf emf recorded in healthy individuals and patients with advanced hepatocellular carcinoma using artificial intelligence program.\\, \n\\diagnostic criteria for hepatocellular carcinoma recurrence: refer to chinese anti-cancer association professional committee of hepatocellular carcinoma developed diagnostic criteria for primary hepatocellular carcinoma belong to guangzhou standard in 2001. once new or suspected place nature lesions within liver were found by b-ultrasonography examination,we should do ct, mri or pet-ct review, in order to confirm the diagnosis. if imaging is positive, diagnosing hepatocellular carcinoma(dominant) recurrence after treatment; if imaging is negative, but afp values> 400µg/l or ongoing elevated afp values, diagnosing hepatocellular carcinoma occult recurrence after treatment.\\, \nna, \\rfs is defined as from date of randomization until the date of first documented tumor recurrence or date of death from any cause, whichever came first.\\, na, \\os is defined as from date of randomization until the date of documented death from any cause.\\, \\using karnofsky-performance-status score:\\nevaluation methods: comparison of symptom scores before and after the treatment.\\nmarkedly: increasing by more than 20 points after treatment compared to before treatment; effective: increasing by more than 10 points after treatment compared to before treatment; stable: increasing by less than 10 points or no change after treatment compared to before treatment; invalid: decrease after treatment than before treatment.\\, \n\\evaluation index : according to clinical observations, tcm symptoms are divided into 4 levels: (0) no symptoms, (1) mild, (2) moderate, (3)severe, recording treatment according to symptoms.\\nevaluation methods: comparison of symptom total integral before and after the treatment (before treatment / after treatment) markedly: symptom disappeared, or symptom integral reduce = 2/3; effective: symptom alleviative, integral is reduced=1/3,=2/3; invalid: symptom is not alleviated or reduced<1/3.\\  , \\classification according to the common terminology criteria adverse events version 4.0(ctcae v4.0).\\, \n\\the diagnosis of hepatocellular carcinoma will be based on the guidelines of the american association for the study of liver diseases (aasld) (hepatology. 2011;53:1020-2). the adjudicating physicians will be blinded to patient results associated with the msept9 test.\\, \\the diagnosis of hepatocellular carcinoma will be based on the guidelines of the american association for the study of liver diseases (aasld) (hepatology. 2011;53:1020-2). the adjudicating physicians will be blinded to patient results associated with the msept9 test.\\, \n\\biofeedback response will be monitored\\, \\representation of autonomous response during the exposure of specific frequencies of modulation\\, \\the primary endpoint of the study was the development of hepatocellular carcinoma. we assessed the risk of development of hepatocellular carcinoma according to liver status, viral response to treatment, and the presence of previous resistance to nuc therapy.\\, \\survival in cirrhosis and chronic hepatitis b patients\\, \\time from the day of liver resection to the day of clinical diagnosis of recurrence\\, \n\\peripheral blood is drawn every 3 months after liver resection. 5hmc level in cfdna in particular recurrence-related genes is tested by cfdna sequencing and calculated by feature counts.\\, na, \\any adverse effect of the test is to be recorded.\\, na, na, na, \\difference would be found out by estimating cfdna in terms of ng/ml of the blood specimen\\, na, na, na, na, na, na, \\according to standard imaging surveillance protocol, and confirmatory ct/mri/biopsy\\, \\positive family history of liver cancer, bmi, active/previous smoking, active/previous alcohol consumption, caffeine consumption in diet, diabetes mellitus, use of drugs for chronic medical conditions\\, \n\\composite of regression of fibrosis plus other specific conditions decreasing incidence of hepatocellular carcinoma to <1.5% / year\\, \\according to fibrotest/fibrosure and transient elastography\\, \\to determine the clinical utility of annexin a2 serum level as a novel diagnostic marker of hepatocellular carcinoma (hcc) and to correlate its level with alpha fetoprotein the current marker of (hcc).\\)
## [3] c(\\primary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\other_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \n\\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\other_outcome\\, \\primary_outcome\\)                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      
## [4] c(\\nct03338166\\, \\nct03448757\\, \\nct03448757\\, \\nct03448757\\, \\nct02399033\\, \\nct02399033\\, \\nct02399033\\, \\nct02399033\\, \\nct02399033\\, \\nct02399033\\, \\nct02399033\\, \\nct02399033\\, \\nct03311152\\, \\nct03311152\\, \\nct01641276\\, \\nct01641276\\, \\nct02025842\\, \\nct02025842\\, \\nct03493763\\, \\nct03493763\\, \\nct03493763\\, \\nct03493763\\, \\nct03162198\\, \\nct03162198\\, \\nct03162198\\, \\nct03162198\\, \\nct03162198\\, \\nct03162198\\, \\nct03162198\\, \\nct03162198\\, \\nct03162198\\, \\nct03162198\\, \\nct01831037\\, \\nct01831037\\, \n\\nct01831037\\, \\nct01831037\\, \\nct02541149\\)                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      
## [5] <NA>
corpus <- tm_map(corpus,removePunctuation)
## Warning in tm_map.SimpleCorpus(corpus, removePunctuation): transformation
## drops documents
inspect(corpus[1:5])
## <<SimpleCorpus>>
## Metadata:  corpus specific: 1, document level (indexed): 0
## Content:  documents: 5
## 
## [1] c2 months 90 min on day 1 and day 2 120 min single procedure 120 min single procedure in the three years after hepatectomy in a year after hepatectomy up to 5 years in a year or three years after hepatectomy up to 5 years in a year or three years after hepatectomy participants will be followed for the duration of study an expected average of 3 months up to 5 years the diagnosis of hcc will be based on overall patients evaluation including clinical biological and imaging workup which will be carried out during the consultation andor the three months preceding or following the inclusion consultation \nthe diagnosis will be based on an overall patients evaluation including clinical biological and imaging workup which will be carried out during the consultation andor the three months preceding or following the inclusion consultation within 10 min of exposure within 10 minutes of exposure followup of 625 months range 18 to 112 months followup of 625 months range 18 to 112 months 2 years 2 years or until tumor recurrence 2 years or until tumor recurrence 2 years \nday 0 day 0 day 0 day 0 day 0 day 0 day 0 day 0 day 0 day 0 3 years change from baseline to 3 years change from baseline to 3 years change from baseline to 3 years 1 month                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        
## [2] cto evaluate if serum ldh level can be used as a predictor of response in patients receiving different lines of treatment for hepatocellular carcinoma identification of hemodymanic alterations induced by the exposure to low levels of amplitude modulation radiofrequency electromagnetic fields am rf emf in healthy individuals and patients with advanced hepatocellular carcinoma using artificial intelligence program to analyze the recorded data set collected by a highprecision and noninvasive hemodynamic monitor \ncomparison of hemodynamic alteration during exposure to a group of hepatocellularspecific am rf emf recorded in healthy individuals and patients with advanced hepatocellular carcinoma using artificial intelligence algorithms to compare the recorded data set collected by a highprecision and noninvasive hemodynamic monitor identification of specifc hemodynamic alteration recorded during the exposure to a series of specific frequency modulations am rf emf recorded in healthy individuals and patients with advanced hepatocellular carcinoma using artificial intelligence program \ndiagnostic criteria for hepatocellular carcinoma recurrence refer to chinese anticancer association professional committee of hepatocellular carcinoma developed diagnostic criteria for primary hepatocellular carcinoma belong to guangzhou standard in 2001 once new or suspected place nature lesions within liver were found by bultrasonography examinationwe should do ct mri or petct review in order to confirm the diagnosis if imaging is positive diagnosing hepatocellular carcinomadominant recurrence after treatment if imaging is negative but afp values 400µgl or ongoing elevated afp values diagnosing hepatocellular carcinoma occult recurrence after treatment \nna rfs is defined as from date of randomization until the date of first documented tumor recurrence or date of death from any cause whichever came first na os is defined as from date of randomization until the date of documented death from any cause using karnofskyperformancestatus scorenevaluation methods comparison of symptom scores before and after the treatmentnmarkedly increasing by more than 20 points after treatment compared to before treatment effective increasing by more than 10 points after treatment compared to before treatment stable increasing by less than 10 points or no change after treatment compared to before treatment invalid decrease after treatment than before treatment \nevaluation index  according to clinical observations tcm symptoms are divided into 4 levels 0 no symptoms 1 mild 2 moderate 3severe recording treatment according to symptomsnevaluation methods comparison of symptom total integral before and after the treatment before treatment  after treatment markedly symptom disappeared or symptom integral reduce  23 effective symptom alleviative integral is reduced1323 invalid symptom is not alleviated or reduced13   classification according to the common terminology criteria adverse events version 40ctcae v40 \nthe diagnosis of hepatocellular carcinoma will be based on the guidelines of the american association for the study of liver diseases aasld hepatology 20115310202 the adjudicating physicians will be blinded to patient results associated with the msept9 test the diagnosis of hepatocellular carcinoma will be based on the guidelines of the american association for the study of liver diseases aasld hepatology 20115310202 the adjudicating physicians will be blinded to patient results associated with the msept9 test \nbiofeedback response will be monitored representation of autonomous response during the exposure of specific frequencies of modulation the primary endpoint of the study was the development of hepatocellular carcinoma we assessed the risk of development of hepatocellular carcinoma according to liver status viral response to treatment and the presence of previous resistance to nuc therapy survival in cirrhosis and chronic hepatitis b patients time from the day of liver resection to the day of clinical diagnosis of recurrence \nperipheral blood is drawn every 3 months after liver resection 5hmc level in cfdna in particular recurrencerelated genes is tested by cfdna sequencing and calculated by feature counts na any adverse effect of the test is to be recorded na na na difference would be found out by estimating cfdna in terms of ngml of the blood specimen na na na na na na according to standard imaging surveillance protocol and confirmatory ctmribiopsy positive family history of liver cancer bmi activeprevious smoking activeprevious alcohol consumption caffeine consumption in diet diabetes mellitus use of drugs for chronic medical conditions \ncomposite of regression of fibrosis plus other specific conditions decreasing incidence of hepatocellular carcinoma to 15  year according to fibrotestfibrosure and transient elastography to determine the clinical utility of annexin a2 serum level as a novel diagnostic marker of hepatocellular carcinoma hcc and to correlate its level with alpha fetoprotein the current marker of hcc
## [3] cprimaryoutcome primaryoutcome secondaryoutcome otheroutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome primaryoutcome secondaryoutcome \nsecondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome otheroutcome primaryoutcome                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             
## [4] cnct03338166 nct03448757 nct03448757 nct03448757 nct02399033 nct02399033 nct02399033 nct02399033 nct02399033 nct02399033 nct02399033 nct02399033 nct03311152 nct03311152 nct01641276 nct01641276 nct02025842 nct02025842 nct03493763 nct03493763 nct03493763 nct03493763 nct03162198 nct03162198 nct03162198 nct03162198 nct03162198 nct03162198 nct03162198 nct03162198 nct03162198 nct03162198 nct01831037 nct01831037 \nnct01831037 nct01831037 nct02541149                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        
## [5] <NA>
corpus <- tm_map(corpus,removeNumbers)
## Warning in tm_map.SimpleCorpus(corpus, removeNumbers): transformation drops
## documents
inspect(corpus[1:5])
## <<SimpleCorpus>>
## Metadata:  corpus specific: 1, document level (indexed): 0
## Content:  documents: 5
## 
## [1] c months  min on day  and day   min single procedure  min single procedure in the three years after hepatectomy in a year after hepatectomy up to  years in a year or three years after hepatectomy up to  years in a year or three years after hepatectomy participants will be followed for the duration of study an expected average of  months up to  years the diagnosis of hcc will be based on overall patients evaluation including clinical biological and imaging workup which will be carried out during the consultation andor the three months preceding or following the inclusion consultation \nthe diagnosis will be based on an overall patients evaluation including clinical biological and imaging workup which will be carried out during the consultation andor the three months preceding or following the inclusion consultation within  min of exposure within  minutes of exposure followup of  months range  to  months followup of  months range  to  months  years  years or until tumor recurrence  years or until tumor recurrence  years \nday  day  day  day  day  day  day  day  day  day   years change from baseline to  years change from baseline to  years change from baseline to  years  month                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   
## [2] cto evaluate if serum ldh level can be used as a predictor of response in patients receiving different lines of treatment for hepatocellular carcinoma identification of hemodymanic alterations induced by the exposure to low levels of amplitude modulation radiofrequency electromagnetic fields am rf emf in healthy individuals and patients with advanced hepatocellular carcinoma using artificial intelligence program to analyze the recorded data set collected by a highprecision and noninvasive hemodynamic monitor \ncomparison of hemodynamic alteration during exposure to a group of hepatocellularspecific am rf emf recorded in healthy individuals and patients with advanced hepatocellular carcinoma using artificial intelligence algorithms to compare the recorded data set collected by a highprecision and noninvasive hemodynamic monitor identification of specifc hemodynamic alteration recorded during the exposure to a series of specific frequency modulations am rf emf recorded in healthy individuals and patients with advanced hepatocellular carcinoma using artificial intelligence program \ndiagnostic criteria for hepatocellular carcinoma recurrence refer to chinese anticancer association professional committee of hepatocellular carcinoma developed diagnostic criteria for primary hepatocellular carcinoma belong to guangzhou standard in  once new or suspected place nature lesions within liver were found by bultrasonography examinationwe should do ct mri or petct review in order to confirm the diagnosis if imaging is positive diagnosing hepatocellular carcinomadominant recurrence after treatment if imaging is negative but afp values µgl or ongoing elevated afp values diagnosing hepatocellular carcinoma occult recurrence after treatment \nna rfs is defined as from date of randomization until the date of first documented tumor recurrence or date of death from any cause whichever came first na os is defined as from date of randomization until the date of documented death from any cause using karnofskyperformancestatus scorenevaluation methods comparison of symptom scores before and after the treatmentnmarkedly increasing by more than  points after treatment compared to before treatment effective increasing by more than  points after treatment compared to before treatment stable increasing by less than  points or no change after treatment compared to before treatment invalid decrease after treatment than before treatment \nevaluation index  according to clinical observations tcm symptoms are divided into  levels  no symptoms  mild  moderate severe recording treatment according to symptomsnevaluation methods comparison of symptom total integral before and after the treatment before treatment  after treatment markedly symptom disappeared or symptom integral reduce   effective symptom alleviative integral is reduced invalid symptom is not alleviated or reduced   classification according to the common terminology criteria adverse events version ctcae v \nthe diagnosis of hepatocellular carcinoma will be based on the guidelines of the american association for the study of liver diseases aasld hepatology  the adjudicating physicians will be blinded to patient results associated with the msept test the diagnosis of hepatocellular carcinoma will be based on the guidelines of the american association for the study of liver diseases aasld hepatology  the adjudicating physicians will be blinded to patient results associated with the msept test \nbiofeedback response will be monitored representation of autonomous response during the exposure of specific frequencies of modulation the primary endpoint of the study was the development of hepatocellular carcinoma we assessed the risk of development of hepatocellular carcinoma according to liver status viral response to treatment and the presence of previous resistance to nuc therapy survival in cirrhosis and chronic hepatitis b patients time from the day of liver resection to the day of clinical diagnosis of recurrence \nperipheral blood is drawn every  months after liver resection hmc level in cfdna in particular recurrencerelated genes is tested by cfdna sequencing and calculated by feature counts na any adverse effect of the test is to be recorded na na na difference would be found out by estimating cfdna in terms of ngml of the blood specimen na na na na na na according to standard imaging surveillance protocol and confirmatory ctmribiopsy positive family history of liver cancer bmi activeprevious smoking activeprevious alcohol consumption caffeine consumption in diet diabetes mellitus use of drugs for chronic medical conditions \ncomposite of regression of fibrosis plus other specific conditions decreasing incidence of hepatocellular carcinoma to   year according to fibrotestfibrosure and transient elastography to determine the clinical utility of annexin a serum level as a novel diagnostic marker of hepatocellular carcinoma hcc and to correlate its level with alpha fetoprotein the current marker of hcc
## [3] cprimaryoutcome primaryoutcome secondaryoutcome otheroutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome primaryoutcome secondaryoutcome \nsecondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome otheroutcome primaryoutcome                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                  
## [4] cnct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct \nnct nct nct                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     
## [5] <NA>
corpus_clean<-tm_map(corpus,stripWhitespace)
## Warning in tm_map.SimpleCorpus(corpus, stripWhitespace): transformation
## drops documents
inspect(corpus[1:5])
## <<SimpleCorpus>>
## Metadata:  corpus specific: 1, document level (indexed): 0
## Content:  documents: 5
## 
## [1] c months  min on day  and day   min single procedure  min single procedure in the three years after hepatectomy in a year after hepatectomy up to  years in a year or three years after hepatectomy up to  years in a year or three years after hepatectomy participants will be followed for the duration of study an expected average of  months up to  years the diagnosis of hcc will be based on overall patients evaluation including clinical biological and imaging workup which will be carried out during the consultation andor the three months preceding or following the inclusion consultation \nthe diagnosis will be based on an overall patients evaluation including clinical biological and imaging workup which will be carried out during the consultation andor the three months preceding or following the inclusion consultation within  min of exposure within  minutes of exposure followup of  months range  to  months followup of  months range  to  months  years  years or until tumor recurrence  years or until tumor recurrence  years \nday  day  day  day  day  day  day  day  day  day   years change from baseline to  years change from baseline to  years change from baseline to  years  month                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   
## [2] cto evaluate if serum ldh level can be used as a predictor of response in patients receiving different lines of treatment for hepatocellular carcinoma identification of hemodymanic alterations induced by the exposure to low levels of amplitude modulation radiofrequency electromagnetic fields am rf emf in healthy individuals and patients with advanced hepatocellular carcinoma using artificial intelligence program to analyze the recorded data set collected by a highprecision and noninvasive hemodynamic monitor \ncomparison of hemodynamic alteration during exposure to a group of hepatocellularspecific am rf emf recorded in healthy individuals and patients with advanced hepatocellular carcinoma using artificial intelligence algorithms to compare the recorded data set collected by a highprecision and noninvasive hemodynamic monitor identification of specifc hemodynamic alteration recorded during the exposure to a series of specific frequency modulations am rf emf recorded in healthy individuals and patients with advanced hepatocellular carcinoma using artificial intelligence program \ndiagnostic criteria for hepatocellular carcinoma recurrence refer to chinese anticancer association professional committee of hepatocellular carcinoma developed diagnostic criteria for primary hepatocellular carcinoma belong to guangzhou standard in  once new or suspected place nature lesions within liver were found by bultrasonography examinationwe should do ct mri or petct review in order to confirm the diagnosis if imaging is positive diagnosing hepatocellular carcinomadominant recurrence after treatment if imaging is negative but afp values µgl or ongoing elevated afp values diagnosing hepatocellular carcinoma occult recurrence after treatment \nna rfs is defined as from date of randomization until the date of first documented tumor recurrence or date of death from any cause whichever came first na os is defined as from date of randomization until the date of documented death from any cause using karnofskyperformancestatus scorenevaluation methods comparison of symptom scores before and after the treatmentnmarkedly increasing by more than  points after treatment compared to before treatment effective increasing by more than  points after treatment compared to before treatment stable increasing by less than  points or no change after treatment compared to before treatment invalid decrease after treatment than before treatment \nevaluation index  according to clinical observations tcm symptoms are divided into  levels  no symptoms  mild  moderate severe recording treatment according to symptomsnevaluation methods comparison of symptom total integral before and after the treatment before treatment  after treatment markedly symptom disappeared or symptom integral reduce   effective symptom alleviative integral is reduced invalid symptom is not alleviated or reduced   classification according to the common terminology criteria adverse events version ctcae v \nthe diagnosis of hepatocellular carcinoma will be based on the guidelines of the american association for the study of liver diseases aasld hepatology  the adjudicating physicians will be blinded to patient results associated with the msept test the diagnosis of hepatocellular carcinoma will be based on the guidelines of the american association for the study of liver diseases aasld hepatology  the adjudicating physicians will be blinded to patient results associated with the msept test \nbiofeedback response will be monitored representation of autonomous response during the exposure of specific frequencies of modulation the primary endpoint of the study was the development of hepatocellular carcinoma we assessed the risk of development of hepatocellular carcinoma according to liver status viral response to treatment and the presence of previous resistance to nuc therapy survival in cirrhosis and chronic hepatitis b patients time from the day of liver resection to the day of clinical diagnosis of recurrence \nperipheral blood is drawn every  months after liver resection hmc level in cfdna in particular recurrencerelated genes is tested by cfdna sequencing and calculated by feature counts na any adverse effect of the test is to be recorded na na na difference would be found out by estimating cfdna in terms of ngml of the blood specimen na na na na na na according to standard imaging surveillance protocol and confirmatory ctmribiopsy positive family history of liver cancer bmi activeprevious smoking activeprevious alcohol consumption caffeine consumption in diet diabetes mellitus use of drugs for chronic medical conditions \ncomposite of regression of fibrosis plus other specific conditions decreasing incidence of hepatocellular carcinoma to   year according to fibrotestfibrosure and transient elastography to determine the clinical utility of annexin a serum level as a novel diagnostic marker of hepatocellular carcinoma hcc and to correlate its level with alpha fetoprotein the current marker of hcc
## [3] cprimaryoutcome primaryoutcome secondaryoutcome otheroutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome primaryoutcome secondaryoutcome \nsecondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome otheroutcome primaryoutcome                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                  
## [4] cnct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct \nnct nct nct                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     
## [5] <NA>
cleanset<-tm_map(corpus,removeWords, stopwords('english'))
## Warning in tm_map.SimpleCorpus(corpus, removeWords, stopwords("english")):
## transformation drops documents
inspect(cleanset[1:5])
## <<SimpleCorpus>>
## Metadata:  corpus specific: 1, document level (indexed): 0
## Content:  documents: 5
## 
## [1] c months  min  day   day   min single procedure  min single procedure   three years  hepatectomy   year  hepatectomy    years   year  three years  hepatectomy    years   year  three years  hepatectomy participants will  followed   duration  study  expected average   months    years  diagnosis  hcc will  based  overall patients evaluation including clinical biological  imaging workup  will  carried    consultation andor  three months preceding  following  inclusion consultation \n diagnosis will  based   overall patients evaluation including clinical biological  imaging workup  will  carried    consultation andor  three months preceding  following  inclusion consultation within  min  exposure within  minutes  exposure followup   months range    months followup   months range    months  years  years   tumor recurrence  years   tumor recurrence  years \nday  day  day  day  day  day  day  day  day  day   years change  baseline   years change  baseline   years change  baseline   years  month                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   
## [2] cto evaluate  serum ldh level can  used   predictor  response  patients receiving different lines  treatment  hepatocellular carcinoma identification  hemodymanic alterations induced   exposure  low levels  amplitude modulation radiofrequency electromagnetic fields  rf emf  healthy individuals  patients  advanced hepatocellular carcinoma using artificial intelligence program  analyze  recorded data set collected   highprecision  noninvasive hemodynamic monitor \ncomparison  hemodynamic alteration  exposure   group  hepatocellularspecific  rf emf recorded  healthy individuals  patients  advanced hepatocellular carcinoma using artificial intelligence algorithms  compare  recorded data set collected   highprecision  noninvasive hemodynamic monitor identification  specifc hemodynamic alteration recorded   exposure   series  specific frequency modulations  rf emf recorded  healthy individuals  patients  advanced hepatocellular carcinoma using artificial intelligence program \ndiagnostic criteria  hepatocellular carcinoma recurrence refer  chinese anticancer association professional committee  hepatocellular carcinoma developed diagnostic criteria  primary hepatocellular carcinoma belong  guangzhou standard    new  suspected place nature lesions within liver  found  bultrasonography examinationwe   ct mri  petct review  order  confirm  diagnosis  imaging  positive diagnosing hepatocellular carcinomadominant recurrence  treatment  imaging  negative  afp values µgl  ongoing elevated afp values diagnosing hepatocellular carcinoma occult recurrence  treatment \nna rfs  defined   date  randomization   date  first documented tumor recurrence  date  death   cause whichever came first na os  defined   date  randomization   date  documented death   cause using karnofskyperformancestatus scorenevaluation methods comparison  symptom scores     treatmentnmarkedly increasing     points  treatment compared   treatment effective increasing     points  treatment compared   treatment stable increasing  less   points   change  treatment compared   treatment invalid decrease  treatment   treatment \nevaluation index  according  clinical observations tcm symptoms  divided   levels   symptoms  mild  moderate severe recording treatment according  symptomsnevaluation methods comparison  symptom total integral     treatment  treatment   treatment markedly symptom disappeared  symptom integral reduce   effective symptom alleviative integral  reduced invalid symptom   alleviated  reduced   classification according   common terminology criteria adverse events version ctcae v \n diagnosis  hepatocellular carcinoma will  based   guidelines   american association   study  liver diseases aasld hepatology   adjudicating physicians will  blinded  patient results associated   msept test  diagnosis  hepatocellular carcinoma will  based   guidelines   american association   study  liver diseases aasld hepatology   adjudicating physicians will  blinded  patient results associated   msept test \nbiofeedback response will  monitored representation  autonomous response   exposure  specific frequencies  modulation  primary endpoint   study   development  hepatocellular carcinoma  assessed  risk  development  hepatocellular carcinoma according  liver status viral response  treatment   presence  previous resistance  nuc therapy survival  cirrhosis  chronic hepatitis b patients time   day  liver resection   day  clinical diagnosis  recurrence \nperipheral blood  drawn every  months  liver resection hmc level  cfdna  particular recurrencerelated genes  tested  cfdna sequencing  calculated  feature counts na  adverse effect   test    recorded na na na difference   found   estimating cfdna  terms  ngml   blood specimen na na na na na na according  standard imaging surveillance protocol  confirmatory ctmribiopsy positive family history  liver cancer bmi activeprevious smoking activeprevious alcohol consumption caffeine consumption  diet diabetes mellitus use  drugs  chronic medical conditions \ncomposite  regression  fibrosis plus  specific conditions decreasing incidence  hepatocellular carcinoma    year according  fibrotestfibrosure  transient elastography  determine  clinical utility  annexin  serum level   novel diagnostic marker  hepatocellular carcinoma hcc   correlate  level  alpha fetoprotein  current marker  hcc
## [3] cprimaryoutcome primaryoutcome secondaryoutcome otheroutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome primaryoutcome secondaryoutcome \nsecondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome otheroutcome primaryoutcome                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   
## [4] cnct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct \nnct nct nct                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      
## [5] <NA>
# write.table(cleanset,"cleanset.txt",row.names = F)



removeURL <- function(x) gsub('http[[:alnum:]]*','',x)
cleanset <- tm_map(cleanset, content_transformer(removeURL))
## Warning in tm_map.SimpleCorpus(cleanset, content_transformer(removeURL)):
## transformation drops documents
inspect(cleanset[1:5])
## <<SimpleCorpus>>
## Metadata:  corpus specific: 1, document level (indexed): 0
## Content:  documents: 5
## 
## [1] c months  min  day   day   min single procedure  min single procedure   three years  hepatectomy   year  hepatectomy    years   year  three years  hepatectomy    years   year  three years  hepatectomy participants will  followed   duration  study  expected average   months    years  diagnosis  hcc will  based  overall patients evaluation including clinical biological  imaging workup  will  carried    consultation andor  three months preceding  following  inclusion consultation \n diagnosis will  based   overall patients evaluation including clinical biological  imaging workup  will  carried    consultation andor  three months preceding  following  inclusion consultation within  min  exposure within  minutes  exposure followup   months range    months followup   months range    months  years  years   tumor recurrence  years   tumor recurrence  years \nday  day  day  day  day  day  day  day  day  day   years change  baseline   years change  baseline   years change  baseline   years  month                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   
## [2] cto evaluate  serum ldh level can  used   predictor  response  patients receiving different lines  treatment  hepatocellular carcinoma identification  hemodymanic alterations induced   exposure  low levels  amplitude modulation radiofrequency electromagnetic fields  rf emf  healthy individuals  patients  advanced hepatocellular carcinoma using artificial intelligence program  analyze  recorded data set collected   highprecision  noninvasive hemodynamic monitor \ncomparison  hemodynamic alteration  exposure   group  hepatocellularspecific  rf emf recorded  healthy individuals  patients  advanced hepatocellular carcinoma using artificial intelligence algorithms  compare  recorded data set collected   highprecision  noninvasive hemodynamic monitor identification  specifc hemodynamic alteration recorded   exposure   series  specific frequency modulations  rf emf recorded  healthy individuals  patients  advanced hepatocellular carcinoma using artificial intelligence program \ndiagnostic criteria  hepatocellular carcinoma recurrence refer  chinese anticancer association professional committee  hepatocellular carcinoma developed diagnostic criteria  primary hepatocellular carcinoma belong  guangzhou standard    new  suspected place nature lesions within liver  found  bultrasonography examinationwe   ct mri  petct review  order  confirm  diagnosis  imaging  positive diagnosing hepatocellular carcinomadominant recurrence  treatment  imaging  negative  afp values µgl  ongoing elevated afp values diagnosing hepatocellular carcinoma occult recurrence  treatment \nna rfs  defined   date  randomization   date  first documented tumor recurrence  date  death   cause whichever came first na os  defined   date  randomization   date  documented death   cause using karnofskyperformancestatus scorenevaluation methods comparison  symptom scores     treatmentnmarkedly increasing     points  treatment compared   treatment effective increasing     points  treatment compared   treatment stable increasing  less   points   change  treatment compared   treatment invalid decrease  treatment   treatment \nevaluation index  according  clinical observations tcm symptoms  divided   levels   symptoms  mild  moderate severe recording treatment according  symptomsnevaluation methods comparison  symptom total integral     treatment  treatment   treatment markedly symptom disappeared  symptom integral reduce   effective symptom alleviative integral  reduced invalid symptom   alleviated  reduced   classification according   common terminology criteria adverse events version ctcae v \n diagnosis  hepatocellular carcinoma will  based   guidelines   american association   study  liver diseases aasld hepatology   adjudicating physicians will  blinded  patient results associated   msept test  diagnosis  hepatocellular carcinoma will  based   guidelines   american association   study  liver diseases aasld hepatology   adjudicating physicians will  blinded  patient results associated   msept test \nbiofeedback response will  monitored representation  autonomous response   exposure  specific frequencies  modulation  primary endpoint   study   development  hepatocellular carcinoma  assessed  risk  development  hepatocellular carcinoma according  liver status viral response  treatment   presence  previous resistance  nuc therapy survival  cirrhosis  chronic hepatitis b patients time   day  liver resection   day  clinical diagnosis  recurrence \nperipheral blood  drawn every  months  liver resection hmc level  cfdna  particular recurrencerelated genes  tested  cfdna sequencing  calculated  feature counts na  adverse effect   test    recorded na na na difference   found   estimating cfdna  terms  ngml   blood specimen na na na na na na according  standard imaging surveillance protocol  confirmatory ctmribiopsy positive family history  liver cancer bmi activeprevious smoking activeprevious alcohol consumption caffeine consumption  diet diabetes mellitus use  drugs  chronic medical conditions \ncomposite  regression  fibrosis plus  specific conditions decreasing incidence  hepatocellular carcinoma    year according  fibrotestfibrosure  transient elastography  determine  clinical utility  annexin  serum level   novel diagnostic marker  hepatocellular carcinoma hcc   correlate  level  alpha fetoprotein  current marker  hcc
## [3] cprimaryoutcome primaryoutcome secondaryoutcome otheroutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome primaryoutcome secondaryoutcome \nsecondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome otheroutcome primaryoutcome                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   
## [4] cnct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct \nnct nct nct                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      
## [5] <NA>
cleanset<-tm_map(cleanset,removeWords, c('nct','cnct'))
## Warning in tm_map.SimpleCorpus(cleanset, removeWords, c("nct", "cnct")):
## transformation drops documents
# Since the nct and cnct  were used, this can be removed as we 
# dont need those registry numbers for this exercise.


# cleanset <- tm_map(cleanset, gsub,pattern = 'Compared', replacement = 'Comparison')
# the barplot pulls both Compare and Comparison as separate words. this should be 
# counted as one as both holds the same synonym.

inspect(cleanset[1:5])
## <<SimpleCorpus>>
## Metadata:  corpus specific: 1, document level (indexed): 0
## Content:  documents: 5
## 
## [1] c months  min  day   day   min single procedure  min single procedure   three years  hepatectomy   year  hepatectomy    years   year  three years  hepatectomy    years   year  three years  hepatectomy participants will  followed   duration  study  expected average   months    years  diagnosis  hcc will  based  overall patients evaluation including clinical biological  imaging workup  will  carried    consultation andor  three months preceding  following  inclusion consultation \n diagnosis will  based   overall patients evaluation including clinical biological  imaging workup  will  carried    consultation andor  three months preceding  following  inclusion consultation within  min  exposure within  minutes  exposure followup   months range    months followup   months range    months  years  years   tumor recurrence  years   tumor recurrence  years \nday  day  day  day  day  day  day  day  day  day   years change  baseline   years change  baseline   years change  baseline   years  month                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   
## [2] cto evaluate  serum ldh level can  used   predictor  response  patients receiving different lines  treatment  hepatocellular carcinoma identification  hemodymanic alterations induced   exposure  low levels  amplitude modulation radiofrequency electromagnetic fields  rf emf  healthy individuals  patients  advanced hepatocellular carcinoma using artificial intelligence program  analyze  recorded data set collected   highprecision  noninvasive hemodynamic monitor \ncomparison  hemodynamic alteration  exposure   group  hepatocellularspecific  rf emf recorded  healthy individuals  patients  advanced hepatocellular carcinoma using artificial intelligence algorithms  compare  recorded data set collected   highprecision  noninvasive hemodynamic monitor identification  specifc hemodynamic alteration recorded   exposure   series  specific frequency modulations  rf emf recorded  healthy individuals  patients  advanced hepatocellular carcinoma using artificial intelligence program \ndiagnostic criteria  hepatocellular carcinoma recurrence refer  chinese anticancer association professional committee  hepatocellular carcinoma developed diagnostic criteria  primary hepatocellular carcinoma belong  guangzhou standard    new  suspected place nature lesions within liver  found  bultrasonography examinationwe   ct mri  petct review  order  confirm  diagnosis  imaging  positive diagnosing hepatocellular carcinomadominant recurrence  treatment  imaging  negative  afp values µgl  ongoing elevated afp values diagnosing hepatocellular carcinoma occult recurrence  treatment \nna rfs  defined   date  randomization   date  first documented tumor recurrence  date  death   cause whichever came first na os  defined   date  randomization   date  documented death   cause using karnofskyperformancestatus scorenevaluation methods comparison  symptom scores     treatmentnmarkedly increasing     points  treatment compared   treatment effective increasing     points  treatment compared   treatment stable increasing  less   points   change  treatment compared   treatment invalid decrease  treatment   treatment \nevaluation index  according  clinical observations tcm symptoms  divided   levels   symptoms  mild  moderate severe recording treatment according  symptomsnevaluation methods comparison  symptom total integral     treatment  treatment   treatment markedly symptom disappeared  symptom integral reduce   effective symptom alleviative integral  reduced invalid symptom   alleviated  reduced   classification according   common terminology criteria adverse events version ctcae v \n diagnosis  hepatocellular carcinoma will  based   guidelines   american association   study  liver diseases aasld hepatology   adjudicating physicians will  blinded  patient results associated   msept test  diagnosis  hepatocellular carcinoma will  based   guidelines   american association   study  liver diseases aasld hepatology   adjudicating physicians will  blinded  patient results associated   msept test \nbiofeedback response will  monitored representation  autonomous response   exposure  specific frequencies  modulation  primary endpoint   study   development  hepatocellular carcinoma  assessed  risk  development  hepatocellular carcinoma according  liver status viral response  treatment   presence  previous resistance  nuc therapy survival  cirrhosis  chronic hepatitis b patients time   day  liver resection   day  clinical diagnosis  recurrence \nperipheral blood  drawn every  months  liver resection hmc level  cfdna  particular recurrencerelated genes  tested  cfdna sequencing  calculated  feature counts na  adverse effect   test    recorded na na na difference   found   estimating cfdna  terms  ngml   blood specimen na na na na na na according  standard imaging surveillance protocol  confirmatory ctmribiopsy positive family history  liver cancer bmi activeprevious smoking activeprevious alcohol consumption caffeine consumption  diet diabetes mellitus use  drugs  chronic medical conditions \ncomposite  regression  fibrosis plus  specific conditions decreasing incidence  hepatocellular carcinoma    year according  fibrotestfibrosure  transient elastography  determine  clinical utility  annexin  serum level   novel diagnostic marker  hepatocellular carcinoma hcc   correlate  level  alpha fetoprotein  current marker  hcc
## [3] cprimaryoutcome primaryoutcome secondaryoutcome otheroutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome primaryoutcome secondaryoutcome \nsecondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome otheroutcome primaryoutcome                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   
## [4]                                   \n                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        
## [5] <NA>
cleanset <- tm_map(cleanset,stripWhitespace)
## Warning in tm_map.SimpleCorpus(cleanset, stripWhitespace): transformation
## drops documents
inspect(cleanset[1:5])
## <<SimpleCorpus>>
## Metadata:  corpus specific: 1, document level (indexed): 0
## Content:  documents: 5
## 
## [1] c months min day day min single procedure min single procedure three years hepatectomy year hepatectomy years year three years hepatectomy years year three years hepatectomy participants will followed duration study expected average months years diagnosis hcc will based overall patients evaluation including clinical biological imaging workup will carried consultation andor three months preceding following inclusion consultation diagnosis will based overall patients evaluation including clinical biological imaging workup will carried consultation andor three months preceding following inclusion consultation within min exposure within minutes exposure followup months range months followup months range months years years tumor recurrence years tumor recurrence years day day day day day day day day day day years change baseline years change baseline years change baseline years month                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                         
## [2] cto evaluate serum ldh level can used predictor response patients receiving different lines treatment hepatocellular carcinoma identification hemodymanic alterations induced exposure low levels amplitude modulation radiofrequency electromagnetic fields rf emf healthy individuals patients advanced hepatocellular carcinoma using artificial intelligence program analyze recorded data set collected highprecision noninvasive hemodynamic monitor comparison hemodynamic alteration exposure group hepatocellularspecific rf emf recorded healthy individuals patients advanced hepatocellular carcinoma using artificial intelligence algorithms compare recorded data set collected highprecision noninvasive hemodynamic monitor identification specifc hemodynamic alteration recorded exposure series specific frequency modulations rf emf recorded healthy individuals patients advanced hepatocellular carcinoma using artificial intelligence program diagnostic criteria hepatocellular carcinoma recurrence refer chinese anticancer association professional committee hepatocellular carcinoma developed diagnostic criteria primary hepatocellular carcinoma belong guangzhou standard new suspected place nature lesions within liver found bultrasonography examinationwe ct mri petct review order confirm diagnosis imaging positive diagnosing hepatocellular carcinomadominant recurrence treatment imaging negative afp values µgl ongoing elevated afp values diagnosing hepatocellular carcinoma occult recurrence treatment na rfs defined date randomization date first documented tumor recurrence date death cause whichever came first na os defined date randomization date documented death cause using karnofskyperformancestatus scorenevaluation methods comparison symptom scores treatmentnmarkedly increasing points treatment compared treatment effective increasing points treatment compared treatment stable increasing less points change treatment compared treatment invalid decrease treatment treatment evaluation index according clinical observations tcm symptoms divided levels symptoms mild moderate severe recording treatment according symptomsnevaluation methods comparison symptom total integral treatment treatment treatment markedly symptom disappeared symptom integral reduce effective symptom alleviative integral reduced invalid symptom alleviated reduced classification according common terminology criteria adverse events version ctcae v diagnosis hepatocellular carcinoma will based guidelines american association study liver diseases aasld hepatology adjudicating physicians will blinded patient results associated msept test diagnosis hepatocellular carcinoma will based guidelines american association study liver diseases aasld hepatology adjudicating physicians will blinded patient results associated msept test biofeedback response will monitored representation autonomous response exposure specific frequencies modulation primary endpoint study development hepatocellular carcinoma assessed risk development hepatocellular carcinoma according liver status viral response treatment presence previous resistance nuc therapy survival cirrhosis chronic hepatitis b patients time day liver resection day clinical diagnosis recurrence peripheral blood drawn every months liver resection hmc level cfdna particular recurrencerelated genes tested cfdna sequencing calculated feature counts na adverse effect test recorded na na na difference found estimating cfdna terms ngml blood specimen na na na na na na according standard imaging surveillance protocol confirmatory ctmribiopsy positive family history liver cancer bmi activeprevious smoking activeprevious alcohol consumption caffeine consumption diet diabetes mellitus use drugs chronic medical conditions composite regression fibrosis plus specific conditions decreasing incidence hepatocellular carcinoma year according fibrotestfibrosure transient elastography determine clinical utility annexin serum level novel diagnostic marker hepatocellular carcinoma hcc correlate level alpha fetoprotein current marker hcc
## [3] cprimaryoutcome primaryoutcome secondaryoutcome otheroutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome otheroutcome primaryoutcome                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             
## [4]                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     
## [5] <NA>
#Term Document Matrix :
# Convert the unstructured data to structured data :
tdm <- TermDocumentMatrix(cleanset)
tdm
## <<TermDocumentMatrix (terms: 280, documents: 4)>>
## Non-/sparse entries: 297/823
## Sparsity           : 73%
## Maximal term length: 26
## Weighting          : term frequency (tf)
# the terms indicate that there are 280 words and 4 documents(# of tweets) in this TDM
# Sparsity is 73% which indicates that there are zero values
tdm <- as.matrix(tdm)
tdm[1:10,1:4]
##               Docs
## Terms           1 2 3 4
##   andor         2 0 0 0
##   average       1 0 0 0
##   based         2 2 0 0
##   baseline      3 0 0 0
##   biological    2 0 0 0
##   carried       2 0 0 0
##   change        3 1 0 0
##   clinical      2 3 0 0
##   consultation  4 0 0 0
##   day          12 2 0 0
# Bar Plot 

w <- rowSums(tdm)  # provides the no of times a particular word has been used.
w <- subset(w, w>= 3) # Pull words that were used more than 2 times.
barplot(w, las = 2, col = rainbow(50))

# the word Aquaman,Like and James as the highest frequency. This implies
# that Movie Aquaman has got more reviews about the James and 
# most of them liked the movie.

# Word Cloud :
w <- sort(rowSums(tdm), decreasing = TRUE) # Sort words in decreasing order.
set.seed(123)
wordcloud(words = names(w), freq = w, 
          max.words = 250,random.order = F,
          min.freq =  3, 
          colors = brewer.pal(8, 'Dark2'),
          scale = c(5,0.3),
          rot.per = 0.6)
## Warning in wordcloud(words = names(w), freq = w, max.words = 250,
## random.order = F, : secondaryoutcome could not be fit on page. It will not
## be plotted.

w <- data.frame(names(w),w)
colnames(w) <- c('word','freq')
wordcloud2(w,size = 0.5, shape = 'triangle', rotateRatio = 0.5, 
           minSize = 1)
# lettercloud 

letterCloud(w,word = 'HCC',frequency(2), size=1)
# Sentiment Analysis for tweets:


# Read File 
HCC_Outcome <- read.delim('cleanset.TXT')
trail_out <- as.character(HCC_Outcome[-1,])
class(trail_out)
## [1] "character"
# Obtain Sentiment scores 
s <- get_nrc_sentiment(trail_out)
## Warning: package 'bindrcpp' was built under R version 3.5.1
head(s)
##   anger anticipation disgust fear joy sadness surprise trust negative
## 1     4            8       4   14   3       7        2    11       15
## 2     0            0       0    0   0       0        0     0        0
## 3     0            0       0    0   0       0        0     0        0
##   positive
## 1       19
## 2        0
## 3        0
get_nrc_sentiment('diagnosis')
##   anger anticipation disgust fear joy sadness surprise trust negative
## 1     0            1       0    1   0       0        0     1        1
##   positive
## 1        0
# diagnosis has 1 anticipation, 1 fear, 1 trust and 1 negative value
get_nrc_sentiment('death') 
##   anger anticipation disgust fear joy sadness surprise trust negative
## 1     1            1       1    1   0       1        1     0        1
##   positive
## 1        0
# death has one anger, one anticpation, 1 disgust, 1 fear, 1 sadness, 
# 1 surprise, and 1 Negative



# barplot 

barplot(colSums(s), las = 2.5, col = rainbow(10),
        ylab = 'Count',main= 'Sentiment scores for HCC Clinical Trail')

# Overall, it looks like the outcome had lots of Anticipation on the 
# results, encountered lots of fear , anger. Most of their work had a 
# lot of negative thoughts with sadness. However the outcome also showed
# great signs of trust which show cased a lot of positive outcomes.