library(rvest)
## Warning: package 'rvest' was built under R version 3.5.1
## Loading required package: xml2
## Warning: package 'xml2' was built under R version 3.5.1
library(XML)
## Warning: package 'XML' was built under R version 3.5.1
##
## Attaching package: 'XML'
## The following object is masked from 'package:rvest':
##
## xml
library(magrittr)
## Warning: package 'magrittr' was built under R version 3.5.1
library(tm)
## Warning: package 'tm' was built under R version 3.5.1
## Loading required package: NLP
## Warning: package 'NLP' was built under R version 3.5.1
library(wordcloud)
## Warning: package 'wordcloud' was built under R version 3.5.1
## Loading required package: RColorBrewer
library(wordcloud2)
library(syuzhet)
## Warning: package 'syuzhet' was built under R version 3.5.1
library(lubridate)
## Warning: package 'lubridate' was built under R version 3.5.1
##
## Attaching package: 'lubridate'
## The following object is masked from 'package:base':
##
## date
library(ggplot2)
## Warning: package 'ggplot2' was built under R version 3.5.1
##
## Attaching package: 'ggplot2'
## The following object is masked from 'package:NLP':
##
## annotate
library(scales)
## Warning: package 'scales' was built under R version 3.5.1
##
## Attaching package: 'scales'
## The following object is masked from 'package:syuzhet':
##
## rescale
library(reshape2)
library(dplyr)
## Warning: package 'dplyr' was built under R version 3.5.1
##
## Attaching package: 'dplyr'
## The following objects are masked from 'package:lubridate':
##
## intersect, setdiff, union
## The following objects are masked from 'package:stats':
##
## filter, lag
## The following objects are masked from 'package:base':
##
## intersect, setdiff, setequal, union
library(rclinicaltrials)
library(devtools)
## Warning: package 'devtools' was built under R version 3.5.1
## Warning: package 'usethis' was built under R version 3.5.1
# install.packages('devtools')
# devtools::install_github("lchiffon/wordcloud2")
# install_github("sachsmc/rclinicaltrials")
# ClinicalTrailReviews #############################
# HCC_Info <- clinicaltrials_download(query = c("cond=Hepatocellular Carcinoma", "phase=2","type=Intr", "rslt=With"), count = 1e6, include_results = TRUE)
# summary(HCC_Info$study_information$interventions)
z <- clinicaltrials_download(query = 'Hepatocellular Carcinoma', count = 10, include_results = TRUE)
str(z)
## List of 2
## $ study_information:List of 6
## ..$ study_info :'data.frame': 10 obs. of 43 variables:
## .. ..$ org_study_id : chr [1:10] "URL" "HSL 2016-83" "SCheng" "2017-A01885-48" ...
## .. ..$ nct_id : chr [1:10] "NCT03338166" "NCT03448757" "NCT02399033" "NCT03311152" ...
## .. ..$ brief_title : chr [1:10] "Role of LDH as a Predictor of Treatment Outcomes in Hepatocellular Carcinoma" "Determination of Autonomic Responses to the Exposure of Low Energy Electromagnetic Fields With Frequency Modula"| __truncated__ "Xihuang Capsules Prevention of Recurrence in Patients With Hepatocellular Carcinoma After Hepatectomy" "Circulating Cell-free DNA-based Epigenetic Biomarker mSEPT9 for Hepatocellular Carcinoma Detection in Cirrhosis" ...
## .. ..$ official_title : chr [1:10] "Role of LDH as a Predictor of Treatment Outcomes in Hepatocellular Carcinoma" "Determination of Autonomic Responses to the Exposure of Low Energy Electromagnetic Fields With Frequency Modula"| __truncated__ "Xihuang Capsules Prevention of Recurrence in Patients With Hepatocellular Carcinoma After Hepatectomy: A Multic"| __truncated__ "Diagnostic Accuracy of the Circulating Cell-free DNA-based Epigenetic Biomarker mSEPT9 for Hepatocellular Carci"| __truncated__ ...
## .. ..$ overall_status : chr [1:10] "Not yet recruiting" "Recruiting" "Recruiting" "Recruiting" ...
## .. ..$ start_date.text : chr [1:10] "January 2, 2018" "February 15, 2018" NA "February 12, 2018" ...
## .. ..$ start_date..attrs : chr [1:10] "Anticipated" "Actual" NA "Actual" ...
## .. ..$ completion_date.text : chr [1:10] "December 2018" "February 16, 2020" "December 2019" "February 12, 2022" ...
## .. ..$ completion_date..attrs : chr [1:10] "Anticipated" "Anticipated" "Anticipated" "Anticipated" ...
## .. ..$ completion_date_type : chr [1:10] "Anticipated" "Anticipated" "Anticipated" "Anticipated" ...
## .. ..$ lead_sponsor/agency : chr [1:10] "Assiut University" "Hospital Sirio-Libanes" "Shuqun Cheng" "Central Hospital, Nancy, France" ...
## .. ..$ overall_official.last_name : chr [1:10] "Aml R Ibrahim, Lecturer" NA "Shuqun Cheng, Ph.D" "Abderrahim OUSSALAH, MD, PhD" ...
## .. ..$ overall_official.role : chr [1:10] "Principal Investigator" NA "Principal Investigator" "Principal Investigator" ...
## .. ..$ overall_official.affiliation : chr [1:10] "Assiut University" NA "Eastern Hepatobiliary Surgical Hospital" "University Hospital of Nancy, INSERM U954, Faculty of Medicine of Nancy, University of Lorraine" ...
## .. ..$ study_type : chr [1:10] "Observational" "Interventional" "Interventional" "Interventional" ...
## .. ..$ enrollment.text : chr [1:10] "50" "60" "1000" "440" ...
## .. ..$ enrollment..attrs : chr [1:10] "Anticipated" "Anticipated" "Anticipated" "Anticipated" ...
## .. ..$ primary_condition : chr [1:10] "Hepatocellular Carcinoma" "Hepatocellular Carcinoma" "Hepatocellular Carcinoma" "Hepatocellular Carcinoma; Cirrhosis" ...
## .. ..$ primary_outcome.measure : chr [1:10] "serum LDH level as a predictor of response in hepatocellular carcinoma" "non-invasive hemodynamic parameter measurements during exposure AM RF EMF" "Hepatocellular carcinoma recurrence rate in the three years after hepatectomy" "Presence of hepatocellular carcinoma." ...
## .. ..$ primary_outcome.time_frame : chr [1:10] "2 months" "90 min on day 1 and day 2" "in the three years after hepatectomy" "The diagnosis of HCC will be based on overall patient's evaluation including clinical, biological and imaging w"| __truncated__ ...
## .. ..$ primary_outcome.description : chr [1:10] "To evaluate if serum LDH level can be used as a predictor of response in patients receiving different lines of "| __truncated__ "Identification of hemodymanic alterations induced by the exposure to low levels of amplitude modulation radiofr"| __truncated__ "Diagnostic criteria for hepatocellular carcinoma recurrence: refer to Chinese Anti-Cancer Association Professio"| __truncated__ "The diagnosis of hepatocellular carcinoma will be based on the guidelines of the American Association for the S"| __truncated__ ...
## .. ..$ eligibility.sampling_method : chr [1:10] "Probability Sample" NA NA NA ...
## .. ..$ eligibility.textblock.1 : chr [1:10] "\n Inclusion Criteria:\n\n - patients with Hepatocellular carcinoma diagnosed by biopsy or ima"| __truncated__ NA NA NA ...
## .. ..$ eligibility.gender : chr [1:10] "All" "All" "All" "All" ...
## .. ..$ eligibility.minimum_age : chr [1:10] "18 Years" "18 Years" "20 Years" "18 Years" ...
## .. ..$ eligibility.maximum_age : chr [1:10] "65 Years" "80 Years" "70 Years" "N/A" ...
## .. ..$ eligibility.healthy_volunteers : chr [1:10] "No" "Accepts Healthy Volunteers" "No" "No" ...
## .. ..$ sponsors.lead_sponsor.agency : chr [1:10] "Assiut University" "Hospital Sirio-Libanes" "Shuqun Cheng" "Central Hospital, Nancy, France" ...
## .. ..$ sponsors.lead_sponsor.agency_class : chr [1:10] "Other" "Other" "Other" "Other" ...
## .. ..$ date_disclaimer : chr [1:10] "ClinicalTrials.gov processed this data on December 21, 2018" "ClinicalTrials.gov processed this data on December 21, 2018" "ClinicalTrials.gov processed this data on December 21, 2018" "ClinicalTrials.gov processed this data on December 21, 2018" ...
## .. ..$ phase : chr [1:10] NA "N/A" "Phase 4" "N/A" ...
## .. ..$ start_date : chr [1:10] NA NA "June 2014" NA ...
## .. ..$ sponsors.collaborator.agency : chr [1:10] NA NA NA "Institut National de la Santé Et de la Recherche Médicale, France" ...
## .. ..$ sponsors.collaborator.agency_class : chr [1:10] NA NA NA "Other" ...
## .. ..$ sponsors.collaborator.agency.1 : chr [1:10] NA NA NA "Groupement Interrégional de Recherche Clinique et d'Innovation" ...
## .. ..$ sponsors.collaborator.agency_class.1: chr [1:10] NA NA NA "Other" ...
## .. ..$ sponsors.collaborator.agency.2 : chr [1:10] NA NA NA "Epigenomics, Inc" ...
## .. ..$ sponsors.collaborator.agency_class.2: chr [1:10] NA NA NA "Industry" ...
## .. ..$ primary_outcome.measure.1 : chr [1:10] NA NA NA NA ...
## .. ..$ primary_outcome.time_frame.1 : chr [1:10] NA NA NA NA ...
## .. ..$ overall_official.last_name.1 : chr [1:10] NA NA NA NA ...
## .. ..$ overall_official.role.1 : chr [1:10] NA NA NA NA ...
## .. ..$ overall_official.affiliation.1 : chr [1:10] NA NA NA NA ...
## ..$ locations :'data.frame': 10 obs. of 20 variables:
## .. ..$ name : chr [1:10] "Hospital SÃrio-Libanês" "Eastern Hepatobiliary Surgical Hospital" "University Hospital of Nancy (CHRU de Nancy)" "Hospital SÃrio Libanês" ...
## .. ..$ address.city : chr [1:10] "São Paulo" "Shanghai" "Vandoeuvre-lès-Nancy" "São Paulo" ...
## .. ..$ address.country : chr [1:10] "Brazil" "China" "France" "Brazil" ...
## .. ..$ status : chr [1:10] "Recruiting" "Recruiting" "Recruiting" NA ...
## .. ..$ contact.last_name : chr [1:10] "Tatiana Zanesco" "Shuqun Cheng, Ph.D" "Abderrahim OUSSALAH, MD, PhD" NA ...
## .. ..$ contact.phone : chr [1:10] "5511983539222" "021-65564166" "+33 (0)3 83 15 36 29" NA ...
## .. ..$ contact.email : chr [1:10] "tzanesco@hotmail.com" NA "a.oussalah@chru-nancy.fr" NA ...
## .. ..$ nct_id : chr [1:10] "NCT03448757" "NCT02399033" "NCT03311152" "NCT01641276" ...
## .. ..$ address.state : chr [1:10] NA "Shanghai" NA NA ...
## .. ..$ address.zip : chr [1:10] NA "200438" "54511" "01308-050" ...
## .. ..$ investigator.last_name : chr [1:10] NA NA "Abderrahim OUSSALAH, MD, PhD" NA ...
## .. ..$ investigator.role : chr [1:10] NA NA "Principal Investigator" NA ...
## .. ..$ investigator.last_name.1: chr [1:10] NA NA "Jean-Louis GUÉANT, MD,DSc,AGAF" NA ...
## .. ..$ investigator.role.1 : chr [1:10] NA NA "Sub-Investigator" NA ...
## .. ..$ investigator.last_name.2: chr [1:10] NA NA "Jean-Pierre BRONOWICKI, MD, PhD" NA ...
## .. ..$ investigator.role.2 : chr [1:10] NA NA "Sub-Investigator" NA ...
## .. ..$ investigator.last_name.3: chr [1:10] NA NA "Valérie LAURENT, MD, PhD" NA ...
## .. ..$ investigator.role.3 : chr [1:10] NA NA "Sub-Investigator" NA ...
## .. ..$ investigator.last_name.4: chr [1:10] NA NA "Ahmet AYAV, MD, PhD" NA ...
## .. ..$ investigator.role.4 : chr [1:10] NA NA "Sub-Investigator" NA ...
## ..$ arms :'data.frame': 21 obs. of 4 variables:
## .. ..$ arm_group_label: chr [1:21] "Group A" "Group B" "Group C" "Group D" ...
## .. ..$ description : chr [1:21] "Patients with Hepatocellular carcinoma who treated with sorafenib and measure LDH serum level one month pre and post treatment" "Patients with Hepatocellular carcinoma who treated with trans catheter arterial chemo embolization (TACE) and m"| __truncated__ "Patients with Hepatocellular carcinoma who treated surgically and measure LDH serum level one month pre and post treatment" "Patients with Hepatocellular carcinoma who don't receive treatment and asses LDH serum level for 3months" ...
## .. ..$ nct_id : chr [1:21] "NCT03338166" "NCT03338166" "NCT03338166" "NCT03338166" ...
## .. ..$ arm_group_type : chr [1:21] NA NA NA NA ...
## ..$ interventions:'data.frame': 11 obs. of 10 variables:
## .. ..$ intervention_type: chr [1:11] "Other" "Other" "Drug" "Diagnostic Test" ...
## .. ..$ intervention_name: chr [1:11] "LDH serum level" "measuring hemodynamic parameters heart beat to heart beat during single-frequency exposure" "Xihuang Capsules" "\"Epi proColon 2.0 CE\" test from Epigenomics, Inc (Berlin, Germany)" ...
## .. ..$ description : chr [1:11] "Blood sample to measure LDH as a predictor of Hepatocellular carcinoma treatment outcome" "This study aims to create a method for non-invasive diagnosis of biofeedback effect exposure to LEEF modulated "| __truncated__ "In two weeks after hepatectomy, Xihuang Capsules group received Xihuang Capsules (2 g, bid), Continuously takin"| __truncated__ "The mSEPT9 assay consists of DNA extraction from plasma, bisulfite conversion of DNA, purification of bis-DNA, "| __truncated__ ...
## .. ..$ arm_group_label : chr [1:11] "Group A" "Autonomic response" "Xihuang Capsules group" "HCC-free cirrhotic patients" ...
## .. ..$ arm_group_label.1: chr [1:11] "Group B" NA NA "HCC-positive cirrhotic patients" ...
## .. ..$ arm_group_label.2: chr [1:11] "Group C" NA NA NA ...
## .. ..$ arm_group_label.3: chr [1:11] "Group D" NA NA NA ...
## .. ..$ nct_id : chr [1:11] "NCT03338166" "NCT03448757" "NCT02399033" "NCT03311152" ...
## .. ..$ other_name : chr [1:11] NA NA "Wangbang Pharmaceutical Xihuang Capsules" "Plasma mSEPT9 test" ...
## .. ..$ other_name.1 : chr [1:11] NA NA NA NA ...
## ..$ outcomes :'data.frame': 37 obs. of 5 variables:
## .. ..$ measure : chr [1:37] "serum LDH level as a predictor of response in hepatocellular carcinoma" "non-invasive hemodynamic parameter measurements during exposure AM RF EMF" "Hemodynamic alteration´s comparison among advanced cancer patients and healthy controls" "Searching for cancer-specific frequency modulation" ...
## .. ..$ time_frame : chr [1:37] "2 months" "90 min on day 1 and day 2" "120 min (single procedure)" "120 min (single procedure)" ...
## .. ..$ description: chr [1:37] "To evaluate if serum LDH level can be used as a predictor of response in patients receiving different lines of "| __truncated__ "Identification of hemodymanic alterations induced by the exposure to low levels of amplitude modulation radiofr"| __truncated__ "Comparison of hemodynamic alteration during exposure to a group of hepatocellular-specific AM RF EMF recorded i"| __truncated__ "Identification of specifc hemodynamic alteration recorded during the exposure to a series of specific frequency"| __truncated__ ...
## .. ..$ type : chr [1:37] "primary_outcome" "primary_outcome" "secondary_outcome" "other_outcome" ...
## .. ..$ nct_id : chr [1:37] "NCT03338166" "NCT03448757" "NCT03448757" "NCT03448757" ...
## ..$ textblocks : NULL
## $ study_results :List of 3
## ..$ participant_flow: NULL
## ..$ baseline_data : NULL
## ..$ outcome_data : NULL
zstudyinfo <- z$study_information$study_info
zoutcomes <- z$study_information$outcomes
zinterventions <- z$study_information$interventions
zoutcomes <- as.character(zoutcomes)
zinterventions <- as.character(zinterventions)
zhcc <- rbind(zoutcomes,zinterventions)
setwd("C:/Users/Thiru/Desktop/Assignments In Progress/Text Mining/ClinicalTrialAnalysis")
write.table(zhcc,"zhcc.txt",row.names = F)
write.table(zinterventions,"inv.txt",row.names = F)
write.table(zoutcomes,"out.txt",row.names = F)
hcc <- read.delim('out.txt')
str(hcc)
## 'data.frame': 5 obs. of 1 variable:
## $ x: Factor w/ 5 levels "c(\\2 months\\, \\90 min on day 1 and day 2\\, \\120 min (single procedure)\\, \\120 min (single procedure)\\, "| __truncated__,..: 4 1 5 3 2
View(hcc)
# Build Corpus and DTM/TDM
library(tm)
corpus <- hcc[-1,]
head(corpus)
## [1] c(\\2 months\\, \\90 min on day 1 and day 2\\, \\120 min (single procedure)\\, \\120 min (single procedure)\\, \\in the three years after hepatectomy\\, \\in a year after hepatectomy\\, \\up to 5 years\\, \\in a year or three years after hepatectomy\\, \\up to 5 years\\, \\in a year or three years after hepatectomy\\, \\participants will be followed for the duration of study, an expected average of 3 months.\\, \\up to 5 years\\, \\The diagnosis of HCC will be based on overall patient's evaluation including clinical, biological and imaging workup which will be carried out during the consultation and/or the three months preceding or following the inclusion consultation.\\, \n\\The diagnosis will be based on an overall patient's evaluation including clinical, biological and imaging workup which will be carried out during the consultation and/or the three months preceding or following the inclusion consultation.\\, \\within 10 min of exposure\\, \\within 10 minutes of exposure\\, \\follow-up of 62.5 months (range, 18 to 112 months),\\, \\follow-up of 62.5 months (range, 18 to 112 months),\\, \\2 years\\, \\2 years or until tumor recurrence\\, \\2 years or until tumor recurrence\\, \\2 years\\, \n\\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\3 years\\, \\Change from baseline to 3 years\\, \\Change from baseline to 3 years\\, \\Change from baseline to 3 years\\, \\1 month\\)
## [2] c(\\To evaluate if serum LDH level can be used as a predictor of response in patients receiving different lines of treatment for hepatocellular carcinoma\\, \\Identification of hemodymanic alterations induced by the exposure to low levels of amplitude modulation radiofrequency electromagnetic fields (AM RF EMF) in healthy individuals and patients with advanced hepatocellular carcinoma using Artificial Intelligence program to analyze the recorded data set collected by a high-precision and non-invasive hemodynamic monitor.\\, \n\\Comparison of hemodynamic alteration during exposure to a group of hepatocellular-specific AM RF EMF recorded in healthy individuals and patients with advanced hepatocellular carcinoma using Artificial Intelligence algorithms to compare the recorded data set collected by a high-precision and non-invasive hemodynamic monitor.\\, \\Identification of specifc hemodynamic alteration recorded during the exposure to a series of specific frequency modulations AM RF EMF recorded in healthy individuals and patients with advanced hepatocellular carcinoma using Artificial Intelligence program.\\, \n\\Diagnostic criteria for hepatocellular carcinoma recurrence: refer to Chinese Anti-Cancer Association Professional Committee of hepatocellular carcinoma developed diagnostic criteria for primary hepatocellular carcinoma belong to Guangzhou standard in 2001. Once new or suspected place nature lesions within liver were found by B-ultrasonography examination,we should do CT, MRI or PET-CT review, in order to confirm the diagnosis. If imaging is positive, diagnosing hepatocellular carcinoma(dominant) recurrence after treatment; if imaging is negative, but AFP values> 400µg/L or ongoing elevated AFP values, diagnosing hepatocellular carcinoma occult recurrence after treatment.\\, \nNA, \\RFS is defined as from date of randomization until the date of first documented tumor recurrence or date of death from any cause, whichever came first.\\, NA, \\OS is defined as from date of randomization until the date of documented death from any cause.\\, \\Using Karnofsky-Performance-Status score:\\nEvaluation Methods: Comparison of symptom scores before and after the treatment.\\nMarkedly: increasing by more than 20 points after treatment compared to before treatment; Effective: increasing by more than 10 points after treatment compared to before treatment; Stable: increasing by less than 10 points or no change after treatment compared to before treatment; Invalid: decrease after treatment than before treatment.\\, \n\\Evaluation index : according to clinical observations, TCM symptoms are divided into 4 levels: (0) no symptoms, (1) mild, (2) moderate, (3)severe, Recording treatment according to symptoms.\\nEvaluation methods: comparison of symptom total integral before and after the treatment (before treatment / after treatment) Markedly: symptom disappeared, or symptom integral reduce = 2/3; Effective: symptom alleviative, integral is reduced=1/3,=2/3; Invalid: symptom is not alleviated or reduced<1/3.\\ , \\Classification according to the Common Terminology Criteria Adverse Events Version 4.0(CTCAE v4.0).\\, \n\\The diagnosis of hepatocellular carcinoma will be based on the guidelines of the American Association for the Study of Liver Diseases (AASLD) (Hepatology. 2011;53:1020-2). The adjudicating physicians will be blinded to patient results associated with the mSEPT9 test.\\, \\The diagnosis of hepatocellular carcinoma will be based on the guidelines of the American Association for the Study of Liver Diseases (AASLD) (Hepatology. 2011;53:1020-2). The adjudicating physicians will be blinded to patient results associated with the mSEPT9 test.\\, \n\\biofeedback response will be monitored\\, \\Representation of autonomous response during the exposure of specific frequencies of modulation\\, \\The primary endpoint of the study was the development of Hepatocellular carcinoma. We assessed the risk of development of hepatocellular carcinoma according to liver status, viral response to treatment, and the presence of previous resistance to NUC therapy.\\, \\survival in cirrhosis and chronic hepatitis B patients\\, \\Time from the day of liver resection to the day of clinical diagnosis of recurrence\\, \n\\Peripheral blood is drawn every 3 months after liver resection. 5hmc level in cfDNA in particular recurrence-related genes is tested by cfDNA sequencing and calculated by feature counts.\\, NA, \\Any adverse effect of the test is to be recorded.\\, NA, NA, NA, \\Difference would be found out by estimating cfDNA in terms of ng/mL of the blood specimen\\, NA, NA, NA, NA, NA, NA, \\According to standard imaging surveillance protocol, and confirmatory CT/MRI/biopsy\\, \\Positive family history of liver cancer, BMI, active/previous smoking, active/previous alcohol consumption, caffeine consumption in diet, diabetes mellitus, use of drugs for chronic medical conditions\\, \n\\Composite of regression of fibrosis plus other specific conditions decreasing incidence of hepatocellular carcinoma to <1.5% / year\\, \\According to Fibrotest/Fibrosure and transient elastography\\, \\to determine the clinical utility of Annexin A2 serum level as a novel diagnostic marker of hepatocellular carcinoma (HCC) and to correlate its level with alpha fetoprotein the current marker of (HCC).\\)
## [3] c(\\primary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\other_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \n\\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\other_outcome\\, \\primary_outcome\\)
## [4] c(\\NCT03338166\\, \\NCT03448757\\, \\NCT03448757\\, \\NCT03448757\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT03311152\\, \\NCT03311152\\, \\NCT01641276\\, \\NCT01641276\\, \\NCT02025842\\, \\NCT02025842\\, \\NCT03493763\\, \\NCT03493763\\, \\NCT03493763\\, \\NCT03493763\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT01831037\\, \\NCT01831037\\, \n\\NCT01831037\\, \\NCT01831037\\, \\NCT02541149\\)
## 5 Levels: c(\\2 months\\, \\90 min on day 1 and day 2\\, \\120 min (single procedure)\\, \\120 min (single procedure)\\, \\in the three years after hepatectomy\\, \\in a year after hepatectomy\\, \\up to 5 years\\, \\in a year or three years after hepatectomy\\, \\up to 5 years\\, \\in a year or three years after hepatectomy\\, \\participants will be followed for the duration of study, an expected average of 3 months.\\, \\up to 5 years\\, \\The diagnosis of HCC will be based on overall patient's evaluation including clinical, biological and imaging workup which will be carried out during the consultation and/or the three months preceding or following the inclusion consultation.\\, \n\\The diagnosis will be based on an overall patient's evaluation including clinical, biological and imaging workup which will be carried out during the consultation and/or the three months preceding or following the inclusion consultation.\\, \\within 10 min of exposure\\, \\within 10 minutes of exposure\\, \\follow-up of 62.5 months (range, 18 to 112 months),\\, \\follow-up of 62.5 months (range, 18 to 112 months),\\, \\2 years\\, \\2 years or until tumor recurrence\\, \\2 years or until tumor recurrence\\, \\2 years\\, \n\\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\3 years\\, \\Change from baseline to 3 years\\, \\Change from baseline to 3 years\\, \\Change from baseline to 3 years\\, \\1 month\\) ...
class(corpus)
## [1] "factor"
corpus <- Corpus(VectorSource(corpus))
inspect(corpus[1:5])
## <<SimpleCorpus>>
## Metadata: corpus specific: 1, document level (indexed): 0
## Content: documents: 5
##
## [1] c(\\2 months\\, \\90 min on day 1 and day 2\\, \\120 min (single procedure)\\, \\120 min (single procedure)\\, \\in the three years after hepatectomy\\, \\in a year after hepatectomy\\, \\up to 5 years\\, \\in a year or three years after hepatectomy\\, \\up to 5 years\\, \\in a year or three years after hepatectomy\\, \\participants will be followed for the duration of study, an expected average of 3 months.\\, \\up to 5 years\\, \\The diagnosis of HCC will be based on overall patient's evaluation including clinical, biological and imaging workup which will be carried out during the consultation and/or the three months preceding or following the inclusion consultation.\\, \n\\The diagnosis will be based on an overall patient's evaluation including clinical, biological and imaging workup which will be carried out during the consultation and/or the three months preceding or following the inclusion consultation.\\, \\within 10 min of exposure\\, \\within 10 minutes of exposure\\, \\follow-up of 62.5 months (range, 18 to 112 months),\\, \\follow-up of 62.5 months (range, 18 to 112 months),\\, \\2 years\\, \\2 years or until tumor recurrence\\, \\2 years or until tumor recurrence\\, \\2 years\\, \n\\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\Day 0\\, \\3 years\\, \\Change from baseline to 3 years\\, \\Change from baseline to 3 years\\, \\Change from baseline to 3 years\\, \\1 month\\)
## [2] c(\\To evaluate if serum LDH level can be used as a predictor of response in patients receiving different lines of treatment for hepatocellular carcinoma\\, \\Identification of hemodymanic alterations induced by the exposure to low levels of amplitude modulation radiofrequency electromagnetic fields (AM RF EMF) in healthy individuals and patients with advanced hepatocellular carcinoma using Artificial Intelligence program to analyze the recorded data set collected by a high-precision and non-invasive hemodynamic monitor.\\, \n\\Comparison of hemodynamic alteration during exposure to a group of hepatocellular-specific AM RF EMF recorded in healthy individuals and patients with advanced hepatocellular carcinoma using Artificial Intelligence algorithms to compare the recorded data set collected by a high-precision and non-invasive hemodynamic monitor.\\, \\Identification of specifc hemodynamic alteration recorded during the exposure to a series of specific frequency modulations AM RF EMF recorded in healthy individuals and patients with advanced hepatocellular carcinoma using Artificial Intelligence program.\\, \n\\Diagnostic criteria for hepatocellular carcinoma recurrence: refer to Chinese Anti-Cancer Association Professional Committee of hepatocellular carcinoma developed diagnostic criteria for primary hepatocellular carcinoma belong to Guangzhou standard in 2001. Once new or suspected place nature lesions within liver were found by B-ultrasonography examination,we should do CT, MRI or PET-CT review, in order to confirm the diagnosis. If imaging is positive, diagnosing hepatocellular carcinoma(dominant) recurrence after treatment; if imaging is negative, but AFP values> 400µg/L or ongoing elevated AFP values, diagnosing hepatocellular carcinoma occult recurrence after treatment.\\, \nNA, \\RFS is defined as from date of randomization until the date of first documented tumor recurrence or date of death from any cause, whichever came first.\\, NA, \\OS is defined as from date of randomization until the date of documented death from any cause.\\, \\Using Karnofsky-Performance-Status score:\\nEvaluation Methods: Comparison of symptom scores before and after the treatment.\\nMarkedly: increasing by more than 20 points after treatment compared to before treatment; Effective: increasing by more than 10 points after treatment compared to before treatment; Stable: increasing by less than 10 points or no change after treatment compared to before treatment; Invalid: decrease after treatment than before treatment.\\, \n\\Evaluation index : according to clinical observations, TCM symptoms are divided into 4 levels: (0) no symptoms, (1) mild, (2) moderate, (3)severe, Recording treatment according to symptoms.\\nEvaluation methods: comparison of symptom total integral before and after the treatment (before treatment / after treatment) Markedly: symptom disappeared, or symptom integral reduce = 2/3; Effective: symptom alleviative, integral is reduced=1/3,=2/3; Invalid: symptom is not alleviated or reduced<1/3.\\ , \\Classification according to the Common Terminology Criteria Adverse Events Version 4.0(CTCAE v4.0).\\, \n\\The diagnosis of hepatocellular carcinoma will be based on the guidelines of the American Association for the Study of Liver Diseases (AASLD) (Hepatology. 2011;53:1020-2). The adjudicating physicians will be blinded to patient results associated with the mSEPT9 test.\\, \\The diagnosis of hepatocellular carcinoma will be based on the guidelines of the American Association for the Study of Liver Diseases (AASLD) (Hepatology. 2011;53:1020-2). The adjudicating physicians will be blinded to patient results associated with the mSEPT9 test.\\, \n\\biofeedback response will be monitored\\, \\Representation of autonomous response during the exposure of specific frequencies of modulation\\, \\The primary endpoint of the study was the development of Hepatocellular carcinoma. We assessed the risk of development of hepatocellular carcinoma according to liver status, viral response to treatment, and the presence of previous resistance to NUC therapy.\\, \\survival in cirrhosis and chronic hepatitis B patients\\, \\Time from the day of liver resection to the day of clinical diagnosis of recurrence\\, \n\\Peripheral blood is drawn every 3 months after liver resection. 5hmc level in cfDNA in particular recurrence-related genes is tested by cfDNA sequencing and calculated by feature counts.\\, NA, \\Any adverse effect of the test is to be recorded.\\, NA, NA, NA, \\Difference would be found out by estimating cfDNA in terms of ng/mL of the blood specimen\\, NA, NA, NA, NA, NA, NA, \\According to standard imaging surveillance protocol, and confirmatory CT/MRI/biopsy\\, \\Positive family history of liver cancer, BMI, active/previous smoking, active/previous alcohol consumption, caffeine consumption in diet, diabetes mellitus, use of drugs for chronic medical conditions\\, \n\\Composite of regression of fibrosis plus other specific conditions decreasing incidence of hepatocellular carcinoma to <1.5% / year\\, \\According to Fibrotest/Fibrosure and transient elastography\\, \\to determine the clinical utility of Annexin A2 serum level as a novel diagnostic marker of hepatocellular carcinoma (HCC) and to correlate its level with alpha fetoprotein the current marker of (HCC).\\)
## [3] c(\\primary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\other_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \n\\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\other_outcome\\, \\primary_outcome\\)
## [4] c(\\NCT03338166\\, \\NCT03448757\\, \\NCT03448757\\, \\NCT03448757\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT02399033\\, \\NCT03311152\\, \\NCT03311152\\, \\NCT01641276\\, \\NCT01641276\\, \\NCT02025842\\, \\NCT02025842\\, \\NCT03493763\\, \\NCT03493763\\, \\NCT03493763\\, \\NCT03493763\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT03162198\\, \\NCT01831037\\, \\NCT01831037\\, \n\\NCT01831037\\, \\NCT01831037\\, \\NCT02541149\\)
## [5] <NA>
# Clean the text
corpus <- tm_map(corpus,tolower)
## Warning in tm_map.SimpleCorpus(corpus, tolower): transformation drops
## documents
inspect(corpus[1:5])
## <<SimpleCorpus>>
## Metadata: corpus specific: 1, document level (indexed): 0
## Content: documents: 5
##
## [1] c(\\2 months\\, \\90 min on day 1 and day 2\\, \\120 min (single procedure)\\, \\120 min (single procedure)\\, \\in the three years after hepatectomy\\, \\in a year after hepatectomy\\, \\up to 5 years\\, \\in a year or three years after hepatectomy\\, \\up to 5 years\\, \\in a year or three years after hepatectomy\\, \\participants will be followed for the duration of study, an expected average of 3 months.\\, \\up to 5 years\\, \\the diagnosis of hcc will be based on overall patient's evaluation including clinical, biological and imaging workup which will be carried out during the consultation and/or the three months preceding or following the inclusion consultation.\\, \n\\the diagnosis will be based on an overall patient's evaluation including clinical, biological and imaging workup which will be carried out during the consultation and/or the three months preceding or following the inclusion consultation.\\, \\within 10 min of exposure\\, \\within 10 minutes of exposure\\, \\follow-up of 62.5 months (range, 18 to 112 months),\\, \\follow-up of 62.5 months (range, 18 to 112 months),\\, \\2 years\\, \\2 years or until tumor recurrence\\, \\2 years or until tumor recurrence\\, \\2 years\\, \n\\day 0\\, \\day 0\\, \\day 0\\, \\day 0\\, \\day 0\\, \\day 0\\, \\day 0\\, \\day 0\\, \\day 0\\, \\day 0\\, \\3 years\\, \\change from baseline to 3 years\\, \\change from baseline to 3 years\\, \\change from baseline to 3 years\\, \\1 month\\)
## [2] c(\\to evaluate if serum ldh level can be used as a predictor of response in patients receiving different lines of treatment for hepatocellular carcinoma\\, \\identification of hemodymanic alterations induced by the exposure to low levels of amplitude modulation radiofrequency electromagnetic fields (am rf emf) in healthy individuals and patients with advanced hepatocellular carcinoma using artificial intelligence program to analyze the recorded data set collected by a high-precision and non-invasive hemodynamic monitor.\\, \n\\comparison of hemodynamic alteration during exposure to a group of hepatocellular-specific am rf emf recorded in healthy individuals and patients with advanced hepatocellular carcinoma using artificial intelligence algorithms to compare the recorded data set collected by a high-precision and non-invasive hemodynamic monitor.\\, \\identification of specifc hemodynamic alteration recorded during the exposure to a series of specific frequency modulations am rf emf recorded in healthy individuals and patients with advanced hepatocellular carcinoma using artificial intelligence program.\\, \n\\diagnostic criteria for hepatocellular carcinoma recurrence: refer to chinese anti-cancer association professional committee of hepatocellular carcinoma developed diagnostic criteria for primary hepatocellular carcinoma belong to guangzhou standard in 2001. once new or suspected place nature lesions within liver were found by b-ultrasonography examination,we should do ct, mri or pet-ct review, in order to confirm the diagnosis. if imaging is positive, diagnosing hepatocellular carcinoma(dominant) recurrence after treatment; if imaging is negative, but afp values> 400µg/l or ongoing elevated afp values, diagnosing hepatocellular carcinoma occult recurrence after treatment.\\, \nna, \\rfs is defined as from date of randomization until the date of first documented tumor recurrence or date of death from any cause, whichever came first.\\, na, \\os is defined as from date of randomization until the date of documented death from any cause.\\, \\using karnofsky-performance-status score:\\nevaluation methods: comparison of symptom scores before and after the treatment.\\nmarkedly: increasing by more than 20 points after treatment compared to before treatment; effective: increasing by more than 10 points after treatment compared to before treatment; stable: increasing by less than 10 points or no change after treatment compared to before treatment; invalid: decrease after treatment than before treatment.\\, \n\\evaluation index : according to clinical observations, tcm symptoms are divided into 4 levels: (0) no symptoms, (1) mild, (2) moderate, (3)severe, recording treatment according to symptoms.\\nevaluation methods: comparison of symptom total integral before and after the treatment (before treatment / after treatment) markedly: symptom disappeared, or symptom integral reduce = 2/3; effective: symptom alleviative, integral is reduced=1/3,=2/3; invalid: symptom is not alleviated or reduced<1/3.\\ , \\classification according to the common terminology criteria adverse events version 4.0(ctcae v4.0).\\, \n\\the diagnosis of hepatocellular carcinoma will be based on the guidelines of the american association for the study of liver diseases (aasld) (hepatology. 2011;53:1020-2). the adjudicating physicians will be blinded to patient results associated with the msept9 test.\\, \\the diagnosis of hepatocellular carcinoma will be based on the guidelines of the american association for the study of liver diseases (aasld) (hepatology. 2011;53:1020-2). the adjudicating physicians will be blinded to patient results associated with the msept9 test.\\, \n\\biofeedback response will be monitored\\, \\representation of autonomous response during the exposure of specific frequencies of modulation\\, \\the primary endpoint of the study was the development of hepatocellular carcinoma. we assessed the risk of development of hepatocellular carcinoma according to liver status, viral response to treatment, and the presence of previous resistance to nuc therapy.\\, \\survival in cirrhosis and chronic hepatitis b patients\\, \\time from the day of liver resection to the day of clinical diagnosis of recurrence\\, \n\\peripheral blood is drawn every 3 months after liver resection. 5hmc level in cfdna in particular recurrence-related genes is tested by cfdna sequencing and calculated by feature counts.\\, na, \\any adverse effect of the test is to be recorded.\\, na, na, na, \\difference would be found out by estimating cfdna in terms of ng/ml of the blood specimen\\, na, na, na, na, na, na, \\according to standard imaging surveillance protocol, and confirmatory ct/mri/biopsy\\, \\positive family history of liver cancer, bmi, active/previous smoking, active/previous alcohol consumption, caffeine consumption in diet, diabetes mellitus, use of drugs for chronic medical conditions\\, \n\\composite of regression of fibrosis plus other specific conditions decreasing incidence of hepatocellular carcinoma to <1.5% / year\\, \\according to fibrotest/fibrosure and transient elastography\\, \\to determine the clinical utility of annexin a2 serum level as a novel diagnostic marker of hepatocellular carcinoma (hcc) and to correlate its level with alpha fetoprotein the current marker of (hcc).\\)
## [3] c(\\primary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\other_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \n\\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\primary_outcome\\, \\secondary_outcome\\, \\secondary_outcome\\, \\other_outcome\\, \\primary_outcome\\)
## [4] c(\\nct03338166\\, \\nct03448757\\, \\nct03448757\\, \\nct03448757\\, \\nct02399033\\, \\nct02399033\\, \\nct02399033\\, \\nct02399033\\, \\nct02399033\\, \\nct02399033\\, \\nct02399033\\, \\nct02399033\\, \\nct03311152\\, \\nct03311152\\, \\nct01641276\\, \\nct01641276\\, \\nct02025842\\, \\nct02025842\\, \\nct03493763\\, \\nct03493763\\, \\nct03493763\\, \\nct03493763\\, \\nct03162198\\, \\nct03162198\\, \\nct03162198\\, \\nct03162198\\, \\nct03162198\\, \\nct03162198\\, \\nct03162198\\, \\nct03162198\\, \\nct03162198\\, \\nct03162198\\, \\nct01831037\\, \\nct01831037\\, \n\\nct01831037\\, \\nct01831037\\, \\nct02541149\\)
## [5] <NA>
corpus <- tm_map(corpus,removePunctuation)
## Warning in tm_map.SimpleCorpus(corpus, removePunctuation): transformation
## drops documents
inspect(corpus[1:5])
## <<SimpleCorpus>>
## Metadata: corpus specific: 1, document level (indexed): 0
## Content: documents: 5
##
## [1] c2 months 90 min on day 1 and day 2 120 min single procedure 120 min single procedure in the three years after hepatectomy in a year after hepatectomy up to 5 years in a year or three years after hepatectomy up to 5 years in a year or three years after hepatectomy participants will be followed for the duration of study an expected average of 3 months up to 5 years the diagnosis of hcc will be based on overall patients evaluation including clinical biological and imaging workup which will be carried out during the consultation andor the three months preceding or following the inclusion consultation \nthe diagnosis will be based on an overall patients evaluation including clinical biological and imaging workup which will be carried out during the consultation andor the three months preceding or following the inclusion consultation within 10 min of exposure within 10 minutes of exposure followup of 625 months range 18 to 112 months followup of 625 months range 18 to 112 months 2 years 2 years or until tumor recurrence 2 years or until tumor recurrence 2 years \nday 0 day 0 day 0 day 0 day 0 day 0 day 0 day 0 day 0 day 0 3 years change from baseline to 3 years change from baseline to 3 years change from baseline to 3 years 1 month
## [2] cto evaluate if serum ldh level can be used as a predictor of response in patients receiving different lines of treatment for hepatocellular carcinoma identification of hemodymanic alterations induced by the exposure to low levels of amplitude modulation radiofrequency electromagnetic fields am rf emf in healthy individuals and patients with advanced hepatocellular carcinoma using artificial intelligence program to analyze the recorded data set collected by a highprecision and noninvasive hemodynamic monitor \ncomparison of hemodynamic alteration during exposure to a group of hepatocellularspecific am rf emf recorded in healthy individuals and patients with advanced hepatocellular carcinoma using artificial intelligence algorithms to compare the recorded data set collected by a highprecision and noninvasive hemodynamic monitor identification of specifc hemodynamic alteration recorded during the exposure to a series of specific frequency modulations am rf emf recorded in healthy individuals and patients with advanced hepatocellular carcinoma using artificial intelligence program \ndiagnostic criteria for hepatocellular carcinoma recurrence refer to chinese anticancer association professional committee of hepatocellular carcinoma developed diagnostic criteria for primary hepatocellular carcinoma belong to guangzhou standard in 2001 once new or suspected place nature lesions within liver were found by bultrasonography examinationwe should do ct mri or petct review in order to confirm the diagnosis if imaging is positive diagnosing hepatocellular carcinomadominant recurrence after treatment if imaging is negative but afp values 400µgl or ongoing elevated afp values diagnosing hepatocellular carcinoma occult recurrence after treatment \nna rfs is defined as from date of randomization until the date of first documented tumor recurrence or date of death from any cause whichever came first na os is defined as from date of randomization until the date of documented death from any cause using karnofskyperformancestatus scorenevaluation methods comparison of symptom scores before and after the treatmentnmarkedly increasing by more than 20 points after treatment compared to before treatment effective increasing by more than 10 points after treatment compared to before treatment stable increasing by less than 10 points or no change after treatment compared to before treatment invalid decrease after treatment than before treatment \nevaluation index according to clinical observations tcm symptoms are divided into 4 levels 0 no symptoms 1 mild 2 moderate 3severe recording treatment according to symptomsnevaluation methods comparison of symptom total integral before and after the treatment before treatment after treatment markedly symptom disappeared or symptom integral reduce 23 effective symptom alleviative integral is reduced1323 invalid symptom is not alleviated or reduced13 classification according to the common terminology criteria adverse events version 40ctcae v40 \nthe diagnosis of hepatocellular carcinoma will be based on the guidelines of the american association for the study of liver diseases aasld hepatology 20115310202 the adjudicating physicians will be blinded to patient results associated with the msept9 test the diagnosis of hepatocellular carcinoma will be based on the guidelines of the american association for the study of liver diseases aasld hepatology 20115310202 the adjudicating physicians will be blinded to patient results associated with the msept9 test \nbiofeedback response will be monitored representation of autonomous response during the exposure of specific frequencies of modulation the primary endpoint of the study was the development of hepatocellular carcinoma we assessed the risk of development of hepatocellular carcinoma according to liver status viral response to treatment and the presence of previous resistance to nuc therapy survival in cirrhosis and chronic hepatitis b patients time from the day of liver resection to the day of clinical diagnosis of recurrence \nperipheral blood is drawn every 3 months after liver resection 5hmc level in cfdna in particular recurrencerelated genes is tested by cfdna sequencing and calculated by feature counts na any adverse effect of the test is to be recorded na na na difference would be found out by estimating cfdna in terms of ngml of the blood specimen na na na na na na according to standard imaging surveillance protocol and confirmatory ctmribiopsy positive family history of liver cancer bmi activeprevious smoking activeprevious alcohol consumption caffeine consumption in diet diabetes mellitus use of drugs for chronic medical conditions \ncomposite of regression of fibrosis plus other specific conditions decreasing incidence of hepatocellular carcinoma to 15 year according to fibrotestfibrosure and transient elastography to determine the clinical utility of annexin a2 serum level as a novel diagnostic marker of hepatocellular carcinoma hcc and to correlate its level with alpha fetoprotein the current marker of hcc
## [3] cprimaryoutcome primaryoutcome secondaryoutcome otheroutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome primaryoutcome secondaryoutcome \nsecondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome otheroutcome primaryoutcome
## [4] cnct03338166 nct03448757 nct03448757 nct03448757 nct02399033 nct02399033 nct02399033 nct02399033 nct02399033 nct02399033 nct02399033 nct02399033 nct03311152 nct03311152 nct01641276 nct01641276 nct02025842 nct02025842 nct03493763 nct03493763 nct03493763 nct03493763 nct03162198 nct03162198 nct03162198 nct03162198 nct03162198 nct03162198 nct03162198 nct03162198 nct03162198 nct03162198 nct01831037 nct01831037 \nnct01831037 nct01831037 nct02541149
## [5] <NA>
corpus <- tm_map(corpus,removeNumbers)
## Warning in tm_map.SimpleCorpus(corpus, removeNumbers): transformation drops
## documents
inspect(corpus[1:5])
## <<SimpleCorpus>>
## Metadata: corpus specific: 1, document level (indexed): 0
## Content: documents: 5
##
## [1] c months min on day and day min single procedure min single procedure in the three years after hepatectomy in a year after hepatectomy up to years in a year or three years after hepatectomy up to years in a year or three years after hepatectomy participants will be followed for the duration of study an expected average of months up to years the diagnosis of hcc will be based on overall patients evaluation including clinical biological and imaging workup which will be carried out during the consultation andor the three months preceding or following the inclusion consultation \nthe diagnosis will be based on an overall patients evaluation including clinical biological and imaging workup which will be carried out during the consultation andor the three months preceding or following the inclusion consultation within min of exposure within minutes of exposure followup of months range to months followup of months range to months years years or until tumor recurrence years or until tumor recurrence years \nday day day day day day day day day day years change from baseline to years change from baseline to years change from baseline to years month
## [2] cto evaluate if serum ldh level can be used as a predictor of response in patients receiving different lines of treatment for hepatocellular carcinoma identification of hemodymanic alterations induced by the exposure to low levels of amplitude modulation radiofrequency electromagnetic fields am rf emf in healthy individuals and patients with advanced hepatocellular carcinoma using artificial intelligence program to analyze the recorded data set collected by a highprecision and noninvasive hemodynamic monitor \ncomparison of hemodynamic alteration during exposure to a group of hepatocellularspecific am rf emf recorded in healthy individuals and patients with advanced hepatocellular carcinoma using artificial intelligence algorithms to compare the recorded data set collected by a highprecision and noninvasive hemodynamic monitor identification of specifc hemodynamic alteration recorded during the exposure to a series of specific frequency modulations am rf emf recorded in healthy individuals and patients with advanced hepatocellular carcinoma using artificial intelligence program \ndiagnostic criteria for hepatocellular carcinoma recurrence refer to chinese anticancer association professional committee of hepatocellular carcinoma developed diagnostic criteria for primary hepatocellular carcinoma belong to guangzhou standard in once new or suspected place nature lesions within liver were found by bultrasonography examinationwe should do ct mri or petct review in order to confirm the diagnosis if imaging is positive diagnosing hepatocellular carcinomadominant recurrence after treatment if imaging is negative but afp values µgl or ongoing elevated afp values diagnosing hepatocellular carcinoma occult recurrence after treatment \nna rfs is defined as from date of randomization until the date of first documented tumor recurrence or date of death from any cause whichever came first na os is defined as from date of randomization until the date of documented death from any cause using karnofskyperformancestatus scorenevaluation methods comparison of symptom scores before and after the treatmentnmarkedly increasing by more than points after treatment compared to before treatment effective increasing by more than points after treatment compared to before treatment stable increasing by less than points or no change after treatment compared to before treatment invalid decrease after treatment than before treatment \nevaluation index according to clinical observations tcm symptoms are divided into levels no symptoms mild moderate severe recording treatment according to symptomsnevaluation methods comparison of symptom total integral before and after the treatment before treatment after treatment markedly symptom disappeared or symptom integral reduce effective symptom alleviative integral is reduced invalid symptom is not alleviated or reduced classification according to the common terminology criteria adverse events version ctcae v \nthe diagnosis of hepatocellular carcinoma will be based on the guidelines of the american association for the study of liver diseases aasld hepatology the adjudicating physicians will be blinded to patient results associated with the msept test the diagnosis of hepatocellular carcinoma will be based on the guidelines of the american association for the study of liver diseases aasld hepatology the adjudicating physicians will be blinded to patient results associated with the msept test \nbiofeedback response will be monitored representation of autonomous response during the exposure of specific frequencies of modulation the primary endpoint of the study was the development of hepatocellular carcinoma we assessed the risk of development of hepatocellular carcinoma according to liver status viral response to treatment and the presence of previous resistance to nuc therapy survival in cirrhosis and chronic hepatitis b patients time from the day of liver resection to the day of clinical diagnosis of recurrence \nperipheral blood is drawn every months after liver resection hmc level in cfdna in particular recurrencerelated genes is tested by cfdna sequencing and calculated by feature counts na any adverse effect of the test is to be recorded na na na difference would be found out by estimating cfdna in terms of ngml of the blood specimen na na na na na na according to standard imaging surveillance protocol and confirmatory ctmribiopsy positive family history of liver cancer bmi activeprevious smoking activeprevious alcohol consumption caffeine consumption in diet diabetes mellitus use of drugs for chronic medical conditions \ncomposite of regression of fibrosis plus other specific conditions decreasing incidence of hepatocellular carcinoma to year according to fibrotestfibrosure and transient elastography to determine the clinical utility of annexin a serum level as a novel diagnostic marker of hepatocellular carcinoma hcc and to correlate its level with alpha fetoprotein the current marker of hcc
## [3] cprimaryoutcome primaryoutcome secondaryoutcome otheroutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome primaryoutcome secondaryoutcome \nsecondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome otheroutcome primaryoutcome
## [4] cnct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct \nnct nct nct
## [5] <NA>
corpus_clean<-tm_map(corpus,stripWhitespace)
## Warning in tm_map.SimpleCorpus(corpus, stripWhitespace): transformation
## drops documents
inspect(corpus[1:5])
## <<SimpleCorpus>>
## Metadata: corpus specific: 1, document level (indexed): 0
## Content: documents: 5
##
## [1] c months min on day and day min single procedure min single procedure in the three years after hepatectomy in a year after hepatectomy up to years in a year or three years after hepatectomy up to years in a year or three years after hepatectomy participants will be followed for the duration of study an expected average of months up to years the diagnosis of hcc will be based on overall patients evaluation including clinical biological and imaging workup which will be carried out during the consultation andor the three months preceding or following the inclusion consultation \nthe diagnosis will be based on an overall patients evaluation including clinical biological and imaging workup which will be carried out during the consultation andor the three months preceding or following the inclusion consultation within min of exposure within minutes of exposure followup of months range to months followup of months range to months years years or until tumor recurrence years or until tumor recurrence years \nday day day day day day day day day day years change from baseline to years change from baseline to years change from baseline to years month
## [2] cto evaluate if serum ldh level can be used as a predictor of response in patients receiving different lines of treatment for hepatocellular carcinoma identification of hemodymanic alterations induced by the exposure to low levels of amplitude modulation radiofrequency electromagnetic fields am rf emf in healthy individuals and patients with advanced hepatocellular carcinoma using artificial intelligence program to analyze the recorded data set collected by a highprecision and noninvasive hemodynamic monitor \ncomparison of hemodynamic alteration during exposure to a group of hepatocellularspecific am rf emf recorded in healthy individuals and patients with advanced hepatocellular carcinoma using artificial intelligence algorithms to compare the recorded data set collected by a highprecision and noninvasive hemodynamic monitor identification of specifc hemodynamic alteration recorded during the exposure to a series of specific frequency modulations am rf emf recorded in healthy individuals and patients with advanced hepatocellular carcinoma using artificial intelligence program \ndiagnostic criteria for hepatocellular carcinoma recurrence refer to chinese anticancer association professional committee of hepatocellular carcinoma developed diagnostic criteria for primary hepatocellular carcinoma belong to guangzhou standard in once new or suspected place nature lesions within liver were found by bultrasonography examinationwe should do ct mri or petct review in order to confirm the diagnosis if imaging is positive diagnosing hepatocellular carcinomadominant recurrence after treatment if imaging is negative but afp values µgl or ongoing elevated afp values diagnosing hepatocellular carcinoma occult recurrence after treatment \nna rfs is defined as from date of randomization until the date of first documented tumor recurrence or date of death from any cause whichever came first na os is defined as from date of randomization until the date of documented death from any cause using karnofskyperformancestatus scorenevaluation methods comparison of symptom scores before and after the treatmentnmarkedly increasing by more than points after treatment compared to before treatment effective increasing by more than points after treatment compared to before treatment stable increasing by less than points or no change after treatment compared to before treatment invalid decrease after treatment than before treatment \nevaluation index according to clinical observations tcm symptoms are divided into levels no symptoms mild moderate severe recording treatment according to symptomsnevaluation methods comparison of symptom total integral before and after the treatment before treatment after treatment markedly symptom disappeared or symptom integral reduce effective symptom alleviative integral is reduced invalid symptom is not alleviated or reduced classification according to the common terminology criteria adverse events version ctcae v \nthe diagnosis of hepatocellular carcinoma will be based on the guidelines of the american association for the study of liver diseases aasld hepatology the adjudicating physicians will be blinded to patient results associated with the msept test the diagnosis of hepatocellular carcinoma will be based on the guidelines of the american association for the study of liver diseases aasld hepatology the adjudicating physicians will be blinded to patient results associated with the msept test \nbiofeedback response will be monitored representation of autonomous response during the exposure of specific frequencies of modulation the primary endpoint of the study was the development of hepatocellular carcinoma we assessed the risk of development of hepatocellular carcinoma according to liver status viral response to treatment and the presence of previous resistance to nuc therapy survival in cirrhosis and chronic hepatitis b patients time from the day of liver resection to the day of clinical diagnosis of recurrence \nperipheral blood is drawn every months after liver resection hmc level in cfdna in particular recurrencerelated genes is tested by cfdna sequencing and calculated by feature counts na any adverse effect of the test is to be recorded na na na difference would be found out by estimating cfdna in terms of ngml of the blood specimen na na na na na na according to standard imaging surveillance protocol and confirmatory ctmribiopsy positive family history of liver cancer bmi activeprevious smoking activeprevious alcohol consumption caffeine consumption in diet diabetes mellitus use of drugs for chronic medical conditions \ncomposite of regression of fibrosis plus other specific conditions decreasing incidence of hepatocellular carcinoma to year according to fibrotestfibrosure and transient elastography to determine the clinical utility of annexin a serum level as a novel diagnostic marker of hepatocellular carcinoma hcc and to correlate its level with alpha fetoprotein the current marker of hcc
## [3] cprimaryoutcome primaryoutcome secondaryoutcome otheroutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome primaryoutcome secondaryoutcome \nsecondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome otheroutcome primaryoutcome
## [4] cnct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct \nnct nct nct
## [5] <NA>
cleanset<-tm_map(corpus,removeWords, stopwords('english'))
## Warning in tm_map.SimpleCorpus(corpus, removeWords, stopwords("english")):
## transformation drops documents
inspect(cleanset[1:5])
## <<SimpleCorpus>>
## Metadata: corpus specific: 1, document level (indexed): 0
## Content: documents: 5
##
## [1] c months min day day min single procedure min single procedure three years hepatectomy year hepatectomy years year three years hepatectomy years year three years hepatectomy participants will followed duration study expected average months years diagnosis hcc will based overall patients evaluation including clinical biological imaging workup will carried consultation andor three months preceding following inclusion consultation \n diagnosis will based overall patients evaluation including clinical biological imaging workup will carried consultation andor three months preceding following inclusion consultation within min exposure within minutes exposure followup months range months followup months range months years years tumor recurrence years tumor recurrence years \nday day day day day day day day day day years change baseline years change baseline years change baseline years month
## [2] cto evaluate serum ldh level can used predictor response patients receiving different lines treatment hepatocellular carcinoma identification hemodymanic alterations induced exposure low levels amplitude modulation radiofrequency electromagnetic fields rf emf healthy individuals patients advanced hepatocellular carcinoma using artificial intelligence program analyze recorded data set collected highprecision noninvasive hemodynamic monitor \ncomparison hemodynamic alteration exposure group hepatocellularspecific rf emf recorded healthy individuals patients advanced hepatocellular carcinoma using artificial intelligence algorithms compare recorded data set collected highprecision noninvasive hemodynamic monitor identification specifc hemodynamic alteration recorded exposure series specific frequency modulations rf emf recorded healthy individuals patients advanced hepatocellular carcinoma using artificial intelligence program \ndiagnostic criteria hepatocellular carcinoma recurrence refer chinese anticancer association professional committee hepatocellular carcinoma developed diagnostic criteria primary hepatocellular carcinoma belong guangzhou standard new suspected place nature lesions within liver found bultrasonography examinationwe ct mri petct review order confirm diagnosis imaging positive diagnosing hepatocellular carcinomadominant recurrence treatment imaging negative afp values µgl ongoing elevated afp values diagnosing hepatocellular carcinoma occult recurrence treatment \nna rfs defined date randomization date first documented tumor recurrence date death cause whichever came first na os defined date randomization date documented death cause using karnofskyperformancestatus scorenevaluation methods comparison symptom scores treatmentnmarkedly increasing points treatment compared treatment effective increasing points treatment compared treatment stable increasing less points change treatment compared treatment invalid decrease treatment treatment \nevaluation index according clinical observations tcm symptoms divided levels symptoms mild moderate severe recording treatment according symptomsnevaluation methods comparison symptom total integral treatment treatment treatment markedly symptom disappeared symptom integral reduce effective symptom alleviative integral reduced invalid symptom alleviated reduced classification according common terminology criteria adverse events version ctcae v \n diagnosis hepatocellular carcinoma will based guidelines american association study liver diseases aasld hepatology adjudicating physicians will blinded patient results associated msept test diagnosis hepatocellular carcinoma will based guidelines american association study liver diseases aasld hepatology adjudicating physicians will blinded patient results associated msept test \nbiofeedback response will monitored representation autonomous response exposure specific frequencies modulation primary endpoint study development hepatocellular carcinoma assessed risk development hepatocellular carcinoma according liver status viral response treatment presence previous resistance nuc therapy survival cirrhosis chronic hepatitis b patients time day liver resection day clinical diagnosis recurrence \nperipheral blood drawn every months liver resection hmc level cfdna particular recurrencerelated genes tested cfdna sequencing calculated feature counts na adverse effect test recorded na na na difference found estimating cfdna terms ngml blood specimen na na na na na na according standard imaging surveillance protocol confirmatory ctmribiopsy positive family history liver cancer bmi activeprevious smoking activeprevious alcohol consumption caffeine consumption diet diabetes mellitus use drugs chronic medical conditions \ncomposite regression fibrosis plus specific conditions decreasing incidence hepatocellular carcinoma year according fibrotestfibrosure transient elastography determine clinical utility annexin serum level novel diagnostic marker hepatocellular carcinoma hcc correlate level alpha fetoprotein current marker hcc
## [3] cprimaryoutcome primaryoutcome secondaryoutcome otheroutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome primaryoutcome secondaryoutcome \nsecondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome otheroutcome primaryoutcome
## [4] cnct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct \nnct nct nct
## [5] <NA>
# write.table(cleanset,"cleanset.txt",row.names = F)
removeURL <- function(x) gsub('http[[:alnum:]]*','',x)
cleanset <- tm_map(cleanset, content_transformer(removeURL))
## Warning in tm_map.SimpleCorpus(cleanset, content_transformer(removeURL)):
## transformation drops documents
inspect(cleanset[1:5])
## <<SimpleCorpus>>
## Metadata: corpus specific: 1, document level (indexed): 0
## Content: documents: 5
##
## [1] c months min day day min single procedure min single procedure three years hepatectomy year hepatectomy years year three years hepatectomy years year three years hepatectomy participants will followed duration study expected average months years diagnosis hcc will based overall patients evaluation including clinical biological imaging workup will carried consultation andor three months preceding following inclusion consultation \n diagnosis will based overall patients evaluation including clinical biological imaging workup will carried consultation andor three months preceding following inclusion consultation within min exposure within minutes exposure followup months range months followup months range months years years tumor recurrence years tumor recurrence years \nday day day day day day day day day day years change baseline years change baseline years change baseline years month
## [2] cto evaluate serum ldh level can used predictor response patients receiving different lines treatment hepatocellular carcinoma identification hemodymanic alterations induced exposure low levels amplitude modulation radiofrequency electromagnetic fields rf emf healthy individuals patients advanced hepatocellular carcinoma using artificial intelligence program analyze recorded data set collected highprecision noninvasive hemodynamic monitor \ncomparison hemodynamic alteration exposure group hepatocellularspecific rf emf recorded healthy individuals patients advanced hepatocellular carcinoma using artificial intelligence algorithms compare recorded data set collected highprecision noninvasive hemodynamic monitor identification specifc hemodynamic alteration recorded exposure series specific frequency modulations rf emf recorded healthy individuals patients advanced hepatocellular carcinoma using artificial intelligence program \ndiagnostic criteria hepatocellular carcinoma recurrence refer chinese anticancer association professional committee hepatocellular carcinoma developed diagnostic criteria primary hepatocellular carcinoma belong guangzhou standard new suspected place nature lesions within liver found bultrasonography examinationwe ct mri petct review order confirm diagnosis imaging positive diagnosing hepatocellular carcinomadominant recurrence treatment imaging negative afp values µgl ongoing elevated afp values diagnosing hepatocellular carcinoma occult recurrence treatment \nna rfs defined date randomization date first documented tumor recurrence date death cause whichever came first na os defined date randomization date documented death cause using karnofskyperformancestatus scorenevaluation methods comparison symptom scores treatmentnmarkedly increasing points treatment compared treatment effective increasing points treatment compared treatment stable increasing less points change treatment compared treatment invalid decrease treatment treatment \nevaluation index according clinical observations tcm symptoms divided levels symptoms mild moderate severe recording treatment according symptomsnevaluation methods comparison symptom total integral treatment treatment treatment markedly symptom disappeared symptom integral reduce effective symptom alleviative integral reduced invalid symptom alleviated reduced classification according common terminology criteria adverse events version ctcae v \n diagnosis hepatocellular carcinoma will based guidelines american association study liver diseases aasld hepatology adjudicating physicians will blinded patient results associated msept test diagnosis hepatocellular carcinoma will based guidelines american association study liver diseases aasld hepatology adjudicating physicians will blinded patient results associated msept test \nbiofeedback response will monitored representation autonomous response exposure specific frequencies modulation primary endpoint study development hepatocellular carcinoma assessed risk development hepatocellular carcinoma according liver status viral response treatment presence previous resistance nuc therapy survival cirrhosis chronic hepatitis b patients time day liver resection day clinical diagnosis recurrence \nperipheral blood drawn every months liver resection hmc level cfdna particular recurrencerelated genes tested cfdna sequencing calculated feature counts na adverse effect test recorded na na na difference found estimating cfdna terms ngml blood specimen na na na na na na according standard imaging surveillance protocol confirmatory ctmribiopsy positive family history liver cancer bmi activeprevious smoking activeprevious alcohol consumption caffeine consumption diet diabetes mellitus use drugs chronic medical conditions \ncomposite regression fibrosis plus specific conditions decreasing incidence hepatocellular carcinoma year according fibrotestfibrosure transient elastography determine clinical utility annexin serum level novel diagnostic marker hepatocellular carcinoma hcc correlate level alpha fetoprotein current marker hcc
## [3] cprimaryoutcome primaryoutcome secondaryoutcome otheroutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome primaryoutcome secondaryoutcome \nsecondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome otheroutcome primaryoutcome
## [4] cnct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct nct \nnct nct nct
## [5] <NA>
cleanset<-tm_map(cleanset,removeWords, c('nct','cnct'))
## Warning in tm_map.SimpleCorpus(cleanset, removeWords, c("nct", "cnct")):
## transformation drops documents
# Since the nct and cnct were used, this can be removed as we
# dont need those registry numbers for this exercise.
# cleanset <- tm_map(cleanset, gsub,pattern = 'Compared', replacement = 'Comparison')
# the barplot pulls both Compare and Comparison as separate words. this should be
# counted as one as both holds the same synonym.
inspect(cleanset[1:5])
## <<SimpleCorpus>>
## Metadata: corpus specific: 1, document level (indexed): 0
## Content: documents: 5
##
## [1] c months min day day min single procedure min single procedure three years hepatectomy year hepatectomy years year three years hepatectomy years year three years hepatectomy participants will followed duration study expected average months years diagnosis hcc will based overall patients evaluation including clinical biological imaging workup will carried consultation andor three months preceding following inclusion consultation \n diagnosis will based overall patients evaluation including clinical biological imaging workup will carried consultation andor three months preceding following inclusion consultation within min exposure within minutes exposure followup months range months followup months range months years years tumor recurrence years tumor recurrence years \nday day day day day day day day day day years change baseline years change baseline years change baseline years month
## [2] cto evaluate serum ldh level can used predictor response patients receiving different lines treatment hepatocellular carcinoma identification hemodymanic alterations induced exposure low levels amplitude modulation radiofrequency electromagnetic fields rf emf healthy individuals patients advanced hepatocellular carcinoma using artificial intelligence program analyze recorded data set collected highprecision noninvasive hemodynamic monitor \ncomparison hemodynamic alteration exposure group hepatocellularspecific rf emf recorded healthy individuals patients advanced hepatocellular carcinoma using artificial intelligence algorithms compare recorded data set collected highprecision noninvasive hemodynamic monitor identification specifc hemodynamic alteration recorded exposure series specific frequency modulations rf emf recorded healthy individuals patients advanced hepatocellular carcinoma using artificial intelligence program \ndiagnostic criteria hepatocellular carcinoma recurrence refer chinese anticancer association professional committee hepatocellular carcinoma developed diagnostic criteria primary hepatocellular carcinoma belong guangzhou standard new suspected place nature lesions within liver found bultrasonography examinationwe ct mri petct review order confirm diagnosis imaging positive diagnosing hepatocellular carcinomadominant recurrence treatment imaging negative afp values µgl ongoing elevated afp values diagnosing hepatocellular carcinoma occult recurrence treatment \nna rfs defined date randomization date first documented tumor recurrence date death cause whichever came first na os defined date randomization date documented death cause using karnofskyperformancestatus scorenevaluation methods comparison symptom scores treatmentnmarkedly increasing points treatment compared treatment effective increasing points treatment compared treatment stable increasing less points change treatment compared treatment invalid decrease treatment treatment \nevaluation index according clinical observations tcm symptoms divided levels symptoms mild moderate severe recording treatment according symptomsnevaluation methods comparison symptom total integral treatment treatment treatment markedly symptom disappeared symptom integral reduce effective symptom alleviative integral reduced invalid symptom alleviated reduced classification according common terminology criteria adverse events version ctcae v \n diagnosis hepatocellular carcinoma will based guidelines american association study liver diseases aasld hepatology adjudicating physicians will blinded patient results associated msept test diagnosis hepatocellular carcinoma will based guidelines american association study liver diseases aasld hepatology adjudicating physicians will blinded patient results associated msept test \nbiofeedback response will monitored representation autonomous response exposure specific frequencies modulation primary endpoint study development hepatocellular carcinoma assessed risk development hepatocellular carcinoma according liver status viral response treatment presence previous resistance nuc therapy survival cirrhosis chronic hepatitis b patients time day liver resection day clinical diagnosis recurrence \nperipheral blood drawn every months liver resection hmc level cfdna particular recurrencerelated genes tested cfdna sequencing calculated feature counts na adverse effect test recorded na na na difference found estimating cfdna terms ngml blood specimen na na na na na na according standard imaging surveillance protocol confirmatory ctmribiopsy positive family history liver cancer bmi activeprevious smoking activeprevious alcohol consumption caffeine consumption diet diabetes mellitus use drugs chronic medical conditions \ncomposite regression fibrosis plus specific conditions decreasing incidence hepatocellular carcinoma year according fibrotestfibrosure transient elastography determine clinical utility annexin serum level novel diagnostic marker hepatocellular carcinoma hcc correlate level alpha fetoprotein current marker hcc
## [3] cprimaryoutcome primaryoutcome secondaryoutcome otheroutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome primaryoutcome secondaryoutcome \nsecondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome otheroutcome primaryoutcome
## [4] \n
## [5] <NA>
cleanset <- tm_map(cleanset,stripWhitespace)
## Warning in tm_map.SimpleCorpus(cleanset, stripWhitespace): transformation
## drops documents
inspect(cleanset[1:5])
## <<SimpleCorpus>>
## Metadata: corpus specific: 1, document level (indexed): 0
## Content: documents: 5
##
## [1] c months min day day min single procedure min single procedure three years hepatectomy year hepatectomy years year three years hepatectomy years year three years hepatectomy participants will followed duration study expected average months years diagnosis hcc will based overall patients evaluation including clinical biological imaging workup will carried consultation andor three months preceding following inclusion consultation diagnosis will based overall patients evaluation including clinical biological imaging workup will carried consultation andor three months preceding following inclusion consultation within min exposure within minutes exposure followup months range months followup months range months years years tumor recurrence years tumor recurrence years day day day day day day day day day day years change baseline years change baseline years change baseline years month
## [2] cto evaluate serum ldh level can used predictor response patients receiving different lines treatment hepatocellular carcinoma identification hemodymanic alterations induced exposure low levels amplitude modulation radiofrequency electromagnetic fields rf emf healthy individuals patients advanced hepatocellular carcinoma using artificial intelligence program analyze recorded data set collected highprecision noninvasive hemodynamic monitor comparison hemodynamic alteration exposure group hepatocellularspecific rf emf recorded healthy individuals patients advanced hepatocellular carcinoma using artificial intelligence algorithms compare recorded data set collected highprecision noninvasive hemodynamic monitor identification specifc hemodynamic alteration recorded exposure series specific frequency modulations rf emf recorded healthy individuals patients advanced hepatocellular carcinoma using artificial intelligence program diagnostic criteria hepatocellular carcinoma recurrence refer chinese anticancer association professional committee hepatocellular carcinoma developed diagnostic criteria primary hepatocellular carcinoma belong guangzhou standard new suspected place nature lesions within liver found bultrasonography examinationwe ct mri petct review order confirm diagnosis imaging positive diagnosing hepatocellular carcinomadominant recurrence treatment imaging negative afp values µgl ongoing elevated afp values diagnosing hepatocellular carcinoma occult recurrence treatment na rfs defined date randomization date first documented tumor recurrence date death cause whichever came first na os defined date randomization date documented death cause using karnofskyperformancestatus scorenevaluation methods comparison symptom scores treatmentnmarkedly increasing points treatment compared treatment effective increasing points treatment compared treatment stable increasing less points change treatment compared treatment invalid decrease treatment treatment evaluation index according clinical observations tcm symptoms divided levels symptoms mild moderate severe recording treatment according symptomsnevaluation methods comparison symptom total integral treatment treatment treatment markedly symptom disappeared symptom integral reduce effective symptom alleviative integral reduced invalid symptom alleviated reduced classification according common terminology criteria adverse events version ctcae v diagnosis hepatocellular carcinoma will based guidelines american association study liver diseases aasld hepatology adjudicating physicians will blinded patient results associated msept test diagnosis hepatocellular carcinoma will based guidelines american association study liver diseases aasld hepatology adjudicating physicians will blinded patient results associated msept test biofeedback response will monitored representation autonomous response exposure specific frequencies modulation primary endpoint study development hepatocellular carcinoma assessed risk development hepatocellular carcinoma according liver status viral response treatment presence previous resistance nuc therapy survival cirrhosis chronic hepatitis b patients time day liver resection day clinical diagnosis recurrence peripheral blood drawn every months liver resection hmc level cfdna particular recurrencerelated genes tested cfdna sequencing calculated feature counts na adverse effect test recorded na na na difference found estimating cfdna terms ngml blood specimen na na na na na na according standard imaging surveillance protocol confirmatory ctmribiopsy positive family history liver cancer bmi activeprevious smoking activeprevious alcohol consumption caffeine consumption diet diabetes mellitus use drugs chronic medical conditions composite regression fibrosis plus specific conditions decreasing incidence hepatocellular carcinoma year according fibrotestfibrosure transient elastography determine clinical utility annexin serum level novel diagnostic marker hepatocellular carcinoma hcc correlate level alpha fetoprotein current marker hcc
## [3] cprimaryoutcome primaryoutcome secondaryoutcome otheroutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome primaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome secondaryoutcome primaryoutcome secondaryoutcome secondaryoutcome otheroutcome primaryoutcome
## [4]
## [5] <NA>
#Term Document Matrix :
# Convert the unstructured data to structured data :
tdm <- TermDocumentMatrix(cleanset)
tdm
## <<TermDocumentMatrix (terms: 280, documents: 4)>>
## Non-/sparse entries: 297/823
## Sparsity : 73%
## Maximal term length: 26
## Weighting : term frequency (tf)
# the terms indicate that there are 280 words and 4 documents(# of tweets) in this TDM
# Sparsity is 73% which indicates that there are zero values
tdm <- as.matrix(tdm)
tdm[1:10,1:4]
## Docs
## Terms 1 2 3 4
## andor 2 0 0 0
## average 1 0 0 0
## based 2 2 0 0
## baseline 3 0 0 0
## biological 2 0 0 0
## carried 2 0 0 0
## change 3 1 0 0
## clinical 2 3 0 0
## consultation 4 0 0 0
## day 12 2 0 0
# Bar Plot
w <- rowSums(tdm) # provides the no of times a particular word has been used.
w <- subset(w, w>= 3) # Pull words that were used more than 2 times.
barplot(w, las = 2, col = rainbow(50))
# the word Aquaman,Like and James as the highest frequency. This implies
# that Movie Aquaman has got more reviews about the James and
# most of them liked the movie.
# Word Cloud :
w <- sort(rowSums(tdm), decreasing = TRUE) # Sort words in decreasing order.
set.seed(123)
wordcloud(words = names(w), freq = w,
max.words = 250,random.order = F,
min.freq = 3,
colors = brewer.pal(8, 'Dark2'),
scale = c(5,0.3),
rot.per = 0.6)
## Warning in wordcloud(words = names(w), freq = w, max.words = 250,
## random.order = F, : secondaryoutcome could not be fit on page. It will not
## be plotted.
w <- data.frame(names(w),w)
colnames(w) <- c('word','freq')
wordcloud2(w,size = 0.5, shape = 'triangle', rotateRatio = 0.5,
minSize = 1)
# lettercloud
letterCloud(w,word = 'HCC',frequency(2), size=1)
# Sentiment Analysis for tweets:
# Read File
HCC_Outcome <- read.delim('cleanset.TXT')
trail_out <- as.character(HCC_Outcome[-1,])
class(trail_out)
## [1] "character"
# Obtain Sentiment scores
s <- get_nrc_sentiment(trail_out)
## Warning: package 'bindrcpp' was built under R version 3.5.1
head(s)
## anger anticipation disgust fear joy sadness surprise trust negative
## 1 4 8 4 14 3 7 2 11 15
## 2 0 0 0 0 0 0 0 0 0
## 3 0 0 0 0 0 0 0 0 0
## positive
## 1 19
## 2 0
## 3 0
get_nrc_sentiment('diagnosis')
## anger anticipation disgust fear joy sadness surprise trust negative
## 1 0 1 0 1 0 0 0 1 1
## positive
## 1 0
# diagnosis has 1 anticipation, 1 fear, 1 trust and 1 negative value
get_nrc_sentiment('death')
## anger anticipation disgust fear joy sadness surprise trust negative
## 1 1 1 1 1 0 1 1 0 1
## positive
## 1 0
# death has one anger, one anticpation, 1 disgust, 1 fear, 1 sadness,
# 1 surprise, and 1 Negative
# barplot
barplot(colSums(s), las = 2.5, col = rainbow(10),
ylab = 'Count',main= 'Sentiment scores for HCC Clinical Trail')
# Overall, it looks like the outcome had lots of Anticipation on the
# results, encountered lots of fear , anger. Most of their work had a
# lot of negative thoughts with sadness. However the outcome also showed
# great signs of trust which show cased a lot of positive outcomes.