Trong R có các cách sau để tải dữ liệu từ nguồn internet về dùng:
1. Dùng download.file()
temporaryFile <- tempfile()
download.file("https://raw.githubusercontent.com/vincentarelbundock/Rdatasets/master/csv/datasets/AirPassengers.csv", destfile=temporaryFile)
trying URL 'https://raw.githubusercontent.com/vincentarelbundock/Rdatasets/master/csv/datasets/AirPassengers.csv'
Content type 'text/plain; charset=utf-8' length 3326 bytes
downloaded 3326 bytes
myData <- read.csv(temporaryFile)
head(myData)
apply(myData, 2, class)
X time AirPassengers
"numeric" "numeric" "numeric"
2. Dùng package RCurl
library(RCurl)
myCsv <- getURL("https://raw.githubusercontent.com/vincentarelbundock/Rdatasets/master/csv/datasets/Titanic.csv", ssl.verifypeer = FALSE)
myData <- read.csv(textConnection(myCsv))
dim(myData)
[1] 1313 7
apply(myData, 2, summary)
X Name PClass Age Sex Survived SexCode
Length "1313" "1313" "1313" "1313" "1313" "1313" "1313"
Class "character" "character" "character" "character" "character" "character" "character"
Mode "character" "character" "character" "character" "character" "character" "character"
3. Chỉ dùng hàm cơ bản read.csv trong R
myData <- read.csv("https://raw.githubusercontent.com/vincentarelbundock/Rdatasets/master/csv/datasets/Titanic.csv", header=T)
head(myData)
LS0tDQp0aXRsZTogIlThuqNpIGThu68gbGnhu4d1IHThu6sgaW50ZXJuZXQgdHJvbmcgUiINCmF1dGhvcjogIkN1b25nIFNhaSINCmRhdGU6ICcwMi8zLzIwMTgnDQpvdXRwdXQ6DQogIGh0bWxfbm90ZWJvb2s6IGRlZmF1bHQNCiAgd29yZF9kb2N1bWVudDogZGVmYXVsdA0KLS0tDQoNCiMjIFRyb25nIFIgY8OzIGPDoWMgY8OhY2ggc2F1IMSR4buDIHThuqNpIGThu68gbGnhu4d1IHThu6sgbmd14buTbiBpbnRlcm5ldCB24buBIGTDuW5nOg0KDQojIyAxLiBEw7luZyBkb3dubG9hZC5maWxlKCkNCg0KYGBge3IsIHdhcm5pbmc9RkFMU0UsIG1lc3NhZ2U9RkFMU0V9DQp0ZW1wb3JhcnlGaWxlIDwtIHRlbXBmaWxlKCkNCmRvd25sb2FkLmZpbGUoImh0dHBzOi8vcmF3LmdpdGh1YnVzZXJjb250ZW50LmNvbS92aW5jZW50YXJlbGJ1bmRvY2svUmRhdGFzZXRzL21hc3Rlci9jc3YvZGF0YXNldHMvQWlyUGFzc2VuZ2Vycy5jc3YiLCBkZXN0ZmlsZT10ZW1wb3JhcnlGaWxlKQ0KbXlEYXRhIDwtIHJlYWQuY3N2KHRlbXBvcmFyeUZpbGUpDQpoZWFkKG15RGF0YSkNCmFwcGx5KG15RGF0YSwgMiwgY2xhc3MpDQpgYGANCg0KIyMgMi4gRMO5bmcgcGFja2FnZSBSQ3VybA0KDQpgYGB7cn0NCmxpYnJhcnkoUkN1cmwpDQpteUNzdiA8LSBnZXRVUkwoImh0dHBzOi8vcmF3LmdpdGh1YnVzZXJjb250ZW50LmNvbS92aW5jZW50YXJlbGJ1bmRvY2svUmRhdGFzZXRzL21hc3Rlci9jc3YvZGF0YXNldHMvVGl0YW5pYy5jc3YiLCBzc2wudmVyaWZ5cGVlciA9IEZBTFNFKQ0KbXlEYXRhIDwtIHJlYWQuY3N2KHRleHRDb25uZWN0aW9uKG15Q3N2KSkNCmRpbShteURhdGEpDQphcHBseShteURhdGEsIDIsIHN1bW1hcnkpDQpgYGANCg0KIyMgMy4gQ2jhu4kgZMO5bmcgaMOgbSBjxqEgYuG6o24gcmVhZC5jc3YgdHJvbmcgUg0KDQpgYGB7cn0NCm15RGF0YSA8LSByZWFkLmNzdigiaHR0cHM6Ly9yYXcuZ2l0aHVidXNlcmNvbnRlbnQuY29tL3ZpbmNlbnRhcmVsYnVuZG9jay9SZGF0YXNldHMvbWFzdGVyL2Nzdi9kYXRhc2V0cy9UaXRhbmljLmNzdiIsIGhlYWRlcj1UKQ0KaGVhZChteURhdGEpDQpgYGANCg0KDQoNCg==