#Just taking an initial look at the data before anything.
chess_reader <- readLines('https://raw.githubusercontent.com/Sangeetha-007/R-Practice/master/607/Projects/Project%201/tournamentinfo.txt', skip=1)
## Warning in readLines("https://raw.githubusercontent.com/Sangeetha-007/R-
## Practice/master/607/Projects/Project%201/tournamentinfo.txt", : incomplete
## final line found on 'https://raw.githubusercontent.com/Sangeetha-007/R-Practice/
## master/607/Projects/Project%201/tournamentinfo.txt'
#read text by line
head(chess_reader)
## [1] "-----------------------------------------------------------------------------------------"
## [2] " Pair | Player Name |Total|Round|Round|Round|Round|Round|Round|Round| "
## [3] " Num | USCF ID / Rtg (Pre->Post) | Pts | 1 | 2 | 3 | 4 | 5 | 6 | 7 | "
## [4] "-----------------------------------------------------------------------------------------"
## [5] " 1 | GARY HUA |6.0 |W 39|W 21|W 18|W 14|W 7|D 12|D 4|"
## [6] " ON | 15445895 / R: 1794 ->1817 |N:2 |W |B |W |B |W |B |W |"
class(chess_reader)
## [1] "character"
chess_data <- read.delim(file = "https://raw.githubusercontent.com/Sangeetha-007/R-Practice/master/607/Projects/Project%201/tournamentinfo.txt", header = TRUE)
#If you specify header=FALSE the first line is read in as data.
class(chess_data)
## [1] "data.frame"
head(chess_data)
## X.........................................................................................
## 1 Pair | Player Name |Total|Round|Round|Round|Round|Round|Round|Round|
## 2 Num | USCF ID / Rtg (Pre->Post) | Pts | 1 | 2 | 3 | 4 | 5 | 6 | 7 |
## 3 -----------------------------------------------------------------------------------------
## 4 1 | GARY HUA |6.0 |W 39|W 21|W 18|W 14|W 7|D 12|D 4|
## 5 ON | 15445895 / R: 1794 ->1817 |N:2 |W |B |W |B |W |B |W |
## 6 -----------------------------------------------------------------------------------------
#getState <- str_extract_all(chess_data, "([A-Z][A-Z])\\s\\|")
chess_data[1,0]
## data frame with 0 columns and 1 row
chess_data[1,1]
## [1] " Pair | Player Name |Total|Round|Round|Round|Round|Round|Round|Round| "
chess_data[0,1]
## character(0)
chess_data[2,1]
## [1] " Num | USCF ID / Rtg (Pre->Post) | Pts | 1 | 2 | 3 | 4 | 5 | 6 | 7 | "
chess_data[1,2]
## NULL
chess_data[1,]
## [1] " Pair | Player Name |Total|Round|Round|Round|Round|Round|Round|Round| "
chess_data[2,]
## [1] " Num | USCF ID / Rtg (Pre->Post) | Pts | 1 | 2 | 3 | 4 | 5 | 6 | 7 | "
chess_data[3,]
## [1] "-----------------------------------------------------------------------------------------"
chess_data[4,]
## [1] " 1 | GARY HUA |6.0 |W 39|W 21|W 18|W 14|W 7|D 12|D 4|"
chess_data[5,]
## [1] " ON | 15445895 / R: 1794 ->1817 |N:2 |W |B |W |B |W |B |W |"
class(chess_data[5,])
## [1] "character"
Removing the header
newChessData<-chess_data[-c(1,2),]
class(newChessData)
## [1] "character"
head(newChessData, 100)
## [1] "-----------------------------------------------------------------------------------------"
## [2] " 1 | GARY HUA |6.0 |W 39|W 21|W 18|W 14|W 7|D 12|D 4|"
## [3] " ON | 15445895 / R: 1794 ->1817 |N:2 |W |B |W |B |W |B |W |"
## [4] "-----------------------------------------------------------------------------------------"
## [5] " 2 | DAKSHESH DARURI |6.0 |W 63|W 58|L 4|W 17|W 16|W 20|W 7|"
## [6] " MI | 14598900 / R: 1553 ->1663 |N:2 |B |W |B |W |B |W |B |"
## [7] "-----------------------------------------------------------------------------------------"
## [8] " 3 | ADITYA BAJAJ |6.0 |L 8|W 61|W 25|W 21|W 11|W 13|W 12|"
## [9] " MI | 14959604 / R: 1384 ->1640 |N:2 |W |B |W |B |W |B |W |"
## [10] "-----------------------------------------------------------------------------------------"
## [11] " 4 | PATRICK H SCHILLING |5.5 |W 23|D 28|W 2|W 26|D 5|W 19|D 1|"
## [12] " MI | 12616049 / R: 1716 ->1744 |N:2 |W |B |W |B |W |B |B |"
## [13] "-----------------------------------------------------------------------------------------"
## [14] " 5 | HANSHI ZUO |5.5 |W 45|W 37|D 12|D 13|D 4|W 14|W 17|"
## [15] " MI | 14601533 / R: 1655 ->1690 |N:2 |B |W |B |W |B |W |B |"
## [16] "-----------------------------------------------------------------------------------------"
## [17] " 6 | HANSEN SONG |5.0 |W 34|D 29|L 11|W 35|D 10|W 27|W 21|"
## [18] " OH | 15055204 / R: 1686 ->1687 |N:3 |W |B |W |B |B |W |B |"
## [19] "-----------------------------------------------------------------------------------------"
## [20] " 7 | GARY DEE SWATHELL |5.0 |W 57|W 46|W 13|W 11|L 1|W 9|L 2|"
## [21] " MI | 11146376 / R: 1649 ->1673 |N:3 |W |B |W |B |B |W |W |"
## [22] "-----------------------------------------------------------------------------------------"
## [23] " 8 | EZEKIEL HOUGHTON |5.0 |W 3|W 32|L 14|L 9|W 47|W 28|W 19|"
## [24] " MI | 15142253 / R: 1641P17->1657P24 |N:3 |B |W |B |W |B |W |W |"
## [25] "-----------------------------------------------------------------------------------------"
## [26] " 9 | STEFANO LEE |5.0 |W 25|L 18|W 59|W 8|W 26|L 7|W 20|"
## [27] " ON | 14954524 / R: 1411 ->1564 |N:2 |W |B |W |B |W |B |B |"
## [28] "-----------------------------------------------------------------------------------------"
## [29] " 10 | ANVIT RAO |5.0 |D 16|L 19|W 55|W 31|D 6|W 25|W 18|"
## [30] " MI | 14150362 / R: 1365 ->1544 |N:3 |W |W |B |B |W |B |W |"
## [31] "-----------------------------------------------------------------------------------------"
## [32] " 11 | CAMERON WILLIAM MC LEMAN |4.5 |D 38|W 56|W 6|L 7|L 3|W 34|W 26|"
## [33] " MI | 12581589 / R: 1712 ->1696 |N:3 |B |W |B |W |B |W |B |"
## [34] "-----------------------------------------------------------------------------------------"
## [35] " 12 | KENNETH J TACK |4.5 |W 42|W 33|D 5|W 38|H |D 1|L 3|"
## [36] " MI | 12681257 / R: 1663 ->1670 |N:3 |W |B |W |B | |W |B |"
## [37] "-----------------------------------------------------------------------------------------"
## [38] " 13 | TORRANCE HENRY JR |4.5 |W 36|W 27|L 7|D 5|W 33|L 3|W 32|"
## [39] " MI | 15082995 / R: 1666 ->1662 |N:3 |B |W |B |B |W |W |B |"
## [40] "-----------------------------------------------------------------------------------------"
## [41] " 14 | BRADLEY SHAW |4.5 |W 54|W 44|W 8|L 1|D 27|L 5|W 31|"
## [42] " MI | 10131499 / R: 1610 ->1618 |N:3 |W |B |W |W |B |B |W |"
## [43] "-----------------------------------------------------------------------------------------"
## [44] " 15 | ZACHARY JAMES HOUGHTON |4.5 |D 19|L 16|W 30|L 22|W 54|W 33|W 38|"
## [45] " MI | 15619130 / R: 1220P13->1416P20 |N:3 |B |B |W |W |B |B |W |"
## [46] "-----------------------------------------------------------------------------------------"
## [47] " 16 | MIKE NIKITIN |4.0 |D 10|W 15|H |W 39|L 2|W 36|U |"
## [48] " MI | 10295068 / R: 1604 ->1613 |N:3 |B |W | |B |W |B | |"
## [49] "-----------------------------------------------------------------------------------------"
## [50] " 17 | RONALD GRZEGORCZYK |4.0 |W 48|W 41|L 26|L 2|W 23|W 22|L 5|"
## [51] " MI | 10297702 / R: 1629 ->1610 |N:3 |W |B |W |B |W |B |W |"
## [52] "-----------------------------------------------------------------------------------------"
## [53] " 18 | DAVID SUNDEEN |4.0 |W 47|W 9|L 1|W 32|L 19|W 38|L 10|"
## [54] " MI | 11342094 / R: 1600 ->1600 |N:3 |B |W |B |W |B |W |B |"
## [55] "-----------------------------------------------------------------------------------------"
## [56] " 19 | DIPANKAR ROY |4.0 |D 15|W 10|W 52|D 28|W 18|L 4|L 8|"
## [57] " MI | 14862333 / R: 1564 ->1570 |N:3 |W |B |W |B |W |W |B |"
## [58] "-----------------------------------------------------------------------------------------"
## [59] " 20 | JASON ZHENG |4.0 |L 40|W 49|W 23|W 41|W 28|L 2|L 9|"
## [60] " MI | 14529060 / R: 1595 ->1569 |N:4 |W |B |W |B |W |B |W |"
## [61] "-----------------------------------------------------------------------------------------"
## [62] " 21 | DINH DANG BUI |4.0 |W 43|L 1|W 47|L 3|W 40|W 39|L 6|"
## [63] " ON | 15495066 / R: 1563P22->1562 |N:3 |B |W |B |W |W |B |W |"
## [64] "-----------------------------------------------------------------------------------------"
## [65] " 22 | EUGENE L MCCLURE |4.0 |W 64|D 52|L 28|W 15|H |L 17|W 40|"
## [66] " MI | 12405534 / R: 1555 ->1529 |N:4 |W |B |W |B | |W |B |"
## [67] "-----------------------------------------------------------------------------------------"
## [68] " 23 | ALAN BUI |4.0 |L 4|W 43|L 20|W 58|L 17|W 37|W 46|"
## [69] " ON | 15030142 / R: 1363 ->1371 | |B |W |B |W |B |W |B |"
## [70] "-----------------------------------------------------------------------------------------"
## [71] " 24 | MICHAEL R ALDRICH |4.0 |L 28|L 47|W 43|L 25|W 60|W 44|W 39|"
## [72] " MI | 13469010 / R: 1229 ->1300 |N:4 |B |W |B |B |W |W |B |"
## [73] "-----------------------------------------------------------------------------------------"
## [74] " 25 | LOREN SCHWIEBERT |3.5 |L 9|W 53|L 3|W 24|D 34|L 10|W 47|"
## [75] " MI | 12486656 / R: 1745 ->1681 |N:4 |B |W |B |W |B |W |B |"
## [76] "-----------------------------------------------------------------------------------------"
## [77] " 26 | MAX ZHU |3.5 |W 49|W 40|W 17|L 4|L 9|D 32|L 11|"
## [78] " ON | 15131520 / R: 1579 ->1564 |N:4 |B |W |B |W |B |W |W |"
## [79] "-----------------------------------------------------------------------------------------"
## [80] " 27 | GAURAV GIDWANI |3.5 |W 51|L 13|W 46|W 37|D 14|L 6|U |"
## [81] " MI | 14476567 / R: 1552 ->1539 |N:4 |W |B |W |B |W |B | |"
## [82] "-----------------------------------------------------------------------------------------"
## [83] " 28 | SOFIA ADINA STANESCU-BELLU |3.5 |W 24|D 4|W 22|D 19|L 20|L 8|D 36|"
## [84] " MI | 14882954 / R: 1507 ->1513 |N:3 |W |W |B |W |B |B |W |"
## [85] "-----------------------------------------------------------------------------------------"
## [86] " 29 | CHIEDOZIE OKORIE |3.5 |W 50|D 6|L 38|L 34|W 52|W 48|U |"
## [87] " MI | 15323285 / R: 1602P6 ->1508P12 |N:4 |B |W |B |W |W |B | |"
## [88] "-----------------------------------------------------------------------------------------"
## [89] " 30 | GEORGE AVERY JONES |3.5 |L 52|D 64|L 15|W 55|L 31|W 61|W 50|"
## [90] " ON | 12577178 / R: 1522 ->1444 | |W |B |B |W |W |B |B |"
## [91] "-----------------------------------------------------------------------------------------"
## [92] " 31 | RISHI SHETTY |3.5 |L 58|D 55|W 64|L 10|W 30|W 50|L 14|"
## [93] " MI | 15131618 / R: 1494 ->1444 | |B |W |B |W |B |W |B |"
## [94] "-----------------------------------------------------------------------------------------"
## [95] " 32 | JOSHUA PHILIP MATHEWS |3.5 |W 61|L 8|W 44|L 18|W 51|D 26|L 13|"
## [96] " ON | 14073750 / R: 1441 ->1433 |N:4 |W |B |W |B |W |B |W |"
## [97] "-----------------------------------------------------------------------------------------"
## [98] " 33 | JADE GE |3.5 |W 60|L 12|W 50|D 36|L 13|L 15|W 51|"
## [99] " MI | 14691842 / R: 1449 ->1421 | |B |W |B |W |B |W |B |"
## [100] "-----------------------------------------------------------------------------------------"
#([A-Z])\w+
#players <- str_extract_all(chess_data, "([A-Z])\\w+", simplify=TRUE)
#players <- unlist(players)
#print(players)
#playersNew <-str_extract_all(players, "([A-Z][A-Z])\\s\\|")
#print(playersNew)
playersName <- str_extract_all(chess_data, "(\\s[A-Z]+\\s[A-Z]+)?((\\s|-)[A-Z]+)?(\\s|-)[A-Z]+", simplify=TRUE)
## Warning in stri_extract_all_regex(string, pattern, simplify = simplify, :
## argument is not an atomic vector; coercing
playersName <- playersName[!apply(playersName == "", 1, all), ]
playersName
## [1] " P" " P"
## [3] " N" " N"
## [5] " USCF ID" " R"
## [7] " P" " GARY HUA"
## [9] " ON" " R"
## [11] " DAKSHESH DARURI" " MI"
## [13] " R" " ADITYA BAJAJ"
## [15] " MI" " R"
## [17] " PATRICK H SCHILLING" " MI"
## [19] " R" " HANSHI ZUO"
## [21] " MI" " R"
## [23] " HANSEN SONG" " OH"
## [25] " R" " GARY DEE SWATHELL"
## [27] " MI" " R"
## [29] " EZEKIEL HOUGHTON" " MI"
## [31] " R" " STEFANO LEE"
## [33] " ON" " R"
## [35] " ANVIT RAO" " MI"
## [37] " R" " CAMERON WILLIAM MC LEMAN"
## [39] " MI" " R"
## [41] " KENNETH J TACK" " MI"
## [43] " R" " TORRANCE HENRY JR"
## [45] " MI" " R"
## [47] " BRADLEY SHAW" " MI"
## [49] " R" " ZACHARY JAMES HOUGHTON"
## [51] " MI" " R"
## [53] " MIKE NIKITIN" " MI"
## [55] " R" " RONALD GRZEGORCZYK"
## [57] " MI" " R"
## [59] " DAVID SUNDEEN" " MI"
## [61] " R" " DIPANKAR ROY"
## [63] " MI" " R"
## [65] " JASON ZHENG" " MI"
## [67] " R" " DINH DANG BUI"
## [69] " ON" " R"
## [71] " EUGENE L MCCLURE" " MI"
## [73] " R" " ALAN BUI"
## [75] " ON" " R"
## [77] " MICHAEL R ALDRICH" " MI"
## [79] " R" " LOREN SCHWIEBERT"
## [81] " MI" " R"
## [83] " MAX ZHU" " ON"
## [85] " R" " GAURAV GIDWANI"
## [87] " MI" " R"
## [89] " SOFIA ADINA STANESCU-BELLU" " MI"
## [91] " R" " CHIEDOZIE OKORIE"
## [93] " MI" " R"
## [95] " GEORGE AVERY JONES" " ON"
## [97] " R" " RISHI SHETTY"
## [99] " MI" " R"
## [101] " JOSHUA PHILIP MATHEWS" " ON"
## [103] " R" " JADE GE"
## [105] " MI" " R"
## [107] " MICHAEL JEFFERY THOMAS" " MI"
## [109] " R" " JOSHUA DAVID LEE"
## [111] " MI" " R"
## [113] " SIDDHARTH JHA" " MI"
## [115] " R" " AMIYATOSH PWNANANDAM"
## [117] " MI" " R"
## [119] " BRIAN LIU" " MI"
## [121] " R" " JOEL R HENDON"
## [123] " MI" " R"
## [125] " FOREST ZHANG" " MI"
## [127] " R" " KYLE WILLIAM MURPHY"
## [129] " MI" " R"
## [131] " JARED GE" " MI"
## [133] " R" " ROBERT GLEN VASEY"
## [135] " MI" " R"
## [137] " JUSTIN D SCHILLING" " MI"
## [139] " R" " DEREK YAN"
## [141] " MI" " R"
## [143] " JACOB ALEXANDER LAVALLEY" " MI"
## [145] " R" " ERIC WRIGHT"
## [147] " MI" " R"
## [149] " DANIEL KHAIN" " MI"
## [151] " R" " MICHAEL J MARTIN"
## [153] " MI" " R"
## [155] " SHIVAM JHA" " MI"
## [157] " R" " TEJAS AYYAGARI"
## [159] " MI" " R"
## [161] " ETHAN GUO" " MI"
## [163] " R" " JOSE C YBARRA"
## [165] " MI" " R"
## [167] " LARRY HODGE" " MI"
## [169] " R" " ALEX KONG"
## [171] " MI" " R"
## [173] " MARISA RICCI" " MI"
## [175] " R" " MICHAEL LU"
## [177] " MI" " R"
## [179] " VIRAJ MOHILE" " MI"
## [181] " R" " SEAN M MC CORMICK"
## [183] " MI" " R"
## [185] " JULIA SHEN" " MI"
## [187] " R" " JEZZEL FARKAS"
## [189] " ON" " R"
## [191] " ASHWIN BALAJI" " MI"
## [193] " R" " THOMAS JOSEPH HOSMER"
## [195] " MI" " R"
## [197] " BEN LI" " MI"
## [199] " R"
playersState <- str_extract_all(chess_data, "([A-Z][A-Z])\\s\\|", simplify=TRUE)
## Warning in stri_extract_all_regex(string, pattern, simplify = simplify, :
## argument is not an atomic vector; coercing
playersState <- playersState[!apply(playersState == "", 1, all), ]
playersState
## [1] "ON |" "MI |" "MI |" "MI |" "MI |" "OH |" "MI |" "MI |" "ON |" "MI |"
## [11] "MI |" "MI |" "MI |" "MI |" "MI |" "MI |" "MI |" "MI |" "MI |" "MI |"
## [21] "ON |" "MI |" "ON |" "MI |" "MI |" "ON |" "MI |" "MI |" "MI |" "ON |"
## [31] "MI |" "ON |" "MI |" "MI |" "MI |" "MI |" "MI |" "MI |" "MI |" "MI |"
## [41] "MI |" "MI |" "MI |" "MI |" "MI |" "MI |" "MI |" "MI |" "MI |" "MI |"
## [51] "MI |" "MI |" "MI |" "MI |" "MI |" "MI |" "MI |" "MI |" "MI |" "MI |"
## [61] "ON |" "MI |" "MI |" "MI |"
gamePoints <- str_extract_all(chess_data, "\\d\\.\\d", simplify=TRUE)
## Warning in stri_extract_all_regex(string, pattern, simplify = simplify, :
## argument is not an atomic vector; coercing
gamePoints <- gamePoints[!apply(gamePoints == "", 1, all), ]
gamePoints
## [1] "6.0" "6.0" "6.0" "5.5" "5.5" "5.0" "5.0" "5.0" "5.0" "5.0" "4.5" "4.5"
## [13] "4.5" "4.5" "4.5" "4.0" "4.0" "4.0" "4.0" "4.0" "4.0" "4.0" "4.0" "4.0"
## [25] "3.5" "3.5" "3.5" "3.5" "3.5" "3.5" "3.5" "3.5" "3.5" "3.5" "3.5" "3.5"
## [37] "3.5" "3.0" "3.0" "3.0" "3.0" "3.0" "3.0" "3.0" "3.0" "3.0" "2.5" "2.5"
## [49] "2.5" "2.5" "2.5" "2.5" "2.0" "2.0" "2.0" "2.0" "2.0" "2.0" "2.0" "1.5"
## [61] "1.5" "1.0" "1.0" "1.0"
class(playersName)
## [1] "character"
playersName<- str_remove(playersName, pattern = " USCF ID")
playersName<- str_remove(playersName, pattern = "ON")
playersName<- str_remove(playersName, pattern = "R")
playersName<- str_remove(playersName, pattern = "MI")
playersName<- str_remove(playersName, pattern = "P")
playersName<- str_remove(playersName, pattern = "N")
playersName<- str_remove(playersName, pattern = " OH")
playersName <- playersName[!grepl("^\\s+$", playersName)]
playersName <- unique(playersName[playersName!= ""])
playersName
## [1] " GAY HUA" " DAKSHESH DAURI"
## [3] " ADITYA BAJAJ" " ATICK H SCHILLIG"
## [5] " HASHI ZUO" " HASEN SG"
## [7] " GAY DEE SWATHELL" " EZEKIEL HOUGHT"
## [9] " STEFAO LEE" " AVIT AO"
## [11] " CAME WILLIAM MC LEMA" " KENETH J TACK"
## [13] " TORACE HENRY JR" " BADLEY SHAW"
## [15] " ZACHAY JAMES HOUGHT" " KE IKITIN"
## [17] " ALD GRZEGORCZYK" " DAVID SUDEEN"
## [19] " DIAKA ROY" " JAS ZHEG"
## [21] " DIH DANG BUI" " EUGEE L MCCLUE"
## [23] " ALA BUI" " CHAEL ALDRICH"
## [25] " LOE SCHWIEBERT" " MAX ZHU"
## [27] " GAUAV GIDWAI" " SOFIA ADIA STANESCU-BELLU"
## [29] " CHIEDOZIE OKOIE" " GEOGE AVERY JES"
## [31] " ISHI SHETTY" " JOSHUA HILIP MATHEWS"
## [33] " JADE GE" " CHAEL JEFFEY THOMAS"
## [35] " JOSHUA DAVID LEE" " SIDDHATH JHA"
## [37] " AYATOSH WANANDAM" " BIA LIU"
## [39] " JOEL HED" " FOEST ZHAG"
## [41] " KYLE WILLIAM MUHY" " JAED GE"
## [43] " OBERT GLE VASEY" " JUSTI D SCHILLING"
## [45] " DEEK YA" " JACOB ALEXADE LAVALLEY"
## [47] " EIC WRIGHT" " DAIEL KHAIN"
## [49] " CHAEL J MATI" " SHIVAM JHA"
## [51] " TEJAS AYYAGAI" " ETHA GUO"
## [53] " JOSE C YBARA" " LARY HODGE"
## [55] " ALEX KG" " MAISA RICCI"
## [57] " CHAEL LU" " VIAJ MOHILE"
## [59] " SEA M MC COCK" " JULIA SHE"
## [61] " JEZZEL FAKAS" " ASHWI BALAJI"
## [63] " THOMAS JOSEH HOSME" " BE LI"
length(playersName)
## [1] 64
length(playersState)
## [1] 64
length(gamePoints)
## [1] 64
PlayerPreRating <- str_extract_all(chess_data, "R.\\s+\\d+", simplify=TRUE)
## Warning in stri_extract_all_regex(string, pattern, simplify = simplify, :
## argument is not an atomic vector; coercing
print(PlayerPreRating[1,])
## [1] "R: 1794" "R: 1553" "R: 1384" "R: 1716" "R: 1655" "R: 1686" "R: 1649"
## [8] "R: 1641" "R: 1411" "R: 1365" "R: 1712" "R: 1663" "R: 1666" "R: 1610"
## [15] "R: 1220" "R: 1604" "R: 1629" "R: 1600" "R: 1564" "R: 1595" "R: 1563"
## [22] "R: 1555" "R: 1363" "R: 1229" "R: 1745" "R: 1579" "R: 1552" "R: 1507"
## [29] "R: 1602" "R: 1522" "R: 1494" "R: 1441" "R: 1449" "R: 1399" "R: 1438"
## [36] "R: 1355" "R: 980" "R: 1423" "R: 1436" "R: 1348" "R: 1403" "R: 1332"
## [43] "R: 1283" "R: 1199" "R: 1242" "R: 377" "R: 1362" "R: 1382" "R: 1291"
## [50] "R: 1056" "R: 1011" "R: 935" "R: 1393" "R: 1270" "R: 1186" "R: 1153"
## [57] "R: 1092" "R: 917" "R: 853" "R: 967" "R: 955" "R: 1530" "R: 1175"
## [64] "R: 1163"
class(PlayerPreRating)
## [1] "matrix" "array"
#rowMeans: Form Row Sums and Means
#meanOfRow <- rowMeans(PlayerPreRating, na.rm = TRUE , dims=1 )
# na. rm = TRUE to exclude missing values
#meanOfRow
PlayerPreRating <- as.data.frame(PlayerPreRating)
class(PlayerPreRating)
## [1] "data.frame"
head(PlayerPreRating)
## V1 V2 V3 V4 V5 V6 V7 V8 V9
## 1 R: 1794 R: 1553 R: 1384 R: 1716 R: 1655 R: 1686 R: 1649 R: 1641 R: 1411
## V10 V11 V12 V13 V14 V15 V16 V17 V18
## 1 R: 1365 R: 1712 R: 1663 R: 1666 R: 1610 R: 1220 R: 1604 R: 1629 R: 1600
## V19 V20 V21 V22 V23 V24 V25 V26 V27
## 1 R: 1564 R: 1595 R: 1563 R: 1555 R: 1363 R: 1229 R: 1745 R: 1579 R: 1552
## V28 V29 V30 V31 V32 V33 V34 V35 V36
## 1 R: 1507 R: 1602 R: 1522 R: 1494 R: 1441 R: 1449 R: 1399 R: 1438 R: 1355
## V37 V38 V39 V40 V41 V42 V43 V44 V45
## 1 R: 980 R: 1423 R: 1436 R: 1348 R: 1403 R: 1332 R: 1283 R: 1199 R: 1242
## V46 V47 V48 V49 V50 V51 V52 V53 V54
## 1 R: 377 R: 1362 R: 1382 R: 1291 R: 1056 R: 1011 R: 935 R: 1393 R: 1270
## V55 V56 V57 V58 V59 V60 V61 V62 V63
## 1 R: 1186 R: 1153 R: 1092 R: 917 R: 853 R: 967 R: 955 R: 1530 R: 1175
## V64
## 1 R: 1163
#meanOfRow <- rowMeans(PlayerPreRating)
subs<-substring(PlayerPreRating,3,7)
print(subs)
## [1] " 1794" " 1553" " 1384" " 1716" " 1655" " 1686" " 1649" " 1641" " 1411"
## [10] " 1365" " 1712" " 1663" " 1666" " 1610" " 1220" " 1604" " 1629" " 1600"
## [19] " 1564" " 1595" " 1563" " 1555" " 1363" " 1229" " 1745" " 1579" " 1552"
## [28] " 1507" " 1602" " 1522" " 1494" " 1441" " 1449" " 1399" " 1438" " 1355"
## [37] " 980" " 1423" " 1436" " 1348" " 1403" " 1332" " 1283" " 1199" " 1242"
## [46] " 377" " 1362" " 1382" " 1291" " 1056" " 1011" " 935" " 1393" " 1270"
## [55] " 1186" " 1153" " 1092" " 917" " 853" " 967" " 955" " 1530" " 1175"
## [64] " 1163"
beg <-substring(PlayerPreRating,0, 2)
print(beg)
## [1] "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:"
## [16] "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:"
## [31] "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:"
## [46] "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:" "R:"
## [61] "R:" "R:" "R:" "R:"
newSubs<-as.integer(subs)
print(newSubs)
## [1] 1794 1553 1384 1716 1655 1686 1649 1641 1411 1365 1712 1663 1666 1610 1220
## [16] 1604 1629 1600 1564 1595 1563 1555 1363 1229 1745 1579 1552 1507 1602 1522
## [31] 1494 1441 1449 1399 1438 1355 980 1423 1436 1348 1403 1332 1283 1199 1242
## [46] 377 1362 1382 1291 1056 1011 935 1393 1270 1186 1153 1092 917 853 967
## [61] 955 1530 1175 1163
class(newSubs)
## [1] "integer"
newSubs<- as.data.frame(newSubs)
class(newSubs)
## [1] "data.frame"
PreChessRating <- rowMeans(newSubs, na.rm = TRUE , dims=1 )
print(PreChessRating)
## [1] 1794 1553 1384 1716 1655 1686 1649 1641 1411 1365 1712 1663 1666 1610 1220
## [16] 1604 1629 1600 1564 1595 1563 1555 1363 1229 1745 1579 1552 1507 1602 1522
## [31] 1494 1441 1449 1399 1438 1355 980 1423 1436 1348 1403 1332 1283 1199 1242
## [46] 377 1362 1382 1291 1056 1011 935 1393 1270 1186 1153 1092 917 853 967
## [61] 955 1530 1175 1163
#meanOfRow <- rowMeans(PlayerPreRating)
#I am a bit confused about the average pre chess rating approach. I tried different things, but I am out of time as well.
chessInfo <- data.frame(playersName, playersState, gamePoints, PreChessRating)
head(chessInfo)
## playersName playersState gamePoints PreChessRating
## 1 GAY HUA ON | 6.0 1794
## 2 DAKSHESH DAURI MI | 6.0 1553
## 3 ADITYA BAJAJ MI | 6.0 1384
## 4 ATICK H SCHILLIG MI | 5.5 1716
## 5 HASHI ZUO MI | 5.5 1655
## 6 HASEN SG OH | 5.0 1686
write.csv(chessInfo, file = "/Users/Sangeetha/Downloads/ChessGameNumbers.csv")