data set

here are the two files https://dl.dropboxusercontent.com/u/7710864/data/reviews-apr29.csv https://dl.dropboxusercontent.com/u/7710864/data/solutions-apr29.csv

reviews = read.csv("reviews-apr29.csv")
solutions = read.csv("solutions-apr29.csv")
head(reviews, 2)

##   id solution_id reviewer_id      start       stop time_left accept
## 1  1           3          27 1304095698 1304095758      1754      1
## 2  2           4          22 1304095188 1304095206      2306      1

head(solutions,2)

##   id problem_id subject_id      start       stop time_left answer
## 1  1        156         29 1304095119 1304095169      2343      B
## 2  2        269         25 1304095119 1304095183      2329      C

names(reviews)

## [1] "id"          "solution_id" "reviewer_id" "start"       "stop"       
## [6] "time_left"   "accept"

Lets merge

mergeData = merge(reviews, solutions, by.x = "solution_id", by.y = "id" , all=TRUE)

to know the intersections

intersect(names(solutions), names(reviews))

## [1] "id"        "start"     "stop"      "time_left"

merge data sets

abdul Baqi

Monday, November 24, 2014

data set