benchmark different formats

sparsity (zero-value rate)

dt[, unique(sparsity), by = list(nCells, beta_value)]
##     nCells             beta_value        V1
##  1:   1000 alpha = 0.1 beta = 0.8 0.9225260
##  2:   4000 alpha = 0.1 beta = 0.8 0.9243426
##  3:   7000 alpha = 0.1 beta = 0.8 0.9227970
##  4:  20000 alpha = 0.1 beta = 0.8 0.9229823
##  5:  50000 alpha = 0.1 beta = 0.8 0.9224632
##  6:   1000 alpha = 0.2 beta = 0.9 0.8730451
##  7:   4000 alpha = 0.2 beta = 0.9 0.8713663
##  8:   7000 alpha = 0.2 beta = 0.9 0.8717319
##  9:  20000 alpha = 0.2 beta = 0.9 0.8719348
## 10:  50000 alpha = 0.2 beta = 0.9 0.8712112
## 11:   1000 alpha = 0.3 beta = 0.7 0.7897353
## 12:   4000 alpha = 0.3 beta = 0.7 0.7927173
## 13:   7000 alpha = 0.3 beta = 0.7 0.7883399
## 14:  20000 alpha = 0.3 beta = 0.7 0.7883345
## 15:  50000 alpha = 0.3 beta = 0.7 0.7901626
## 16:   1000 alpha = 0.4 beta = 0.6 0.7195631
## 17:   4000 alpha = 0.4 beta = 0.6 0.7213056
## 18:   7000 alpha = 0.4 beta = 0.6 0.7199958
## 19:  20000 alpha = 0.4 beta = 0.6 0.7184199
## 20:  50000 alpha = 0.4 beta = 0.6 0.7190410

plot the result

ggplot(dt, aes(y = time, x = nCells, color = format)) + geom_line() + geom_point() + facet_grid(slicing~beta_value, scales ="free") + ylab("time (ms)") + scale_x_continuous(breaks = nCellsVec) + ggtitle("time") + scale_y_log10()

ggplot(dt[format != "H5(chunked.read)"], aes(x = nCells, y = size, color = format)) + geom_line() + geom_point() + facet_wrap(~beta_value) + ylab("size (GB)") + scale_x_continuous(breaks = nCellsVec) + ggtitle("space")