diff --git a/.Rbuildignore b/.Rbuildignore
index c05278e2..5c5d5b95 100644
--- a/.Rbuildignore
+++ b/.Rbuildignore
@@ -64,4 +64,5 @@ vignettes.asis.template
 vignettes.Rnw.template
 ^codecov\.yml$
 new-nse-dev.r
-test-poorman.R
\ No newline at end of file
+test-poorman.R
+*.parquet
\ No newline at end of file
diff --git a/CRAN-RELEASE b/CRAN-RELEASE
index f72236de..48d603de 100644
--- a/CRAN-RELEASE
+++ b/CRAN-RELEASE
@@ -1,2 +1,2 @@
-This package was submitted to CRAN on 2021-02-13.
-Once it is accepted, delete this file and tag the release (commit f7dd3db).
+This package was submitted to CRAN on 2021-03-12.
+Once it is accepted, delete this file and tag the release (commit 34bafaa).
diff --git a/DESCRIPTION b/DESCRIPTION
index a9207fc2..0f848ee8 100644
--- a/DESCRIPTION
+++ b/DESCRIPTION
@@ -1,8 +1,8 @@
 Type: Package
 Package: disk.frame
 Title: Larger-than-RAM Disk-Based Data Manipulation Framework
-Version: 0.4.0
-Date: 2021-02-11
+Version: 0.5.0
+Date: 2021-05-09
 Authors@R: c(
   person("Dai", "ZJ", email = "zhuojia.dai@gmail.com", role = c("aut", "cre")),
   person("Jacky", "Poon", role = c("ctb"))
diff --git a/NAMESPACE b/NAMESPACE
index 51fa7439..da78d075 100644
--- a/NAMESPACE
+++ b/NAMESPACE
@@ -67,7 +67,6 @@ S3method(transmute,disk.frame)
 export(IQR_df.chunk_agg.disk.frame)
 export(IQR_df.collected_agg.disk.frame)
 export(add_chunk)
-export(add_count.disk.frame)
 export(add_tally.disk.frame)
 export(all_df.chunk_agg.disk.frame)
 export(all_df.collected_agg.disk.frame)
@@ -176,7 +175,6 @@ importFrom(data.table,setDT)
 importFrom(data.table,setkey)
 importFrom(data.table,setkeyv)
 importFrom(data.table,timetaken)
-importFrom(dplyr,add_count)
 importFrom(dplyr,add_tally)
 importFrom(dplyr,anti_join)
 importFrom(dplyr,arrange)
diff --git a/NEWS.md b/NEWS.md
index f06cc6e6..088222ce 100644
--- a/NEWS.md
+++ b/NEWS.md
@@ -1,3 +1,9 @@
+# disk.frame 0.5
+* removed `add_count` method
+
+# disk.frame 0.4.1
+* removed use of `sysctl` which was violating CRAN policy
+
 # disk.frame 0.4.0
 * Removed `count` and `tally`
 * Fixed package compatibility
diff --git a/R/dplyr_verbs.r b/R/dplyr_verbs.r
index e92e678d..75be5774 100644
--- a/R/dplyr_verbs.r
+++ b/R/dplyr_verbs.r
@@ -70,10 +70,10 @@ chunk_arrange <- create_chunk_mapper(dplyr::arrange)
 # TODO alot of these .disk.frame functions are not generic
 
 
-#' @export
-#' @importFrom dplyr add_count
-#' @rdname dplyr_verbs
-add_count.disk.frame <- create_chunk_mapper(dplyr::add_count)
+#' #' @export
+#' #' @importFrom dplyr add_count
+#' #' @rdname dplyr_verbs
+#' add_count.disk.frame <- create_chunk_mapper(dplyr::add_count)
 
 
 #' @export
diff --git a/R/recommend_nchunks.r b/R/recommend_nchunks.r
index 8d77e1f5..e5be6ac0 100644
--- a/R/recommend_nchunks.r
+++ b/R/recommend_nchunks.r
@@ -91,16 +91,18 @@ df_ram_size <- function() {
         }
       } 
     } else {
-      os = R.version$os
-      if (length(grep("^darwin", os))) {
-        a = substring(system("sysctl hw.memsize", intern = TRUE), 13)
-      } #else {
+      #os = R.version$os
+      #if (length(grep("^darwin", os))) {
+        #a = substring(system("sysctl hw.memsize", intern = TRUE), 13)
+        # the above is not allowed by CRAN
+      #} #else {
         # This would work but is not allowed by CRAN
         #a = system('grep MemTotal /proc/meminfo', intern = TRUE)
       #}
-      l = strsplit(a, " ")[[1]]
-      l = as.numeric(l[length(l)-1])
-      ram_size = l/1024^2
+      #l = strsplit(a, " ")[[1]]
+      #l = as.numeric(l[length(l)-1])
+      #ram_size = l/1024^2
+      ram_size = 16 # to be conservative
     } 
     
     if(is.null(ram_size)) {
diff --git a/README.Rmd b/README.Rmd
index 06bd5fa8..e5d8beaf 100644
--- a/README.Rmd
+++ b/README.Rmd
@@ -250,7 +250,7 @@ ncol(flights.df)
 
 ## Hex logo
 
-![disk.frame logo](inst/figures/logo.png?raw=true)
+![disk.frame logo](inst/figures/logo.png)
 
 ## Contributors
 
@@ -283,6 +283,7 @@ The work priorities at this stage are
 | [深入对比数据科学工具箱：Python3 和 R 之争(2020版)](https://segmentfault.com/a/1190000021653567) | Chinese  | Harry Zhu       | 2020-02-16 | Mentions disk.frame                                          |
 
 
+
 ### Interested in learning `{disk.frame}` in a structured course?
 
 Please register your interest at:
diff --git a/README.md b/README.md
index 751b0a66..8b8b1af9 100644
--- a/README.md
+++ b/README.md
@@ -211,15 +211,12 @@ flights.df %>%
   filter(year == 2013) %>% 
   mutate(origin_dest = paste0(origin, dest)) %>% 
   head(2)
-#>   year month day dep_time sched_dep_time dep_delay arr_time sched_arr_time arr_delay
-#> 1 2013     1   1      517            515         2      830            819        11
-#> 2 2013     1   1      533            529         4      850            830        20
-#>   carrier flight tailnum origin dest air_time distance hour minute           time_hour
-#> 1      UA   1545  N14228    EWR  IAH      227     1400    5     15 2013-01-01 05:00:00
-#> 2      UA   1714  N24211    LGA  IAH      227     1416    5     29 2013-01-01 05:00:00
-#>   origin_dest
-#> 1      EWRIAH
-#> 2      LGAIAH
+#>   year month day dep_time sched_dep_time dep_delay arr_time sched_arr_time arr_delay carrier
+#> 1 2013     1   1      517            515         2      830            819        11      UA
+#> 2 2013     1   1      533            529         4      850            830        20      UA
+#>   flight tailnum origin dest air_time distance hour minute           time_hour origin_dest
+#> 1   1545  N14228    EWR  IAH      227     1400    5     15 2013-01-01 05:00:00      EWRIAH
+#> 2   1714  N24211    LGA  IAH      227     1416    5     29 2013-01-01 05:00:00      LGAIAH
 ```
 
 ### Group-by
@@ -276,15 +273,6 @@ obtained using estimated methods.
 
 ``` r
 library(data.table)
-#> data.table 1.13.6 using 6 threads (see ?getDTthreads).  Latest news: r-datatable.com
-#> 
-#> Attaching package: 'data.table'
-#> The following object is masked from 'package:purrr':
-#> 
-#>     transpose
-#> The following objects are masked from 'package:dplyr':
-#> 
-#>     between, first, last
 
 suppressWarnings(
   grp_by_stage1 <- 
@@ -325,7 +313,7 @@ To find out where the disk.frame is stored on disk:
 ``` r
 # where is the disk.frame stored
 attr(flights.df, "path")
-#> [1] "C:\\Users\\RTX2080\\AppData\\Local\\Temp\\Rtmpk3aGAr\\file3adc78655410.df"
+#> [1] "C:\\Users\\RTX2080\\AppData\\Local\\Temp\\RtmpIlXNzn\\file568813b835a7.df"
 ```
 
 A number of data.frame functions are implemented for disk.frame
@@ -333,19 +321,19 @@ A number of data.frame functions are implemented for disk.frame
 ``` r
 # get first few rows
 head(flights.df, 1)
-#>    year month day dep_time sched_dep_time dep_delay arr_time sched_arr_time arr_delay
-#> 1: 2013     1   1      517            515         2      830            819        11
-#>    carrier flight tailnum origin dest air_time distance hour minute           time_hour
-#> 1:      UA   1545  N14228    EWR  IAH      227     1400    5     15 2013-01-01 05:00:00
+#>    year month day dep_time sched_dep_time dep_delay arr_time sched_arr_time arr_delay carrier
+#> 1: 2013     1   1      517            515         2      830            819        11      UA
+#>    flight tailnum origin dest air_time distance hour minute           time_hour
+#> 1:   1545  N14228    EWR  IAH      227     1400    5     15 2013-01-01 05:00:00
 ```
 
 ``` r
 # get last few rows
 tail(flights.df, 1)
-#>    year month day dep_time sched_dep_time dep_delay arr_time sched_arr_time arr_delay
-#> 1: 2013     9  30       NA            840        NA       NA           1020        NA
-#>    carrier flight tailnum origin dest air_time distance hour minute           time_hour
-#> 1:      MQ   3531  N839MQ    LGA  RDU       NA      431    8     40 2013-09-30 08:00:00
+#>    year month day dep_time sched_dep_time dep_delay arr_time sched_arr_time arr_delay carrier
+#> 1: 2013     9  30       NA            840        NA       NA           1020        NA      MQ
+#>    flight tailnum origin dest air_time distance hour minute           time_hour
+#> 1:   3531  N839MQ    LGA  RDU       NA      431    8     40 2013-09-30 08:00:00
 ```
 
 ``` r
@@ -362,7 +350,7 @@ ncol(flights.df)
 
 ## Hex logo
 
-![disk.frame logo](inst/figures/logo.png?raw=true)
+![disk.frame logo](inst/figures/logo.png)
 
 ## Contributors
 
@@ -456,11 +444,3 @@ ways? Here are some ways you can contribute
 
 [![](https://cranlogs.r-pkg.org/badges/disk.frame)](https://cran.r-project.org/package=disk.frame)
 [![](http://cranlogs.r-pkg.org/badges/grand-total/disk.frame)](https://cran.r-project.org/package=disk.frame)
-[![Travis build
-status](https://travis-ci.org/xiaodaigh/disk.frame.svg?branch=master)](https://travis-ci.org/xiaodaigh/disk.frame)
-[![AppVeyor build
-status](https://ci.appveyor.com/api/projects/status/github/xiaodaigh/disk.frame?branch=master&svg=true)](https://ci.appveyor.com/project/xiaodaigh/disk.frame)
-
-## Live Stream of `{disk.frame}` development
-
--   <https://www.youtube.com/playlist?list=PL3DVdT3kym4fIU5CO-pxKtWhdjMVn4XGe>
diff --git a/book/01-intro.Rmd b/book/01-intro.Rmd
index d0df5a20..0ffc5a2e 100644
--- a/book/01-intro.Rmd
+++ b/book/01-intro.Rmd
@@ -3,7 +3,7 @@ title: "Preface - The birth of `disk.frame`"
 author: "ZJ"
 output: rmarkdown::html_vignette
 vignette: >
-  %\VignetteIndexEntry{preface}
+  %\VignetteIndexEntry{Preface - The birth of `disk.frame`}
   %\VignetteEngine{knitr::rmarkdown}
   %\VignetteEncoding{UTF-8}
 ---
diff --git a/book/06-vs-dask-juliadb.Rmd b/book/06-vs-dask-juliadb.Rmd
index 830081f9..c018af59 100644
--- a/book/06-vs-dask-juliadb.Rmd
+++ b/book/06-vs-dask-juliadb.Rmd
@@ -3,7 +3,7 @@ title: "Benchmarks 1: disk.frame beats Dask! disk.frame beats JuliaDB! Anyone el
 author: "ZJ"
 output: rmarkdown::html_vignette
 vignette: >
-  %\VignetteIndexEntry{benchmark-1}
+  %\VignetteIndexEntry{Benchmarks 1: disk.frame beats Dask! disk.frame beats JuliaDB! Anyone else wanna challenge?}
   %\VignetteEngine{knitr::rmarkdown}
   %\VignetteEncoding{UTF-8}
 ---
diff --git a/book/10-group-by.Rmd b/book/10-group-by.Rmd
index f0f6ec34..1f47eb55 100644
--- a/book/10-group-by.Rmd
+++ b/book/10-group-by.Rmd
@@ -58,22 +58,23 @@ It is important to note that not all functions that can run in `dplyr::summarize
 
 If a function you need/like is missing, please make a feature request [here](https://github.com/xiaodaigh/disk.frame/issues). It is a limitation that function that depend on the order a column can only obtained using estimated methods.
 
-| Function | Exact/Estimate | Notes |
-| -- | -- | -- |
-| `min` | Exact |  |
-| `max` | Exact |  |
-| `mean` | Exact |  |
-| `sum` | Exact |  |
-| `length` | Exact |  |
-| `n` | Exact |  |
-| `n_distinct` | Exact |  |
-| `sd` | Exact |  |
-| `var` | Exact | `var(x)` only `cor, cov` support *planned*  |
-| `any` | Exact |  |
-| `all` | Exact |  |
-| `median` | Estimate |  |
-| `quantile` | Estimate | One quantile only |
-| `IQR` | Estimate |  |
+| Function     | Exact/Estimate | Notes                                      |
+|--------------|----------------|--------------------------------------------|
+| `min`        | Exact          |                                            |
+| `max`        | Exact          |                                            |
+| `mean`       | Exact          |                                            |
+| `sum`        | Exact          |                                            |
+| `length`     | Exact          |                                            |
+| `n`          | Exact          |                                            |
+| `n_distinct` | Exact          |                                            |
+| `sd`         | Exact          |                                            |
+| `var`        | Exact          | `var(x)` only `cor, cov` support *planned* |
+| `any`        | Exact          |                                            |
+| `all`        | Exact          |                                            |
+| `median`     | Estimate       |                                            |
+| `quantile`   | Estimate       | One quantile only                          |
+| `IQR`        | Estimate       |                                            |
+
 
 ### Notes on One-Stage group-by
 
diff --git a/book/88-trouble-shooting.Rmd b/book/88-trouble-shooting.Rmd
new file mode 100644
index 00000000..f9cbca51
--- /dev/null
+++ b/book/88-trouble-shooting.Rmd
@@ -0,0 +1,53 @@
+---
+title: "Trouble shooting"
+author: "ZJ"
+output: pdf_document
+---
+
+```{r include=FALSE}
+knitr::opts_chunk$set(
+  collapse = TRUE,
+  comment = "#>",
+  eval=TRUE,
+  include=TRUE
+)
+```
+
+### Steps to trouble shoot
+
+1. I suggest updating {future} and your R version if you have not already done so.
+
+2. Are you able to share the data?
+
+3. Do a good MWE
+```
+library(disk.frame)
+setup_disk.frame()
+
+df<-as.disk.frame(a)
+
+
+df1 = mutate(df, date = as.Date(as.character(datadate), format="%Y%m%d"))
+
+head(df1)
+```
+
+
+3. Check if your virus scanner is blocking interprocess communication
+
+4. Try to apply the function to just one chunk, perhaps there is a syntax error or column error? If one chunk works then you can rule out coding error
+
+```
+get_chunk(df, 1) %>%
+  mutate(date = as.Date(as.character(datadate), format="%Y%m%d"))
+```
+
+5. Set the number of workers to 1, so there is no more inter-process communication. Does it work now? If it does, then it's the inter process communication. You might need to contact your admin for help
+
+```
+setup_disk.frame(workers=1)
+mutate(df, date = as.Date(as.character(datadate), format="%Y%m%d"))
+As an MWE this works for me.
+
+a = data.frame(datadate = rep("20201007", 3e6))
+```
diff --git a/cran-comments.md b/cran-comments.md
index 3784d366..b661d1a8 100644
--- a/cran-comments.md
+++ b/cran-comments.md
@@ -1,11 +1,11 @@
-## Submission for v0.4.0
-*  Fixed recently reported warnings
+## Submission for v0.5.0
+*  Fixed issue in CRAN check but needed to update version to follow semver conventions
 
 ## Test environments
-* local Windows 10 Pro install, R 4.0.3
-* local Windows 10 Pro install, R devel (as of 2021-02-11)
-* local Linux/Ubuntu install, R 4.0.3
-* local Linux/Ubuntu install, R devel (as of 2021-02-11)
+* local Windows 10 Pro install, R 4.0.5
+* local Windows 10 Pro install, R devel (as of 2021-05-09)
+* local Linux/Ubuntu install, R 4.0.5
+* local Linux/Ubuntu install, R devel (as of 2021-05-09)
 
 ## R CMD check results
 There were no ERRORs nor WARNINGs nor NOTE when run locally.
diff --git a/docs/404.html b/docs/404.html
index 8c5ef8b1..78100fa4 100644
--- a/docs/404.html
+++ b/docs/404.html
@@ -1,66 +1,27 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en">
+<head>
+<meta http-equiv="Content-Type" content="text/html; charset=UTF-8">
+<meta charset="utf-8">
 <meta http-equiv="X-UA-Compatible" content="IE=edge">
 <meta name="viewport" content="width=device-width, initial-scale=1.0">
-
 <title>Page not found (404) • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="bootstrap-toc.css">
-<script src="bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="pkgdown.css" rel="stylesheet">
-<script src="pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Page not found (404)" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous">
+<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="bootstrap-toc.css">
+<script src="bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous">
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous">
+<!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="pkgdown.css" rel="stylesheet">
+<script src="pkgdown.js"></script><meta property="og:title" content="Page not found (404)">
+<!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 <![endif]-->
+</head>
+<body data-spy="scroll" data-target="#toc">
+    
 
-
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-title-body">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -71,18 +32,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
       <ul class="nav navbar-nav">
-        <li>
-  <a href="index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
 <li>
   <a href="reference/index.html">Reference</a>
 </li>
@@ -93,7 +48,7 @@
     <span class="caret"></span>
   </a>
   <ul class="dropdown-menu" role="menu">
-    <li>
+<li>
       <a href="articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -126,30 +81,33 @@
     <li>
       <a href="articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
+    <li>
+      <a href="articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
   </ul>
 </li>
 <li>
   <a href="news/index.html">Changelog</a>
 </li>
       </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+<ul class="nav navbar-nav navbar-right">
+<li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
       </ul>
-      
-    </div><!--/.nav-collapse -->
-  </div><!--/.container -->
-</div><!--/.navbar -->
+</div>
+<!--/.nav-collapse -->
+  </div>
+<!--/.container -->
+</div>
+<!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="contents col-md-9">
     <div class="page-header">
       <h1>Page not found (404)</h1>
@@ -160,31 +118,31 @@ <h1>Page not found (404)</h1>
   </div>
 
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
     </nav>
-  </div>
+</div>
 
 </div>
 
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p>
+<p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p>
+<p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
       </footer>
-   </div>
+</div>
 
   
 
 
+  
+
   </body>
 </html>
-
-
diff --git a/docs/LICENSE-text.html b/docs/LICENSE-text.html
index f2435efd..abba5cc8 100644
--- a/docs/LICENSE-text.html
+++ b/docs/LICENSE-text.html
@@ -1,66 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>License • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="bootstrap-toc.css">
-<script src="bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="pkgdown.css" rel="stylesheet">
-<script src="pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="License" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>License • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="bootstrap-toc.css"><script src="bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="pkgdown.css" rel="stylesheet"><script src="pkgdown.js"></script><meta property="og:title" content="License"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
-
-
-  </head>
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-title-body">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -71,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -92,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -126,30 +64,26 @@
     <li>
       <a href="articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="contents col-md-9">
     <div class="page-header">
       <h1>License</h1>
@@ -162,31 +96,27 @@ <h1>License</h1>
   </div>
 
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 
 </div>
 
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/articles/01-intro.html b/docs/articles/01-intro.html
index 93f57ca8..584809c3 100644
--- a/docs/articles/01-intro.html
+++ b/docs/articles/01-intro.html
@@ -19,6 +19,8 @@
 <![endif]-->
 </head>
 <body data-spy="scroll" data-target="#toc">
+    
+
     <div class="container template-article">
       <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
@@ -31,18 +33,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
       <ul class="nav navbar-nav">
-<li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
 <li>
   <a href="../reference/index.html">Reference</a>
 </li>
@@ -86,6 +82,9 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
   </ul>
 </li>
 <li>
@@ -94,8 +93,8 @@
       </ul>
 <ul class="nav navbar-nav navbar-right">
 <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
@@ -114,19 +113,19 @@
     <div class="page-header toc-ignore">
       <h1 data-toc-skip>Preface - The birth of <code>disk.frame</code>
 </h1>
-                        <h4 class="author">ZJ</h4>
+                        <h4 data-toc-skip class="author">ZJ</h4>
             
       
-      <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/master/vignettes/01-intro.Rmd"><code>vignettes/01-intro.Rmd</code></a></small>
+      <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/vignettes/01-intro.Rmd" class="external-link"><code>vignettes/01-intro.Rmd</code></a></small>
       <div class="hidden name"><code>01-intro.Rmd</code></div>
 
     </div>
 
     
     
-<div id="the-story-of-how-disk-frame-came-to-be" class="section level1">
-<h1 class="hasAnchor">
-<a href="#the-story-of-how-disk-frame-came-to-be" class="anchor"></a>The story of how <code>{disk.frame}</code> came to be</h1>
+<div class="section level2">
+<h2 id="the-story-of-how-disk-frame-came-to-be">The story of how <code>{disk.frame}</code> came to be<a class="anchor" aria-label="anchor" href="#the-story-of-how-disk-frame-came-to-be"></a>
+</h2>
 <p>I was working at one of Australia’s biggest banks and their shiny new SAS server was experiencing huge instability issues. As a result, we had to run SAS on our laptops to perform huge amounts of data manipulation. A simple SQL query can take around 20 minutes.</p>
 <p>I had enough.</p>
 <p>That’s why I created <code>disk.frame</code> - a larger-than-RAM data manipulation framework for R. The same query now only takes 10 seconds.</p>
@@ -144,11 +143,13 @@ <h1 class="hasAnchor">
 
 
       <footer><div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+  <p></p>
+<p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p>
+<p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
       </footer>
@@ -157,5 +158,7 @@ <h1 class="hasAnchor">
   
 
 
+  
+
   </body>
 </html>
diff --git a/docs/articles/01-intro_files/header-attrs-2.8/header-attrs.js b/docs/articles/01-intro_files/header-attrs-2.8/header-attrs.js
new file mode 100644
index 00000000..dd57d92e
--- /dev/null
+++ b/docs/articles/01-intro_files/header-attrs-2.8/header-attrs.js
@@ -0,0 +1,12 @@
+// Pandoc 2.9 adds attributes on both header and div. We remove the former (to
+// be compatible with the behavior of Pandoc < 2.8).
+document.addEventListener('DOMContentLoaded', function(e) {
+  var hs = document.querySelectorAll("div.section[class*='level'] > :first-child");
+  var i, h, a;
+  for (i = 0; i < hs.length; i++) {
+    h = hs[i];
+    if (!/^h[1-6]$/i.test(h.tagName)) continue;  // it should be a header h1-h6
+    a = h.attributes;
+    while (a.length > 0) h.removeAttribute(a[0].name);
+  }
+});
diff --git a/docs/articles/02-intro-disk-frame.html b/docs/articles/02-intro-disk-frame.html
index 9ff4e6d6..fec5669f 100644
--- a/docs/articles/02-intro-disk-frame.html
+++ b/docs/articles/02-intro-disk-frame.html
@@ -19,6 +19,8 @@
 <![endif]-->
 </head>
 <body data-spy="scroll" data-target="#toc">
+    
+
     <div class="container template-article">
       <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
@@ -31,18 +33,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
       <ul class="nav navbar-nav">
-<li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
 <li>
   <a href="../reference/index.html">Reference</a>
 </li>
@@ -86,6 +82,9 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
   </ul>
 </li>
 <li>
@@ -94,8 +93,8 @@
       </ul>
 <ul class="nav navbar-nav navbar-right">
 <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
@@ -113,291 +112,313 @@
   <div class="col-md-9 contents">
     <div class="page-header toc-ignore">
       <h1 data-toc-skip>Quick Start: Basic Operations with nycflights13</h1>
-                        <h4 class="author">ZJ</h4>
+                        <h4 data-toc-skip class="author">ZJ</h4>
             
       
-      <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/master/vignettes/02-intro-disk-frame.Rmd"><code>vignettes/02-intro-disk-frame.Rmd</code></a></small>
+      <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/vignettes/02-intro-disk-frame.Rmd" class="external-link"><code>vignettes/02-intro-disk-frame.Rmd</code></a></small>
       <div class="hidden name"><code>02-intro-disk-frame.Rmd</code></div>
 
     </div>
 
     
     
-<div id="quick-start---replicating-dplyrs-tutorial-on-nycflight13" class="section level1">
-<h1 class="hasAnchor">
-<a href="#quick-start---replicating-dplyrs-tutorial-on-nycflight13" class="anchor"></a>Quick Start - replicating dplyr’s tutorial on nycflight13</h1>
-<p>The <a href="https://github.com/xiaodaigh/disk.frame"><code>disk.frame</code> package</a> aims to be the answer to the question: how do I manipulate structured tabular data that doesn’t fit into Random Access Memory (RAM)?</p>
+<div class="section level2">
+<h2 id="quick-start---replicating-dplyrs-tutorial-on-nycflight13">Quick Start - replicating dplyr’s tutorial on nycflight13<a class="anchor" aria-label="anchor" href="#quick-start---replicating-dplyrs-tutorial-on-nycflight13"></a>
+</h2>
+<p>The <a href="https://github.com/xiaodaigh/disk.frame" class="external-link"><code>disk.frame</code> package</a> aims to be the answer to the question: how do I manipulate structured tabular data that doesn’t fit into Random Access Memory (RAM)?</p>
 <p>In a nutshell, <code>disk.frame</code> makes use of two simple ideas</p>
 <ol style="list-style-type: decimal">
 <li>split up a larger-than-RAM dataset into chunks and store each chunk in a separate file inside a folder and</li>
 <li>provide a convenient API to manipulate these chunks</li>
 </ol>
 <p><code>disk.frame</code> performs a similar role to distributed systems such as Apache Spark, Python’s Dask, and Julia’s JuliaDB.jl for <em>medium data</em> which are datasets that are too large for RAM but not quite large enough to qualify as <em>big data</em>.</p>
-<p>In this tutorial, we introduce <code>disk.frame</code>, address some common questions, and replicate the <a href="https://spark.rstudio.com/dplyr/">sparklyr data manipulation tutorial</a> using <code>disk.frame</code> constructs.</p>
-<div id="installation" class="section level2">
-<h2 class="hasAnchor">
-<a href="#installation" class="anchor"></a>Installation</h2>
+<p>In this tutorial, we introduce <code>disk.frame</code>, address some common questions, and replicate the <a href="https://spark.rstudio.com/dplyr/" class="external-link">sparklyr data manipulation tutorial</a> using <code>disk.frame</code> constructs.</p>
+<div class="section level3">
+<h3 id="installation">Installation<a class="anchor" aria-label="anchor" href="#installation"></a>
+</h3>
 <p>Simply run</p>
-<div class="sourceCode" id="cb1"><html><body><pre class="r"><span class="fu"><a href="https://rdrr.io/r/utils/install.packages.html">install.packages</a></span>(<span class="st">"disk.frame"</span>) <span class="co"># when CRAN ready</span></pre></body></html></div>
+<div class="sourceCode" id="cb1"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu"><a href="https://rdrr.io/r/utils/install.packages.html" class="external-link">install.packages</a></span><span class="op">(</span><span class="st">"disk.frame"</span><span class="op">)</span> <span class="co"># when CRAN ready</span></code></pre></div>
 <p>or</p>
-<div class="sourceCode" id="cb2"><html><body><pre class="r"><span class="kw pkg">devtools</span><span class="kw ns">::</span><span class="fu"><a href="https://devtools.r-lib.org//reference/remote-reexports.html">install_github</a></span>(<span class="st">"xiaodaigh/disk.frame"</span>)</pre></body></html></div>
+<div class="sourceCode" id="cb2"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu">devtools</span><span class="fu">::</span><span class="fu"><a href="https://devtools.r-lib.org/reference/remote-reexports.html" class="external-link">install_github</a></span><span class="op">(</span><span class="st">"xiaodaigh/disk.frame"</span><span class="op">)</span></code></pre></div>
 </div>
-<div id="set-up-disk-frame" class="section level2">
-<h2 class="hasAnchor">
-<a href="#set-up-disk-frame" class="anchor"></a>Set-up <code>disk.frame</code>
-</h2>
+<div class="section level3">
+<h3 id="set-up-disk-frame">Set-up <code>disk.frame</code><a class="anchor" aria-label="anchor" href="#set-up-disk-frame"></a>
+</h3>
 <p><code>disk.frame</code> works best if it can process multiple data chunks in parallel. The best way to set-up <code>disk.frame</code> so that each CPU core runs a background worker is by using</p>
-<div class="sourceCode" id="cb3"><html><body><pre class="r"><span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span>()
+<div class="sourceCode" id="cb3"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span><span class="op">(</span><span class="op">)</span>
 
 <span class="co"># this will allow unlimited amount of data to be passed from worker to worker</span>
-<span class="fu"><a href="https://rdrr.io/r/base/options.html">options</a></span>(<span class="kw">future.globals.maxSize</span> <span class="kw">=</span> <span class="fl">Inf</span>)</pre></body></html></div>
+<span class="fu"><a href="https://rdrr.io/r/base/options.html" class="external-link">options</a></span><span class="op">(</span>future.globals.maxSize <span class="op">=</span> <span class="cn">Inf</span><span class="op">)</span></code></pre></div>
 <p>The <code><a href="../reference/setup_disk.frame.html">setup_disk.frame()</a></code> sets up background workers equal to the number of CPU cores; please note that, by default, hyper-threaded cores are counted as one not two.</p>
-<p>Alternatively, one may specify the number of workers using <code><a href="../reference/setup_disk.frame.html">setup_disk.frame(workers = n)</a></code>.</p>
+<p>Alternatively, one may specify the number of workers using <code>setup_disk.frame(workers = n)</code>.</p>
 </div>
-<div id="basic-data-operations-with-disk-frame" class="section level2">
-<h2 class="hasAnchor">
-<a href="#basic-data-operations-with-disk-frame" class="anchor"></a>Basic Data Operations with <code>disk.frame</code>
-</h2>
-<p>The <code>disk.frame</code> package provides convenient functions to convert <code>data.frame</code>s and CSVs to <code>disk.frame</code>s.</p>
-<div id="creating-a-disk-frame-from-data-frame" class="section level3">
-<h3 class="hasAnchor">
-<a href="#creating-a-disk-frame-from-data-frame" class="anchor"></a>Creating a <code>disk.frame</code> from <code>data.frame</code>
+<div class="section level3">
+<h3 id="basic-data-operations-with-disk-frame">Basic Data Operations with <code>disk.frame</code><a class="anchor" aria-label="anchor" href="#basic-data-operations-with-disk-frame"></a>
 </h3>
+<p>The <code>disk.frame</code> package provides convenient functions to convert <code>data.frame</code>s and CSVs to <code>disk.frame</code>s.</p>
+<div class="section level4">
+<h4 id="creating-a-disk-frame-from-data-frame">Creating a <code>disk.frame</code> from <code>data.frame</code><a class="anchor" aria-label="anchor" href="#creating-a-disk-frame-from-data-frame"></a>
+</h4>
 <p>We convert a <code>data.frame</code> to <code>disk.frame</code> using the <code>as.data.frame</code> function.</p>
-<div class="sourceCode" id="cb4"><html><body><pre class="r"><span class="fu"><a href="https://rdrr.io/r/base/library.html">library</a></span>(<span class="no">nycflights13</span>)
-<span class="fu"><a href="https://rdrr.io/r/base/library.html">library</a></span>(<span class="no">dplyr</span>)
-<span class="fu"><a href="https://rdrr.io/r/base/library.html">library</a></span>(<span class="no">disk.frame</span>)
-<span class="fu"><a href="https://rdrr.io/r/base/library.html">library</a></span>(<span class="no">data.table</span>)
+<div class="sourceCode" id="cb4"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://github.com/hadley/nycflights13" class="external-link">nycflights13</a></span><span class="op">)</span>
+<span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://dplyr.tidyverse.org" class="external-link">dplyr</a></span><span class="op">)</span>
+<span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://diskframe.com" class="external-link">disk.frame</a></span><span class="op">)</span>
+<span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://r-datatable.com" class="external-link">data.table</a></span><span class="op">)</span>
 
 <span class="co"># convert the flights data to a disk.frame and store the disk.frame in the folder</span>
 <span class="co"># "tmp_flights" and overwrite any content if needed</span>
-<span class="no">flights.df</span> <span class="kw">&lt;-</span> <span class="fu"><a href="../reference/as.disk.frame.html">as.disk.frame</a></span>(
-  <span class="no">flights</span>,
-  <span class="kw">outdir</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/file.path.html">file.path</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/tempfile.html">tempdir</a></span>(), <span class="st">"tmp_flights.df"</span>),
-  <span class="kw">overwrite</span> <span class="kw">=</span> <span class="fl">TRUE</span>)
-<span class="no">flights.df</span></pre></body></html></div>
+<span class="va">flights.df</span> <span class="op">&lt;-</span> <span class="fu"><a href="../reference/as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span>
+  <span class="va">flights</span>, 
+  outdir <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/file.path.html" class="external-link">file.path</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempdir</a></span><span class="op">(</span><span class="op">)</span>, <span class="st">"tmp_flights.df"</span><span class="op">)</span>,
+  overwrite <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span>
+<span class="va">flights.df</span></code></pre></div>
 <p>You should now see a folder called <code>tmp_flights</code> with some files in it, namely <code>1.fst</code>, <code>2.fst</code>…. where each <code>fst</code> files is one chunk of the <code>disk.frame</code>.</p>
 </div>
-<div id="creating-a-disk-frame-from-csv" class="section level3">
-<h3 class="hasAnchor">
-<a href="#creating-a-disk-frame-from-csv" class="anchor"></a>Creating a <code>disk.frame</code> from CSV</h3>
-<div class="sourceCode" id="cb5"><html><body><pre class="r"><span class="fu"><a href="https://rdrr.io/r/base/library.html">library</a></span>(<span class="no">nycflights13</span>)
+<div class="section level4">
+<h4 id="creating-a-disk-frame-from-csv">Creating a <code>disk.frame</code> from CSV<a class="anchor" aria-label="anchor" href="#creating-a-disk-frame-from-csv"></a>
+</h4>
+<div class="sourceCode" id="cb5"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://github.com/hadley/nycflights13" class="external-link">nycflights13</a></span><span class="op">)</span>
 <span class="co"># write a csv</span>
-<span class="no">csv_path</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/file.path.html">file.path</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/tempfile.html">tempdir</a></span>(), <span class="st">"tmp_flights.csv"</span>)
-<span class="kw pkg">data.table</span><span class="kw ns">::</span><span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/fwrite.html">fwrite</a></span>(<span class="no">flights</span>, <span class="no">csv_path</span>)
+<span class="va">csv_path</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/file.path.html" class="external-link">file.path</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempdir</a></span><span class="op">(</span><span class="op">)</span>, <span class="st">"tmp_flights.csv"</span><span class="op">)</span>
+<span class="fu">data.table</span><span class="fu">::</span><span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/fwrite.html" class="external-link">fwrite</a></span><span class="op">(</span><span class="va">flights</span>, <span class="va">csv_path</span><span class="op">)</span>
 
 <span class="co"># load the csv into a disk.frame</span>
-<span class="no">df_path</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/file.path.html">file.path</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/tempfile.html">tempdir</a></span>(), <span class="st">"tmp_flights.df"</span>)
-<span class="no">flights.df</span> <span class="kw">&lt;-</span> <span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span>(
-  <span class="no">csv_path</span>,
-  <span class="kw">outdir</span> <span class="kw">=</span> <span class="no">df_path</span>,
-  <span class="kw">overwrite</span> <span class="kw">=</span> <span class="no">T</span>)
-
-<span class="no">flights.df</span></pre></body></html></div>
+<span class="va">df_path</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/file.path.html" class="external-link">file.path</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempdir</a></span><span class="op">(</span><span class="op">)</span>, <span class="st">"tmp_flights.df"</span><span class="op">)</span>
+<span class="va">flights.df</span> <span class="op">&lt;-</span> <span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span><span class="op">(</span>
+  <span class="va">csv_path</span>, 
+  outdir <span class="op">=</span> <span class="va">df_path</span>,
+  overwrite <span class="op">=</span> <span class="cn">T</span><span class="op">)</span>
+  
+<span class="va">flights.df</span></code></pre></div>
 <p>If the CSV is too large to read in, then we can also use the <code>in_chunk_size</code> option to control how many rows to read in at once. For example to read in the data 100,000 rows at a time.</p>
-<div class="sourceCode" id="cb6"><html><body><pre class="r"><span class="fu"><a href="https://rdrr.io/r/base/library.html">library</a></span>(<span class="no">nycflights13</span>)
-<span class="fu"><a href="https://rdrr.io/r/base/library.html">library</a></span>(<span class="no">disk.frame</span>)
+<div class="sourceCode" id="cb6"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://github.com/hadley/nycflights13" class="external-link">nycflights13</a></span><span class="op">)</span>
+<span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://diskframe.com" class="external-link">disk.frame</a></span><span class="op">)</span>
 
 <span class="co"># write a csv</span>
-<span class="no">csv_path</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/file.path.html">file.path</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/tempfile.html">tempdir</a></span>(), <span class="st">"tmp_flights.csv"</span>)
+<span class="va">csv_path</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/file.path.html" class="external-link">file.path</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempdir</a></span><span class="op">(</span><span class="op">)</span>, <span class="st">"tmp_flights.csv"</span><span class="op">)</span>
 
-<span class="kw pkg">data.table</span><span class="kw ns">::</span><span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/fwrite.html">fwrite</a></span>(<span class="no">flights</span>, <span class="no">csv_path</span>)
+<span class="fu">data.table</span><span class="fu">::</span><span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/fwrite.html" class="external-link">fwrite</a></span><span class="op">(</span><span class="va">flights</span>, <span class="va">csv_path</span><span class="op">)</span>
 
-<span class="no">df_path</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/file.path.html">file.path</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/tempfile.html">tempdir</a></span>(), <span class="st">"tmp_flights.df"</span>)
+<span class="va">df_path</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/file.path.html" class="external-link">file.path</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempdir</a></span><span class="op">(</span><span class="op">)</span>, <span class="st">"tmp_flights.df"</span><span class="op">)</span>
 
-<span class="no">flights.df</span> <span class="kw">&lt;-</span> <span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span>(
-  <span class="no">csv_path</span>,
-  <span class="kw">outdir</span> <span class="kw">=</span> <span class="no">df_path</span>,
-  <span class="kw">in_chunk_size</span> <span class="kw">=</span> <span class="fl">100000</span>)
-
-<span class="no">flights.df</span></pre></body></html></div>
+<span class="va">flights.df</span> <span class="op">&lt;-</span> <span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span><span class="op">(</span>
+  <span class="va">csv_path</span>, 
+  outdir <span class="op">=</span> <span class="va">df_path</span>, 
+  in_chunk_size <span class="op">=</span> <span class="fl">100000</span><span class="op">)</span>
+<span class="co">#&gt; Warning: UNRELIABLE VALUE: Future ('&lt;none&gt;') unexpectedly generated random</span>
+<span class="co">#&gt; numbers without specifying argument 'seed'. There is a risk that those random</span>
+<span class="co">#&gt; numbers are not statistically sound and the overall results might be invalid.</span>
+<span class="co">#&gt; To fix this, specify 'seed=TRUE'. This ensures that proper, parallel-safe random</span>
+<span class="co">#&gt; numbers are produced via the L'Ecuyer-CMRG method. To disable this check, use</span>
+<span class="co">#&gt; 'seed=NULL', or set option 'future.rng.onMisuse' to "ignore".</span>
+  
+<span class="va">flights.df</span></code></pre></div>
 <p><code>disk.frame</code> also has a function <code>zip_to_disk.frame</code> that can convert every CSV in a zip file to <code>disk.frame</code>s.</p>
 </div>
-<div id="simple-dplyr-verbs-and-lazy-evaluation" class="section level3">
-<h3 class="hasAnchor">
-<a href="#simple-dplyr-verbs-and-lazy-evaluation" class="anchor"></a>Simple <code>dplyr</code> verbs and lazy evaluation</h3>
-<div class="sourceCode" id="cb7"><html><body><pre class="r"><span class="no">flights.df1</span> <span class="kw">&lt;-</span> <span class="fu"><a href="https://dplyr.tidyverse.org/reference/select.html">select</a></span>(<span class="no">flights.df</span>, <span class="no">year</span>:<span class="no">day</span>, <span class="no">arr_delay</span>, <span class="no">dep_delay</span>)
-<span class="no">flights.df1</span></pre></body></html></div>
-<div class="sourceCode" id="cb8"><html><body><pre class="r"><span class="fu"><a href="https://rdrr.io/r/base/class.html">class</a></span>(<span class="no">flights.df1</span>)
-<span class="co">#&gt; [1] "disk.frame"        "disk.frame.folder"</span></pre></body></html></div>
-<p>The class of <code>flights.df1</code> is also a <code>disk.frame</code> after the <code><a href="https://dplyr.tidyverse.org/reference/select.html">dplyr::select</a></code> transformation. Also, <code>disk.frame</code> operations are by default (and where possible) <strong>lazy</strong>, meaning it doesn’t perform the operations right away. Instead, it waits until you call <code>collect</code>. Exceptions to this rule are the <code>*_join</code> operations which evaluated <em>eagerly</em> under certain conditions see <strong>Joins for disk.frame in-depth</strong> for details.</p>
+<div class="section level4">
+<h4 id="simple-dplyr-verbs-and-lazy-evaluation">Simple <code>dplyr</code> verbs and lazy evaluation<a class="anchor" aria-label="anchor" href="#simple-dplyr-verbs-and-lazy-evaluation"></a>
+</h4>
+<div class="sourceCode" id="cb7"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">flights.df1</span> <span class="op">&lt;-</span> <span class="fu"><a href="https://dplyr.tidyverse.org/reference/select.html" class="external-link">select</a></span><span class="op">(</span><span class="va">flights.df</span>, <span class="va">year</span><span class="op">:</span><span class="va">day</span>, <span class="va">arr_delay</span>, <span class="va">dep_delay</span><span class="op">)</span>
+<span class="va">flights.df1</span></code></pre></div>
+<div class="sourceCode" id="cb8"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu"><a href="https://rdrr.io/r/base/class.html" class="external-link">class</a></span><span class="op">(</span><span class="va">flights.df1</span><span class="op">)</span>
+<span class="co">#&gt; [1] "disk.frame"        "disk.frame.folder"</span></code></pre></div>
+<p>The class of <code>flights.df1</code> is also a <code>disk.frame</code> after the <code><a href="https://dplyr.tidyverse.org/reference/select.html" class="external-link">dplyr::select</a></code> transformation. Also, <code>disk.frame</code> operations are by default (and where possible) <strong>lazy</strong>, meaning it doesn’t perform the operations right away. Instead, it waits until you call <code>collect</code>. Exceptions to this rule are the <code>*_join</code> operations which evaluated <em>eagerly</em> under certain conditions see <strong>Joins for disk.frame in-depth</strong> for details.</p>
 <p>For lazily constructed <code>disk.frame</code>s (e.g. <code>flights.df1</code>). The function <code>collect</code> can be used to bring the results from disk into R, e.g.</p>
-<div class="sourceCode" id="cb9"><html><body><pre class="r"><span class="fu"><a href="https://dplyr.tidyverse.org/reference/compute.html">collect</a></span>(<span class="no">flights.df1</span>) <span class="kw">%&gt;%</span> <span class="fu"><a href="https://rdrr.io/r/utils/head.html">head</a></span>(<span class="fl">2</span>)
+<div class="sourceCode" id="cb9"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu"><a href="https://dplyr.tidyverse.org/reference/compute.html" class="external-link">collect</a></span><span class="op">(</span><span class="va">flights.df1</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="fu"><a href="https://rdrr.io/r/utils/head.html" class="external-link">head</a></span><span class="op">(</span><span class="fl">2</span><span class="op">)</span>
 <span class="co">#&gt;    year month day arr_delay dep_delay</span>
 <span class="co">#&gt; 1: 2013     1   1        11         2</span>
-<span class="co">#&gt; 2: 2013     1   1        20         4</span></pre></body></html></div>
+<span class="co">#&gt; 2: 2013     1   1        20         4</span></code></pre></div>
 <p>Of course, for larger-than-RAM datasets, one wouldn’t call <code>collect</code> on the whole <code>disk.frame</code> (because why would you need <code>disk.frame</code> otherwise). More likely, one would call <code>collect</code> on a <code>filter</code>ed dataset or one summarized with <code>group_by</code>.</p>
 <p>Some examples of other dplyr verbs applied:</p>
-<div class="sourceCode" id="cb10"><html><body><pre class="r"><span class="fu"><a href="https://dplyr.tidyverse.org/reference/filter.html">filter</a></span>(<span class="no">flights.df</span>, <span class="no">dep_delay</span> <span class="kw">&gt;</span> <span class="fl">1000</span>) <span class="kw">%&gt;%</span> <span class="no">collect</span> <span class="kw">%&gt;%</span> <span class="fu"><a href="https://rdrr.io/r/utils/head.html">head</a></span>(<span class="fl">2</span>)
-<span class="co">#&gt;   year month day dep_time sched_dep_time dep_delay arr_time sched_arr_time</span>
-<span class="co">#&gt; 1 2013     1   9      641            900      1301     1242           1530</span>
-<span class="co">#&gt; 2 2013     1  10     1121           1635      1126     1239           1810</span>
-<span class="co">#&gt;   arr_delay carrier flight tailnum origin dest air_time distance hour minute</span>
-<span class="co">#&gt; 1      1272      HA     51  N384HA    JFK  HNL      640     4983    9      0</span>
-<span class="co">#&gt; 2      1109      MQ   3695  N517MQ    EWR  ORD      111      719   16     35</span>
+<div class="sourceCode" id="cb10"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu"><a href="https://dplyr.tidyverse.org/reference/filter.html" class="external-link">filter</a></span><span class="op">(</span><span class="va">flights.df</span>, <span class="va">dep_delay</span> <span class="op">&gt;</span> <span class="fl">1000</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="va">collect</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="fu"><a href="https://rdrr.io/r/utils/head.html" class="external-link">head</a></span><span class="op">(</span><span class="fl">2</span><span class="op">)</span>
+<span class="co">#&gt;    year month day dep_time sched_dep_time dep_delay arr_time sched_arr_time</span>
+<span class="co">#&gt; 1: 2013     1   9      641            900      1301     1242           1530</span>
+<span class="co">#&gt; 2: 2013     1  10     1121           1635      1126     1239           1810</span>
+<span class="co">#&gt;    arr_delay carrier flight tailnum origin dest air_time distance hour minute</span>
+<span class="co">#&gt; 1:      1272      HA     51  N384HA    JFK  HNL      640     4983    9      0</span>
+<span class="co">#&gt; 2:      1109      MQ   3695  N517MQ    EWR  ORD      111      719   16     35</span>
 <span class="co">#&gt;              time_hour</span>
-<span class="co">#&gt; 1 2013-01-09T14:00:00Z</span>
-<span class="co">#&gt; 2 2013-01-10T21:00:00Z</span></pre></body></html></div>
-<div class="sourceCode" id="cb11"><html><body><pre class="r"><span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate.html">mutate</a></span>(<span class="no">flights.df</span>, <span class="kw">speed</span> <span class="kw">=</span> <span class="no">distance</span> / <span class="no">air_time</span> * <span class="fl">60</span>) <span class="kw">%&gt;%</span> <span class="no">collect</span> <span class="kw">%&gt;%</span> <span class="fu"><a href="https://rdrr.io/r/utils/head.html">head</a></span>(<span class="fl">2</span>)
-<span class="co">#&gt;   year month day dep_time sched_dep_time dep_delay arr_time sched_arr_time</span>
-<span class="co">#&gt; 1 2013     1   1      517            515         2      830            819</span>
-<span class="co">#&gt; 2 2013     1   1      533            529         4      850            830</span>
-<span class="co">#&gt;   arr_delay carrier flight tailnum origin dest air_time distance hour minute</span>
-<span class="co">#&gt; 1        11      UA   1545  N14228    EWR  IAH      227     1400    5     15</span>
-<span class="co">#&gt; 2        20      UA   1714  N24211    LGA  IAH      227     1416    5     29</span>
+<span class="co">#&gt; 1: 2013-01-09 14:00:00</span>
+<span class="co">#&gt; 2: 2013-01-10 21:00:00</span></code></pre></div>
+<div class="sourceCode" id="cb11"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate.html" class="external-link">mutate</a></span><span class="op">(</span><span class="va">flights.df</span>, speed <span class="op">=</span> <span class="va">distance</span> <span class="op">/</span> <span class="va">air_time</span> <span class="op">*</span> <span class="fl">60</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="va">collect</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="fu"><a href="https://rdrr.io/r/utils/head.html" class="external-link">head</a></span><span class="op">(</span><span class="fl">2</span><span class="op">)</span>
+<span class="co">#&gt;    year month day dep_time sched_dep_time dep_delay arr_time sched_arr_time</span>
+<span class="co">#&gt; 1: 2013     1   1      517            515         2      830            819</span>
+<span class="co">#&gt; 2: 2013     1   1      533            529         4      850            830</span>
+<span class="co">#&gt;    arr_delay carrier flight tailnum origin dest air_time distance hour minute</span>
+<span class="co">#&gt; 1:        11      UA   1545  N14228    EWR  IAH      227     1400    5     15</span>
+<span class="co">#&gt; 2:        20      UA   1714  N24211    LGA  IAH      227     1416    5     29</span>
 <span class="co">#&gt;              time_hour    speed</span>
-<span class="co">#&gt; 1 2013-01-01T10:00:00Z 370.0441</span>
-<span class="co">#&gt; 2 2013-01-01T10:00:00Z 374.2731</span></pre></body></html></div>
+<span class="co">#&gt; 1: 2013-01-01 10:00:00 370.0441</span>
+<span class="co">#&gt; 2: 2013-01-01 10:00:00 374.2731</span></code></pre></div>
 </div>
-<div id="examples-of-not-fully-supported-dplyr-verbs" class="section level3">
-<h3 class="hasAnchor">
-<a href="#examples-of-not-fully-supported-dplyr-verbs" class="anchor"></a>Examples of NOT fully supported <code>dplyr</code> verbs</h3>
+<div class="section level4">
+<h4 id="examples-of-not-fully-supported-dplyr-verbs">Examples of NOT fully supported <code>dplyr</code> verbs<a class="anchor" aria-label="anchor" href="#examples-of-not-fully-supported-dplyr-verbs"></a>
+</h4>
 <p>The <code>chunk_arrange</code> function arranges (sorts) each chunk but not the whole dataset. So use with caution. Similarly <code>chunk_summarise</code> creates summary variables within each chunk and hence also needs to be used with caution. In the Group By section, we demonstrate how to use <code>summarise</code> in the <code>disk.frame</code> context correctly with <code>hard_group_by</code>s.</p>
-<div class="sourceCode" id="cb12"><html><body><pre class="r"><span class="co"># this only sorts within each chunk</span>
-<span class="fu"><a href="../reference/dplyr_verbs.html">chunk_arrange</a></span>(<span class="no">flights.df</span>, <span class="kw pkg">dplyr</span><span class="kw ns">::</span><span class="fu"><a href="https://dplyr.tidyverse.org/reference/desc.html">desc</a></span>(<span class="no">dep_delay</span>)) <span class="kw">%&gt;%</span> <span class="no">collect</span> <span class="kw">%&gt;%</span> <span class="fu"><a href="https://rdrr.io/r/utils/head.html">head</a></span>(<span class="fl">2</span>)
-<span class="co">#&gt;   year month day dep_time sched_dep_time dep_delay arr_time sched_arr_time</span>
-<span class="co">#&gt; 1 2013     1   9      641            900      1301     1242           1530</span>
-<span class="co">#&gt; 2 2013     1  10     1121           1635      1126     1239           1810</span>
-<span class="co">#&gt;   arr_delay carrier flight tailnum origin dest air_time distance hour minute</span>
-<span class="co">#&gt; 1      1272      HA     51  N384HA    JFK  HNL      640     4983    9      0</span>
-<span class="co">#&gt; 2      1109      MQ   3695  N517MQ    EWR  ORD      111      719   16     35</span>
+<div class="sourceCode" id="cb12"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="co"># this only sorts within each chunk</span>
+<span class="fu"><a href="../reference/dplyr_verbs.html">chunk_arrange</a></span><span class="op">(</span><span class="va">flights.df</span>, <span class="fu">dplyr</span><span class="fu">::</span><span class="fu"><a href="https://dplyr.tidyverse.org/reference/desc.html" class="external-link">desc</a></span><span class="op">(</span><span class="va">dep_delay</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="va">collect</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="fu"><a href="https://rdrr.io/r/utils/head.html" class="external-link">head</a></span><span class="op">(</span><span class="fl">2</span><span class="op">)</span>
+<span class="co">#&gt;    year month day dep_time sched_dep_time dep_delay arr_time sched_arr_time</span>
+<span class="co">#&gt; 1: 2013     1   9      641            900      1301     1242           1530</span>
+<span class="co">#&gt; 2: 2013     1  10     1121           1635      1126     1239           1810</span>
+<span class="co">#&gt;    arr_delay carrier flight tailnum origin dest air_time distance hour minute</span>
+<span class="co">#&gt; 1:      1272      HA     51  N384HA    JFK  HNL      640     4983    9      0</span>
+<span class="co">#&gt; 2:      1109      MQ   3695  N517MQ    EWR  ORD      111      719   16     35</span>
 <span class="co">#&gt;              time_hour</span>
-<span class="co">#&gt; 1 2013-01-09T14:00:00Z</span>
-<span class="co">#&gt; 2 2013-01-10T21:00:00Z</span></pre></body></html></div>
-<div class="sourceCode" id="cb13"><html><body><pre class="r"><span class="fu"><a href="../reference/chunk_group_by.html">chunk_summarize</a></span>(<span class="no">flights.df</span>, <span class="kw">mean_dep_delay</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/mean.html">mean</a></span>(<span class="no">dep_delay</span>, <span class="kw">na.rm</span> <span class="kw">=</span><span class="no">T</span>)) <span class="kw">%&gt;%</span> <span class="no">collect</span>
-<span class="co">#&gt;   mean_dep_delay</span>
-<span class="co">#&gt; 1       12.32700</span>
-<span class="co">#&gt; 2       12.01291</span>
-<span class="co">#&gt; 3       13.81315</span>
-<span class="co">#&gt; 4       12.94445</span>
-<span class="co">#&gt; 5       12.67813</span>
-<span class="co">#&gt; 6       12.05854</span></pre></body></html></div>
+<span class="co">#&gt; 1: 2013-01-09 14:00:00</span>
+<span class="co">#&gt; 2: 2013-01-10 21:00:00</span></code></pre></div>
+<div class="sourceCode" id="cb13"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu"><a href="../reference/chunk_group_by.html">chunk_summarize</a></span><span class="op">(</span><span class="va">flights.df</span>, mean_dep_delay <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/mean.html" class="external-link">mean</a></span><span class="op">(</span><span class="va">dep_delay</span>, na.rm <span class="op">=</span><span class="cn">T</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="va">collect</span>
+<span class="co">#&gt;    mean_dep_delay</span>
+<span class="co">#&gt; 1:       12.32700</span>
+<span class="co">#&gt; 2:       12.01291</span>
+<span class="co">#&gt; 3:       13.81315</span>
+<span class="co">#&gt; 4:       12.94445</span>
+<span class="co">#&gt; 5:       12.67813</span>
+<span class="co">#&gt; 6:       12.05854</span></code></pre></div>
 </div>
-<div id="piping" class="section level3">
-<h3 class="hasAnchor">
-<a href="#piping" class="anchor"></a>Piping</h3>
+<div class="section level4">
+<h4 id="piping">Piping<a class="anchor" aria-label="anchor" href="#piping"></a>
+</h4>
 <p>One can chain <code>dplyr</code> verbs together like with a <code>data.frame</code></p>
-<div class="sourceCode" id="cb14"><html><body><pre class="r"><span class="no">c4</span> <span class="kw">&lt;-</span> <span class="no">flights</span> <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/filter.html">filter</a></span>(<span class="no">month</span> <span class="kw">==</span> <span class="fl">5</span>, <span class="no">day</span> <span class="kw">==</span> <span class="fl">17</span>, <span class="no">carrier</span> <span class="kw">%in%</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html">c</a></span>(<span class="st">'UA'</span>, <span class="st">'WN'</span>, <span class="st">'AA'</span>, <span class="st">'DL'</span>)) <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/select.html">select</a></span>(<span class="no">carrier</span>, <span class="no">dep_delay</span>, <span class="no">air_time</span>, <span class="no">distance</span>) <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate.html">mutate</a></span>(<span class="kw">air_time_hours</span> <span class="kw">=</span> <span class="no">air_time</span> / <span class="fl">60</span>) <span class="kw">%&gt;%</span>
-  <span class="no">collect</span> <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/arrange.html">arrange</a></span>(<span class="no">carrier</span>)<span class="co"># arrange should occur after `collect`</span>
+<div class="sourceCode" id="cb14"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">c4</span> <span class="op">&lt;-</span> <span class="va">flights</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/filter.html" class="external-link">filter</a></span><span class="op">(</span><span class="va">month</span> <span class="op">==</span> <span class="fl">5</span>, <span class="va">day</span> <span class="op">==</span> <span class="fl">17</span>, <span class="va">carrier</span> <span class="op"><a href="https://rdrr.io/r/base/match.html" class="external-link">%in%</a></span> <span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">'UA'</span>, <span class="st">'WN'</span>, <span class="st">'AA'</span>, <span class="st">'DL'</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/select.html" class="external-link">select</a></span><span class="op">(</span><span class="va">carrier</span>, <span class="va">dep_delay</span>, <span class="va">air_time</span>, <span class="va">distance</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate.html" class="external-link">mutate</a></span><span class="op">(</span>air_time_hours <span class="op">=</span> <span class="va">air_time</span> <span class="op">/</span> <span class="fl">60</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="va">collect</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/arrange.html" class="external-link">arrange</a></span><span class="op">(</span><span class="va">carrier</span><span class="op">)</span><span class="co"># arrange should occur after `collect`</span>
 
-<span class="no">c4</span>  <span class="kw">%&gt;%</span> <span class="no">head</span>
+<span class="va">c4</span>  <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="va">head</span>
 <span class="co">#&gt;    carrier dep_delay air_time distance air_time_hours</span>
 <span class="co">#&gt; 1:      AA        -7      142     1089       2.366667</span>
 <span class="co">#&gt; 2:      AA        -9      186     1389       3.100000</span>
 <span class="co">#&gt; 3:      AA        -6      143     1096       2.383333</span>
 <span class="co">#&gt; 4:      AA        -4      114      733       1.900000</span>
 <span class="co">#&gt; 5:      AA        -2      146     1085       2.433333</span>
-<span class="co">#&gt; 6:      AA        -7      119      733       1.983333</span></pre></body></html></div>
+<span class="co">#&gt; 6:      AA        -7      119      733       1.983333</span></code></pre></div>
 </div>
-<div id="list-of-supported-dplyr-verbs" class="section level3">
-<h3 class="hasAnchor">
-<a href="#list-of-supported-dplyr-verbs" class="anchor"></a>List of supported <code>dplyr</code> verbs</h3>
-<div class="sourceCode" id="cb15"><html><body><pre class="r"><span class="no">select</span>
-<span class="no">rename</span>
-<span class="no">filter</span>
-<span class="no">chunk_arrange</span> <span class="co"># within each chunk</span>
-<span class="no">chunk_group_by</span> <span class="co"># within each chunk</span>
-<span class="no">chunk_summarize</span> <span class="co"># within each chunk</span>
-<span class="no">group_by</span> <span class="co"># limited functions</span>
-<span class="no">summarize</span> <span class="co"># limited functions</span>
-<span class="no">mutate</span>
-<span class="no">transmute</span>
-<span class="no">left_join</span>
-<span class="no">inner_join</span>
-<span class="no">full_join</span> <span class="co"># careful. Performance!</span>
-<span class="no">semi_join</span>
-<span class="no">anit_join</span></pre></body></html></div>
+<div class="section level4">
+<h4 id="list-of-supported-dplyr-verbs">List of supported <code>dplyr</code> verbs<a class="anchor" aria-label="anchor" href="#list-of-supported-dplyr-verbs"></a>
+</h4>
+<div class="sourceCode" id="cb15"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">select</span>
+<span class="va">rename</span>
+<span class="va">filter</span>
+<span class="va">chunk_arrange</span> <span class="co"># within each chunk</span>
+<span class="va">chunk_group_by</span> <span class="co"># within each chunk</span>
+<span class="va">chunk_summarize</span> <span class="co"># within each chunk</span>
+<span class="va">group_by</span> <span class="co"># limited functions</span>
+<span class="va">summarize</span> <span class="co"># limited functions</span>
+<span class="va">mutate</span>
+<span class="va">transmute</span>
+<span class="va">left_join</span>
+<span class="va">inner_join</span>
+<span class="va">full_join</span> <span class="co"># careful. Performance!</span>
+<span class="va">semi_join</span>
+<span class="va">anit_join</span></code></pre></div>
 </div>
 </div>
-<div id="sharding-and-distribution-of-chunks" class="section level2">
-<h2 class="hasAnchor">
-<a href="#sharding-and-distribution-of-chunks" class="anchor"></a>Sharding and distribution of chunks</h2>
+<div class="section level3">
+<h3 id="sharding-and-distribution-of-chunks">Sharding and distribution of chunks<a class="anchor" aria-label="anchor" href="#sharding-and-distribution-of-chunks"></a>
+</h3>
 <p>Like other distributed data manipulation frameworks <code>disk.frame</code> utilizes the <em>sharding</em> concept to distribute the data into chunks. For example “to shard by <code>cust_id</code>” means that all rows with the same <code>cust_id</code> will be stored in the same chunk. This enables <code>chunk_group_by</code> by <code>cust_id</code> to produce the same results as non-chunked data.</p>
 <p>The <code>by</code> variables that were used to shard the dataset are called the <code>shardkey</code>s. The <em>sharding</em> is performed by computing a deterministic hash on the shard keys (the <code>by</code> variables) for each row. The hash function produces an integer between <code>1</code> and <code>n</code>, where <code>n</code> is the number of chunks.</p>
 </div>
-<div id="group-by" class="section level2">
-<h2 class="hasAnchor">
-<a href="#group-by" class="anchor"></a>Group-by</h2>
-<p><code>{disk.frame}</code> implements the <code>group_by</code> operation some caveats. In the <code>{disk.frame}</code> framework, only a set functions are supported in <code>summarize</code>. However, the user can create more custom <code>group-by</code> functions can be defined.</p>
-<div class="sourceCode" id="cb16"><html><body><pre class="r"><span class="no">flights.df</span> <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/group_by.html">group_by</a></span>(<span class="no">carrier</span>) <span class="kw">%&gt;%</span> <span class="co"># notice that hard_group_by needs to be set</span>
-  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/summarise.html">summarize</a></span>(<span class="kw">count</span> <span class="kw">=</span> <span class="fu"><a href="https://dplyr.tidyverse.org/reference/context.html">n</a></span>(), <span class="kw">mean_dep_delay</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/mean.html">mean</a></span>(<span class="no">dep_delay</span>, <span class="kw">na.rm</span><span class="kw">=</span><span class="no">T</span>)) <span class="kw">%&gt;%</span>  <span class="co"># mean follows normal R rules</span>
-  <span class="no">collect</span> <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/arrange.html">arrange</a></span>(<span class="no">carrier</span>)
-<span class="co">#&gt; # A tibble: 16 x 3</span>
+<div class="section level3">
+<h3 id="group-by">Group-by<a class="anchor" aria-label="anchor" href="#group-by"></a>
+</h3>
+<p><a href="https://diskframe.com" class="external-link">disk.frame</a> implements the <code>group_by</code> operation some caveats. In the <a href="https://diskframe.com" class="external-link">disk.frame</a> framework, only a set functions are supported in <code>summarize</code>. However, the user can create more custom <code>group-by</code> functions can be defined.</p>
+<div class="sourceCode" id="cb16"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">flights.df</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/group_by.html" class="external-link">group_by</a></span><span class="op">(</span><span class="va">carrier</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="co"># notice that hard_group_by needs to be set</span>
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/summarise.html" class="external-link">summarize</a></span><span class="op">(</span>count <span class="op">=</span> <span class="fu"><a href="https://dplyr.tidyverse.org/reference/context.html" class="external-link">n</a></span><span class="op">(</span><span class="op">)</span>, mean_dep_delay <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/mean.html" class="external-link">mean</a></span><span class="op">(</span><span class="va">dep_delay</span>, na.rm<span class="op">=</span><span class="cn">T</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>  <span class="co"># mean follows normal R rules</span>
+  <span class="va">collect</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/arrange.html" class="external-link">arrange</a></span><span class="op">(</span><span class="va">carrier</span><span class="op">)</span>
+<span class="co">#&gt; <span style="color: #949494;"># A tibble: 16 x 3</span></span>
 <span class="co">#&gt;    carrier count mean_dep_delay</span>
-<span class="co">#&gt;    &lt;chr&gt;   &lt;int&gt;          &lt;dbl&gt;</span>
-<span class="co">#&gt;  1 9E      18460          16.7 </span>
-<span class="co">#&gt;  2 AA      32729           8.59</span>
-<span class="co">#&gt;  3 AS        714           5.80</span>
-<span class="co">#&gt;  4 B6      54635          13.0 </span>
-<span class="co">#&gt;  5 DL      48110           9.26</span>
-<span class="co">#&gt;  6 EV      54173          20.0 </span>
-<span class="co">#&gt;  7 F9        685          20.2 </span>
-<span class="co">#&gt;  8 FL       3260          18.7 </span>
-<span class="co">#&gt;  9 HA        342           4.90</span>
-<span class="co">#&gt; 10 MQ      26397          10.6 </span>
-<span class="co">#&gt; 11 OO         32          12.6 </span>
-<span class="co">#&gt; 12 UA      58665          12.1 </span>
-<span class="co">#&gt; 13 US      20536           3.78</span>
-<span class="co">#&gt; 14 VX       5162          12.9 </span>
-<span class="co">#&gt; 15 WN      12275          17.7 </span>
-<span class="co">#&gt; 16 YV        601          19.0</span></pre></body></html></div>
+<span class="co">#&gt;    <span style="color: #949494; font-style: italic;">&lt;chr&gt;</span>   <span style="color: #949494; font-style: italic;">&lt;int&gt;</span>          <span style="color: #949494; font-style: italic;">&lt;dbl&gt;</span></span>
+<span class="co">#&gt; <span style="color: #BCBCBC;"> 1</span> 9E      <span style="text-decoration: underline;">18</span>460          16.7 </span>
+<span class="co">#&gt; <span style="color: #BCBCBC;"> 2</span> AA      <span style="text-decoration: underline;">32</span>729           8.59</span>
+<span class="co">#&gt; <span style="color: #BCBCBC;"> 3</span> AS        714           5.80</span>
+<span class="co">#&gt; <span style="color: #BCBCBC;"> 4</span> B6      <span style="text-decoration: underline;">54</span>635          13.0 </span>
+<span class="co">#&gt; <span style="color: #BCBCBC;"> 5</span> DL      <span style="text-decoration: underline;">48</span>110           9.26</span>
+<span class="co">#&gt; <span style="color: #BCBCBC;"> 6</span> EV      <span style="text-decoration: underline;">54</span>173          20.0 </span>
+<span class="co">#&gt; <span style="color: #BCBCBC;"> 7</span> F9        685          20.2 </span>
+<span class="co">#&gt; <span style="color: #BCBCBC;"> 8</span> FL       <span style="text-decoration: underline;">3</span>260          18.7 </span>
+<span class="co">#&gt; <span style="color: #BCBCBC;"> 9</span> HA        342           4.90</span>
+<span class="co">#&gt; <span style="color: #BCBCBC;">10</span> MQ      <span style="text-decoration: underline;">26</span>397          10.6 </span>
+<span class="co">#&gt; <span style="color: #BCBCBC;">11</span> OO         32          12.6 </span>
+<span class="co">#&gt; <span style="color: #BCBCBC;">12</span> UA      <span style="text-decoration: underline;">58</span>665          12.1 </span>
+<span class="co">#&gt; <span style="color: #BCBCBC;">13</span> US      <span style="text-decoration: underline;">20</span>536           3.78</span>
+<span class="co">#&gt; <span style="color: #BCBCBC;">14</span> VX       <span style="text-decoration: underline;">5</span>162          12.9 </span>
+<span class="co">#&gt; <span style="color: #BCBCBC;">15</span> WN      <span style="text-decoration: underline;">12</span>275          17.7 </span>
+<span class="co">#&gt; <span style="color: #BCBCBC;">16</span> YV        601          19.0</span></code></pre></div>
 </div>
-<div id="restrict-input-columns-for-faster-processing" class="section level2">
-<h2 class="hasAnchor">
-<a href="#restrict-input-columns-for-faster-processing" class="anchor"></a>Restrict input columns for faster processing</h2>
+<div class="section level3">
+<h3 id="restrict-input-columns-for-faster-processing">Restrict input columns for faster processing<a class="anchor" aria-label="anchor" href="#restrict-input-columns-for-faster-processing"></a>
+</h3>
 <p>One can restrict which input columns to load into memory for each chunk; this can significantly increase the speed of data processing. To restrict the input columns, use the <code>srckeep</code> function which only accepts column names as a string vector.</p>
-<div class="sourceCode" id="cb17"><html><body><pre class="r"><span class="no">flights.df</span> <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="../reference/srckeep.html">srckeep</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/c.html">c</a></span>(<span class="st">"carrier"</span>,<span class="st">"dep_delay"</span>)) <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/group_by.html">group_by</a></span>(<span class="no">carrier</span>) <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/summarise.html">summarize</a></span>(<span class="kw">count</span> <span class="kw">=</span> <span class="fu"><a href="https://dplyr.tidyverse.org/reference/context.html">n</a></span>(), <span class="kw">mean_dep_delay</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/mean.html">mean</a></span>(<span class="no">dep_delay</span>, <span class="kw">na.rm</span><span class="kw">=</span><span class="no">T</span>)) <span class="kw">%&gt;%</span>  <span class="co"># mean follows normal R rules</span>
-  <span class="no">collect</span>
-<span class="co">#&gt; # A tibble: 16 x 3</span>
+<div class="sourceCode" id="cb17"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">flights.df</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="fu"><a href="../reference/srckeep.html">srckeep</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">"carrier"</span>,<span class="st">"dep_delay"</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/group_by.html" class="external-link">group_by</a></span><span class="op">(</span><span class="va">carrier</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/summarise.html" class="external-link">summarize</a></span><span class="op">(</span>count <span class="op">=</span> <span class="fu"><a href="https://dplyr.tidyverse.org/reference/context.html" class="external-link">n</a></span><span class="op">(</span><span class="op">)</span>, mean_dep_delay <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/mean.html" class="external-link">mean</a></span><span class="op">(</span><span class="va">dep_delay</span>, na.rm<span class="op">=</span><span class="cn">T</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>  <span class="co"># mean follows normal R rules</span>
+  <span class="va">collect</span>
+<span class="co">#&gt; <span style="color: #949494;"># A tibble: 16 x 3</span></span>
 <span class="co">#&gt;    carrier count mean_dep_delay</span>
-<span class="co">#&gt;    &lt;chr&gt;   &lt;int&gt;          &lt;dbl&gt;</span>
-<span class="co">#&gt;  1 9E      18460          16.7 </span>
-<span class="co">#&gt;  2 AA      32729           8.59</span>
-<span class="co">#&gt;  3 AS        714           5.80</span>
-<span class="co">#&gt;  4 B6      54635          13.0 </span>
-<span class="co">#&gt;  5 DL      48110           9.26</span>
-<span class="co">#&gt;  6 EV      54173          20.0 </span>
-<span class="co">#&gt;  7 F9        685          20.2 </span>
-<span class="co">#&gt;  8 FL       3260          18.7 </span>
-<span class="co">#&gt;  9 HA        342           4.90</span>
-<span class="co">#&gt; 10 MQ      26397          10.6 </span>
-<span class="co">#&gt; 11 OO         32          12.6 </span>
-<span class="co">#&gt; 12 UA      58665          12.1 </span>
-<span class="co">#&gt; 13 US      20536           3.78</span>
-<span class="co">#&gt; 14 VX       5162          12.9 </span>
-<span class="co">#&gt; 15 WN      12275          17.7 </span>
-<span class="co">#&gt; 16 YV        601          19.0</span></pre></body></html></div>
+<span class="co">#&gt;    <span style="color: #949494; font-style: italic;">&lt;chr&gt;</span>   <span style="color: #949494; font-style: italic;">&lt;int&gt;</span>          <span style="color: #949494; font-style: italic;">&lt;dbl&gt;</span></span>
+<span class="co">#&gt; <span style="color: #BCBCBC;"> 1</span> 9E      <span style="text-decoration: underline;">18</span>460          16.7 </span>
+<span class="co">#&gt; <span style="color: #BCBCBC;"> 2</span> AA      <span style="text-decoration: underline;">32</span>729           8.59</span>
+<span class="co">#&gt; <span style="color: #BCBCBC;"> 3</span> AS        714           5.80</span>
+<span class="co">#&gt; <span style="color: #BCBCBC;"> 4</span> B6      <span style="text-decoration: underline;">54</span>635          13.0 </span>
+<span class="co">#&gt; <span style="color: #BCBCBC;"> 5</span> DL      <span style="text-decoration: underline;">48</span>110           9.26</span>
+<span class="co">#&gt; <span style="color: #BCBCBC;"> 6</span> EV      <span style="text-decoration: underline;">54</span>173          20.0 </span>
+<span class="co">#&gt; <span style="color: #BCBCBC;"> 7</span> F9        685          20.2 </span>
+<span class="co">#&gt; <span style="color: #BCBCBC;"> 8</span> FL       <span style="text-decoration: underline;">3</span>260          18.7 </span>
+<span class="co">#&gt; <span style="color: #BCBCBC;"> 9</span> HA        342           4.90</span>
+<span class="co">#&gt; <span style="color: #BCBCBC;">10</span> MQ      <span style="text-decoration: underline;">26</span>397          10.6 </span>
+<span class="co">#&gt; <span style="color: #BCBCBC;">11</span> OO         32          12.6 </span>
+<span class="co">#&gt; <span style="color: #BCBCBC;">12</span> UA      <span style="text-decoration: underline;">58</span>665          12.1 </span>
+<span class="co">#&gt; <span style="color: #BCBCBC;">13</span> US      <span style="text-decoration: underline;">20</span>536           3.78</span>
+<span class="co">#&gt; <span style="color: #BCBCBC;">14</span> VX       <span style="text-decoration: underline;">5</span>162          12.9 </span>
+<span class="co">#&gt; <span style="color: #BCBCBC;">15</span> WN      <span style="text-decoration: underline;">12</span>275          17.7 </span>
+<span class="co">#&gt; <span style="color: #BCBCBC;">16</span> YV        601          19.0</span></code></pre></div>
 <p>Input column restriction is one of the most critical efficiencies provided by <code>disk.frame</code>. Because the underlying format allows random access to columns (i.e. retrieve only the columns used for processing), hence one can drastically reduce the amount of data loaded into RAM for processing by keeping only those columns that are directly used to produce the results.</p>
 </div>
-<div id="joins" class="section level2">
-<h2 class="hasAnchor">
-<a href="#joins" class="anchor"></a>Joins</h2>
+<div class="section level3">
+<h3 id="joins">Joins<a class="anchor" aria-label="anchor" href="#joins"></a>
+</h3>
 <p><code>disk.frame</code> supports many dplyr joins including:</p>
-<div class="sourceCode" id="cb18"><html><body><pre class="r"><span class="no">left_join</span>
-<span class="no">inner_join</span>
-<span class="no">semi_join</span>
-<span class="no">inner_join</span>
-<span class="no">full_join</span> <span class="co"># requires hard_group_by on both left and right</span></pre></body></html></div>
+<div class="sourceCode" id="cb18"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">left_join</span>
+<span class="va">inner_join</span>
+<span class="va">semi_join</span>
+<span class="va">inner_join</span>
+<span class="va">full_join</span> <span class="co"># requires hard_group_by on both left and right</span></code></pre></div>
 <p>In all cases, the left dataset (<code>x</code>) must be a <code>disk.frame</code>, and the right dataset (<code>y</code>) can be either a <code>disk.frame</code> or a <code>data.frame</code>. If the right dataset is a <code>disk.frame</code> and the <code>shardkey</code>s are different between the two <code>disk.frame</code>s then two expensive <code>hard</code> <code>group_by</code> operations are performed <em>eagerly</em>, one on the left <code>disk.frame</code> and one on the right <code>disk.frame</code> to perform the joins correctly.</p>
 <p>However, if the right dataset is a <code>data.frame</code> then <code>hard_group_by</code>s are only performed in the case of <code>full_join</code>.</p>
 <p>Note <code>disk.frame</code> does not support <code>right_join</code> the user should use <code>left_join</code> instead.</p>
 <p>The below joins are performed <em>lazily</em> because <code>airlines.dt</code> is a <code>data.table</code> not a <code>disk.frame</code>:</p>
-<div class="sourceCode" id="cb19"><html><body><pre class="r"><span class="co"># make airlines a data.table</span>
-<span class="no">airlines.dt</span> <span class="kw">&lt;-</span> <span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/data.table.html">data.table</a></span>(<span class="no">airlines</span>)
+<div class="sourceCode" id="cb19"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="co"># make airlines a data.table</span>
+<span class="va">airlines.dt</span> <span class="op">&lt;-</span> <span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/data.table.html" class="external-link">data.table</a></span><span class="op">(</span><span class="va">airlines</span><span class="op">)</span>
 <span class="co"># flights %&gt;% left_join(airlines, by = "carrier") #</span>
-<span class="no">flights.df</span> <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate-joins.html">left_join</a></span>(<span class="no">airlines.dt</span>, <span class="kw">by</span> <span class="kw">=</span><span class="st">"carrier"</span>) <span class="kw">%&gt;%</span>
-  <span class="no">collect</span> <span class="kw">%&gt;%</span>
-  <span class="no">head</span>
+<span class="va">flights.df</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate-joins.html" class="external-link">left_join</a></span><span class="op">(</span><span class="va">airlines.dt</span>, by <span class="op">=</span><span class="st">"carrier"</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="va">collect</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="va">head</span>
 <span class="co">#&gt;    year month day dep_time sched_dep_time dep_delay arr_time sched_arr_time</span>
 <span class="co">#&gt; 1: 2013     1   1      517            515         2      830            819</span>
 <span class="co">#&gt; 2: 2013     1   1      533            529         4      850            830</span>
@@ -412,17 +433,18 @@ <h2 class="hasAnchor">
 <span class="co">#&gt; 4:       -18      B6    725  N804JB    JFK  BQN      183     1576    5     45</span>
 <span class="co">#&gt; 5:       -25      DL    461  N668DN    LGA  ATL      116      762    6      0</span>
 <span class="co">#&gt; 6:        12      UA   1696  N39463    EWR  ORD      150      719    5     58</span>
-<span class="co">#&gt;               time_hour                   name</span>
-<span class="co">#&gt; 1: 2013-01-01T10:00:00Z  United Air Lines Inc.</span>
-<span class="co">#&gt; 2: 2013-01-01T10:00:00Z  United Air Lines Inc.</span>
-<span class="co">#&gt; 3: 2013-01-01T10:00:00Z American Airlines Inc.</span>
-<span class="co">#&gt; 4: 2013-01-01T10:00:00Z        JetBlue Airways</span>
-<span class="co">#&gt; 5: 2013-01-01T11:00:00Z   Delta Air Lines Inc.</span>
-<span class="co">#&gt; 6: 2013-01-01T10:00:00Z  United Air Lines Inc.</span></pre></body></html></div>
-<div class="sourceCode" id="cb20"><html><body><pre class="r"><span class="no">flights.df</span> <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate-joins.html">left_join</a></span>(<span class="no">airlines.dt</span>, <span class="kw">by</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html">c</a></span>(<span class="st">"carrier"</span>)) <span class="kw">%&gt;%</span>
-  <span class="no">collect</span> <span class="kw">%&gt;%</span>
-  <span class="no">tail</span>
+<span class="co">#&gt;              time_hour                   name</span>
+<span class="co">#&gt; 1: 2013-01-01 10:00:00  United Air Lines Inc.</span>
+<span class="co">#&gt; 2: 2013-01-01 10:00:00  United Air Lines Inc.</span>
+<span class="co">#&gt; 3: 2013-01-01 10:00:00 American Airlines Inc.</span>
+<span class="co">#&gt; 4: 2013-01-01 10:00:00        JetBlue Airways</span>
+<span class="co">#&gt; 5: 2013-01-01 11:00:00   Delta Air Lines Inc.</span>
+<span class="co">#&gt; 6: 2013-01-01 10:00:00  United Air Lines Inc.</span></code></pre></div>
+<div class="sourceCode" id="cb20"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">flights.df</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate-joins.html" class="external-link">left_join</a></span><span class="op">(</span><span class="va">airlines.dt</span>, by <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">"carrier"</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="va">collect</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="va">tail</span>
 <span class="co">#&gt;    year month day dep_time sched_dep_time dep_delay arr_time sched_arr_time</span>
 <span class="co">#&gt; 1: 2013     9  30       NA           1842        NA       NA           2019</span>
 <span class="co">#&gt; 2: 2013     9  30       NA           1455        NA       NA           1634</span>
@@ -437,82 +459,77 @@ <h2 class="hasAnchor">
 <span class="co">#&gt; 4:        NA      MQ   3461  N535MQ    LGA  BNA       NA      764   12     10</span>
 <span class="co">#&gt; 5:        NA      MQ   3572  N511MQ    LGA  CLE       NA      419   11     59</span>
 <span class="co">#&gt; 6:        NA      MQ   3531  N839MQ    LGA  RDU       NA      431    8     40</span>
-<span class="co">#&gt;               time_hour                     name</span>
-<span class="co">#&gt; 1: 2013-09-30T22:00:00Z ExpressJet Airlines Inc.</span>
-<span class="co">#&gt; 2: 2013-09-30T18:00:00Z        Endeavor Air Inc.</span>
-<span class="co">#&gt; 3: 2013-10-01T02:00:00Z        Endeavor Air Inc.</span>
-<span class="co">#&gt; 4: 2013-09-30T16:00:00Z                Envoy Air</span>
-<span class="co">#&gt; 5: 2013-09-30T15:00:00Z                Envoy Air</span>
-<span class="co">#&gt; 6: 2013-09-30T12:00:00Z                Envoy Air</span></pre></body></html></div>
+<span class="co">#&gt;              time_hour                     name</span>
+<span class="co">#&gt; 1: 2013-09-30 22:00:00 ExpressJet Airlines Inc.</span>
+<span class="co">#&gt; 2: 2013-09-30 18:00:00        Endeavor Air Inc.</span>
+<span class="co">#&gt; 3: 2013-10-01 02:00:00        Endeavor Air Inc.</span>
+<span class="co">#&gt; 4: 2013-09-30 16:00:00                Envoy Air</span>
+<span class="co">#&gt; 5: 2013-09-30 15:00:00                Envoy Air</span>
+<span class="co">#&gt; 6: 2013-09-30 12:00:00                Envoy Air</span></code></pre></div>
 </div>
-<div id="window-functions-and-arbitrary-functions" class="section level2">
-<h2 class="hasAnchor">
-<a href="#window-functions-and-arbitrary-functions" class="anchor"></a>Window functions and arbitrary functions</h2>
-<p><code>{disk.frame}</code> supports all <code>data.frame</code> operations, unlike Spark which can only perform those operations that Spark has implemented. Hence windowing functions like <code>min_rank</code> and <code>rank</code> are supported out of the box.</p>
+<div class="section level3">
+<h3 id="window-functions-and-arbitrary-functions">Window functions and arbitrary functions<a class="anchor" aria-label="anchor" href="#window-functions-and-arbitrary-functions"></a>
+</h3>
+<p><a href="https://diskframe.com" class="external-link">disk.frame</a> supports all <code>data.frame</code> operations, unlike Spark which can only perform those operations that Spark has implemented. Hence windowing functions like <code>min_rank</code> and <code>rank</code> are supported out of the box.</p>
 <p>For the following example, we will use the <code>hard_group_by</code> which performs a group-by and also reorganises the chunks so that all records with the same <code>year</code>, <code>month</code>, and <code>day</code> end up in the same chunk. This is typically not advised, as <code>hard_group_by</code> can be slow for large datasets.</p>
-<div class="sourceCode" id="cb21"><html><body><pre class="r"><span class="co"># Find the most and least delayed flight each day</span>
-<span class="no">bestworst</span> <span class="kw">&lt;-</span> <span class="no">flights.df</span> <span class="kw">%&gt;%</span>
-   <span class="fu"><a href="../reference/srckeep.html">srckeep</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/c.html">c</a></span>(<span class="st">"year"</span>,<span class="st">"month"</span>,<span class="st">"day"</span>, <span class="st">"dep_delay"</span>)) <span class="kw">%&gt;%</span>
-   <span class="fu"><a href="../reference/hard_group_by.html">hard_group_by</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/c.html">c</a></span>(<span class="st">"year"</span>, <span class="st">"month"</span>, <span class="st">"day"</span>)) <span class="kw">%&gt;%</span>
-   <span class="fu"><a href="https://dplyr.tidyverse.org/reference/filter.html">filter</a></span>(<span class="no">dep_delay</span> <span class="kw">==</span> <span class="fu"><a href="https://rdrr.io/r/base/Extremes.html">min</a></span>(<span class="no">dep_delay</span>, <span class="kw">na.rm</span> <span class="kw">=</span> <span class="no">T</span>) <span class="kw">||</span> <span class="no">dep_delay</span> <span class="kw">==</span> <span class="fu"><a href="https://rdrr.io/r/base/Extremes.html">max</a></span>(<span class="no">dep_delay</span>, <span class="kw">na.rm</span> <span class="kw">=</span> <span class="no">T</span>)) <span class="kw">%&gt;%</span>
-   <span class="no">collect</span>
-
-<span class="no">bestworst</span> <span class="kw">%&gt;%</span> <span class="no">head</span>
-<span class="co">#&gt; # A tibble: 6 x 4</span>
-<span class="co">#&gt; # Groups:   year, month, day [1]</span>
-<span class="co">#&gt;    year month   day dep_delay</span>
-<span class="co">#&gt;   &lt;int&gt; &lt;int&gt; &lt;int&gt;     &lt;int&gt;</span>
-<span class="co">#&gt; 1  2013     2    21       301</span>
-<span class="co">#&gt; 2  2013     2    21        -9</span>
-<span class="co">#&gt; 3  2013     2    21        -1</span>
-<span class="co">#&gt; 4  2013     2    21         2</span>
-<span class="co">#&gt; 5  2013     2    21        -4</span>
-<span class="co">#&gt; 6  2013     2    21        10</span></pre></body></html></div>
+<div class="sourceCode" id="cb21"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="co"># Find the most and least delayed flight each day</span>
+<span class="va">bestworst</span> <span class="op">&lt;-</span> <span class="va">flights.df</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+   <span class="fu"><a href="../reference/srckeep.html">srckeep</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">"year"</span>,<span class="st">"month"</span>,<span class="st">"day"</span>, <span class="st">"dep_delay"</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+   <span class="fu"><a href="../reference/hard_group_by.html">hard_group_by</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">"year"</span>, <span class="st">"month"</span>, <span class="st">"day"</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+   <span class="fu"><a href="https://dplyr.tidyverse.org/reference/filter.html" class="external-link">filter</a></span><span class="op">(</span><span class="va">dep_delay</span> <span class="op">==</span> <span class="fu"><a href="https://rdrr.io/r/base/Extremes.html" class="external-link">min</a></span><span class="op">(</span><span class="va">dep_delay</span>, na.rm <span class="op">=</span> <span class="cn">T</span><span class="op">)</span> <span class="op">||</span> <span class="va">dep_delay</span> <span class="op">==</span> <span class="fu"><a href="https://rdrr.io/r/base/Extremes.html" class="external-link">max</a></span><span class="op">(</span><span class="va">dep_delay</span>, na.rm <span class="op">=</span> <span class="cn">T</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+   <span class="va">collect</span>
+   
+<span class="va">bestworst</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="va">head</span>
+<span class="co">#&gt;    year month day dep_delay</span>
+<span class="co">#&gt; 1: 2013     2  21       301</span>
+<span class="co">#&gt; 2: 2013     2  21        -9</span>
+<span class="co">#&gt; 3: 2013     2  21        -1</span>
+<span class="co">#&gt; 4: 2013     2  21         2</span>
+<span class="co">#&gt; 5: 2013     2  21        -4</span>
+<span class="co">#&gt; 6: 2013     2  21        10</span></code></pre></div>
 <p>another example</p>
-<div class="sourceCode" id="cb22"><html><body><pre class="r"><span class="no">ranked</span> <span class="kw">&lt;-</span> <span class="no">flights.df</span> <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="../reference/srckeep.html">srckeep</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/c.html">c</a></span>(<span class="st">"year"</span>,<span class="st">"month"</span>,<span class="st">"day"</span>, <span class="st">"dep_delay"</span>)) <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="../reference/hard_group_by.html">hard_group_by</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/c.html">c</a></span>(<span class="st">"year"</span>, <span class="st">"month"</span>, <span class="st">"day"</span>)) <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/filter.html">filter</a></span>(<span class="fu"><a href="https://dplyr.tidyverse.org/reference/ranking.html">min_rank</a></span>(<span class="fu"><a href="https://dplyr.tidyverse.org/reference/desc.html">desc</a></span>(<span class="no">dep_delay</span>)) <span class="kw">&lt;=</span> <span class="fl">2</span> <span class="kw">&amp;</span> <span class="no">dep_delay</span> <span class="kw">&gt;</span> <span class="fl">0</span>) <span class="kw">%&gt;%</span>
-  <span class="no">collect</span>
+<div class="sourceCode" id="cb22"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">ranked</span> <span class="op">&lt;-</span> <span class="va">flights.df</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="fu"><a href="../reference/srckeep.html">srckeep</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">"year"</span>,<span class="st">"month"</span>,<span class="st">"day"</span>, <span class="st">"dep_delay"</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="fu"><a href="../reference/hard_group_by.html">hard_group_by</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">"year"</span>, <span class="st">"month"</span>, <span class="st">"day"</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/filter.html" class="external-link">filter</a></span><span class="op">(</span><span class="fu"><a href="https://dplyr.tidyverse.org/reference/ranking.html" class="external-link">min_rank</a></span><span class="op">(</span><span class="fu"><a href="https://dplyr.tidyverse.org/reference/desc.html" class="external-link">desc</a></span><span class="op">(</span><span class="va">dep_delay</span><span class="op">)</span><span class="op">)</span> <span class="op">&lt;=</span> <span class="fl">2</span> <span class="op">&amp;</span> <span class="va">dep_delay</span> <span class="op">&gt;</span> <span class="fl">0</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="va">collect</span>
 
-<span class="no">ranked</span> <span class="kw">%&gt;%</span> <span class="no">head</span>
-<span class="co">#&gt; # A tibble: 6 x 4</span>
-<span class="co">#&gt; # Groups:   year, month, day [3]</span>
-<span class="co">#&gt;    year month   day dep_delay</span>
-<span class="co">#&gt;   &lt;int&gt; &lt;int&gt; &lt;int&gt;     &lt;int&gt;</span>
-<span class="co">#&gt; 1  2013     1     9      1301</span>
-<span class="co">#&gt; 2  2013     1     9       253</span>
-<span class="co">#&gt; 3  2013     1    10      1126</span>
-<span class="co">#&gt; 4  2013     1    10       385</span>
-<span class="co">#&gt; 5  2013     1    17       259</span>
-<span class="co">#&gt; 6  2013     1    17       255</span></pre></body></html></div>
+<span class="va">ranked</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="va">head</span>
+<span class="co">#&gt;    year month day dep_delay</span>
+<span class="co">#&gt; 1: 2013     1   9      1301</span>
+<span class="co">#&gt; 2: 2013     1   9       253</span>
+<span class="co">#&gt; 3: 2013     1  10      1126</span>
+<span class="co">#&gt; 4: 2013     1  10       385</span>
+<span class="co">#&gt; 5: 2013     1  17       259</span>
+<span class="co">#&gt; 6: 2013     1  17       255</span></code></pre></div>
 <p>one more example</p>
-<div class="sourceCode" id="cb23"><html><body><pre class="r"><span class="co"># Rank each flight within a daily</span>
-<span class="no">ranked</span> <span class="kw">&lt;-</span> <span class="no">flights.df</span> <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="../reference/srckeep.html">srckeep</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/c.html">c</a></span>(<span class="st">"year"</span>,<span class="st">"month"</span>,<span class="st">"day"</span>, <span class="st">"dep_delay"</span>)) <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="../reference/chunk_group_by.html">chunk_group_by</a></span>(<span class="no">year</span>, <span class="no">month</span>, <span class="no">day</span>) <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/select.html">select</a></span>(<span class="no">dep_delay</span>) <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate.html">mutate</a></span>(<span class="kw">rank</span> <span class="kw">=</span> <span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/frank.html">rank</a></span>(<span class="fu"><a href="https://dplyr.tidyverse.org/reference/desc.html">desc</a></span>(<span class="no">dep_delay</span>))) <span class="kw">%&gt;%</span>
-  <span class="no">collect</span>
+<div class="sourceCode" id="cb23"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="co"># Rank each flight within a daily</span>
+<span class="va">ranked</span> <span class="op">&lt;-</span> <span class="va">flights.df</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="fu"><a href="../reference/srckeep.html">srckeep</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">"year"</span>,<span class="st">"month"</span>,<span class="st">"day"</span>, <span class="st">"dep_delay"</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="fu"><a href="../reference/chunk_group_by.html">chunk_group_by</a></span><span class="op">(</span><span class="va">year</span>, <span class="va">month</span>, <span class="va">day</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/select.html" class="external-link">select</a></span><span class="op">(</span><span class="va">dep_delay</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate.html" class="external-link">mutate</a></span><span class="op">(</span>rank <span class="op">=</span> <span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/frank.html" class="external-link">rank</a></span><span class="op">(</span><span class="fu"><a href="https://dplyr.tidyverse.org/reference/desc.html" class="external-link">desc</a></span><span class="op">(</span><span class="va">dep_delay</span><span class="op">)</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="va">collect</span>
 
-<span class="no">ranked</span> <span class="kw">%&gt;%</span> <span class="no">head</span>
-<span class="co">#&gt; # A tibble: 6 x 5</span>
-<span class="co">#&gt; # Groups:   year, month, day [1]</span>
-<span class="co">#&gt;    year month   day dep_delay  rank</span>
-<span class="co">#&gt;   &lt;int&gt; &lt;int&gt; &lt;int&gt;     &lt;int&gt; &lt;dbl&gt;</span>
-<span class="co">#&gt; 1  2013     1     1         2   313</span>
-<span class="co">#&gt; 2  2013     1     1         4   276</span>
-<span class="co">#&gt; 3  2013     1     1         2   313</span>
-<span class="co">#&gt; 4  2013     1     1        -1   440</span>
-<span class="co">#&gt; 5  2013     1     1        -6   742</span>
-<span class="co">#&gt; 6  2013     1     1        -4   633</span></pre></body></html></div>
+<span class="va">ranked</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="va">head</span>
+<span class="co">#&gt;    year month day dep_delay rank</span>
+<span class="co">#&gt; 1: 2013     1   1         2  313</span>
+<span class="co">#&gt; 2: 2013     1   1         4  276</span>
+<span class="co">#&gt; 3: 2013     1   1         2  313</span>
+<span class="co">#&gt; 4: 2013     1   1        -1  440</span>
+<span class="co">#&gt; 5: 2013     1   1        -6  742</span>
+<span class="co">#&gt; 6: 2013     1   1        -4  633</span></code></pre></div>
 </div>
-<div id="arbitrary-by-chunk-processing" class="section level2">
-<h2 class="hasAnchor">
-<a href="#arbitrary-by-chunk-processing" class="anchor"></a>Arbitrary by-chunk processing</h2>
-<p>One can apply arbitrary transformations to each chunk of the <code>disk.frame</code> by using the <code>delayed</code> function which evaluates lazily or the <code><a href="../reference/cmap.html">map.disk.frame(lazy = F)</a></code> function which evaluates eagerly. For example to return the number of rows in each chunk</p>
-<div class="sourceCode" id="cb24"><html><body><pre class="r"><span class="no">flights.df1</span> <span class="kw">&lt;-</span> <span class="fu"><a href="../reference/cmap.html">delayed</a></span>(<span class="no">flights.df</span>, ~<span class="fu"><a href="../reference/ncol_nrow.html">nrow</a></span>(<span class="no">.x</span>))
-<span class="fu"><a href="../reference/collect.html">collect_list</a></span>(<span class="no">flights.df1</span>) <span class="kw">%&gt;%</span> <span class="no">head</span> <span class="co"># returns number of rows for each data.frame in a list</span>
+<div class="section level3">
+<h3 id="arbitrary-by-chunk-processing">Arbitrary by-chunk processing<a class="anchor" aria-label="anchor" href="#arbitrary-by-chunk-processing"></a>
+</h3>
+<p>One can apply arbitrary transformations to each chunk of the <code>disk.frame</code> by using the <code>delayed</code> function which evaluates lazily or the <code>map.disk.frame(lazy = F)</code> function which evaluates eagerly. For example to return the number of rows in each chunk</p>
+<div class="sourceCode" id="cb24"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">flights.df1</span> <span class="op">&lt;-</span> <span class="fu"><a href="../reference/cmap.html">delayed</a></span><span class="op">(</span><span class="va">flights.df</span>, <span class="op">~</span><span class="fu"><a href="../reference/ncol_nrow.html">nrow</a></span><span class="op">(</span><span class="va">.x</span><span class="op">)</span><span class="op">)</span>
+<span class="fu"><a href="../reference/collect.html">collect_list</a></span><span class="op">(</span><span class="va">flights.df1</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="va">head</span> <span class="co"># returns number of rows for each data.frame in a list</span>
 <span class="co">#&gt; [[1]]</span>
 <span class="co">#&gt; [1] 56131</span>
 <span class="co">#&gt; </span>
@@ -529,9 +546,10 @@ <h2 class="hasAnchor">
 <span class="co">#&gt; [1] 56131</span>
 <span class="co">#&gt; </span>
 <span class="co">#&gt; [[6]]</span>
-<span class="co">#&gt; [1] 56121</span></pre></body></html></div>
+<span class="co">#&gt; [1] 56121</span></code></pre></div>
 <p>and to do the same with <code>map.disk.frame</code></p>
-<div class="sourceCode" id="cb25"><html><body><pre class="r"><span class="fu"><a href="../reference/cmap.html">map</a></span>(<span class="no">flights.df</span>, ~<span class="fu"><a href="../reference/ncol_nrow.html">nrow</a></span>(<span class="no">.x</span>), <span class="kw">lazy</span> <span class="kw">=</span> <span class="no">F</span>) <span class="kw">%&gt;%</span> <span class="no">head</span>
+<div class="sourceCode" id="cb25"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu"><a href="../reference/cmap.html">map</a></span><span class="op">(</span><span class="va">flights.df</span>, <span class="op">~</span><span class="fu"><a href="../reference/ncol_nrow.html">nrow</a></span><span class="op">(</span><span class="va">.x</span><span class="op">)</span>, lazy <span class="op">=</span> <span class="cn">F</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="va">head</span>
 <span class="co">#&gt; Warning in map.disk.frame(flights.df, ~nrow(.x), lazy = F): map(df, ...) where</span>
 <span class="co">#&gt; df is a disk.frame has been deprecated. Please use cmap(df,...) instead</span>
 <span class="co">#&gt; [[1]]</span>
@@ -550,15 +568,16 @@ <h2 class="hasAnchor">
 <span class="co">#&gt; [1] 56131</span>
 <span class="co">#&gt; </span>
 <span class="co">#&gt; [[6]]</span>
-<span class="co">#&gt; [1] 56121</span></pre></body></html></div>
+<span class="co">#&gt; [1] 56121</span></code></pre></div>
 <p>The <code>map</code> function can also output the results to another disk.frame folder, e.g.</p>
-<div class="sourceCode" id="cb26"><html><body><pre class="r"><span class="co"># return the first 10 rows of each chunk</span>
-<span class="no">flights.df2</span> <span class="kw">&lt;-</span> <span class="fu"><a href="../reference/cmap.html">map</a></span>(<span class="no">flights.df</span>, ~<span class="no">.x</span>[<span class="fl">1</span>:<span class="fl">10</span>,], <span class="kw">lazy</span> <span class="kw">=</span> <span class="no">F</span>, <span class="kw">outdir</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/file.path.html">file.path</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/tempfile.html">tempdir</a></span>(), <span class="st">"tmp2"</span>), <span class="kw">overwrite</span> <span class="kw">=</span> <span class="no">T</span>)
+<div class="sourceCode" id="cb26"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="co"># return the first 10 rows of each chunk</span>
+<span class="va">flights.df2</span> <span class="op">&lt;-</span> <span class="fu"><a href="../reference/cmap.html">map</a></span><span class="op">(</span><span class="va">flights.df</span>, <span class="op">~</span><span class="va">.x</span><span class="op">[</span><span class="fl">1</span><span class="op">:</span><span class="fl">10</span>,<span class="op">]</span>, lazy <span class="op">=</span> <span class="cn">F</span>, outdir <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/file.path.html" class="external-link">file.path</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempdir</a></span><span class="op">(</span><span class="op">)</span>, <span class="st">"tmp2"</span><span class="op">)</span>, overwrite <span class="op">=</span> <span class="cn">T</span><span class="op">)</span>
 <span class="co">#&gt; Warning in map.disk.frame(flights.df, ~.x[1:10, ], lazy = F, outdir =</span>
 <span class="co">#&gt; file.path(tempdir(), : map(df, ...) where df is a disk.frame has been</span>
 <span class="co">#&gt; deprecated. Please use cmap(df,...) instead</span>
 
-<span class="no">flights.df2</span> <span class="kw">%&gt;%</span> <span class="no">head</span>
+<span class="va">flights.df2</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="va">head</span>
 <span class="co">#&gt;    year month day dep_time sched_dep_time dep_delay arr_time sched_arr_time</span>
 <span class="co">#&gt; 1: 2013     1   1      517            515         2      830            819</span>
 <span class="co">#&gt; 2: 2013     1   1      533            529         4      850            830</span>
@@ -573,47 +592,49 @@ <h2 class="hasAnchor">
 <span class="co">#&gt; 4:       -18      B6    725  N804JB    JFK  BQN      183     1576    5     45</span>
 <span class="co">#&gt; 5:       -25      DL    461  N668DN    LGA  ATL      116      762    6      0</span>
 <span class="co">#&gt; 6:        12      UA   1696  N39463    EWR  ORD      150      719    5     58</span>
-<span class="co">#&gt;               time_hour</span>
-<span class="co">#&gt; 1: 2013-01-01T10:00:00Z</span>
-<span class="co">#&gt; 2: 2013-01-01T10:00:00Z</span>
-<span class="co">#&gt; 3: 2013-01-01T10:00:00Z</span>
-<span class="co">#&gt; 4: 2013-01-01T10:00:00Z</span>
-<span class="co">#&gt; 5: 2013-01-01T11:00:00Z</span>
-<span class="co">#&gt; 6: 2013-01-01T10:00:00Z</span></pre></body></html></div>
-<p>Notice <code>{disk.frame}</code> supports the <code>purrr</code> syntax for defining a function using <code>~</code>.</p>
+<span class="co">#&gt;              time_hour</span>
+<span class="co">#&gt; 1: 2013-01-01 10:00:00</span>
+<span class="co">#&gt; 2: 2013-01-01 10:00:00</span>
+<span class="co">#&gt; 3: 2013-01-01 10:00:00</span>
+<span class="co">#&gt; 4: 2013-01-01 10:00:00</span>
+<span class="co">#&gt; 5: 2013-01-01 11:00:00</span>
+<span class="co">#&gt; 6: 2013-01-01 10:00:00</span></code></pre></div>
+<p>Notice <a href="https://diskframe.com" class="external-link">disk.frame</a> supports the <code>purrr</code> syntax for defining a function using <code>~</code>.</p>
 </div>
-<div id="sampling" class="section level2">
-<h2 class="hasAnchor">
-<a href="#sampling" class="anchor"></a>Sampling</h2>
+<div class="section level3">
+<h3 id="sampling">Sampling<a class="anchor" aria-label="anchor" href="#sampling"></a>
+</h3>
 <p>In the <code>disk.frame</code> framework, sampling a proportion of rows within each chunk can be performed using <code>sample_frac</code>.</p>
-<div class="sourceCode" id="cb27"><html><body><pre class="r"><span class="no">flights.df</span> <span class="kw">%&gt;%</span> <span class="fu"><a href="https://dplyr.tidyverse.org/reference/sample_n.html">sample_frac</a></span>(<span class="fl">0.01</span>) <span class="kw">%&gt;%</span> <span class="no">collect</span> <span class="kw">%&gt;%</span> <span class="no">head</span>
-<span class="co">#&gt;   year month day dep_time sched_dep_time dep_delay arr_time sched_arr_time</span>
-<span class="co">#&gt; 1 2013     5  20      933            935        -2     1152           1208</span>
-<span class="co">#&gt; 2 2013     5  17     1624           1622         2     1726           1735</span>
-<span class="co">#&gt; 3 2013     5  21      743            745        -2      955            956</span>
-<span class="co">#&gt; 4 2013     2   1      553            600        -7      821            825</span>
-<span class="co">#&gt; 5 2013     5  22      757            759        -2     1015           1028</span>
-<span class="co">#&gt; 6 2013     5  16     1726           1725         1     2027           2020</span>
-<span class="co">#&gt;   arr_delay carrier flight tailnum origin dest air_time distance hour minute</span>
-<span class="co">#&gt; 1       -16      EV   4140  N14543    EWR  ATL      107      746    9     35</span>
-<span class="co">#&gt; 2        -9      EV   4299  N13994    EWR  DCA       38      199   16     22</span>
-<span class="co">#&gt; 3        -1      EV   4237  N15985    EWR  CHS       99      628    7     45</span>
-<span class="co">#&gt; 4        -4      MQ   4650  N1EAMQ    LGA  ATL      125      762    6      0</span>
-<span class="co">#&gt; 5       -13      DL   2047  N662DN    LGA  ATL      104      762    7     59</span>
-<span class="co">#&gt; 6         7      AA   1901  N3FAAA    JFK  IAH      204     1417   17     25</span>
+<div class="sourceCode" id="cb27"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">flights.df</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="fu"><a href="https://dplyr.tidyverse.org/reference/sample_n.html" class="external-link">sample_frac</a></span><span class="op">(</span><span class="fl">0.01</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="va">collect</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="va">head</span>
+<span class="co">#&gt;    year month day dep_time sched_dep_time dep_delay arr_time sched_arr_time</span>
+<span class="co">#&gt; 1: 2013     5  10      554            600        -6      645            659</span>
+<span class="co">#&gt; 2: 2013     8  28      752            800        -8     1015           1022</span>
+<span class="co">#&gt; 3: 2013     1   3      955            958        -3     1120           1137</span>
+<span class="co">#&gt; 4: 2013     8  22     2157           2100        57        7           2323</span>
+<span class="co">#&gt; 5: 2013     5  14     1853           1900        -7     2003           2048</span>
+<span class="co">#&gt; 6: 2013     8  25     1550           1540        10     1747           1747</span>
+<span class="co">#&gt;    arr_delay carrier flight tailnum origin dest air_time distance hour minute</span>
+<span class="co">#&gt; 1:       -14      US   2161  N747UW    LGA  DCA       38      214    6      0</span>
+<span class="co">#&gt; 2:        -7      UA    561  N513UA    LGA  DEN      218     1620    8      0</span>
+<span class="co">#&gt; 3:       -17      UA    258  N831UA    LGA  ORD      124      733    9     58</span>
+<span class="co">#&gt; 4:        44      DL   1247  N914DE    LGA  ATL      102      762   21      0</span>
+<span class="co">#&gt; 5:       -45      EV   5038  N741EV    LGA  BHM      111      866   19      0</span>
+<span class="co">#&gt; 6:         0      9E   3648  N8940E    JFK  CMH       69      483   15     40</span>
 <span class="co">#&gt;              time_hour</span>
-<span class="co">#&gt; 1 2013-05-20T13:00:00Z</span>
-<span class="co">#&gt; 2 2013-05-17T20:00:00Z</span>
-<span class="co">#&gt; 3 2013-05-21T11:00:00Z</span>
-<span class="co">#&gt; 4 2013-02-01T11:00:00Z</span>
-<span class="co">#&gt; 5 2013-05-22T11:00:00Z</span>
-<span class="co">#&gt; 6 2013-05-16T21:00:00Z</span></pre></body></html></div>
+<span class="co">#&gt; 1: 2013-05-10 10:00:00</span>
+<span class="co">#&gt; 2: 2013-08-28 12:00:00</span>
+<span class="co">#&gt; 3: 2013-01-03 14:00:00</span>
+<span class="co">#&gt; 4: 2013-08-23 01:00:00</span>
+<span class="co">#&gt; 5: 2013-05-14 23:00:00</span>
+<span class="co">#&gt; 6: 2013-08-25 19:00:00</span></code></pre></div>
 </div>
-<div id="writing-data" class="section level2">
-<h2 class="hasAnchor">
-<a href="#writing-data" class="anchor"></a>Writing Data</h2>
+<div class="section level3">
+<h3 id="writing-data">Writing Data<a class="anchor" aria-label="anchor" href="#writing-data"></a>
+</h3>
 <p>One can output a <code>disk.frame</code> by using the <code>write_disk.frame</code> function. E.g.</p>
-<div class="sourceCode" id="cb28"><html><body><pre class="r"><span class="fu"><a href="../reference/write_disk.frame.html">write_disk.frame</a></span>(<span class="no">flights.df</span>, <span class="kw">outdir</span><span class="kw">=</span><span class="st">"out"</span>)</pre></body></html></div>
+<div class="sourceCode" id="cb28"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu"><a href="../reference/write_disk.frame.html">write_disk.frame</a></span><span class="op">(</span><span class="va">flights.df</span>, outdir<span class="op">=</span><span class="st">"out"</span><span class="op">)</span></code></pre></div>
 <p>this will output a disk.frame to the folder “out”</p>
 </div>
 </div>
@@ -630,11 +651,13 @@ <h2 class="hasAnchor">
 
 
       <footer><div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+  <p></p>
+<p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p>
+<p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
       </footer>
@@ -643,5 +666,7 @@ <h2 class="hasAnchor">
   
 
 
+  
+
   </body>
 </html>
diff --git a/docs/articles/02-intro-disk-frame_files/header-attrs-2.8/header-attrs.js b/docs/articles/02-intro-disk-frame_files/header-attrs-2.8/header-attrs.js
new file mode 100644
index 00000000..dd57d92e
--- /dev/null
+++ b/docs/articles/02-intro-disk-frame_files/header-attrs-2.8/header-attrs.js
@@ -0,0 +1,12 @@
+// Pandoc 2.9 adds attributes on both header and div. We remove the former (to
+// be compatible with the behavior of Pandoc < 2.8).
+document.addEventListener('DOMContentLoaded', function(e) {
+  var hs = document.querySelectorAll("div.section[class*='level'] > :first-child");
+  var i, h, a;
+  for (i = 0; i < hs.length; i++) {
+    h = hs[i];
+    if (!/^h[1-6]$/i.test(h.tagName)) continue;  // it should be a header h1-h6
+    a = h.attributes;
+    while (a.length > 0) h.removeAttribute(a[0].name);
+  }
+});
diff --git a/docs/articles/03-concepts.html b/docs/articles/03-concepts.html
index 639f53d2..418a1757 100644
--- a/docs/articles/03-concepts.html
+++ b/docs/articles/03-concepts.html
@@ -19,6 +19,8 @@
 <![endif]-->
 </head>
 <body data-spy="scroll" data-target="#toc">
+    
+
     <div class="container template-article">
       <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
@@ -31,18 +33,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
       <ul class="nav navbar-nav">
-<li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
 <li>
   <a href="../reference/index.html">Reference</a>
 </li>
@@ -86,6 +82,9 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
   </ul>
 </li>
 <li>
@@ -94,8 +93,8 @@
       </ul>
 <ul class="nav navbar-nav navbar-right">
 <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
@@ -113,31 +112,32 @@
   <div class="col-md-9 contents">
     <div class="page-header toc-ignore">
       <h1 data-toc-skip>Key <code>{disk.frame}</code> concepts</h1>
-                        <h4 class="author">ZJ</h4>
+                        <h4 data-toc-skip class="author">ZJ</h4>
             
       
-      <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/master/vignettes/03-concepts.Rmd"><code>vignettes/03-concepts.Rmd</code></a></small>
+      <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/vignettes/03-concepts.Rmd" class="external-link"><code>vignettes/03-concepts.Rmd</code></a></small>
       <div class="hidden name"><code>03-concepts.Rmd</code></div>
 
     </div>
 
     
     
-<div id="key-disk-frame-concepts" class="section level1">
-<h1 class="hasAnchor">
-<a href="#key-disk-frame-concepts" class="anchor"></a>Key <code>{disk.frame}</code> concepts</h1>
+<div class="section level2">
+<h2 id="key-disk-frame-concepts">Key <code>{disk.frame}</code> concepts<a class="anchor" aria-label="anchor" href="#key-disk-frame-concepts"></a>
+</h2>
 <p>There are a number of concepts and terminologies that are useful to understand in order to use <code>disk.frame</code> effectively.</p>
-<div id="what-is-a-disk-frame-and-what-are-chunks" class="section level2">
-<h2 class="hasAnchor">
-<a href="#what-is-a-disk-frame-and-what-are-chunks" class="anchor"></a>What is a <code>disk.frame</code> and what are chunks?</h2>
-<p>A <code>disk.frame</code> is a folder containing <a href="https://www.fstpackage.org/"><code>fst</code></a> files named “1.fst”, “2.fst”, “3.fst” etc. Each of the “.fst” file is called a <em>chunk</em>.</p>
+<div class="section level3">
+<h3 id="what-is-a-disk-frame-and-what-are-chunks">What is a <code>disk.frame</code> and what are chunks?<a class="anchor" aria-label="anchor" href="#what-is-a-disk-frame-and-what-are-chunks"></a>
+</h3>
+<p>A <code>disk.frame</code> is a folder containing <a href="https://www.fstpackage.org/" class="external-link"><code>fst</code></a> files named “1.fst”, “2.fst”, “3.fst” etc. Each of the “.fst” file is called a <em>chunk</em>.</p>
 </div>
-<div id="workers-and-parallelism" class="section level2">
-<h2 class="hasAnchor">
-<a href="#workers-and-parallelism" class="anchor"></a>Workers and parallelism</h2>
-<p>Parallelism in <code>{disk.frame</code>} is achieved using the <a href="https://cran.r-project.org/package=future"><code>{future}</code> package</a>. When performing many tasks, <code>{disk.frame}</code> uses multiple workers to perform the tasks in parallel. A <em>worker</em> is an R session.</p>
-<p>It is recommended that you run the following immediately after <code><a href="https://rdrr.io/pkg/disk.frame/man">library(disk.frame)</a></code> to set-up multiple workers. For example:</p>
-<div class="sourceCode" id="cb1"><html><body><pre class="r"><span class="fu"><a href="https://rdrr.io/r/base/library.html">library</a></span>(<span class="no">disk.frame</span>)
+<div class="section level3">
+<h3 id="workers-and-parallelism">Workers and parallelism<a class="anchor" aria-label="anchor" href="#workers-and-parallelism"></a>
+</h3>
+<p>Parallelism in <code>{disk.frame</code>} is achieved using the <a href="https://cran.r-project.org/package=future" class="external-link"><code>{future}</code> package</a>. When performing many tasks, <a href="https://diskframe.com" class="external-link">disk.frame</a> uses multiple workers to perform the tasks in parallel. A <em>worker</em> is an R session.</p>
+<p>It is recommended that you run the following immediately after <code><a href="https://diskframe.com" class="external-link">library(disk.frame)</a></code> to set-up multiple workers. For example:</p>
+<div class="sourceCode" id="cb1"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://diskframe.com" class="external-link">disk.frame</a></span><span class="op">)</span>
 <span class="co">#&gt; Loading required package: dplyr</span>
 <span class="co">#&gt; </span>
 <span class="co">#&gt; Attaching package: 'dplyr'</span>
@@ -148,24 +148,24 @@ <h2 class="hasAnchor">
 <span class="co">#&gt; </span>
 <span class="co">#&gt;     intersect, setdiff, setequal, union</span>
 <span class="co">#&gt; Loading required package: purrr</span>
-<span class="co">#&gt; Registered S3 method overwritten by 'pryr':</span>
-<span class="co">#&gt;   method      from</span>
-<span class="co">#&gt;   print.bytes Rcpp</span>
-<span class="co">#&gt; </span>
-<span class="co">#&gt; ## Message from disk.frame:</span>
-<span class="co">#&gt; We have 1 workers to use with disk.frame.</span>
-<span class="co">#&gt; To change that, use setup_disk.frame(workers = n) or just setup_disk.frame() to use the defaults.</span>
-<span class="co">#&gt; </span>
-<span class="co">#&gt; </span>
-<span class="co">#&gt; It is recommended that you run the following immediately to set up disk.frame with multiple workers in order to parallelize your operations:</span>
 <span class="co">#&gt; </span>
-<span class="co">#&gt; </span>
-<span class="co">#&gt; ```r</span>
-<span class="co">#&gt; # this will set up disk.frame with multiple workers</span>
-<span class="co">#&gt; setup_disk.frame()</span>
-<span class="co">#&gt; # this will allow unlimited amount of data to be passed from worker to worker</span>
-<span class="co">#&gt; options(future.globals.maxSize = Inf)</span>
-<span class="co">#&gt; ```</span>
+<span class="co"><span style="color: #BB0000;">#&gt; ## Message from disk.frame:</span></span>
+<span class="co"><span style="color: #BB0000;">#&gt; We have 1 workers to use with disk.frame.</span></span>
+<span class="co"><span style="color: #BB0000;">#&gt; To change that, use setup_disk.frame(workers = n) or just setup_disk.frame() to use the defaults.</span></span>
+<span class="co"><span style="color: #00BB00;">#&gt; </span></span>
+<span class="co"><span style="color: #00BB00;">#&gt; </span></span>
+<span class="co"><span style="color: #00BB00;">#&gt; It is recommended that you run the following immediately to set up disk.frame with multiple workers in order to parallelize your operations:</span></span>
+<span class="co"><span style="color: #00BB00;">#&gt; </span></span>
+<span class="co"><span style="color: #00BB00;">#&gt; </span></span>
+<span class="co"><span style="color: #00BB00;">#&gt; ```r</span></span>
+<span class="co"><span style="color: #00BB00;">#&gt; # this will set up disk.frame with multiple workers</span></span>
+<span class="co"><span style="color: #00BB00;">#&gt; setup_disk.frame()</span></span>
+<span class="co"><span style="color: #00BB00;">#&gt; # this will allow unlimited amount of data to be passed from worker to worker</span></span>
+<span class="co"><span style="color: #00BB00;">#&gt; options(future.globals.maxSize = Inf)</span></span>
+<span class="co"><span style="color: #00BB00;">#&gt; ```</span></span>
+<span class="co"><span style="color: #00BB00;">#&gt; </span></span>
+<span class="co"><span style="color: #00BB00;">#&gt; </span></span>
+<span class="co"><span style="color: #00BB00;">#&gt; </span></span>
 <span class="co">#&gt; </span>
 <span class="co">#&gt; Attaching package: 'disk.frame'</span>
 <span class="co">#&gt; The following objects are masked from 'package:purrr':</span>
@@ -174,24 +174,27 @@ <h2 class="hasAnchor">
 <span class="co">#&gt; The following objects are masked from 'package:base':</span>
 <span class="co">#&gt; </span>
 <span class="co">#&gt;     colnames, ncol, nrow</span>
-<span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span>()
+<span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span><span class="op">(</span><span class="op">)</span>
 <span class="co">#&gt; The number of workers available for disk.frame is 6</span>
 
 <span class="co"># this will allow unlimited amount of data to be passed from worker to worker</span>
-<span class="fu"><a href="https://rdrr.io/r/base/options.html">options</a></span>(<span class="kw">future.globals.maxSize</span> <span class="kw">=</span> <span class="fl">Inf</span>)</pre></body></html></div>
+<span class="fu"><a href="https://rdrr.io/r/base/options.html" class="external-link">options</a></span><span class="op">(</span>future.globals.maxSize <span class="op">=</span> <span class="cn">Inf</span><span class="op">)</span></code></pre></div>
 <p>For example, suppose we wish to compute the number of rows for each chunk, we can clearly perform this simultaneously in parallel. The code to do that is</p>
-<div class="sourceCode" id="cb2"><html><body><pre class="r"><span class="co"># use only one column is fastest</span>
-<span class="no">df</span>[,<span class="no">.N</span>, <span class="kw">keep</span> <span class="kw">=</span> <span class="st">"first_col"</span>]</pre></body></html></div>
+<div class="sourceCode" id="cb2"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="co"># use only one column is fastest</span>
+<span class="va">df</span><span class="op">[</span>,<span class="va">.N</span>, keep <span class="op">=</span> <span class="st">"first_col"</span><span class="op">]</span></code></pre></div>
 <p>or equivalent using the <code>srckeep</code> function</p>
-<div class="sourceCode" id="cb3"><html><body><pre class="r"><span class="co"># use only one column is fastest</span>
-<span class="fu"><a href="../reference/srckeep.html">srckeep</a></span>(<span class="no">df</span>, <span class="st">"first_col"</span>)[,<span class="no">.N</span>, <span class="kw">keep</span> <span class="kw">=</span> <span class="st">"first_col"</span>]</pre></body></html></div>
+<div class="sourceCode" id="cb3"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="co"># use only one column is fastest</span>
+<span class="fu"><a href="../reference/srckeep.html">srckeep</a></span><span class="op">(</span><span class="va">df</span>, <span class="st">"first_col"</span><span class="op">)</span><span class="op">[</span>,<span class="va">.N</span>, keep <span class="op">=</span> <span class="st">"first_col"</span><span class="op">]</span></code></pre></div>
 <p>Say there are <code>n</code> chunks in <code>df</code>, and there are <code>m</code> workers. Then the first <code>m</code> chunks will run <code>chunk[,.N]</code> simultaneously.</p>
-<p>To see how many workers are available for <code>{disk.frame}</code> to use, run</p>
-<div class="sourceCode" id="cb4"><html><body><pre class="r"><span class="kw pkg">future</span><span class="kw ns">::</span><span class="fu"><a href="https://rdrr.io/pkg/future/man/nbrOfWorkers.html">nbrOfWorkers</a></span>()</pre></body></html></div>
+<p>To see how many workers are available for <a href="https://diskframe.com" class="external-link">disk.frame</a> to use, run</p>
+<div class="sourceCode" id="cb4"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu">future</span><span class="fu">::</span><span class="fu"><a href="https://future.futureverse.org/reference/nbrOfWorkers.html" class="external-link">nbrOfWorkers</a></span><span class="op">(</span><span class="op">)</span></code></pre></div>
 </div>
-<div id="how-disk-frame-works" class="section level2">
-<h2 class="hasAnchor">
-<a href="#how-disk-frame-works" class="anchor"></a>How <code>{disk.frame}</code> works</h2>
+<div class="section level3">
+<h3 id="how-disk-frame-works">How <code>{disk.frame}</code> works<a class="anchor" aria-label="anchor" href="#how-disk-frame-works"></a>
+</h3>
 <p>When <code>df %&gt;% some_fn %&gt;% collect</code> is called. The <code>some_fn</code> is applied to each chunk of <code>df</code>. The collect will row-bind the results from <code>some_fn(chunk)</code>together if the returned value of <code>some_fn</code> is a data.frame, or it will return a <code>list</code> containing the results of <code>some_fn</code>.</p>
 <p>The session that receives these results is called the <strong>main session</strong>. In general, we should try to minimize the amount of data passed from the worker sessions back to the main session, because passing data around can be slow.</p>
 <p>Also, please note that there is no communication between the workers, except for workers passing data back to the main session.</p>
@@ -210,11 +213,13 @@ <h2 class="hasAnchor">
 
 
       <footer><div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+  <p></p>
+<p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p>
+<p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
       </footer>
@@ -223,5 +228,7 @@ <h2 class="hasAnchor">
   
 
 
+  
+
   </body>
 </html>
diff --git a/docs/articles/03-concepts_files/header-attrs-2.8/header-attrs.js b/docs/articles/03-concepts_files/header-attrs-2.8/header-attrs.js
new file mode 100644
index 00000000..dd57d92e
--- /dev/null
+++ b/docs/articles/03-concepts_files/header-attrs-2.8/header-attrs.js
@@ -0,0 +1,12 @@
+// Pandoc 2.9 adds attributes on both header and div. We remove the former (to
+// be compatible with the behavior of Pandoc < 2.8).
+document.addEventListener('DOMContentLoaded', function(e) {
+  var hs = document.querySelectorAll("div.section[class*='level'] > :first-child");
+  var i, h, a;
+  for (i = 0; i < hs.length; i++) {
+    h = hs[i];
+    if (!/^h[1-6]$/i.test(h.tagName)) continue;  // it should be a header h1-h6
+    a = h.attributes;
+    while (a.length > 0) h.removeAttribute(a[0].name);
+  }
+});
diff --git a/docs/articles/04-ingesting-data.html b/docs/articles/04-ingesting-data.html
index 28168dd7..eb86d829 100644
--- a/docs/articles/04-ingesting-data.html
+++ b/docs/articles/04-ingesting-data.html
@@ -19,6 +19,8 @@
 <![endif]-->
 </head>
 <body data-spy="scroll" data-target="#toc">
+    
+
     <div class="container template-article">
       <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
@@ -31,18 +33,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
       <ul class="nav navbar-nav">
-<li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
 <li>
   <a href="../reference/index.html">Reference</a>
 </li>
@@ -86,6 +82,9 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
   </ul>
 </li>
 <li>
@@ -94,8 +93,8 @@
       </ul>
 <ul class="nav navbar-nav navbar-right">
 <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
@@ -113,135 +112,146 @@
   <div class="col-md-9 contents">
     <div class="page-header toc-ignore">
       <h1 data-toc-skip>Ingesting Data</h1>
-                        <h4 class="author">ZJ</h4>
+                        <h4 data-toc-skip class="author">ZJ</h4>
             
       
-      <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/master/vignettes/04-ingesting-data.Rmd"><code>vignettes/04-ingesting-data.Rmd</code></a></small>
+      <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/vignettes/04-ingesting-data.Rmd" class="external-link"><code>vignettes/04-ingesting-data.Rmd</code></a></small>
       <div class="hidden name"><code>04-ingesting-data.Rmd</code></div>
 
     </div>
 
     
     
-<div id="ingesting-data" class="section level1">
-<h1 class="hasAnchor">
-<a href="#ingesting-data" class="anchor"></a>Ingesting Data</h1>
-<p>One of the most important tasks to perform before using the <code>{disk.frame}</code> package is to make some <code>disk.frame</code>s! There are a few functions to help you do that. Before we do that, we set up the <code>{disk.frame}</code> as usual</p>
+<div class="section level2">
+<h2 id="ingesting-data">Ingesting Data<a class="anchor" aria-label="anchor" href="#ingesting-data"></a>
+</h2>
+<p>One of the most important tasks to perform before using the <a href="https://diskframe.com" class="external-link">disk.frame</a> package is to make some <code>disk.frame</code>s! There are a few functions to help you do that. Before we do that, we set up the <a href="https://diskframe.com" class="external-link">disk.frame</a> as usual</p>
 <p><strong>Setting up</strong></p>
-<div class="sourceCode" id="cb1"><html><body><pre class="r"><span class="fu"><a href="https://rdrr.io/r/base/library.html">library</a></span>(<span class="no">disk.frame</span>)
+<div class="sourceCode" id="cb1"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://diskframe.com" class="external-link">disk.frame</a></span><span class="op">)</span>
 
 <span class="co"># set-up disk.frame to use multiple workers</span>
-<span class="kw">if</span>(<span class="fu"><a href="https://rdrr.io/r/base/interactive.html">interactive</a></span>()) {
-  <span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span>()
+<span class="kw">if</span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/interactive.html" class="external-link">interactive</a></span><span class="op">(</span><span class="op">)</span><span class="op">)</span> <span class="op">{</span>
+  <span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span><span class="op">(</span><span class="op">)</span>
   <span class="co"># highly recommended, however it is pun into interactive() for CRAN because</span>
   <span class="co"># change user options are not allowed on CRAN</span>
-  <span class="fu"><a href="https://rdrr.io/r/base/options.html">options</a></span>(<span class="kw">future.globals.maxSize</span> <span class="kw">=</span> <span class="fl">Inf</span>)
-} <span class="kw">else</span> {
-  <span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span>(<span class="fl">2</span>)
-}</pre></body></html></div>
-<div id="convert-a-data-frame-to-disk-frame" class="section level2">
-<h2 class="hasAnchor">
-<a href="#convert-a-data-frame-to-disk-frame" class="anchor"></a>Convert a <code>data.frame</code> to <code>disk.frame</code>
-</h2>
+  <span class="fu"><a href="https://rdrr.io/r/base/options.html" class="external-link">options</a></span><span class="op">(</span>future.globals.maxSize <span class="op">=</span> <span class="cn">Inf</span><span class="op">)</span>  
+<span class="op">}</span> <span class="kw">else</span> <span class="op">{</span>
+  <span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span><span class="op">(</span><span class="fl">2</span><span class="op">)</span>
+<span class="op">}</span></code></pre></div>
+<div class="section level3">
+<h3 id="convert-a-data-frame-to-disk-frame">Convert a <code>data.frame</code> to <code>disk.frame</code><a class="anchor" aria-label="anchor" href="#convert-a-data-frame-to-disk-frame"></a>
+</h3>
 <p>Firstly, there is <code><a href="../reference/as.disk.frame.html">as.disk.frame()</a></code> which allows you to make a <code>disk.frame</code> from a <code>data.frame</code>, e.g.</p>
-<div class="sourceCode" id="cb2"><html><body><pre class="r"><span class="no">flights.df</span> <span class="kw">=</span> <span class="fu"><a href="../reference/as.disk.frame.html">as.disk.frame</a></span>(<span class="kw pkg">nycflights13</span><span class="kw ns">::</span><span class="no"><a href="https://rdrr.io/pkg/nycflights13/man/flights.html">flights</a></span>)</pre></body></html></div>
-<p>will convert the <code><a href="https://rdrr.io/pkg/nycflights13/man/flights.html">nycflights13::flights</a></code> <code>data.frame</code> to a <code>disk.frame</code> somewhere in <code><a href="https://rdrr.io/r/base/tempfile.html">tempdir()</a></code>. To find out the location of the <code>disk.frame</code> use:</p>
-<div class="sourceCode" id="cb3"><html><body><pre class="r"><span class="fu"><a href="https://rdrr.io/r/base/attr.html">attr</a></span>(<span class="no">flights.df</span>, <span class="st">"path"</span>)</pre></body></html></div>
+<div class="sourceCode" id="cb2"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">flights.df</span> <span class="op">=</span> <span class="fu"><a href="../reference/as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="fu">nycflights13</span><span class="fu">::</span><span class="va"><a href="https://rdrr.io/pkg/nycflights13/man/flights.html" class="external-link">flights</a></span><span class="op">)</span></code></pre></div>
+<p>will convert the <code><a href="https://rdrr.io/pkg/nycflights13/man/flights.html" class="external-link">nycflights13::flights</a></code> <code>data.frame</code> to a <code>disk.frame</code> somewhere in <code><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempdir()</a></code>. To find out the location of the <code>disk.frame</code> use:</p>
+<div class="sourceCode" id="cb3"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu"><a href="https://rdrr.io/r/base/attr.html" class="external-link">attr</a></span><span class="op">(</span><span class="va">flights.df</span>, <span class="st">"path"</span><span class="op">)</span></code></pre></div>
 <p>You can also specify a location to output the <code>disk.frame</code> to using <code>outdir</code></p>
-<div class="sourceCode" id="cb4"><html><body><pre class="r"><span class="no">flights.df</span> <span class="kw">=</span> <span class="fu"><a href="../reference/as.disk.frame.html">as.disk.frame</a></span>(<span class="kw pkg">nycflights13</span><span class="kw ns">::</span><span class="no"><a href="https://rdrr.io/pkg/nycflights13/man/flights.html">flights</a></span>, <span class="kw">outdir</span> <span class="kw">=</span> <span class="st">"some/path.df"</span>)</pre></body></html></div>
+<div class="sourceCode" id="cb4"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">flights.df</span> <span class="op">=</span> <span class="fu"><a href="../reference/as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="fu">nycflights13</span><span class="fu">::</span><span class="va"><a href="https://rdrr.io/pkg/nycflights13/man/flights.html" class="external-link">flights</a></span>, outdir <span class="op">=</span> <span class="st">"some/path.df"</span><span class="op">)</span></code></pre></div>
 <p>it is recommended that you use <code>.df</code> as the extension for a <code>disk.frame</code>, however this is not an enforced requirement.</p>
 <p>However, one of the reasons for <code>disk.frame</code> to exist is to handle larger-than-RAM files, hence <code>as.disk.frame</code> is not all that useful because it can only convert data that can fit into RAM. <code>disk.frame</code> comes with a couple more ways to create <code>disk.frame</code>.</p>
 </div>
-<div id="creating-disk-frame-from-csvs" class="section level2">
-<h2 class="hasAnchor">
-<a href="#creating-disk-frame-from-csvs" class="anchor"></a>Creating <code>disk.frame</code> from CSVs</h2>
+<div class="section level3">
+<h3 id="creating-disk-frame-from-csvs">Creating <code>disk.frame</code> from CSVs<a class="anchor" aria-label="anchor" href="#creating-disk-frame-from-csvs"></a>
+</h3>
 <p>The function <code>csv_to_disk.frame</code> can convert CSV files to <code>disk.frame</code>. The most basic usage is</p>
-<div class="sourceCode" id="cb5"><html><body><pre class="r"><span class="no">some.df</span> <span class="kw">=</span> <span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span>(<span class="st">"some/path.csv"</span>, <span class="kw">outdir</span> <span class="kw">=</span> <span class="st">"some.df"</span>)</pre></body></html></div>
+<div class="sourceCode" id="cb5"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">some.df</span> <span class="op">=</span> <span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span><span class="op">(</span><span class="st">"some/path.csv"</span>, outdir <span class="op">=</span> <span class="st">"some.df"</span><span class="op">)</span></code></pre></div>
 <p>this will convert the CSV file <code>"some/path.csv"</code> to a <code>disk.frame</code>.</p>
 </div>
-<div id="multiple-csv-files" class="section level2">
-<h2 class="hasAnchor">
-<a href="#multiple-csv-files" class="anchor"></a>Multiple CSV files</h2>
+<div class="section level3">
+<h3 id="multiple-csv-files">Multiple CSV files<a class="anchor" aria-label="anchor" href="#multiple-csv-files"></a>
+</h3>
 <p>However, sometimes we have multiple CSV files that you want to read in and row-bind into one large <code>disk.frame</code>. You can do so by supplying a vector of file paths e.g. from the result of <code>list.files</code></p>
-<div class="sourceCode" id="cb6"><html><body><pre class="r"><span class="no">some.df</span> <span class="kw">=</span> <span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/c.html">c</a></span>(<span class="st">"some/path/file1.csv"</span>, <span class="st">"some/path/file2.csv"</span>))
+<div class="sourceCode" id="cb6"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">some.df</span> <span class="op">=</span> <span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">"some/path/file1.csv"</span>, <span class="st">"some/path/file2.csv"</span><span class="op">)</span><span class="op">)</span>
 
 <span class="co"># or</span>
-<span class="no">some.df</span> <span class="kw">=</span> <span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/list.files.html">list.files</a></span>(<span class="st">"some/path"</span>))</pre></body></html></div>
+<span class="va">some.df</span> <span class="op">=</span> <span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/list.files.html" class="external-link">list.files</a></span><span class="op">(</span><span class="st">"some/path"</span><span class="op">)</span><span class="op">)</span></code></pre></div>
 </div>
-<div id="ingesting-csv-files-chunk-wise" class="section level2">
-<h2 class="hasAnchor">
-<a href="#ingesting-csv-files-chunk-wise" class="anchor"></a>Ingesting CSV files chunk-wise</h2>
-<p>The <code><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame(path, ...)</a></code> function reads the file located at <code>path</code> in full into RAM but sometimes the CSV file may be too large to read in one go, as that would require loading the whole file into RAM. In that case, you can read the files chunk-by-chunk by using the <code>in_chunk_size</code> argument which controls how many rows you read in per chunk</p>
-<div class="sourceCode" id="cb7"><html><body><pre class="r"><span class="co"># to read in 1 million (=1e6) rows per chunk</span>
-<span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span>(<span class="no">path</span>, <span class="kw">in_chunk_size</span> <span class="kw">=</span> <span class="fl">1e6</span>)</pre></body></html></div>
-<p>When <code>in_chunk_size</code> is specified, the input file is split into many smaller files using <code>bigreadr</code>’s split file functions. This is generally the fastest way to ingest large CSVs, as the split files can be processed in parallel using all CPU cores. But the disk space requirement is doubled because the split files are as large as the original file. If you run out of disk space, then you must clean R’s temporary folder at <code><a href="https://rdrr.io/r/base/tempfile.html">tempdir()</a></code> and choose another <code>chunk_reader</code> e.g. <code><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame(..., chunk_reader = "LaF")</a></code>.</p>
+<div class="section level3">
+<h3 id="ingesting-csv-files-chunk-wise">Ingesting CSV files chunk-wise<a class="anchor" aria-label="anchor" href="#ingesting-csv-files-chunk-wise"></a>
+</h3>
+<p>The <code>csv_to_disk.frame(path, ...)</code> function reads the file located at <code>path</code> in full into RAM but sometimes the CSV file may be too large to read in one go, as that would require loading the whole file into RAM. In that case, you can read the files chunk-by-chunk by using the <code>in_chunk_size</code> argument which controls how many rows you read in per chunk</p>
+<div class="sourceCode" id="cb7"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="co"># to read in 1 million (=1e6) rows per chunk</span>
+<span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span><span class="op">(</span><span class="va">path</span>, in_chunk_size <span class="op">=</span> <span class="fl">1e6</span><span class="op">)</span></code></pre></div>
+<p>When <code>in_chunk_size</code> is specified, the input file is split into many smaller files using <code>bigreadr</code>’s split file functions. This is generally the fastest way to ingest large CSVs, as the split files can be processed in parallel using all CPU cores. But the disk space requirement is doubled because the split files are as large as the original file. If you run out of disk space, then you must clean R’s temporary folder at <code><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempdir()</a></code> and choose another <code>chunk_reader</code> e.g. <code>csv_to_disk.frame(..., chunk_reader = "LaF")</code>.</p>
 </div>
-<div id="sharding" class="section level2">
-<h2 class="hasAnchor">
-<a href="#sharding" class="anchor"></a>Sharding</h2>
+<div class="section level3">
+<h3 id="sharding">Sharding<a class="anchor" aria-label="anchor" href="#sharding"></a>
+</h3>
 <p>One of the most important aspects of <code>disk.frame</code> is sharding. One can shard a <code>disk.frame</code> at read time by using the <code>shardby</code></p>
-<div class="sourceCode" id="cb8"><html><body><pre class="r"><span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span>(<span class="no">path</span>, <span class="kw">shardby</span> <span class="kw">=</span> <span class="st">"id"</span>)</pre></body></html></div>
+<div class="sourceCode" id="cb8"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span><span class="op">(</span><span class="va">path</span>, shardby <span class="op">=</span> <span class="st">"id"</span><span class="op">)</span></code></pre></div>
 <p>In the above case, all rows with the same <code>id</code> values will end up in the same chunk.</p>
 </div>
-<div id="just-in-time-transformation" class="section level2">
-<h2 class="hasAnchor">
-<a href="#just-in-time-transformation" class="anchor"></a>Just-in-time transformation</h2>
+<div class="section level3">
+<h3 id="just-in-time-transformation">Just-in-time transformation<a class="anchor" aria-label="anchor" href="#just-in-time-transformation"></a>
+</h3>
 <p>Sometimes, one may wish to perform some transformation on the CSV before writing out to disk. One can use the <code>inmapfn</code> argument to do that. The <code>inmapfn</code> name comes from INput MAPping FuNction. The general usage pattern is as follows:</p>
-<div class="sourceCode" id="cb9"><html><body><pre class="r"><span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/file.path.html">file.path</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/tempfile.html">tempdir</a></span>(), <span class="st">"df.csv"</span>), <span class="kw">inmapfn</span> <span class="kw">=</span> <span class="kw">function</span>(<span class="no">chunk</span>) {
-  <span class="fu">some_transformation</span>(<span class="no">chunk</span>)
-})</pre></body></html></div>
+<div class="sourceCode" id="cb9"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/file.path.html" class="external-link">file.path</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempdir</a></span><span class="op">(</span><span class="op">)</span>, <span class="st">"df.csv"</span><span class="op">)</span>, inmapfn <span class="op">=</span> <span class="kw">function</span><span class="op">(</span><span class="va">chunk</span><span class="op">)</span> <span class="op">{</span>
+  <span class="fu">some_transformation</span><span class="op">(</span><span class="va">chunk</span><span class="op">)</span>
+<span class="op">}</span><span class="op">)</span></code></pre></div>
 <p>As a contrived example, suppose you wish to convert a string into date at read time:</p>
-<div class="sourceCode" id="cb10"><html><body><pre class="r"><span class="no">df</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/data.frame.html">data.frame</a></span>(<span class="kw">date_str</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html">c</a></span>(<span class="st">"2019-01-02"</span>, <span class="st">"2019-01-02"</span>))
+<div class="sourceCode" id="cb10"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">df</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/data.frame.html" class="external-link">data.frame</a></span><span class="op">(</span>date_str <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">"2019-01-02"</span>, <span class="st">"2019-01-02"</span><span class="op">)</span><span class="op">)</span>
 
 <span class="co"># write the data.frame </span>
-<span class="fu"><a href="https://rdrr.io/r/utils/write.table.html">write.csv</a></span>(<span class="no">df</span>, <span class="fu"><a href="https://rdrr.io/r/base/file.path.html">file.path</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/tempfile.html">tempdir</a></span>(), <span class="st">"df.csv"</span>))
+<span class="fu"><a href="https://rdrr.io/r/utils/write.table.html" class="external-link">write.csv</a></span><span class="op">(</span><span class="va">df</span>, <span class="fu"><a href="https://rdrr.io/r/base/file.path.html" class="external-link">file.path</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempdir</a></span><span class="op">(</span><span class="op">)</span>, <span class="st">"df.csv"</span><span class="op">)</span><span class="op">)</span>
 
 
 <span class="co"># this would show that date_str is a string</span>
-<span class="fu"><a href="https://rdrr.io/r/utils/str.html">str</a></span>(<span class="fu">collect</span>(<span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/file.path.html">file.path</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/tempfile.html">tempdir</a></span>(), <span class="st">"df.csv"</span>)))$<span class="no">date_str</span>)
+<span class="fu"><a href="https://rdrr.io/r/utils/str.html" class="external-link">str</a></span><span class="op">(</span><span class="fu"><a href="https://dplyr.tidyverse.org/reference/compute.html" class="external-link">collect</a></span><span class="op">(</span><span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/file.path.html" class="external-link">file.path</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempdir</a></span><span class="op">(</span><span class="op">)</span>, <span class="st">"df.csv"</span><span class="op">)</span><span class="op">)</span><span class="op">)</span><span class="op">$</span><span class="va">date_str</span><span class="op">)</span>
 <span class="co">## chr [1:2] "2019-01-02" "2019-01-02"</span>
 
 <span class="co"># this would show that date_str is a string</span>
-<span class="no">df</span> <span class="kw">=</span> <span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/file.path.html">file.path</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/tempfile.html">tempdir</a></span>(), <span class="st">"df.csv"</span>), <span class="kw">inmapfn</span> <span class="kw">=</span> <span class="kw">function</span>(<span class="no">chunk</span>) {
+<span class="va">df</span> <span class="op">=</span> <span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/file.path.html" class="external-link">file.path</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempdir</a></span><span class="op">(</span><span class="op">)</span>, <span class="st">"df.csv"</span><span class="op">)</span>, inmapfn <span class="op">=</span> <span class="kw">function</span><span class="op">(</span><span class="va">chunk</span><span class="op">)</span> <span class="op">{</span>
   <span class="co"># convert to date_str to date format and store as "date"</span>
-  <span class="no">chunk</span>[, <span class="no">date</span> <span class="kw">:=</span> <span class="fu"><a href="https://rdrr.io/r/base/as.Date.html">as.Date</a></span>(<span class="no">date_str</span>, <span class="st">"%Y-%m-%d"</span>)]
-  <span class="no">chunk</span>[, <span class="no">date_str</span><span class="kw">:=</span><span class="kw">NULL</span>]
-})
+  <span class="va">chunk</span><span class="op">[</span>, <span class="va">date</span> <span class="op">:=</span> <span class="fu"><a href="https://rdrr.io/r/base/as.Date.html" class="external-link">as.Date</a></span><span class="op">(</span><span class="va">date_str</span>, <span class="st">"%Y-%m-%d"</span><span class="op">)</span><span class="op">]</span>
+  <span class="va">chunk</span><span class="op">[</span>, <span class="va">date_str</span><span class="op">:=</span><span class="cn">NULL</span><span class="op">]</span>
+<span class="op">}</span><span class="op">)</span>
 
-<span class="fu"><a href="https://rdrr.io/r/utils/str.html">str</a></span>(<span class="fu">collect</span>(<span class="no">df</span>)$<span class="no">date</span>)
-<span class="co">## Date[1:2], format: "2019-01-02" "2019-01-02"</span></pre></body></html></div>
+<span class="fu"><a href="https://rdrr.io/r/utils/str.html" class="external-link">str</a></span><span class="op">(</span><span class="fu"><a href="https://dplyr.tidyverse.org/reference/compute.html" class="external-link">collect</a></span><span class="op">(</span><span class="va">df</span><span class="op">)</span><span class="op">$</span><span class="va">date</span><span class="op">)</span>
+<span class="co">## Date[1:2], format: "2019-01-02" "2019-01-02"</span></code></pre></div>
 </div>
-<div id="reading-csvs-from-zip-files" class="section level2">
-<h2 class="hasAnchor">
-<a href="#reading-csvs-from-zip-files" class="anchor"></a>Reading CSVs from zip files</h2>
+<div class="section level3">
+<h3 id="reading-csvs-from-zip-files">Reading CSVs from zip files<a class="anchor" aria-label="anchor" href="#reading-csvs-from-zip-files"></a>
+</h3>
 <p>Often, CSV comes zipped in a zip files. You can use the <code>zip_to_disk.frame</code> to convert all CSVs within a zip file</p>
-<div class="sourceCode" id="cb11"><html><body><pre class="r"><span class="fu"><a href="../reference/zip_to_disk.frame.html">zip_to_disk.frame</a></span>(<span class="no">path_to_zip_file</span>)</pre></body></html></div>
+<div class="sourceCode" id="cb11"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu"><a href="../reference/zip_to_disk.frame.html">zip_to_disk.frame</a></span><span class="op">(</span><span class="va">path_to_zip_file</span><span class="op">)</span></code></pre></div>
 <p>The arguments for <code>zip_to_disk.frame</code> are the same as <code>csv_to_disk.frame</code>’s.</p>
 </div>
-<div id="using-add_chunk" class="section level2">
-<h2 class="hasAnchor">
-<a href="#using-add_chunk" class="anchor"></a>Using <code>add_chunk</code>
-</h2>
+<div class="section level3">
+<h3 id="using-add_chunk">Using <code>add_chunk</code><a class="anchor" aria-label="anchor" href="#using-add_chunk"></a>
+</h3>
 <p>What if the method of converting to a <code>disk.frame</code> isn’t implemented in <code>disk.frame</code> yet? One can use some lower level constructs provided by <code>disk.frame</code> to create <code>disk.frame</code>s. For example, the <code>add_chunk</code> function can be used to add more chunks to a <code>disk.frame</code>, e.g.</p>
-<div class="sourceCode" id="cb12"><html><body><pre class="r"><span class="no">a.df</span> <span class="kw">=</span> <span class="fu"><a href="../reference/disk.frame.html">disk.frame</a></span>() <span class="co"># create an empty disk.frame</span>
-<span class="fu"><a href="../reference/add_chunk.html">add_chunk</a></span>(<span class="no">a.df</span>, <span class="no">cars</span>) <span class="co"># adds cars as chunk 1</span>
-<span class="fu"><a href="../reference/add_chunk.html">add_chunk</a></span>(<span class="no">a.df</span>, <span class="no">cars</span>) <span class="co"># adds cars as chunk 2</span></pre></body></html></div>
+<div class="sourceCode" id="cb12"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">a.df</span> <span class="op">=</span> <span class="fu"><a href="../reference/disk.frame.html">disk.frame</a></span><span class="op">(</span><span class="op">)</span> <span class="co"># create an empty disk.frame</span>
+<span class="fu"><a href="../reference/add_chunk.html">add_chunk</a></span><span class="op">(</span><span class="va">a.df</span>, <span class="va">cars</span><span class="op">)</span> <span class="co"># adds cars as chunk 1</span>
+<span class="fu"><a href="../reference/add_chunk.html">add_chunk</a></span><span class="op">(</span><span class="va">a.df</span>, <span class="va">cars</span><span class="op">)</span> <span class="co"># adds cars as chunk 2</span></code></pre></div>
 <p>Another example of using <code>add_chunk</code> is via <code>readr</code>’s chunked read functions to create a delimited file reader</p>
-<div class="sourceCode" id="cb13"><html><body><pre class="r"><span class="no">delimited_to_disk.frame</span> <span class="kw">&lt;-</span> <span class="kw">function</span>(<span class="no">file</span>, <span class="no">outdir</span>, <span class="no">...</span>) {
-  <span class="no">res.df</span> <span class="kw">=</span> <span class="fu"><a href="../reference/disk.frame.html">disk.frame</a></span>(<span class="no">outdir</span>, <span class="no">...</span>)
-  <span class="kw pkg">readr</span><span class="kw ns">::</span><span class="fu"><a href="https://readr.tidyverse.org/reference/read_delim_chunked.html">read_delim_chunked</a></span>(<span class="no">file</span>, <span class="kw">callback</span> <span class="kw">=</span> <span class="kw">function</span>(<span class="no">chunk</span>) {
-    <span class="fu"><a href="../reference/add_chunk.html">add_chunk</a></span>(<span class="no">res.df</span>, <span class="no">chunk</span>)
-  }, <span class="no">...</span>)
-
-  <span class="no">res.df</span>
-}
+<div class="sourceCode" id="cb13"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">delimited_to_disk.frame</span> <span class="op">&lt;-</span> <span class="kw">function</span><span class="op">(</span><span class="va">file</span>, <span class="va">outdir</span>, <span class="va">...</span><span class="op">)</span> <span class="op">{</span>
+  <span class="va">res.df</span> <span class="op">=</span> <span class="fu"><a href="../reference/disk.frame.html">disk.frame</a></span><span class="op">(</span><span class="va">outdir</span>, <span class="va">...</span><span class="op">)</span>
+  <span class="fu">readr</span><span class="fu">::</span><span class="fu"><a href="https://readr.tidyverse.org/reference/read_delim_chunked.html" class="external-link">read_delim_chunked</a></span><span class="op">(</span><span class="va">file</span>, callback <span class="op">=</span> <span class="kw">function</span><span class="op">(</span><span class="va">chunk</span><span class="op">)</span> <span class="op">{</span>
+    <span class="fu"><a href="../reference/add_chunk.html">add_chunk</a></span><span class="op">(</span><span class="va">res.df</span>, <span class="va">chunk</span><span class="op">)</span>
+  <span class="op">}</span>, <span class="va">...</span><span class="op">)</span>
+  
+  <span class="va">res.df</span>
+<span class="op">}</span>
 
-<span class="fu">delimited_to_disk.frame</span>(<span class="no">path</span>, <span class="kw">outdir</span> <span class="kw">=</span> <span class="st">"some.df"</span>)</pre></body></html></div>
+<span class="fu">delimited_to_disk.frame</span><span class="op">(</span><span class="va">path</span>, outdir <span class="op">=</span> <span class="st">"some.df"</span><span class="op">)</span></code></pre></div>
 <p>The above code uses <code>readr</code>’s <code>read_delim_chunked</code> function to read <code>file</code> and call <code>add_chunk</code>. The problem with this approach is that is it sequential in nature and hence is not able to take advantage of parallelism.</p>
 </div>
-<div id="exploiting-the-structure-of-a-disk-frame" class="section level2">
-<h2 class="hasAnchor">
-<a href="#exploiting-the-structure-of-a-disk-frame" class="anchor"></a>Exploiting the structure of a disk.frame</h2>
+<div class="section level3">
+<h3 id="exploiting-the-structure-of-a-disk-frame">Exploiting the structure of a disk.frame<a class="anchor" aria-label="anchor" href="#exploiting-the-structure-of-a-disk-frame"></a>
+</h3>
 <p>Of course, a <code>disk.frame</code> is just a folder with many <code>fst</code> files named as <code>1.fst</code>, <code>2.fst</code> etc. So one can simply create these <code>fst</code> files and ensure they have the same variable names and put them in a folder.</p>
 </div>
 </div>
@@ -258,11 +268,13 @@ <h2 class="hasAnchor">
 
 
       <footer><div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+  <p></p>
+<p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p>
+<p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
       </footer>
@@ -271,5 +283,7 @@ <h2 class="hasAnchor">
   
 
 
+  
+
   </body>
 </html>
diff --git a/docs/articles/04-ingesting-data_files/header-attrs-2.8/header-attrs.js b/docs/articles/04-ingesting-data_files/header-attrs-2.8/header-attrs.js
new file mode 100644
index 00000000..dd57d92e
--- /dev/null
+++ b/docs/articles/04-ingesting-data_files/header-attrs-2.8/header-attrs.js
@@ -0,0 +1,12 @@
+// Pandoc 2.9 adds attributes on both header and div. We remove the former (to
+// be compatible with the behavior of Pandoc < 2.8).
+document.addEventListener('DOMContentLoaded', function(e) {
+  var hs = document.querySelectorAll("div.section[class*='level'] > :first-child");
+  var i, h, a;
+  for (i = 0; i < hs.length; i++) {
+    h = hs[i];
+    if (!/^h[1-6]$/i.test(h.tagName)) continue;  // it should be a header h1-h6
+    a = h.attributes;
+    while (a.length > 0) h.removeAttribute(a[0].name);
+  }
+});
diff --git a/docs/articles/05-data-table-syntax.html b/docs/articles/05-data-table-syntax.html
index b2d9c2df..c59cc037 100644
--- a/docs/articles/05-data-table-syntax.html
+++ b/docs/articles/05-data-table-syntax.html
@@ -19,6 +19,8 @@
 <![endif]-->
 </head>
 <body data-spy="scroll" data-target="#toc">
+    
+
     <div class="container template-article">
       <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
@@ -31,18 +33,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
       <ul class="nav navbar-nav">
-<li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
 <li>
   <a href="../reference/index.html">Reference</a>
 </li>
@@ -86,6 +82,9 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
   </ul>
 </li>
 <li>
@@ -94,8 +93,8 @@
       </ul>
 <ul class="nav navbar-nav navbar-right">
 <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
@@ -113,38 +112,41 @@
   <div class="col-md-9 contents">
     <div class="page-header toc-ignore">
       <h1 data-toc-skip>Using data.table syntax with disk.frame</h1>
-                        <h4 class="author">ZJ</h4>
+                        <h4 data-toc-skip class="author">ZJ</h4>
             
       
-      <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/master/vignettes/05-data-table-syntax.Rmd"><code>vignettes/05-data-table-syntax.Rmd</code></a></small>
+      <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/vignettes/05-data-table-syntax.Rmd" class="external-link"><code>vignettes/05-data-table-syntax.Rmd</code></a></small>
       <div class="hidden name"><code>05-data-table-syntax.Rmd</code></div>
 
     </div>
 
     
     
-<div id="disk-frame-supports-data-table-syntax" class="section level2">
-<h2 class="hasAnchor">
-<a href="#disk-frame-supports-data-table-syntax" class="anchor"></a><code>disk.frame</code> supports <code>data.table</code> syntax</h2>
-<div class="sourceCode" id="cb1"><html><body><pre class="r"><span class="fu"><a href="https://rdrr.io/r/base/library.html">library</a></span>(<span class="no">disk.frame</span>)
+<div class="section level2">
+<h2 id="disk-frame-supports-data-table-syntax">
+<code>disk.frame</code> supports <code>data.table</code> syntax<a class="anchor" aria-label="anchor" href="#disk-frame-supports-data-table-syntax"></a>
+</h2>
+<div class="sourceCode" id="cb1"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://diskframe.com" class="external-link">disk.frame</a></span><span class="op">)</span>
 
 <span class="co"># set-up disk.frame to use multiple workers</span>
-<span class="kw">if</span>(<span class="fu"><a href="https://rdrr.io/r/base/interactive.html">interactive</a></span>()) {
-  <span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span>()
+<span class="kw">if</span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/interactive.html" class="external-link">interactive</a></span><span class="op">(</span><span class="op">)</span><span class="op">)</span> <span class="op">{</span>
+  <span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span><span class="op">(</span><span class="op">)</span>
   <span class="co"># highly recommended, however it is pun into interactive() for CRAN because</span>
   <span class="co"># change user options are not allowed on CRAN</span>
-  <span class="fu"><a href="https://rdrr.io/r/base/options.html">options</a></span>(<span class="kw">future.globals.maxSize</span> <span class="kw">=</span> <span class="fl">Inf</span>)
-} <span class="kw">else</span> {
-  <span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span>(<span class="fl">2</span>)
-}
+  <span class="fu"><a href="https://rdrr.io/r/base/options.html" class="external-link">options</a></span><span class="op">(</span>future.globals.maxSize <span class="op">=</span> <span class="cn">Inf</span><span class="op">)</span>  
+<span class="op">}</span> <span class="kw">else</span> <span class="op">{</span>
+  <span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span><span class="op">(</span><span class="fl">2</span><span class="op">)</span>
+<span class="op">}</span>
 
 
-<span class="fu"><a href="https://rdrr.io/r/base/library.html">library</a></span>(<span class="no">nycflights13</span>)
+<span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://github.com/hadley/nycflights13" class="external-link">nycflights13</a></span><span class="op">)</span>
 
 <span class="co"># create a disk.frame</span>
-<span class="no">flights.df</span> <span class="kw">=</span> <span class="fu"><a href="../reference/as.disk.frame.html">as.disk.frame</a></span>(<span class="kw pkg">nycflights13</span><span class="kw ns">::</span><span class="no"><a href="https://rdrr.io/pkg/nycflights13/man/flights.html">flights</a></span>, <span class="kw">outdir</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/file.path.html">file.path</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/tempfile.html">tempdir</a></span>(),<span class="st">"flights13"</span>), <span class="kw">overwrite</span> <span class="kw">=</span> <span class="fl">TRUE</span>)</pre></body></html></div>
+<span class="va">flights.df</span> <span class="op">=</span> <span class="fu"><a href="../reference/as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="fu">nycflights13</span><span class="fu">::</span><span class="va"><a href="https://rdrr.io/pkg/nycflights13/man/flights.html" class="external-link">flights</a></span>, outdir <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/file.path.html" class="external-link">file.path</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempdir</a></span><span class="op">(</span><span class="op">)</span>,<span class="st">"flights13"</span><span class="op">)</span>, overwrite <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span></code></pre></div>
 <p>In the following example, I will use the <code>.N</code> from the <code>data.table</code> package to count the unique combinations <code>year</code> and <code>month</code> within each chunk.</p>
-<div class="sourceCode" id="cb2"><html><body><pre class="r"><span class="fu"><a href="https://rdrr.io/r/base/library.html">library</a></span>(<span class="no">data.table</span>)
+<div class="sourceCode" id="cb2"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://r-datatable.com" class="external-link">data.table</a></span><span class="op">)</span>
 <span class="co">#&gt; </span>
 <span class="co">#&gt; Attaching package: 'data.table'</span>
 <span class="co">#&gt; The following object is masked from 'package:purrr':</span>
@@ -153,18 +155,18 @@ <h2 class="hasAnchor">
 <span class="co">#&gt; The following objects are masked from 'package:dplyr':</span>
 <span class="co">#&gt; </span>
 <span class="co">#&gt;     between, first, last</span>
-<span class="fu"><a href="https://rdrr.io/r/base/library.html">library</a></span>(<span class="no">disk.frame</span>)
+<span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://diskframe.com" class="external-link">disk.frame</a></span><span class="op">)</span>
 
-<span class="no">flights.df</span> <span class="kw">=</span> <span class="fu"><a href="../reference/disk.frame.html">disk.frame</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/file.path.html">file.path</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/tempfile.html">tempdir</a></span>(),<span class="st">"flights13"</span>))
+<span class="va">flights.df</span> <span class="op">=</span> <span class="fu"><a href="../reference/disk.frame.html">disk.frame</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/file.path.html" class="external-link">file.path</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempdir</a></span><span class="op">(</span><span class="op">)</span>,<span class="st">"flights13"</span><span class="op">)</span><span class="op">)</span>
 
-<span class="fu"><a href="https://rdrr.io/r/base/names.html">names</a></span>(<span class="no">flights.df</span>)
+<span class="fu"><a href="https://rdrr.io/r/base/names.html" class="external-link">names</a></span><span class="op">(</span><span class="va">flights.df</span><span class="op">)</span>
 <span class="co">#&gt;  [1] "year"           "month"          "day"            "dep_time"      </span>
 <span class="co">#&gt;  [5] "sched_dep_time" "dep_delay"      "arr_time"       "sched_arr_time"</span>
 <span class="co">#&gt;  [9] "arr_delay"      "carrier"        "flight"         "tailnum"       </span>
 <span class="co">#&gt; [13] "origin"         "dest"           "air_time"       "distance"      </span>
 <span class="co">#&gt; [17] "hour"           "minute"         "time_hour"</span>
 
-<span class="no">flights.df</span>[,<span class="no">.N</span>, <span class="fu">.</span>(<span class="no">year</span>, <span class="no">month</span>), <span class="kw">keep</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html">c</a></span>(<span class="st">"year"</span>, <span class="st">"month"</span>)]
+<span class="va">flights.df</span><span class="op">[</span>,<span class="va">.N</span>, <span class="fu">.</span><span class="op">(</span><span class="va">year</span>, <span class="va">month</span><span class="op">)</span>, keep <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">"year"</span>, <span class="st">"month"</span><span class="op">)</span><span class="op">]</span>
 <span class="co">#&gt;     year month     N</span>
 <span class="co">#&gt;  1: 2013     1 27004</span>
 <span class="co">#&gt;  2: 2013    10 28889</span>
@@ -182,20 +184,22 @@ <h2 class="hasAnchor">
 <span class="co">#&gt; 14: 2013     7 29425</span>
 <span class="co">#&gt; 15: 2013     8   775</span>
 <span class="co">#&gt; 16: 2013     8 28552</span>
-<span class="co">#&gt; 17: 2013     9 27574</span></pre></body></html></div>
+<span class="co">#&gt; 17: 2013     9 27574</span></code></pre></div>
 <p>All <code>data.table</code> syntax are supported. However, <code>disk.frame</code> adds the ability to load only those columns required for the analysis using the <code>keep =</code> option. In the above analysis, only the <code>year</code> and <code>month</code> variables are required and hence <code>keep = c("year", "month")</code> was used.</p>
 <p>Alternatively, we can use the <code>srckeep</code> function to achieve the same, e.g.</p>
-<div class="sourceCode" id="cb3"><html><body><pre class="r"><span class="fu"><a href="../reference/srckeep.html">srckeep</a></span>(<span class="no">flights.df</span>, <span class="fu"><a href="https://rdrr.io/r/base/c.html">c</a></span>(<span class="st">"year"</span>, <span class="st">"month"</span>))[,<span class="no">.N</span>, <span class="fu">.</span>(<span class="no">year</span>, <span class="no">month</span>)]</pre></body></html></div>
-<div id="external-variables-are-captured" class="section level3">
-<h3 class="hasAnchor">
-<a href="#external-variables-are-captured" class="anchor"></a>External variables are captured</h3>
+<div class="sourceCode" id="cb3"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu"><a href="../reference/srckeep.html">srckeep</a></span><span class="op">(</span><span class="va">flights.df</span>, <span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">"year"</span>, <span class="st">"month"</span><span class="op">)</span><span class="op">)</span><span class="op">[</span>,<span class="va">.N</span>, <span class="fu">.</span><span class="op">(</span><span class="va">year</span>, <span class="va">month</span><span class="op">)</span><span class="op">]</span></code></pre></div>
+<div class="section level3">
+<h3 id="external-variables-are-captured">External variables are captured<a class="anchor" aria-label="anchor" href="#external-variables-are-captured"></a>
+</h3>
 <p><code>disk.frame</code> sends the computation to background workers which are essentially distinct and separate R sessions. Typically, the variables that you have available in your current R session aren’t visible in the other R sessions, but <code>disk.frame</code> uses the <code>future</code> package’s variable detection abilities to figure out which variables are in use and then send them to the background workers so they have access to the variables as well. E.g.</p>
-<div class="sourceCode" id="cb4"><html><body><pre class="r"><span class="no">y</span> <span class="kw">=</span> <span class="fl">42</span>
-<span class="no">some_fn</span> <span class="kw">&lt;-</span> <span class="kw">function</span>(<span class="no">x</span>) <span class="no">x</span>
+<div class="sourceCode" id="cb4"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">y</span> <span class="op">=</span> <span class="fl">42</span> 
+<span class="va">some_fn</span> <span class="op">&lt;-</span> <span class="kw">function</span><span class="op">(</span><span class="va">x</span><span class="op">)</span> <span class="va">x</span>
 
 
-<span class="no">flights.df</span>[,<span class="fu">some_fn</span>(<span class="no">y</span>)]
-<span class="co">#&gt; [1] 42 42 42 42 42 42</span></pre></body></html></div>
+<span class="va">flights.df</span><span class="op">[</span>,<span class="fu">some_fn</span><span class="op">(</span><span class="va">y</span><span class="op">)</span><span class="op">]</span>
+<span class="co">#&gt; [1] 42 42 42 42 42 42</span></code></pre></div>
 <p>In the above example, neither <code>some_fn</code> nor <code>y</code> are defined in the background workers’ environments, but <code>disk.frame</code> still manages to evaluate this code <code>flights.df[,some_fn(y)]</code>.</p>
 </div>
 </div>
@@ -212,11 +216,13 @@ <h3 class="hasAnchor">
 
 
       <footer><div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+  <p></p>
+<p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p>
+<p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
       </footer>
@@ -225,5 +231,7 @@ <h3 class="hasAnchor">
   
 
 
+  
+
   </body>
 </html>
diff --git a/docs/articles/05-data-table-syntax_files/header-attrs-2.8/header-attrs.js b/docs/articles/05-data-table-syntax_files/header-attrs-2.8/header-attrs.js
new file mode 100644
index 00000000..dd57d92e
--- /dev/null
+++ b/docs/articles/05-data-table-syntax_files/header-attrs-2.8/header-attrs.js
@@ -0,0 +1,12 @@
+// Pandoc 2.9 adds attributes on both header and div. We remove the former (to
+// be compatible with the behavior of Pandoc < 2.8).
+document.addEventListener('DOMContentLoaded', function(e) {
+  var hs = document.querySelectorAll("div.section[class*='level'] > :first-child");
+  var i, h, a;
+  for (i = 0; i < hs.length; i++) {
+    h = hs[i];
+    if (!/^h[1-6]$/i.test(h.tagName)) continue;  // it should be a header h1-h6
+    a = h.attributes;
+    while (a.length > 0) h.removeAttribute(a[0].name);
+  }
+});
diff --git a/docs/articles/06-vs-dask-juliadb.html b/docs/articles/06-vs-dask-juliadb.html
index 0a92819f..053e7c5e 100644
--- a/docs/articles/06-vs-dask-juliadb.html
+++ b/docs/articles/06-vs-dask-juliadb.html
@@ -19,6 +19,8 @@
 <![endif]-->
 </head>
 <body data-spy="scroll" data-target="#toc">
+    
+
     <div class="container template-article">
       <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
@@ -31,18 +33,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
       <ul class="nav navbar-nav">
-<li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
 <li>
   <a href="../reference/index.html">Reference</a>
 </li>
@@ -86,6 +82,9 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
   </ul>
 </li>
 <li>
@@ -94,8 +93,8 @@
       </ul>
 <ul class="nav navbar-nav navbar-right">
 <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
@@ -113,95 +112,101 @@
   <div class="col-md-9 contents">
     <div class="page-header toc-ignore">
       <h1 data-toc-skip>Benchmarks 1: disk.frame beats Dask! disk.frame beats JuliaDB! Anyone else wanna challenge?</h1>
-                        <h4 class="author">ZJ</h4>
+                        <h4 data-toc-skip class="author">ZJ</h4>
             
       
-      <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/master/vignettes/06-vs-dask-juliadb.Rmd"><code>vignettes/06-vs-dask-juliadb.Rmd</code></a></small>
+      <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/vignettes/06-vs-dask-juliadb.Rmd" class="external-link"><code>vignettes/06-vs-dask-juliadb.Rmd</code></a></small>
       <div class="hidden name"><code>06-vs-dask-juliadb.Rmd</code></div>
 
     </div>
 
     
     
-<div id="intro---benchmark-1" class="section level1">
-<h1 class="hasAnchor">
-<a href="#intro---benchmark-1" class="anchor"></a>Intro - Benchmark 1</h1>
+<div class="section level2">
+<h2 id="intro---benchmark-1">Intro - Benchmark 1<a class="anchor" aria-label="anchor" href="#intro---benchmark-1"></a>
+</h2>
 <p>This is the first in a series to benchmark the performance of disk.frame vs other medium-data tools. For Python, we will benchmark Dask, and for Julia, we will benchmark JuliaDB.jl. In the process, I will do a warts-and-all account of the tools I have tested.</p>
-<p>The title was ‘inspired’ by <a href="https://matloff.wordpress.com/2014/05/21/r-beats-python-r-beats-julia-anyone-else-wanna-challenge-r/">this post titled “R beats Python! R beats Julia! Anyone else wanna challenge R?”</a>.</p>
+<p>The title was ‘inspired’ by <a href="https://matloff.wordpress.com/2014/05/21/r-beats-python-r-beats-julia-anyone-else-wanna-challenge-r/" class="external-link">this post titled “R beats Python! R beats Julia! Anyone else wanna challenge R?”</a>.</p>
 </div>
-<div id="tldr" class="section level1">
-<h1 class="hasAnchor">
-<a href="#tldr" class="anchor"></a>TL;DR</h1>
+<div class="section level2">
+<h2 id="tldr">TL;DR<a class="anchor" aria-label="anchor" href="#tldr"></a>
+</h2>
 <p>For this simple benchmark, disk.frame is faster. But Dask has a more convenient syntax. JuliaDB.jl is not ready for prime time.</p>
-<div id="timings" class="section level4">
-<h4 class="hasAnchor">
-<a href="#timings" class="anchor"></a>Timings</h4>
+<div class="section level5">
+<h5 id="timings">Timings<a class="anchor" aria-label="anchor" href="#timings"></a>
+</h5>
 <p>Please note I have not tried to record the precise times over many runs, but I aim illustrate the magnitude of speed of the different packages</p>
-<div class="sourceCode" id="cb1"><html><body><pre class="r"><span class="fu"><a href="https://rdrr.io/r/base/library.html">library</a></span>(<span class="no">ggplot2</span>)
+<div class="sourceCode" id="cb1"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://ggplot2.tidyverse.org" class="external-link">ggplot2</a></span><span class="op">)</span>
 
-<span class="no">df</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/data.frame.html">data.frame</a></span>(
-  <span class="kw">tool</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html">c</a></span>(<span class="st">"disk.frame"</span>, <span class="st">"Dask"</span>, <span class="st">"JuliaDB.jl"</span>),
-  <span class="kw">timing</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html">c</a></span>(<span class="fl">17.9</span>, <span class="fl">50</span>, <span class="fl">76</span>)
-)
+<span class="va">df</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/data.frame.html" class="external-link">data.frame</a></span><span class="op">(</span>
+  tool <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">"disk.frame"</span>, <span class="st">"Dask"</span>, <span class="st">"JuliaDB.jl"</span><span class="op">)</span>,
+  timing <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="fl">17.9</span>, <span class="fl">50</span>, <span class="fl">76</span><span class="op">)</span>
+<span class="op">)</span>
 
-<span class="fu"><a href="https://ggplot2.tidyverse.org/reference/ggplot.html">ggplot</a></span>(<span class="no">df</span>) +
-  <span class="fu"><a href="https://ggplot2.tidyverse.org/reference/geom_bar.html">geom_bar</a></span>(<span class="fu"><a href="https://ggplot2.tidyverse.org/reference/aes.html">aes</a></span>(<span class="kw">x</span> <span class="kw">=</span> <span class="no">tool</span>, <span class="kw">weight</span> <span class="kw">=</span> <span class="no">timing</span>), <span class="kw">stat</span> <span class="kw">=</span> <span class="st">"count"</span>) +
-  <span class="fu"><a href="https://ggplot2.tidyverse.org/reference/labs.html">ylab</a></span>(<span class="st">"seconds"</span>) +
-  <span class="fu"><a href="https://ggplot2.tidyverse.org/reference/labs.html">ggtitle</a></span>(<span class="st">"Convert to desired format timing"</span>)</pre></body></html></div>
+<span class="fu"><a href="https://ggplot2.tidyverse.org/reference/ggplot.html" class="external-link">ggplot</a></span><span class="op">(</span><span class="va">df</span><span class="op">)</span> <span class="op">+</span>
+  <span class="fu"><a href="https://ggplot2.tidyverse.org/reference/geom_bar.html" class="external-link">geom_bar</a></span><span class="op">(</span><span class="fu"><a href="https://ggplot2.tidyverse.org/reference/aes.html" class="external-link">aes</a></span><span class="op">(</span>x <span class="op">=</span> <span class="va">tool</span>, weight <span class="op">=</span> <span class="va">timing</span><span class="op">)</span>, stat <span class="op">=</span> <span class="st">"count"</span><span class="op">)</span> <span class="op">+</span> 
+  <span class="fu"><a href="https://ggplot2.tidyverse.org/reference/labs.html" class="external-link">ylab</a></span><span class="op">(</span><span class="st">"seconds"</span><span class="op">)</span> <span class="op">+</span>
+  <span class="fu"><a href="https://ggplot2.tidyverse.org/reference/labs.html" class="external-link">ggtitle</a></span><span class="op">(</span><span class="st">"Convert to desired format timing"</span><span class="op">)</span></code></pre></div>
 <p><img src="06-vs-dask-juliadb_files/figure-html/unnamed-chunk-2-1.png" width="700"></p>
 <p>Next up is timings for the simple aggregation</p>
-<div class="sourceCode" id="cb2"><html><body><pre class="r"><span class="no">df</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/data.frame.html">data.frame</a></span>(
-  <span class="kw">tool</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html">c</a></span>(<span class="st">"disk.frame"</span>, <span class="st">"Dask"</span>, <span class="st">"JuliaDB.jl"</span>),
-  <span class="kw">timing</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html">c</a></span>(<span class="fl">1</span>, <span class="fl">1.2</span>, <span class="fl">6</span>)
-)
+<div class="sourceCode" id="cb2"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">df</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/data.frame.html" class="external-link">data.frame</a></span><span class="op">(</span>
+  tool <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">"disk.frame"</span>, <span class="st">"Dask"</span>, <span class="st">"JuliaDB.jl"</span><span class="op">)</span>,
+  timing <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="fl">1</span>, <span class="fl">1.2</span>, <span class="fl">6</span><span class="op">)</span>
+<span class="op">)</span>
 
-<span class="fu"><a href="https://rdrr.io/r/base/library.html">library</a></span>(<span class="no">ggplot2</span>)
-<span class="fu"><a href="https://ggplot2.tidyverse.org/reference/ggplot.html">ggplot</a></span>(<span class="no">df</span>) +
-  <span class="fu"><a href="https://ggplot2.tidyverse.org/reference/geom_bar.html">geom_bar</a></span>(<span class="fu"><a href="https://ggplot2.tidyverse.org/reference/aes.html">aes</a></span>(<span class="kw">x</span> <span class="kw">=</span> <span class="no">tool</span>, <span class="kw">weight</span> <span class="kw">=</span> <span class="no">timing</span>), <span class="kw">stat</span> <span class="kw">=</span> <span class="st">"count"</span>) +
-  <span class="fu"><a href="https://ggplot2.tidyverse.org/reference/labs.html">ylab</a></span>(<span class="st">"seconds"</span>) +
-  <span class="fu"><a href="https://ggplot2.tidyverse.org/reference/labs.html">ggtitle</a></span>(<span class="st">"Count(*) group-by timings"</span>)</pre></body></html></div>
+<span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://ggplot2.tidyverse.org" class="external-link">ggplot2</a></span><span class="op">)</span>
+<span class="fu"><a href="https://ggplot2.tidyverse.org/reference/ggplot.html" class="external-link">ggplot</a></span><span class="op">(</span><span class="va">df</span><span class="op">)</span> <span class="op">+</span>
+  <span class="fu"><a href="https://ggplot2.tidyverse.org/reference/geom_bar.html" class="external-link">geom_bar</a></span><span class="op">(</span><span class="fu"><a href="https://ggplot2.tidyverse.org/reference/aes.html" class="external-link">aes</a></span><span class="op">(</span>x <span class="op">=</span> <span class="va">tool</span>, weight <span class="op">=</span> <span class="va">timing</span><span class="op">)</span>, stat <span class="op">=</span> <span class="st">"count"</span><span class="op">)</span> <span class="op">+</span> 
+  <span class="fu"><a href="https://ggplot2.tidyverse.org/reference/labs.html" class="external-link">ylab</a></span><span class="op">(</span><span class="st">"seconds"</span><span class="op">)</span> <span class="op">+</span>
+  <span class="fu"><a href="https://ggplot2.tidyverse.org/reference/labs.html" class="external-link">ggtitle</a></span><span class="op">(</span><span class="st">"Count(*) group-by timings"</span><span class="op">)</span></code></pre></div>
 <p><img src="06-vs-dask-juliadb_files/figure-html/unnamed-chunk-3-1.png" width="700"></p>
 </div>
-<div id="data" class="section level2">
-<h2 class="hasAnchor">
-<a href="#data" class="anchor"></a>Data</h2>
-<p>The data can be obtained from <a href="https://docs.rapids.ai/datasets/mortgage-data">Rapids.ai’s Fannie Mae Data distribution page</a>. I have downloaded the <a href="http://rapidsai-data.s3-website.us-east-2.amazonaws.com/notebook-mortgage-data/mortgage_2000-2016.tgz">17 Years data</a> which contains dat on 37 million loans with over 1.89 billions rows in Performance datasets.</p>
+<div class="section level3">
+<h3 id="data">Data<a class="anchor" aria-label="anchor" href="#data"></a>
+</h3>
+<p>The data can be obtained from <a href="https://docs.rapids.ai/datasets/mortgage-data" class="external-link">Rapids.ai’s Fannie Mae Data distribution page</a>. I have downloaded the <a href="http://rapidsai-data.s3-website.us-east-2.amazonaws.com/notebook-mortgage-data/mortgage_2000-2016.tgz" class="external-link">17 Years data</a> which contains dat on 37 million loans with over 1.89 billions rows in Performance datasets.</p>
 <p>To download and the data, here are some examples</p>
 <p>For <em>Linux</em> users</p>
-<div class="sourceCode" id="cb3"><pre class="sourceCode bash"><code class="sourceCode bash"><span id="cb3-1"><a href="#cb3-1"></a><span class="fu">wget</span> http://rapidsai-data.s3-website.us-east-2.amazonaws.com/notebook-mortgage-data/mortgage_2000-2016.tgz</span>
-<span id="cb3-2"><a href="#cb3-2"></a><span class="fu">tar</span> xzvg mortgage_2000-2016.tgz</span></code></pre></div>
+<div class="sourceCode" id="cb3"><pre class="sourceCode bash"><code class="sourceCode bash"><span id="cb3-1"><a href="#cb3-1" aria-hidden="true" tabindex="-1"></a><span class="fu">wget</span> http://rapidsai-data.s3-website.us-east-2.amazonaws.com/notebook-mortgage-data/mortgage_2000-2016.tgz</span>
+<span id="cb3-2"><a href="#cb3-2" aria-hidden="true" tabindex="-1"></a><span class="fu">tar</span> xzvg mortgage_2000-2016.tgz</span></code></pre></div>
 <p>For <em>Mac</em> users</p>
-<div class="sourceCode" id="cb4"><pre class="sourceCode bash"><code class="sourceCode bash"><span id="cb4-1"><a href="#cb4-1"></a><span class="ex">curl</span> http://rapidsai-data.s3-website.us-east-2.amazonaws.com/notebook-mortgage-data/mortgage_2000-2016.tgz -o mortgage_2000-2016.tgz</span>
-<span id="cb4-2"><a href="#cb4-2"></a><span class="fu">tar</span> xzvg mortgage_2000-2016.tgz</span></code></pre></div>
+<div class="sourceCode" id="cb4"><pre class="sourceCode bash"><code class="sourceCode bash"><span id="cb4-1"><a href="#cb4-1" aria-hidden="true" tabindex="-1"></a><span class="ex">curl</span> http://rapidsai-data.s3-website.us-east-2.amazonaws.com/notebook-mortgage-data/mortgage_2000-2016.tgz <span class="at">-o</span> mortgage_2000-2016.tgz</span>
+<span id="cb4-2"><a href="#cb4-2" aria-hidden="true" tabindex="-1"></a><span class="fu">tar</span> xzvg mortgage_2000-2016.tgz</span></code></pre></div>
 <p>For <em>Windows</em> users, just download the file and extract the tgz file.</p>
 </div>
-<div id="benchmark-exercise-converting-csv-to-desired-format-and-simple-aggregation" class="section level2">
-<h2 class="hasAnchor">
-<a href="#benchmark-exercise-converting-csv-to-desired-format-and-simple-aggregation" class="anchor"></a>Benchmark exercise: converting CSV to desired format and simple aggregation</h2>
+<div class="section level3">
+<h3 id="benchmark-exercise-converting-csv-to-desired-format-and-simple-aggregation">Benchmark exercise: converting CSV to desired format and simple aggregation<a class="anchor" aria-label="anchor" href="#benchmark-exercise-converting-csv-to-desired-format-and-simple-aggregation"></a>
+</h3>
 <p>We find the largest possible single file to give each of the tool a test run.</p>
-<div id="disk-frame" class="section level4">
-<h4 class="hasAnchor">
-<a href="#disk-frame" class="anchor"></a>disk.frame</h4>
+<div class="section level5">
+<h5 id="disk-frame">disk.frame<a class="anchor" aria-label="anchor" href="#disk-frame"></a>
+</h5>
 <p>First up is disk.frame</p>
-<div class="sourceCode" id="cb5"><html><body><pre class="r"><span class="fu"><a href="https://rdrr.io/r/base/message.html">suppressPackageStartupMessages</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/library.html">library</a></span>(<span class="no">disk.frame</span>))
-<span class="fu"><a href="https://rdrr.io/r/base/system.time.html">system.time</a></span>(<span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span>()) <span class="co"># ~4s</span>
+<div class="sourceCode" id="cb5"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu"><a href="https://rdrr.io/r/base/message.html" class="external-link">suppressPackageStartupMessages</a></span><span class="op">(</span><span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://diskframe.com" class="external-link">disk.frame</a></span><span class="op">)</span><span class="op">)</span>
+<span class="fu"><a href="https://rdrr.io/r/base/system.time.html" class="external-link">system.time</a></span><span class="op">(</span><span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span><span class="op">(</span><span class="op">)</span><span class="op">)</span> <span class="co"># ~4s</span>
 <span class="co">#&gt; The number of workers available for disk.frame is 6</span>
 <span class="co">#&gt;    user  system elapsed </span>
-<span class="co">#&gt;    0.04    0.05    4.64</span></pre></body></html></div>
+<span class="co">#&gt;    0.18    0.03    2.22</span></code></pre></div>
 <p>We note that there is some time needed for disk.frame to start up all the workers. Next we try to convert the largest CSV file to disk.frame format. The file to be converted is about 2.2GB in size</p>
-<div class="sourceCode" id="cb6"><html><body><pre class="r"><span class="no">time_to_convert_disk.frame</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/system.time.html">system.time</a></span>(<span class="no">df1</span> <span class="kw">&lt;-</span> <span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span>(<span class="st">"c:/data/Performance_2004Q3.txt"</span>, <span class="kw">header</span> <span class="kw">=</span> <span class="fl">FALSE</span>))[<span class="fl">3</span>]
+<div class="sourceCode" id="cb6"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">time_to_convert_disk.frame</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/system.time.html" class="external-link">system.time</a></span><span class="op">(</span><span class="va">df1</span> <span class="op">&lt;-</span> <span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span><span class="op">(</span><span class="st">"c:/data/Performance_2004Q3.txt"</span>, header <span class="op">=</span> <span class="cn">FALSE</span><span class="op">)</span><span class="op">)</span><span class="op">[</span><span class="fl">3</span><span class="op">]</span>
 
-<span class="no">time_to_convert_disk.frame</span>
+<span class="va">time_to_convert_disk.frame</span>
 <span class="co">#&gt; elapsed </span>
-<span class="co">#&gt;   20.27</span></pre></body></html></div>
+<span class="co">#&gt;   28.77</span></code></pre></div>
 <p>Now that we have converted it, we want to a count by the first column. To achieve this we use a “two-stage” aggregation strategy. Note that use <code>keep="V1"</code> to bring only the column <code>V1</code> into RAM. This avoids the reading of other unnecessary columns and should speed-up the analysis significantly</p>
-<div class="sourceCode" id="cb7"><html><body><pre class="r"><span class="no">time_to_agg_disk.frame</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/system.time.html">system.time</a></span>(<span class="no">summ</span> <span class="kw">&lt;-</span> <span class="no">df1</span>[,<span class="no">.N</span>, <span class="no">V1</span>, <span class="kw">keep</span> <span class="kw">=</span> <span class="st">"V1"</span>][, <span class="fu">.</span>(<span class="kw">N</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/sum.html">sum</a></span>(<span class="no">N</span>)), <span class="no">V1</span>])
+<div class="sourceCode" id="cb7"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">time_to_agg_disk.frame</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/system.time.html" class="external-link">system.time</a></span><span class="op">(</span><span class="va">summ</span> <span class="op">&lt;-</span> <span class="va">df1</span><span class="op">[</span>,<span class="va">.N</span>, <span class="va">V1</span>, keep <span class="op">=</span> <span class="st">"V1"</span><span class="op">]</span><span class="op">[</span>, <span class="fu">.</span><span class="op">(</span>N <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/sum.html" class="external-link">sum</a></span><span class="op">(</span><span class="va">N</span><span class="op">)</span><span class="op">)</span>, <span class="va">V1</span><span class="op">]</span><span class="op">)</span>
 
-<span class="no">time_to_agg_disk.frame</span>
+<span class="va">time_to_agg_disk.frame</span>
 <span class="co">#&gt;    user  system elapsed </span>
-<span class="co">#&gt;    0.14    0.03    7.39</span></pre></body></html></div>
+<span class="co">#&gt;    0.13    0.03    7.89</span></code></pre></div>
 <p>We can inspect the result as well.</p>
-<div class="sourceCode" id="cb8"><html><body><pre class="r"><span class="no">summ</span>
+<div class="sourceCode" id="cb8"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">summ</span>
 <span class="co">#&gt;                   V1   N</span>
 <span class="co">#&gt;      1: 100001458647 111</span>
 <span class="co">#&gt;      2: 100004788186  95</span>
@@ -212,79 +217,80 @@ <h4 class="hasAnchor">
 <span class="co">#&gt; 389486: 999981910757  17</span>
 <span class="co">#&gt; 389487: 999982397951 104</span>
 <span class="co">#&gt; 389488: 999986952752  97</span>
-<span class="co">#&gt; 389489: 999990008973 156</span>
-<span class="co">#&gt; 389490: 999994125744  15</span></pre></body></html></div>
+<span class="co">#&gt; 389489: 999990008973 162</span>
+<span class="co">#&gt; 389490: 999994125744  15</span></code></pre></div>
 <p>Another way to perform the analysis is to use <code>dplyr</code> syntax to perform group-by in <em>one-stage</em> which is:</p>
-<div class="sourceCode" id="cb9"><html><body><pre class="r"><span class="fu"><a href="https://rdrr.io/r/base/system.time.html">system.time</a></span>(<span class="no">df1</span> <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="../reference/srckeep.html">srckeep</a></span>(<span class="st">"V1"</span>) <span class="kw">%&gt;%</span>
-  <span class="fu">group_by</span>(<span class="no">V1</span>) <span class="kw">%&gt;%</span>
-  <span class="fu">summarise</span>(<span class="kw">N</span> <span class="kw">=</span> <span class="fu">n</span>()) <span class="kw">%&gt;%</span>
-  <span class="no">collect</span>)
+<div class="sourceCode" id="cb9"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu"><a href="https://rdrr.io/r/base/system.time.html" class="external-link">system.time</a></span><span class="op">(</span><span class="va">df1</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="../reference/srckeep.html">srckeep</a></span><span class="op">(</span><span class="st">"V1"</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/group_by.html" class="external-link">group_by</a></span><span class="op">(</span><span class="va">V1</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/summarise.html" class="external-link">summarise</a></span><span class="op">(</span>N <span class="op">=</span> <span class="fu"><a href="https://dplyr.tidyverse.org/reference/context.html" class="external-link">n</a></span><span class="op">(</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="va">collect</span><span class="op">)</span>
 <span class="co">#&gt;    user  system elapsed </span>
-<span class="co">#&gt;    1.82    0.25    6.61</span></pre></body></html></div>
+<span class="co">#&gt;    1.89    0.14    5.30</span></code></pre></div>
 <p>However, the <code>dplyr</code> syntax tends to be slightly slower than using data.table syntax. This may be improved as much of the overhead is due to inefficient use of NSE.</p>
 </div>
-<div id="dask" class="section level4">
-<h4 class="hasAnchor">
-<a href="#dask" class="anchor"></a>Dask</h4>
+<div class="section level5">
+<h5 id="dask">Dask<a class="anchor" aria-label="anchor" href="#dask"></a>
+</h5>
 <p>To test Dask</p>
-<div class="sourceCode" id="cb10"><pre class="sourceCode python"><code class="sourceCode python"><span id="cb10-1"><a href="#cb10-1"></a><span class="im">import</span> dask.dataframe <span class="im">as</span> dd</span>
-<span id="cb10-2"><a href="#cb10-2"></a><span class="im">from</span> datetime <span class="im">import</span> datetime</span>
-<span id="cb10-3"><a href="#cb10-3"></a></span>
-<span id="cb10-4"><a href="#cb10-4"></a>a <span class="op">=</span> dd.read_csv(<span class="st">"c:/data/Performance_2004Q3.txt"</span>, sep<span class="op">=</span><span class="st">"|"</span>,</span>
-<span id="cb10-5"><a href="#cb10-5"></a>                dtype<span class="op">=</span>{<span class="dv">7</span>: <span class="st">'double'</span>, <span class="dv">14</span>: <span class="st">'str'</span>, <span class="dv">15</span>: <span class="st">'str'</span>, <span class="dv">16</span>:<span class="st">'str'</span>}, header <span class="op">=</span> <span class="va">None</span>)</span>
-<span id="cb10-6"><a href="#cb10-6"></a>a.columns <span class="op">=</span> [<span class="st">"var"</span> <span class="op">+</span> <span class="bu">str</span>(i) <span class="cf">for</span> i <span class="kw">in</span> <span class="bu">range</span>(<span class="dv">31</span>)]</span>
-<span id="cb10-7"><a href="#cb10-7"></a>a.head()</span>
-<span id="cb10-8"><a href="#cb10-8"></a></span>
-<span id="cb10-9"><a href="#cb10-9"></a>startTime <span class="op">=</span> datetime.now()</span>
-<span id="cb10-10"><a href="#cb10-10"></a>a.to_parquet(<span class="st">"c:/data/p03.parquet"</span>)</span>
-<span id="cb10-11"><a href="#cb10-11"></a><span class="bu">print</span>(datetime.now() <span class="op">-</span> startTime)  <span class="co"># 50 seconds</span></span></code></pre></div>
+<div class="sourceCode" id="cb10"><pre class="sourceCode python"><code class="sourceCode python"><span id="cb10-1"><a href="#cb10-1" aria-hidden="true" tabindex="-1"></a><span class="im">import</span> dask.dataframe <span class="im">as</span> dd</span>
+<span id="cb10-2"><a href="#cb10-2" aria-hidden="true" tabindex="-1"></a><span class="im">from</span> datetime <span class="im">import</span> datetime</span>
+<span id="cb10-3"><a href="#cb10-3" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb10-4"><a href="#cb10-4" aria-hidden="true" tabindex="-1"></a>a <span class="op">=</span> dd.read_csv(<span class="st">"c:/data/Performance_2004Q3.txt"</span>, sep<span class="op">=</span><span class="st">"|"</span>,</span>
+<span id="cb10-5"><a href="#cb10-5" aria-hidden="true" tabindex="-1"></a>                dtype<span class="op">=</span>{<span class="dv">7</span>: <span class="st">'double'</span>, <span class="dv">14</span>: <span class="st">'str'</span>, <span class="dv">15</span>: <span class="st">'str'</span>, <span class="dv">16</span>:<span class="st">'str'</span>}, header <span class="op">=</span> <span class="va">None</span>)</span>
+<span id="cb10-6"><a href="#cb10-6" aria-hidden="true" tabindex="-1"></a>a.columns <span class="op">=</span> [<span class="st">"var"</span> <span class="op">+</span> <span class="bu">str</span>(i) <span class="cf">for</span> i <span class="kw">in</span> <span class="bu">range</span>(<span class="dv">31</span>)]</span>
+<span id="cb10-7"><a href="#cb10-7" aria-hidden="true" tabindex="-1"></a>a.head()</span>
+<span id="cb10-8"><a href="#cb10-8" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb10-9"><a href="#cb10-9" aria-hidden="true" tabindex="-1"></a>startTime <span class="op">=</span> datetime.now()</span>
+<span id="cb10-10"><a href="#cb10-10" aria-hidden="true" tabindex="-1"></a>a.to_parquet(<span class="st">"c:/data/p03.parquet"</span>)</span>
+<span id="cb10-11"><a href="#cb10-11" aria-hidden="true" tabindex="-1"></a><span class="bu">print</span>(datetime.now() <span class="op">-</span> startTime)  <span class="co"># 50 seconds</span></span></code></pre></div>
 <p>and we can see that converting to Parquet takes more time than <code>csv_to_disk.frame</code>. Now to test Dask’s ability to aggregate a simple use-case, we can also load only column into RAM to speed up the analysis.</p>
-<div class="sourceCode" id="cb11"><pre class="sourceCode python"><code class="sourceCode python"><span id="cb11-1"><a href="#cb11-1"></a>startTime <span class="op">=</span> datetime.now()</span>
-<span id="cb11-2"><a href="#cb11-2"></a>a <span class="op">=</span> dd.read_parquet(<span class="st">"c:/data/p03.parquet"</span>, columns<span class="op">=</span><span class="st">"var0"</span>)</span>
-<span id="cb11-3"><a href="#cb11-3"></a>aa <span class="op">=</span> a.value_counts().compute()</span>
-<span id="cb11-4"><a href="#cb11-4"></a><span class="bu">print</span>(datetime.now() <span class="op">-</span> startTime)  <span class="co"># 1.2</span></span></code></pre></div>
+<div class="sourceCode" id="cb11"><pre class="sourceCode python"><code class="sourceCode python"><span id="cb11-1"><a href="#cb11-1" aria-hidden="true" tabindex="-1"></a>startTime <span class="op">=</span> datetime.now()</span>
+<span id="cb11-2"><a href="#cb11-2" aria-hidden="true" tabindex="-1"></a>a <span class="op">=</span> dd.read_parquet(<span class="st">"c:/data/p03.parquet"</span>, columns<span class="op">=</span><span class="st">"var0"</span>)</span>
+<span id="cb11-3"><a href="#cb11-3" aria-hidden="true" tabindex="-1"></a>aa <span class="op">=</span> a.value_counts().compute()</span>
+<span id="cb11-4"><a href="#cb11-4" aria-hidden="true" tabindex="-1"></a><span class="bu">print</span>(datetime.now() <span class="op">-</span> startTime)  <span class="co"># 1.2</span></span></code></pre></div>
 <p>The aggregation time is also longer, although in practice 1.2s. vs around 0.5s isn’t that big of a difference. We shall see how the differential changes when dealing with larger datasets in a future session.</p>
-<div id="dask-is-good" class="section level5">
-<h5 class="hasAnchor">
-<a href="#dask-is-good" class="anchor"></a>Dask is good</h5>
+<div class="section level6">
+<h6 id="dask-is-good">Dask is good<a class="anchor" aria-label="anchor" href="#dask-is-good"></a>
+</h6>
 <p>A good feature of Dask is that you need not convert the data to parquet before doing the aggregation. This is a very convenient feature that is not available in disk.frame yet. For example:</p>
-<div class="sourceCode" id="cb12"><pre class="sourceCode python"><code class="sourceCode python"><span id="cb12-1"><a href="#cb12-1"></a>startTime <span class="op">=</span> datetime.now()</span>
-<span id="cb12-2"><a href="#cb12-2"></a>a <span class="op">=</span> dd.read_csv(<span class="st">"c:/data/perf/Performance_2004Q3.txt"</span>, sep<span class="op">=</span><span class="st">"|"</span>,</span>
-<span id="cb12-3"><a href="#cb12-3"></a>                dtype<span class="op">=</span>{<span class="dv">7</span>: <span class="st">'double'</span>, <span class="dv">14</span>: <span class="st">'str'</span>, <span class="dv">15</span>: <span class="st">'str'</span>, <span class="dv">16</span>:<span class="st">'str'</span>}, header <span class="op">=</span> <span class="va">None</span>)</span>
-<span id="cb12-4"><a href="#cb12-4"></a>a.columns <span class="op">=</span> [<span class="st">"var"</span> <span class="op">+</span> <span class="bu">str</span>(i) <span class="cf">for</span> i <span class="kw">in</span> <span class="bu">range</span>(<span class="dv">31</span>)]</span>
-<span id="cb12-5"><a href="#cb12-5"></a></span>
-<span id="cb12-6"><a href="#cb12-6"></a>startTime <span class="op">=</span> datetime.now()</span>
-<span id="cb12-7"><a href="#cb12-7"></a>a.var0.value_counts().compute()</span>
-<span id="cb12-8"><a href="#cb12-8"></a><span class="bu">print</span>(datetime.now() <span class="op">-</span> startTime)  <span class="co"># 50 seconds</span></span></code></pre></div>
+<div class="sourceCode" id="cb12"><pre class="sourceCode python"><code class="sourceCode python"><span id="cb12-1"><a href="#cb12-1" aria-hidden="true" tabindex="-1"></a>startTime <span class="op">=</span> datetime.now()</span>
+<span id="cb12-2"><a href="#cb12-2" aria-hidden="true" tabindex="-1"></a>a <span class="op">=</span> dd.read_csv(<span class="st">"c:/data/perf/Performance_2004Q3.txt"</span>, sep<span class="op">=</span><span class="st">"|"</span>,</span>
+<span id="cb12-3"><a href="#cb12-3" aria-hidden="true" tabindex="-1"></a>                dtype<span class="op">=</span>{<span class="dv">7</span>: <span class="st">'double'</span>, <span class="dv">14</span>: <span class="st">'str'</span>, <span class="dv">15</span>: <span class="st">'str'</span>, <span class="dv">16</span>:<span class="st">'str'</span>}, header <span class="op">=</span> <span class="va">None</span>)</span>
+<span id="cb12-4"><a href="#cb12-4" aria-hidden="true" tabindex="-1"></a>a.columns <span class="op">=</span> [<span class="st">"var"</span> <span class="op">+</span> <span class="bu">str</span>(i) <span class="cf">for</span> i <span class="kw">in</span> <span class="bu">range</span>(<span class="dv">31</span>)]</span>
+<span id="cb12-5"><a href="#cb12-5" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb12-6"><a href="#cb12-6" aria-hidden="true" tabindex="-1"></a>startTime <span class="op">=</span> datetime.now()</span>
+<span id="cb12-7"><a href="#cb12-7" aria-hidden="true" tabindex="-1"></a>a.var0.value_counts().compute()</span>
+<span id="cb12-8"><a href="#cb12-8" aria-hidden="true" tabindex="-1"></a><span class="bu">print</span>(datetime.now() <span class="op">-</span> startTime)  <span class="co"># 50 seconds</span></span></code></pre></div>
 <p>However this strategy is not particularly fast. In practice, you are almost always better off spending some time to convert your data to a efficient format before performing analysis. This may have a time cost, but the effort will pay off very quickly.</p>
 </div>
 </div>
-<div id="juliadb" class="section level4">
-<h4 class="hasAnchor">
-<a href="#juliadb" class="anchor"></a>JuliaDB</h4>
+<div class="section level5">
+<h5 id="juliadb">JuliaDB<a class="anchor" aria-label="anchor" href="#juliadb"></a>
+</h5>
 <p>I really like Julia but it’s a shame that JuliaDB is no where near as mature as either disk.frame nor Dask for inputting data. I have not been able to load the CSV using JuliaDB’s native methods and have resorted to using CSV.jl to read the data and convert it to JuliaDB.jl. Also, it’s difficult to figure out how to run JuliaDB from disk, and the memory usage is enormous compared to the disk.frame’s and Dask’s.</p>
-<div class="sourceCode" id="cb13"><pre class="sourceCode julia"><code class="sourceCode julia"><span id="cb13-1"><a href="#cb13-1"></a>using JuliaDB, CSV, OnlineStats</span>
-<span id="cb13-2"><a href="#cb13-2"></a>path = <span class="st">"c:/data/perf"</span></span>
-<span id="cb13-3"><a href="#cb13-3"></a></span>
-<span id="cb13-4"><a href="#cb13-4"></a><span class="co"># read data using CSV.jl and convert to JuliaDB</span></span>
-<span id="cb13-5"><a href="#cb13-5"></a>@time df = CSV.File(joinpath(path, <span class="st">"Performance_2004Q3.txt"</span>), delim = <span class="ch">'|'</span>, header = false) |&gt; JuliaDB.table <span class="co"># 48</span></span></code></pre></div>
+<div class="sourceCode" id="cb13"><pre class="sourceCode julia"><code class="sourceCode julia"><span id="cb13-1"><a href="#cb13-1" aria-hidden="true" tabindex="-1"></a><span class="kw">using</span> JuliaDB<span class="op">,</span> CSV<span class="op">,</span> OnlineStats</span>
+<span id="cb13-2"><a href="#cb13-2" aria-hidden="true" tabindex="-1"></a>path <span class="op">=</span> <span class="st">"c:/data/perf"</span></span>
+<span id="cb13-3"><a href="#cb13-3" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb13-4"><a href="#cb13-4" aria-hidden="true" tabindex="-1"></a><span class="co"># read data using CSV.jl and convert to JuliaDB</span></span>
+<span id="cb13-5"><a href="#cb13-5" aria-hidden="true" tabindex="-1"></a><span class="pp">@time</span> df <span class="op">=</span> CSV.File(joinpath(path<span class="op">,</span> <span class="st">"Performance_2004Q3.txt"</span>)<span class="op">,</span> delim <span class="op">=</span> <span class="ch">'|'</span><span class="op">,</span> header <span class="op">=</span> <span class="ex">false</span>) <span class="op">|&gt;</span> JuliaDB.table <span class="co"># 48</span></span></code></pre></div>
 <p>Once the data has been loaded, I can aggregate as follows</p>
-<div class="sourceCode" id="cb14"><pre class="sourceCode julia"><code class="sourceCode julia"><span id="cb14-1"><a href="#cb14-1"></a>using LambdaFn</span>
-<span id="cb14-2"><a href="#cb14-2"></a>@time groupby(@λ(size(_,<span class="fl">1</span>)), a, :Column1) <span class="co"># 6</span></span></code></pre></div>
+<div class="sourceCode" id="cb14"><pre class="sourceCode julia"><code class="sourceCode julia"><span id="cb14-1"><a href="#cb14-1" aria-hidden="true" tabindex="-1"></a><span class="kw">using</span> LambdaFn</span>
+<span id="cb14-2"><a href="#cb14-2" aria-hidden="true" tabindex="-1"></a><span class="pp">@time</span> groupby(<span class="op">@</span>λ(size(_<span class="op">,</span><span class="fl">1</span>))<span class="op">,</span> a<span class="op">,</span> <span class="op">:</span>Column1) <span class="co"># 6</span></span></code></pre></div>
 <p>Unfortunately, it’s much slower than both disk.frame and Dask.</p>
 <p>As a side note, I can use OnlineStats.jl to do aggregation (relatively) efficiently. I think OnlineStats is one of the bright spots for JuliaDB, as it has powerful online-algorithms that allows you to combine statistics by computing those statistics in chunks and combining the results from each chunk. It’s a shame that JuliaDB is not mature enough to make it shine more brightly. For an example of what it can do, see the example to compute the mean of <code>Column6</code> grouped by <code>Column1</code></p>
-<div class="sourceCode" id="cb15"><pre class="sourceCode julia"><code class="sourceCode julia"><span id="cb15-1"><a href="#cb15-1"></a>@time groupreduce(Mean(), a, :Column1, select = :Column6)</span></code></pre></div>
+<div class="sourceCode" id="cb15"><pre class="sourceCode julia"><code class="sourceCode julia"><span id="cb15-1"><a href="#cb15-1" aria-hidden="true" tabindex="-1"></a><span class="pp">@time</span> groupreduce(Mean()<span class="op">,</span> a<span class="op">,</span> <span class="op">:</span>Column1<span class="op">,</span> select <span class="op">=</span> <span class="op">:</span>Column6)</span></code></pre></div>
 <p>You may have noticed that we have not converted JuliaDB.jl to disk. Here we will try that</p>
-<div class="sourceCode" id="cb16"><pre class="sourceCode julia"><code class="sourceCode julia"><span id="cb16-1"><a href="#cb16-1"></a>@time JuliaDB.save(a, <span class="st">"c:/data/.jldb"</span>) <span class="co"># 26s</span></span></code></pre></div>
+<div class="sourceCode" id="cb16"><pre class="sourceCode julia"><code class="sourceCode julia"><span id="cb16-1"><a href="#cb16-1" aria-hidden="true" tabindex="-1"></a><span class="pp">@time</span> JuliaDB.save(a<span class="op">,</span> <span class="st">"c:/data/.jldb"</span>) <span class="co"># 26s</span></span></code></pre></div>
 <p>Together with the time taken to read the data in (48s), we can say that the time to read and convert to the JuliaDB format is 48s + 28s = 76s. The issue with this conversion is that we are still not able to load only the column we need for the analysis. Random access to columns are possible with disk.frame and Dask.</p>
 <p>Also, it’s astounding that the output file is 17GB in size and the original CSV was only 2.5GB! Loading the data takes about 9s, but uses up a lot of RAM. I think it will take time for JuliaDB to mature.</p>
-<div class="sourceCode" id="cb17"><pre class="sourceCode julia"><code class="sourceCode julia"><span id="cb17-1"><a href="#cb17-1"></a>@time a = JuliaDB.load(<span class="st">"c:/data/.jldb"</span>) <span class="co"># 0s</span></span></code></pre></div>
+<div class="sourceCode" id="cb17"><pre class="sourceCode julia"><code class="sourceCode julia"><span id="cb17-1"><a href="#cb17-1" aria-hidden="true" tabindex="-1"></a><span class="pp">@time</span> a <span class="op">=</span> JuliaDB.load(<span class="st">"c:/data/.jldb"</span>) <span class="co"># 0s</span></span></code></pre></div>
 </div>
 </div>
-<div id="conclusion" class="section level2">
-<h2 class="hasAnchor">
-<a href="#conclusion" class="anchor"></a>Conclusion</h2>
+<div class="section level3">
+<h3 id="conclusion">Conclusion<a class="anchor" aria-label="anchor" href="#conclusion"></a>
+</h3>
 <p>It is somewhat surprising that disk.frame is the speed king in this benchmark study, but I can’t take any of the credit as the speediness of disk.frame is due to the authors of fst, future (and parallel), and data.table. It’s also no surprise that Julia’s medium-data tool lags behind Python’s and R’s, because it’s a pattern noticed elsewhere in the data ecosystem. Julia’s niche and strength at this point is in computational problems that require lots of computation that do not necessarily involved large amounts of input data (the Celeste project appears to be an exception but I think the computational demand there dominate the data demand).</p>
 <p>Although disk.frame is the fastest, it’s syntax is not as convenient as Dask’s. Using Dask is almost the same as using pandas. In contrast, when using disk.frame, the user needs to be aware that operations happen in chunks, and hence a “two-stage” group-by is required. However, this will be addressed in a future planned package disk.frame.db which is will allow the user to “forget” the underlying architecture is made of chunks, and just focus on higher-level data operations.</p>
 </div>
@@ -302,11 +308,13 @@ <h2 class="hasAnchor">
 
 
       <footer><div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+  <p></p>
+<p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p>
+<p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
       </footer>
@@ -315,5 +323,7 @@ <h2 class="hasAnchor">
   
 
 
+  
+
   </body>
 </html>
diff --git a/docs/articles/06-vs-dask-juliadb_files/figure-html/unnamed-chunk-2-1.png b/docs/articles/06-vs-dask-juliadb_files/figure-html/unnamed-chunk-2-1.png
index 6e8deff1..66311482 100644
Binary files a/docs/articles/06-vs-dask-juliadb_files/figure-html/unnamed-chunk-2-1.png and b/docs/articles/06-vs-dask-juliadb_files/figure-html/unnamed-chunk-2-1.png differ
diff --git a/docs/articles/06-vs-dask-juliadb_files/figure-html/unnamed-chunk-3-1.png b/docs/articles/06-vs-dask-juliadb_files/figure-html/unnamed-chunk-3-1.png
index bcc2f132..4e735559 100644
Binary files a/docs/articles/06-vs-dask-juliadb_files/figure-html/unnamed-chunk-3-1.png and b/docs/articles/06-vs-dask-juliadb_files/figure-html/unnamed-chunk-3-1.png differ
diff --git a/docs/articles/06-vs-dask-juliadb_files/header-attrs-2.8/header-attrs.js b/docs/articles/06-vs-dask-juliadb_files/header-attrs-2.8/header-attrs.js
new file mode 100644
index 00000000..dd57d92e
--- /dev/null
+++ b/docs/articles/06-vs-dask-juliadb_files/header-attrs-2.8/header-attrs.js
@@ -0,0 +1,12 @@
+// Pandoc 2.9 adds attributes on both header and div. We remove the former (to
+// be compatible with the behavior of Pandoc < 2.8).
+document.addEventListener('DOMContentLoaded', function(e) {
+  var hs = document.querySelectorAll("div.section[class*='level'] > :first-child");
+  var i, h, a;
+  for (i = 0; i < hs.length; i++) {
+    h = hs[i];
+    if (!/^h[1-6]$/i.test(h.tagName)) continue;  // it should be a header h1-h6
+    a = h.attributes;
+    while (a.length > 0) h.removeAttribute(a[0].name);
+  }
+});
diff --git a/docs/articles/07-glm.html b/docs/articles/07-glm.html
index 75ef5ee3..9a04cd64 100644
--- a/docs/articles/07-glm.html
+++ b/docs/articles/07-glm.html
@@ -19,6 +19,8 @@
 <![endif]-->
 </head>
 <body data-spy="scroll" data-target="#toc">
+    
+
     <div class="container template-article">
       <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
@@ -31,18 +33,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
       <ul class="nav navbar-nav">
-<li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
 <li>
   <a href="../reference/index.html">Reference</a>
 </li>
@@ -86,6 +82,9 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
   </ul>
 </li>
 <li>
@@ -94,8 +93,8 @@
       </ul>
 <ul class="nav navbar-nav navbar-right">
 <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
@@ -115,37 +114,40 @@
       <h1 data-toc-skip>Generalized Linear Models (GLM) including logistic regression with disk.frame</h1>
             
       
-      <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/master/vignettes/07-glm.Rmd"><code>vignettes/07-glm.Rmd</code></a></small>
+      <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/vignettes/07-glm.Rmd" class="external-link"><code>vignettes/07-glm.Rmd</code></a></small>
       <div class="hidden name"><code>07-glm.Rmd</code></div>
 
     </div>
 
     
     
-<div class="sourceCode" id="cb1"><html><body><pre class="r"><span class="fu"><a href="https://rdrr.io/r/base/message.html">suppressPackageStartupMessages</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/library.html">library</a></span>(<span class="no">disk.frame</span>))
+<div class="sourceCode" id="cb1"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu"><a href="https://rdrr.io/r/base/message.html" class="external-link">suppressPackageStartupMessages</a></span><span class="op">(</span><span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://diskframe.com" class="external-link">disk.frame</a></span><span class="op">)</span><span class="op">)</span>
 
-<span class="kw">if</span>(<span class="fu"><a href="https://rdrr.io/r/base/interactive.html">interactive</a></span>()) {
-  <span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span>()
-} <span class="kw">else</span> {
+<span class="kw">if</span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/interactive.html" class="external-link">interactive</a></span><span class="op">(</span><span class="op">)</span><span class="op">)</span> <span class="op">{</span>
+  <span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span><span class="op">(</span><span class="op">)</span> 
+<span class="op">}</span> <span class="kw">else</span> <span class="op">{</span>
   <span class="co"># only use 1 work to pass CRAN check</span>
-  <span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span>(<span class="fl">1</span>)
-}
-<span class="co">#&gt; The number of workers available for disk.frame is 1</span></pre></body></html></div>
-<div id="glms" class="section level1">
-<h1 class="hasAnchor">
-<a href="#glms" class="anchor"></a>GLMs</h1>
-<div id="prerequisites" class="section level3">
-<h3 class="hasAnchor">
-<a href="#prerequisites" class="anchor"></a>Prerequisites</h3>
-<p>In this article, we will assume you are familiar with Generalized Linear Models (GLMs). You are also expected to have basic working knowledge of {<code>disk.frame</code>}, see this <a href="http://diskframe.com/articles/intro-disk-frame.html">{<code>disk.frame</code>} Quick Start</a>.</p>
+  <span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span><span class="op">(</span><span class="fl">1</span><span class="op">)</span>
+<span class="op">}</span>
+<span class="co">#&gt; The number of workers available for disk.frame is 1</span></code></pre></div>
+<div class="section level2">
+<h2 id="glms">GLMs<a class="anchor" aria-label="anchor" href="#glms"></a>
+</h2>
+<div class="section level4">
+<h4 id="prerequisites">Prerequisites<a class="anchor" aria-label="anchor" href="#prerequisites"></a>
+</h4>
+<p>In this article, we will assume you are familiar with Generalized Linear Models (GLMs). You are also expected to have basic working knowledge of {<code>disk.frame</code>}, see this <a href="http://diskframe.com/articles/intro-disk-frame.html" class="external-link">{<code>disk.frame</code>} Quick Start</a>.</p>
 </div>
-<div id="introduction" class="section level2">
-<h2 class="hasAnchor">
-<a href="#introduction" class="anchor"></a>Introduction</h2>
+<div class="section level3">
+<h3 id="introduction">Introduction<a class="anchor" aria-label="anchor" href="#introduction"></a>
+</h3>
 <p>One can fit a GLM using the <code>glm</code> function. For example,</p>
-<div class="sourceCode" id="cb2"><html><body><pre class="r"><span class="no">m</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/stats/glm.html">glm</a></span>(<span class="no">dist</span> ~ <span class="no">speed</span>, <span class="kw">data</span> <span class="kw">=</span> <span class="no">cars</span>)</pre></body></html></div>
+<div class="sourceCode" id="cb2"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">m</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/stats/glm.html" class="external-link">glm</a></span><span class="op">(</span><span class="va">dist</span> <span class="op">~</span> <span class="va">speed</span>, data <span class="op">=</span> <span class="va">cars</span><span class="op">)</span></code></pre></div>
 <p>would fit a linear model on the data <code>cars</code> with <code>dist</code> as the target and <code>speed</code> as the explanatory variable. You can inspect the results of the model fit using</p>
-<div class="sourceCode" id="cb3"><html><body><pre class="r"><span class="fu"><a href="https://rdrr.io/r/base/summary.html">summary</a></span>(<span class="no">m</span>)
+<div class="sourceCode" id="cb3"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu"><a href="https://rdrr.io/r/base/summary.html" class="external-link">summary</a></span><span class="op">(</span><span class="va">m</span><span class="op">)</span>
 <span class="co">#&gt; </span>
 <span class="co">#&gt; Call:</span>
 <span class="co">#&gt; glm(formula = dist ~ speed, data = cars)</span>
@@ -167,21 +169,23 @@ <h2 class="hasAnchor">
 <span class="co">#&gt; Residual deviance: 11354  on 48  degrees of freedom</span>
 <span class="co">#&gt; AIC: 419.16</span>
 <span class="co">#&gt; </span>
-<span class="co">#&gt; Number of Fisher Scoring iterations: 2</span></pre></body></html></div>
-<p>or if you have <code>{broom}</code> installed</p>
-<div class="sourceCode" id="cb4"><html><body><pre class="r"><span class="kw pkg">broom</span><span class="kw ns">::</span><span class="fu"><a href="https://rdrr.io/pkg/broom/man/reexports.html">tidy</a></span>(<span class="no">m</span>)
-<span class="co">#&gt; # A tibble: 2 x 5</span>
+<span class="co">#&gt; Number of Fisher Scoring iterations: 2</span></code></pre></div>
+<p>or if you have <a href="https://broom.tidymodels.org/" class="external-link">broom</a> installed</p>
+<div class="sourceCode" id="cb4"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu">broom</span><span class="fu">::</span><span class="fu"><a href="https://generics.r-lib.org/reference/tidy.html" class="external-link">tidy</a></span><span class="op">(</span><span class="va">m</span><span class="op">)</span>
+<span class="co">#&gt; <span style="color: #949494;"># A tibble: 2 x 5</span></span>
 <span class="co">#&gt;   term        estimate std.error statistic  p.value</span>
-<span class="co">#&gt;   &lt;chr&gt;          &lt;dbl&gt;     &lt;dbl&gt;     &lt;dbl&gt;    &lt;dbl&gt;</span>
-<span class="co">#&gt; 1 (Intercept)   -17.6      6.76      -2.60 1.23e- 2</span>
-<span class="co">#&gt; 2 speed           3.93     0.416      9.46 1.49e-12</span></pre></body></html></div>
+<span class="co">#&gt;   <span style="color: #949494; font-style: italic;">&lt;chr&gt;</span>          <span style="color: #949494; font-style: italic;">&lt;dbl&gt;</span>     <span style="color: #949494; font-style: italic;">&lt;dbl&gt;</span>     <span style="color: #949494; font-style: italic;">&lt;dbl&gt;</span>    <span style="color: #949494; font-style: italic;">&lt;dbl&gt;</span></span>
+<span class="co">#&gt; <span style="color: #BCBCBC;">1</span> (Intercept)   -<span style="color: #BB0000;">17.6</span>      6.76      -<span style="color: #BB0000;">2.60</span> 1.23<span style="color: #949494;">e</span><span style="color: #BB0000;">- 2</span></span>
+<span class="co">#&gt; <span style="color: #BCBCBC;">2</span> speed           3.93     0.416      9.46 1.49<span style="color: #949494;">e</span><span style="color: #BB0000;">-12</span></span></code></pre></div>
 <p>With {<code>disk.frame</code>}, you can run GLM <code>dfglm</code> function, where the <code>df</code> stands for <code>disk.frame</code> of course!</p>
-<div class="sourceCode" id="cb5"><html><body><pre class="r"><span class="no">cars.df</span> <span class="kw">=</span> <span class="fu"><a href="../reference/as.disk.frame.html">as.disk.frame</a></span>(<span class="no">cars</span>)
+<div class="sourceCode" id="cb5"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="../reference/as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span>
 
-<span class="no">m</span> <span class="kw">=</span> <span class="fu"><a href="../reference/dfglm.html">dfglm</a></span>(<span class="no">dist</span> ~ <span class="no">speed</span>, <span class="no">cars.df</span>)
+<span class="va">m</span> <span class="op">=</span> <span class="fu"><a href="../reference/dfglm.html">dfglm</a></span><span class="op">(</span><span class="va">dist</span> <span class="op">~</span> <span class="va">speed</span>, <span class="va">cars.df</span><span class="op">)</span>
 <span class="co">#&gt; Loading required namespace: biglm</span>
 
-<span class="fu"><a href="https://rdrr.io/r/base/summary.html">summary</a></span>(<span class="no">m</span>)
+<span class="fu"><a href="https://rdrr.io/r/base/summary.html" class="external-link">summary</a></span><span class="op">(</span><span class="va">m</span><span class="op">)</span>
 <span class="co">#&gt; Large data regression model: biglm::bigglm(formula, data = streaming_fn, ...)</span>
 <span class="co">#&gt; Sample size =  50 </span>
 <span class="co">#&gt;                 Coef     (95%     CI)     SE      p</span>
@@ -189,34 +193,35 @@ <h2 class="hasAnchor">
 <span class="co">#&gt; speed         3.9324   3.1014  4.7634 0.4155 0.0000</span>
 
 
-<span class="no">majorv</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/integer.html">as.integer</a></span>(<span class="no">version</span>$<span class="no">major</span>)
-<span class="no">minorv</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/integer.html">as.integer</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/strsplit.html">strsplit</a></span>(<span class="no">version</span>$<span class="no">minor</span>, <span class="st">"."</span>, <span class="kw">fixed</span><span class="kw">=</span><span class="fl">TRUE</span>)<span class="kw">[[</span><span class="fl">1</span>]][<span class="fl">1</span>])
+<span class="va">majorv</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/integer.html" class="external-link">as.integer</a></span><span class="op">(</span><span class="va">version</span><span class="op">$</span><span class="va">major</span><span class="op">)</span>
+<span class="va">minorv</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/integer.html" class="external-link">as.integer</a></span><span class="op">(</span><span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/tstrsplit.html" class="external-link">strsplit</a></span><span class="op">(</span><span class="va">version</span><span class="op">$</span><span class="va">minor</span>, <span class="st">"."</span>, fixed<span class="op">=</span><span class="cn">TRUE</span><span class="op">)</span><span class="op">[[</span><span class="fl">1</span><span class="op">]</span><span class="op">]</span><span class="op">[</span><span class="fl">1</span><span class="op">]</span><span class="op">)</span>
 
-<span class="kw">if</span>((<span class="no">majorv</span> <span class="kw">==</span> <span class="fl">3</span>) <span class="kw">&amp;</span> (<span class="no">minorv</span> <span class="kw">&gt;=</span> <span class="fl">6</span>)) {
-  <span class="kw pkg">broom</span><span class="kw ns">::</span><span class="fu"><a href="https://rdrr.io/pkg/broom/man/reexports.html">tidy</a></span>(<span class="no">m</span>)
-} <span class="kw">else</span> {
+<span class="kw">if</span><span class="op">(</span><span class="op">(</span><span class="va">majorv</span> <span class="op">==</span> <span class="fl">3</span><span class="op">)</span> <span class="op">&amp;</span> <span class="op">(</span><span class="va">minorv</span> <span class="op">&gt;=</span> <span class="fl">6</span><span class="op">)</span><span class="op">)</span> <span class="op">{</span>
+  <span class="fu">broom</span><span class="fu">::</span><span class="fu"><a href="https://generics.r-lib.org/reference/tidy.html" class="external-link">tidy</a></span><span class="op">(</span><span class="va">m</span><span class="op">)</span>
+<span class="op">}</span> <span class="kw">else</span> <span class="op">{</span>
   <span class="co"># broom doesn't work in version &lt; R3.6 because biglm does not work</span>
-}
-<span class="co">#&gt; NULL</span></pre></body></html></div>
+<span class="op">}</span>
+<span class="co">#&gt; NULL</span></code></pre></div>
 <p>The syntax didn’t change at all! You are able to enjoy the benefits of <code>disk.frame</code> when dealing with larger-than-RAM data.</p>
 </div>
-<div id="logistic-regression" class="section level2">
-<h2 class="hasAnchor">
-<a href="#logistic-regression" class="anchor"></a>Logistic regression</h2>
+<div class="section level3">
+<h3 id="logistic-regression">Logistic regression<a class="anchor" aria-label="anchor" href="#logistic-regression"></a>
+</h3>
 <p>Logistic regression is one of the most commonly deployed machine learning (ML) models. It is often used to build binary classification models</p>
-<div class="sourceCode" id="cb6"><html><body><pre class="r"><span class="no">iris.df</span> <span class="kw">=</span> <span class="fu"><a href="../reference/as.disk.frame.html">as.disk.frame</a></span>(<span class="no">iris</span>)
+<div class="sourceCode" id="cb6"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">iris.df</span> <span class="op">=</span> <span class="fu"><a href="../reference/as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">iris</span><span class="op">)</span>
 
 <span class="co"># fit a logistic regression model to predict Speciess == "setosa" using all variables</span>
-<span class="no">all_terms_except_species</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/sets.html">setdiff</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/names.html">names</a></span>(<span class="no">iris.df</span>), <span class="st">"Species"</span>)
-<span class="no">formula_rhs</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/paste.html">paste0</a></span>(<span class="no">all_terms_except_species</span>, <span class="kw">collapse</span> <span class="kw">=</span> <span class="st">"+"</span>)
+<span class="va">all_terms_except_species</span> <span class="op">=</span> <span class="fu"><a href="https://generics.r-lib.org/reference/setops.html" class="external-link">setdiff</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/names.html" class="external-link">names</a></span><span class="op">(</span><span class="va">iris.df</span><span class="op">)</span>, <span class="st">"Species"</span><span class="op">)</span>
+<span class="va">formula_rhs</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/paste.html" class="external-link">paste0</a></span><span class="op">(</span><span class="va">all_terms_except_species</span>, collapse <span class="op">=</span> <span class="st">"+"</span><span class="op">)</span>
 
-<span class="no">formula</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/stats/formula.html">as.formula</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/paste.html">paste</a></span>(<span class="st">"Species == 'versicolor' ~ "</span>, <span class="no">formula_rhs</span>))
+<span class="va">formula</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/stats/formula.html" class="external-link">as.formula</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/paste.html" class="external-link">paste</a></span><span class="op">(</span><span class="st">"Species == 'versicolor' ~ "</span>, <span class="va">formula_rhs</span><span class="op">)</span><span class="op">)</span>
 
-<span class="no">iris_model</span> <span class="kw">=</span> <span class="fu"><a href="../reference/dfglm.html">dfglm</a></span>(<span class="no">formula</span> , <span class="kw">data</span> <span class="kw">=</span> <span class="no">iris.df</span>, <span class="kw">family</span><span class="kw">=</span><span class="fu"><a href="https://rdrr.io/r/stats/family.html">binomial</a></span>())
+<span class="va">iris_model</span> <span class="op">=</span> <span class="fu"><a href="../reference/dfglm.html">dfglm</a></span><span class="op">(</span><span class="va">formula</span> , data <span class="op">=</span> <span class="va">iris.df</span>, family<span class="op">=</span><span class="fu"><a href="https://rdrr.io/r/stats/family.html" class="external-link">binomial</a></span><span class="op">(</span><span class="op">)</span><span class="op">)</span>
 
 <span class="co"># iris_model = dfglm(Species == "setosa" ~ , data = iris.df, family=binomial())</span>
 
-<span class="fu"><a href="https://rdrr.io/r/base/summary.html">summary</a></span>(<span class="no">iris_model</span>)
+<span class="fu"><a href="https://rdrr.io/r/base/summary.html" class="external-link">summary</a></span><span class="op">(</span><span class="va">iris_model</span><span class="op">)</span>
 <span class="co">#&gt; Large data regression model: biglm::bigglm(formula, data = streaming_fn, ...)</span>
 <span class="co">#&gt; Sample size =  150 </span>
 <span class="co">#&gt;                 Coef    (95%     CI)     SE      p</span>
@@ -226,21 +231,21 @@ <h2 class="hasAnchor">
 <span class="co">#&gt; Petal.Length  1.3136 -0.0539  2.6812 0.6838 0.0547</span>
 <span class="co">#&gt; Petal.Width  -2.7783 -5.1246 -0.4321 1.1731 0.0179</span>
 
-<span class="no">majorv</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/integer.html">as.integer</a></span>(<span class="no">version</span>$<span class="no">major</span>)
-<span class="no">minorv</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/integer.html">as.integer</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/strsplit.html">strsplit</a></span>(<span class="no">version</span>$<span class="no">minor</span>, <span class="st">"."</span>, <span class="kw">fixed</span><span class="kw">=</span><span class="fl">TRUE</span>)<span class="kw">[[</span><span class="fl">1</span>]][<span class="fl">1</span>])
+<span class="va">majorv</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/integer.html" class="external-link">as.integer</a></span><span class="op">(</span><span class="va">version</span><span class="op">$</span><span class="va">major</span><span class="op">)</span>
+<span class="va">minorv</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/integer.html" class="external-link">as.integer</a></span><span class="op">(</span><span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/tstrsplit.html" class="external-link">strsplit</a></span><span class="op">(</span><span class="va">version</span><span class="op">$</span><span class="va">minor</span>, <span class="st">"."</span>, fixed<span class="op">=</span><span class="cn">TRUE</span><span class="op">)</span><span class="op">[[</span><span class="fl">1</span><span class="op">]</span><span class="op">]</span><span class="op">[</span><span class="fl">1</span><span class="op">]</span><span class="op">)</span>
 
-<span class="kw">if</span>((<span class="no">majorv</span> <span class="kw">==</span> <span class="fl">3</span>) <span class="kw">&amp;</span> (<span class="no">minorv</span> <span class="kw">&gt;=</span> <span class="fl">6</span>)) {
-  <span class="kw pkg">broom</span><span class="kw ns">::</span><span class="fu"><a href="https://rdrr.io/pkg/broom/man/reexports.html">tidy</a></span>(<span class="no">iris_model</span>)
-} <span class="kw">else</span> {
+<span class="kw">if</span><span class="op">(</span><span class="op">(</span><span class="va">majorv</span> <span class="op">==</span> <span class="fl">3</span><span class="op">)</span> <span class="op">&amp;</span> <span class="op">(</span><span class="va">minorv</span> <span class="op">&gt;=</span> <span class="fl">6</span><span class="op">)</span><span class="op">)</span> <span class="op">{</span>
+  <span class="fu">broom</span><span class="fu">::</span><span class="fu"><a href="https://generics.r-lib.org/reference/tidy.html" class="external-link">tidy</a></span><span class="op">(</span><span class="va">iris_model</span><span class="op">)</span>
+<span class="op">}</span> <span class="kw">else</span> <span class="op">{</span>
   <span class="co"># broom doesn't work in version &lt; R3.6 because biglm does not work</span>
-}
-<span class="co">#&gt; NULL</span></pre></body></html></div>
-<p>The arguments to the <code>dfglm</code> function are the same as the arguments to <code><a href="https://rdrr.io/pkg/biglm/man/bigglm.html">biglm::bigglm</a></code> which are based on the <code>glm</code> function. Please check their documentations for other argument options.</p>
+<span class="op">}</span>
+<span class="co">#&gt; NULL</span></code></pre></div>
+<p>The arguments to the <code>dfglm</code> function are the same as the arguments to <code><a href="https://rdrr.io/pkg/biglm/man/bigglm.html" class="external-link">biglm::bigglm</a></code> which are based on the <code>glm</code> function. Please check their documentations for other argument options.</p>
 </div>
-<div id="notes" class="section level2">
-<h2 class="hasAnchor">
-<a href="#notes" class="anchor"></a>Notes</h2>
-<p><code>{disk.frame}</code> uses <code>{biglm}</code> and <code>{speedglm}</code> as the backend for GLMs. Unfortunately, neither package is managed on open-source platforms, so it’s more difficult to contribute to them by making bug fixes and submitting bug reports. So bugs are likely to persists. There is an active effort on <code>disk.frame</code> to look for alternatives. Example of avenues to explore include tighter integration with <code>{keras}</code>, h2o, or Julia’s OnlineStats.jl for model fit purposes.</p>
+<div class="section level3">
+<h3 id="notes">Notes<a class="anchor" aria-label="anchor" href="#notes"></a>
+</h3>
+<p><a href="https://diskframe.com" class="external-link">disk.frame</a> uses <code>{biglm}</code> and <code>{speedglm}</code> as the backend for GLMs. Unfortunately, neither package is managed on open-source platforms, so it’s more difficult to contribute to them by making bug fixes and submitting bug reports. So bugs are likely to persists. There is an active effort on <code>disk.frame</code> to look for alternatives. Example of avenues to explore include tighter integration with <a href="https://keras.rstudio.com" class="external-link">keras</a>, h2o, or Julia’s OnlineStats.jl for model fit purposes.</p>
 <p>Another package for larger-than-RAM glm fitting, <code>{bigFastlm}</code>, has been taken off CRAN, it is managed on Github.</p>
 <p>Currently, parallel processing of GLM fit are not possible with {<code>disk.frame</code>}.</p>
 </div>
@@ -258,11 +263,13 @@ <h2 class="hasAnchor">
 
 
       <footer><div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+  <p></p>
+<p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p>
+<p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
       </footer>
@@ -271,5 +278,7 @@ <h2 class="hasAnchor">
   
 
 
+  
+
   </body>
 </html>
diff --git a/docs/articles/07-glm_files/header-attrs-2.8/header-attrs.js b/docs/articles/07-glm_files/header-attrs-2.8/header-attrs.js
new file mode 100644
index 00000000..dd57d92e
--- /dev/null
+++ b/docs/articles/07-glm_files/header-attrs-2.8/header-attrs.js
@@ -0,0 +1,12 @@
+// Pandoc 2.9 adds attributes on both header and div. We remove the former (to
+// be compatible with the behavior of Pandoc < 2.8).
+document.addEventListener('DOMContentLoaded', function(e) {
+  var hs = document.querySelectorAll("div.section[class*='level'] > :first-child");
+  var i, h, a;
+  for (i = 0; i < hs.length; i++) {
+    h = hs[i];
+    if (!/^h[1-6]$/i.test(h.tagName)) continue;  // it should be a header h1-h6
+    a = h.attributes;
+    while (a.length > 0) h.removeAttribute(a[0].name);
+  }
+});
diff --git a/docs/articles/08-more-epic.html b/docs/articles/08-more-epic.html
index d8200058..cfff702c 100644
--- a/docs/articles/08-more-epic.html
+++ b/docs/articles/08-more-epic.html
@@ -19,6 +19,8 @@
 <![endif]-->
 </head>
 <body data-spy="scroll" data-target="#toc">
+    
+
     <div class="container template-article">
       <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
@@ -31,18 +33,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
       <ul class="nav navbar-nav">
-<li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
 <li>
   <a href="../reference/index.html">Reference</a>
 </li>
@@ -86,6 +82,9 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
   </ul>
 </li>
 <li>
@@ -94,8 +93,8 @@
       </ul>
 <ul class="nav navbar-nav navbar-right">
 <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
@@ -113,181 +112,193 @@
   <div class="col-md-9 contents">
     <div class="page-header toc-ignore">
       <h1 data-toc-skip>{disk.frame} can be more ‘epic’</h1>
-                        <h4 class="author">ZJ</h4>
+                        <h4 data-toc-skip class="author">ZJ</h4>
             
       
-      <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/master/vignettes/08-more-epic.Rmd"><code>vignettes/08-more-epic.Rmd</code></a></small>
+      <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/vignettes/08-more-epic.Rmd" class="external-link"><code>vignettes/08-more-epic.Rmd</code></a></small>
       <div class="hidden name"><code>08-more-epic.Rmd</code></div>
 
     </div>
 
     
     
-<div id="someone-wrote-a-blog-about-disk-frame-being-epic" class="section level2">
-<h2 class="hasAnchor">
-<a href="#someone-wrote-a-blog-about-disk-frame-being-epic" class="anchor"></a>Someone wrote a blog about {disk.frame} being “epic”</h2>
-<p>Mr Bruno Rodrigues had kindly written <a href="https://www.brodrigues.co/blog/2019-09-03-disk_frame/">a nice blog post titled ‘{disk.frame} is epic’</a>. In the post, he compared {disk.frame}’s performance vs Spark’s on doing a simple group-by operation. The task is done on a single-machine and hence is not the ideal use-case for Spark. However, in <a href="https://www.brodrigues.co/blog/2018-02-16-importing_30gb_of_data/">an earlier post</a>, Bruno had shown how Spark can be used for this use case. This is symptomatic of what I call the “premature adoption of Spark syndrome”. It’s not hard to find examples where Spark is used when a more light-weight tool like Dask or {disk.frame} could be more efficient. There is no need to use a sledgehammer to crack a nut. In data science, what a “nut” can represent is getting larger and larger. Ten years ago, a 1GB (in CSV) dataset can be a struggle for R and Python, as many machines back then were still 32bit and hence did not have more than 4GB of RAM in general. Nowadays, 16GB laptop are common place, so any file less than 4GB in size can be considered a “nut”. Furthermore, if you use a tool like {disk.frame} which keeps the data on-disk until you need to process it, then the “nut” you can crack is now substantially larger than 4GB. I would argue, the sledgehammer that is Spark should only be considered for <em>much</em> larger datasets. I don’t want to put a number to it, but the largest dataset I have dealt with is <a href="https://docs.rapids.ai/datasets/mortgage-data">the Fannie Mae dataset</a> which is about 200GB in size in CSV format.</p>
+<div class="section level2">
+<h2 id="someone-wrote-a-blog-about-disk-frame-being-epic">Someone wrote a blog about {disk.frame} being “epic”<a class="anchor" aria-label="anchor" href="#someone-wrote-a-blog-about-disk-frame-being-epic"></a>
+</h2>
+<p>Mr Bruno Rodrigues had kindly written <a href="https://www.brodrigues.co/blog/2019-09-03-disk_frame/" class="external-link">a nice blog post titled ‘{disk.frame} is epic’</a>. In the post, he compared {disk.frame}’s performance vs Spark’s on doing a simple group-by operation. The task is done on a single-machine and hence is not the ideal use-case for Spark. However, in <a href="https://www.brodrigues.co/blog/2018-02-16-importing_30gb_of_data/" class="external-link">an earlier post</a>, Bruno had shown how Spark can be used for this use case. This is symptomatic of what I call the “premature adoption of Spark syndrome”. It’s not hard to find examples where Spark is used when a more light-weight tool like Dask or {disk.frame} could be more efficient. There is no need to use a sledgehammer to crack a nut. In data science, what a “nut” can represent is getting larger and larger. Ten years ago, a 1GB (in CSV) dataset can be a struggle for R and Python, as many machines back then were still 32bit and hence did not have more than 4GB of RAM in general. Nowadays, 16GB laptop are common place, so any file less than 4GB in size can be considered a “nut”. Furthermore, if you use a tool like {disk.frame} which keeps the data on-disk until you need to process it, then the “nut” you can crack is now substantially larger than 4GB. I would argue, the sledgehammer that is Spark should only be considered for <em>much</em> larger datasets. I don’t want to put a number to it, but the largest dataset I have dealt with is <a href="https://docs.rapids.ai/datasets/mortgage-data" class="external-link">the Fannie Mae dataset</a> which is about 200GB in size in CSV format.</p>
 </div>
-<div id="how-to-make-disk-frame-more-epic" class="section level2">
-<h2 class="hasAnchor">
-<a href="#how-to-make-disk-frame-more-epic" class="anchor"></a>How to make {disk.frame} more ‘epic’?</h2>
-<p>If you follow <a href="https://www.brodrigues.co/blog/2018-02-16-importing_30gb_of_data/">this post by Bruno</a>, you will end up with a 30GB CSV file. But this 30GB file was made by row-appending 303 files (size ranging from 70MB to 143MB) together. I will you a few ways to handle such data. As usual, let’s start by setting up {disk.frame}</p>
-<div class="sourceCode" id="cb1"><html><body><pre class="r"><span class="fu"><a href="https://rdrr.io/r/base/library.html">library</a></span>(<span class="no">disk.frame</span>)
+<div class="section level2">
+<h2 id="how-to-make-disk-frame-more-epic">How to make {disk.frame} more ‘epic’?<a class="anchor" aria-label="anchor" href="#how-to-make-disk-frame-more-epic"></a>
+</h2>
+<p>If you follow <a href="https://www.brodrigues.co/blog/2018-02-16-importing_30gb_of_data/" class="external-link">this post by Bruno</a>, you will end up with a 30GB CSV file. But this 30GB file was made by row-appending 303 files (size ranging from 70MB to 143MB) together. I will you a few ways to handle such data. As usual, let’s start by setting up {disk.frame}</p>
+<div class="sourceCode" id="cb1"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://diskframe.com" class="external-link">disk.frame</a></span><span class="op">)</span>
 
 <span class="co"># this willl set disk.frame with multiple workers</span>
-<span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span>()
+<span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span><span class="op">(</span><span class="op">)</span>
 
 <span class="co"># this will allow unlimited amount of data to be passed from worker to worker</span>
-<span class="fu"><a href="https://rdrr.io/r/base/options.html">options</a></span>(<span class="kw">future.globals.maxSize</span> <span class="kw">=</span> <span class="fl">Inf</span>)</pre></body></html></div>
-<div id="load-the-individuals-files" class="section level3">
-<h3 class="hasAnchor">
-<a href="#load-the-individuals-files" class="anchor"></a>Load the individuals files</h3>
+<span class="fu"><a href="https://rdrr.io/r/base/options.html" class="external-link">options</a></span><span class="op">(</span>future.globals.maxSize <span class="op">=</span> <span class="cn">Inf</span><span class="op">)</span></code></pre></div>
+<div class="section level3">
+<h3 id="load-the-individuals-files">Load the individuals files<a class="anchor" aria-label="anchor" href="#load-the-individuals-files"></a>
+</h3>
 <p>The best way to use {disk.frame} is to load the individual files, as <code>csv_to_disk.frame</code> allows a vector of files to be used as input:</p>
-<div class="sourceCode" id="cb2"><html><body><pre class="r"><span class="no">path_to_files</span>  <span class="kw">=</span> <span class="st">"c:/data/AirOnTimeCSV"</span>
-<span class="fu"><a href="https://rdrr.io/r/base/list.files.html">list.files</a></span>(<span class="no">path_to_files</span>, <span class="kw">patter</span><span class="kw">=</span><span class="st">"air"</span>, <span class="kw">full.names</span> <span class="kw">=</span> <span class="fl">TRUE</span>) <span class="kw">%&gt;%</span> <span class="no">head</span>
+<div class="sourceCode" id="cb2"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">path_to_files</span>  <span class="op">=</span> <span class="st">"c:/data/AirOnTimeCSV"</span>
+<span class="fu"><a href="https://rdrr.io/r/base/list.files.html" class="external-link">list.files</a></span><span class="op">(</span><span class="va">path_to_files</span>, patter<span class="op">=</span><span class="st">"air"</span>, full.names <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="va">head</span>
 
 <span class="co">#&gt; [1] "c:/data/AirOnTimeCSV/airOT198710.csv" "c:/data/AirOnTimeCSV/airOT198711.csv"</span>
 <span class="co">#&gt; [3] "c:/data/AirOnTimeCSV/airOT198712.csv" "c:/data/AirOnTimeCSV/airOT198801.csv"</span>
-<span class="co">#&gt; [5] "c:/data/AirOnTimeCSV/airOT198802.csv" "c:/data/AirOnTimeCSV/airOT198803.csv"</span></pre></body></html></div>
+<span class="co">#&gt; [5] "c:/data/AirOnTimeCSV/airOT198802.csv" "c:/data/AirOnTimeCSV/airOT198803.csv"</span></code></pre></div>
 <p>However, there is always a danger with importing from CSVs, especially when importing from multiple CSVs. The chief danger is this: CSV do not encode the type of the columns. Hence the column types need to be inferred. However, when inferring the column type, we only use the first few thousand rows. This is fine most of the time. However, there are times when the column type inferred using the first few thousand rows isn’t compatible with data that comes after. That’s why you will see an error</p>
-<div class="sourceCode" id="cb3"><html><body><pre class="r">Error: Column `WHEELS_OFF` can't be converted from integer to character</pre></body></html></div>
+<div class="sourceCode" id="cb3"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb3-1"><a href="#cb3-1" aria-hidden="true" tabindex="-1"></a>Error<span class="sc">:</span> Column <span class="st">`</span><span class="at">WHEELS_OFF</span><span class="st">`</span> can<span class="st">'t be converted from integer to character</span></span></code></pre></div>
 <p>when running the below code</p>
-<div class="sourceCode" id="cb4"><html><body><pre class="r"><span class="no">list_files</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/list.files.html">list.files</a></span>(<span class="no">path_to_files</span>, <span class="kw">patter</span><span class="kw">=</span><span class="st">"air"</span>, <span class="kw">full.names</span> <span class="kw">=</span> <span class="fl">TRUE</span>)
-<span class="fu"><a href="https://rdrr.io/r/base/system.time.html">system.time</a></span>(<span class="no">flights.df</span> <span class="kw">&lt;-</span> <span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span>(<span class="no">list_files</span>, <span class="no">co</span>))</pre></body></html></div>
+<div class="sourceCode" id="cb4"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">list_files</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/list.files.html" class="external-link">list.files</a></span><span class="op">(</span><span class="va">path_to_files</span>, patter<span class="op">=</span><span class="st">"air"</span>, full.names <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span>
+<span class="fu"><a href="https://rdrr.io/r/base/system.time.html" class="external-link">system.time</a></span><span class="op">(</span><span class="va">flights.df</span> <span class="op">&lt;-</span> <span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span><span class="op">(</span><span class="va">list_files</span>, <span class="va">co</span><span class="op">)</span><span class="op">)</span></code></pre></div>
 <p>I need to come up with a framework to help with these types of task, but for now, you should use the <code>colClasses</code> argument whenever possible to set the column types. For example,</p>
-<div class="sourceCode" id="cb5"><html><body><pre class="r"><span class="no">list_files</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/list.files.html">list.files</a></span>(<span class="no">path_to_files</span>, <span class="kw">patter</span><span class="kw">=</span><span class="st">"air"</span>, <span class="kw">full.names</span> <span class="kw">=</span> <span class="fl">TRUE</span>)
+<div class="sourceCode" id="cb5"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">list_files</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/list.files.html" class="external-link">list.files</a></span><span class="op">(</span><span class="va">path_to_files</span>, patter<span class="op">=</span><span class="st">"air"</span>, full.names <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span>
 
-<span class="fu"><a href="https://rdrr.io/r/base/system.time.html">system.time</a></span>(<span class="no">a</span> <span class="kw">&lt;-</span> <span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span>(
-   <span class="no">list_files</span>,
-   <span class="kw">colClasses</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/list.html">list</a></span>(<span class="kw">character</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html">c</a></span>(<span class="st">"WHEELS_OFF"</span>, <span class="st">"WHEELS_ON"</span>))
-))</pre></body></html></div>
+<span class="fu"><a href="https://rdrr.io/r/base/system.time.html" class="external-link">system.time</a></span><span class="op">(</span><span class="va">a</span> <span class="op">&lt;-</span> <span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span><span class="op">(</span>
+   <span class="va">list_files</span>,
+   colClasses <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/list.html" class="external-link">list</a></span><span class="op">(</span>character <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">"WHEELS_OFF"</span>, <span class="st">"WHEELS_ON"</span><span class="op">)</span><span class="op">)</span>
+<span class="op">)</span><span class="op">)</span></code></pre></div>
 <p>which yielded</p>
-<div class="sourceCode" id="cb6"><html><body><pre class="r">#&gt; csv_to_disk.frame: you are trying to read multiple files.
-#&gt; Please use colClasses to set column types to minimize the chance of a failed read
-#&gt; -- Converting CSVs to disk.frame --
-#&gt; Converting 303 CSVs to 36 disk.frame each consisting of 36 chunks (Stage 1 of 2):
-#&gt; 
-#&gt; Stage 1 or 2 took: 00:01:47 elapsed (0.170s cpu)
-#&gt; 
-#&gt; Row-binding the 36 disk.frames together to form one large disk.frame (Stage 2 of 2):
-#&gt; Creating the disk.frame at C:\Users\RTX2080\AppData\Local\Temp\Rtmp6VQrsK\file1a1c77035a94.df
-#&gt; Appending disk.frames:
-#&gt; 
-#&gt; Stage 2 of 2 took: 00:01:01 elapsed (0.340s cpu)
-#&gt;  -----------------------------------------------------
-#&gt; Stage 1 &amp; 2 in total took: 00:02:48 elapsed (0.510s cpu)
-#&gt;    user  system elapsed 
-#&gt;    0.51    0.32  168.72</pre></body></html></div>
+<div class="sourceCode" id="cb6"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="co">#&gt; csv_to_disk.frame: you are trying to read multiple files.</span>
+<span class="co">#&gt; Please use colClasses to set column types to minimize the chance of a failed read</span>
+<span class="co">#&gt; -- Converting CSVs to disk.frame --</span>
+<span class="co">#&gt; Converting 303 CSVs to 36 disk.frame each consisting of 36 chunks (Stage 1 of 2):</span>
+<span class="co">#&gt; </span>
+<span class="co">#&gt; Stage 1 or 2 took: 00:01:47 elapsed (0.170s cpu)</span>
+<span class="co">#&gt; </span>
+<span class="co">#&gt; Row-binding the 36 disk.frames together to form one large disk.frame (Stage 2 of 2):</span>
+<span class="co">#&gt; Creating the disk.frame at C:\Users\RTX2080\AppData\Local\Temp\Rtmp6VQrsK\file1a1c77035a94.df</span>
+<span class="co">#&gt; Appending disk.frames:</span>
+<span class="co">#&gt; </span>
+<span class="co">#&gt; Stage 2 of 2 took: 00:01:01 elapsed (0.340s cpu)</span>
+<span class="co">#&gt;  -----------------------------------------------------</span>
+<span class="co">#&gt; Stage 1 &amp; 2 in total took: 00:02:48 elapsed (0.510s cpu)</span>
+<span class="co">#&gt;    user  system elapsed </span>
+<span class="co">#&gt;    0.51    0.32  168.72</span></code></pre></div>
 <p>As you can see the the 303 files are converted to a <code>disk.frame</code> in about ~3mins, this much faster than Spark.</p>
 </div>
-<div id="load-one-large-file-splitting" class="section level3">
-<h3 class="hasAnchor">
-<a href="#load-one-large-file-splitting" class="anchor"></a>Load one large-file (splitting)</h3>
+<div class="section level3">
+<h3 id="load-one-large-file-splitting">Load one large-file (splitting)<a class="anchor" aria-label="anchor" href="#load-one-large-file-splitting"></a>
+</h3>
 <p>However, in real life you may be given one large CSV and told to work from there. In Linux or MacOS, we can use the <code>split</code> command to split up the file first, and apply the previous strategy. But on Windows, this isn’t trivial unless you have installed some nix tools (e.g. git bash).</p>
 <p>Starting from {disk.frame} v0.1.1, we have something to help with this. When you call <code>csv_to_disk.frame</code> with the <code>in_chunk_size</code> argument, then the big file will be split into smaller files using {bigreadr} before reading. This happen automatically.</p>
 <p>Splitting up a large file might take a few minutes, but once the file is split, we can use multiple cores to process the split-up files in parallel! The performance gain there might offset the overhead of splitting a file.</p>
 <p>As mentioned, the key is setting argument <code>in_chunk_size</code> to a value, which will activate the file splitting</p>
-<div class="sourceCode" id="cb7"><html><body><pre class="r"><span class="no">path_to_data</span> <span class="kw">=</span> <span class="st">"c:/data/"</span>
+<div class="sourceCode" id="cb7"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">path_to_data</span> <span class="op">=</span> <span class="st">"c:/data/"</span>
 
 <span class="co"># read 10 millions at once</span>
-<span class="no">in_chunk_size</span> <span class="kw">=</span> <span class="fl">1e7</span>
+<span class="va">in_chunk_size</span> <span class="op">=</span> <span class="fl">1e7</span>
 
-<span class="fu"><a href="https://rdrr.io/r/base/system.time.html">system.time</a></span>(<span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span>(
-   <span class="fu"><a href="https://rdrr.io/r/base/file.path.html">file.path</a></span>(<span class="no">path_to_data</span>, <span class="st">"combined.csv"</span>),
-   <span class="kw">in_chunk_size</span> <span class="kw">=</span> <span class="no">in_chunk_size</span>,
-   <span class="kw">colClasses</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/list.html">list</a></span>(<span class="kw">character</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html">c</a></span>(<span class="st">"WHEELS_OFF"</span>,<span class="st">"WHEELS_ON"</span>))
-))</pre></body></html></div>
+<span class="fu"><a href="https://rdrr.io/r/base/system.time.html" class="external-link">system.time</a></span><span class="op">(</span><span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span><span class="op">(</span>
+   <span class="fu"><a href="https://rdrr.io/r/base/file.path.html" class="external-link">file.path</a></span><span class="op">(</span><span class="va">path_to_data</span>, <span class="st">"combined.csv"</span><span class="op">)</span>, 
+   in_chunk_size <span class="op">=</span> <span class="va">in_chunk_size</span>,
+   colClasses <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/list.html" class="external-link">list</a></span><span class="op">(</span>character <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">"WHEELS_OFF"</span>,<span class="st">"WHEELS_ON"</span><span class="op">)</span><span class="op">)</span>
+<span class="op">)</span><span class="op">)</span></code></pre></div>
 <p>which yielded</p>
-<div class="sourceCode" id="cb8"><html><body><pre class="r">#&gt;  -----------------------------------------------------
-#&gt; Stage 1 of 2: splitting the file c:/data//combined.csv into smallers files:
-#&gt; Destination: C:\Users\RTX2080\AppData\Local\Temp\Rtmp6VQrsK\file1a1c22af50f3
-#&gt;  -----------------------------------------------------
-#&gt; Stage 1 of 2 took: 00:02:06 elapsed (00:01:15 cpu)
-#&gt;  -----------------------------------------------------
-#&gt; Stage 2 of 2: Converting the smaller files into disk.frame
-#&gt;  -----------------------------------------------------
-#&gt; csv_to_disk.frame: you are trying to read multiple files.
-#&gt; Please use colClasses to set column types to minimize the chance of a failed read
-#&gt; -- Converting CSVs to disk.frame --
-#&gt; Converting 15 CSVs to 36 disk.frame each consisting of 36 chunks (Stage 1 of 2):
-#&gt; 
-#&gt; Stage 1 or 2 took: 54.0s elapsed (0.120s cpu)
-#&gt; 
-#&gt; Row-binding the 36 disk.frames together to form one large disk.frame (Stage 2 of 2):
-#&gt; Creating the disk.frame at C:\Users\RTX2080\AppData\Local\Temp\Rtmp6VQrsK\file1a1c680f2305.df
-#&gt; Appending disk.frames:
-#&gt; 
-#&gt; Stage 2 of 2 took: 36.0s elapsed (0.200s cpu)
-#&gt;  -----------------------------------------------------
-#&gt; Stage 1 &amp; 2 in total took: 00:01:29 elapsed (0.320s cpu)
-#&gt; Stage 2 of 2 took: 00:01:29 elapsed (0.320s cpu)
-#&gt;  -----------------------------------------------------
-#&gt; Stage 2 &amp; 2 took: 00:03:36 elapsed (00:01:15 cpu)
-#&gt;  -----------------------------------------------------
-#&gt;    user  system elapsed 
-#&gt;   75.79   47.89  216.42</pre></body></html></div>
+<div class="sourceCode" id="cb8"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="co">#&gt;  -----------------------------------------------------</span>
+<span class="co">#&gt; Stage 1 of 2: splitting the file c:/data//combined.csv into smallers files:</span>
+<span class="co">#&gt; Destination: C:\Users\RTX2080\AppData\Local\Temp\Rtmp6VQrsK\file1a1c22af50f3</span>
+<span class="co">#&gt;  -----------------------------------------------------</span>
+<span class="co">#&gt; Stage 1 of 2 took: 00:02:06 elapsed (00:01:15 cpu)</span>
+<span class="co">#&gt;  -----------------------------------------------------</span>
+<span class="co">#&gt; Stage 2 of 2: Converting the smaller files into disk.frame</span>
+<span class="co">#&gt;  -----------------------------------------------------</span>
+<span class="co">#&gt; csv_to_disk.frame: you are trying to read multiple files.</span>
+<span class="co">#&gt; Please use colClasses to set column types to minimize the chance of a failed read</span>
+<span class="co">#&gt; -- Converting CSVs to disk.frame --</span>
+<span class="co">#&gt; Converting 15 CSVs to 36 disk.frame each consisting of 36 chunks (Stage 1 of 2):</span>
+<span class="co">#&gt; </span>
+<span class="co">#&gt; Stage 1 or 2 took: 54.0s elapsed (0.120s cpu)</span>
+<span class="co">#&gt; </span>
+<span class="co">#&gt; Row-binding the 36 disk.frames together to form one large disk.frame (Stage 2 of 2):</span>
+<span class="co">#&gt; Creating the disk.frame at C:\Users\RTX2080\AppData\Local\Temp\Rtmp6VQrsK\file1a1c680f2305.df</span>
+<span class="co">#&gt; Appending disk.frames:</span>
+<span class="co">#&gt; </span>
+<span class="co">#&gt; Stage 2 of 2 took: 36.0s elapsed (0.200s cpu)</span>
+<span class="co">#&gt;  -----------------------------------------------------</span>
+<span class="co">#&gt; Stage 1 &amp; 2 in total took: 00:01:29 elapsed (0.320s cpu)</span>
+<span class="co">#&gt; Stage 2 of 2 took: 00:01:29 elapsed (0.320s cpu)</span>
+<span class="co">#&gt;  -----------------------------------------------------</span>
+<span class="co">#&gt; Stage 2 &amp; 2 took: 00:03:36 elapsed (00:01:15 cpu)</span>
+<span class="co">#&gt;  -----------------------------------------------------</span>
+<span class="co">#&gt;    user  system elapsed </span>
+<span class="co">#&gt;   75.79   47.89  216.42</span></code></pre></div>
 <p>As you can see, this takes longer than loading the individual files approach. I am working on a guess the <code>in_chunk_size</code> feature so that <code>in_chunk_size="guess"</code> will work in the future, so the user doesn’t have to input a manual <code>in_chunk_size</code>.</p>
 </div>
-<div id="load-one-large-file-no-splitting" class="section level3">
-<h3 class="hasAnchor">
-<a href="#load-one-large-file-no-splitting" class="anchor"></a>Load one large-file (no splitting)</h3>
+<div class="section level3">
+<h3 id="load-one-large-file-no-splitting">Load one large-file (no splitting)<a class="anchor" aria-label="anchor" href="#load-one-large-file-no-splitting"></a>
+</h3>
 <p>Split up the file will effectively double the amount of disk space needed. We have the original file and we need additional space equal to the size of the original file to store the split files. This is not always feasible and that’s why you can specify the <code>LaF</code> backend which was shown in Bruno’s post but repeated here for completeness. The problem with a <code>LaF</code> backend and reading one big file is that it can NOT be parallelized and hence it is much slower than the other approaches.</p>
-<div class="sourceCode" id="cb9"><html><body><pre class="r"><span class="no">path_to_data</span> <span class="kw">=</span> <span class="st">"c:/data/"</span>
+<div class="sourceCode" id="cb9"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">path_to_data</span> <span class="op">=</span> <span class="st">"c:/data/"</span>
 
 <span class="co"># read 10 millions at once</span>
-<span class="no">in_chunk_size</span> <span class="kw">=</span> <span class="fl">1e7</span>
+<span class="va">in_chunk_size</span> <span class="op">=</span> <span class="fl">1e7</span>
 
-<span class="fu"><a href="https://rdrr.io/r/base/system.time.html">system.time</a></span>(<span class="no">flights.df</span> <span class="kw">&lt;-</span> <span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span>(
-  <span class="fu"><a href="https://rdrr.io/r/base/paste.html">paste0</a></span>(<span class="no">path_to_data</span>, <span class="st">"combined.csv"</span>),
-  <span class="kw">in_chunk_size</span> <span class="kw">=</span> <span class="no">in_chunk_size</span>,
-  <span class="kw">backend</span> <span class="kw">=</span> <span class="st">"LaF"</span>))</pre></body></html></div>
+<span class="fu"><a href="https://rdrr.io/r/base/system.time.html" class="external-link">system.time</a></span><span class="op">(</span><span class="va">flights.df</span> <span class="op">&lt;-</span> <span class="fu"><a href="../reference/csv_to_disk.frame.html">csv_to_disk.frame</a></span><span class="op">(</span>
+  <span class="fu"><a href="https://rdrr.io/r/base/paste.html" class="external-link">paste0</a></span><span class="op">(</span><span class="va">path_to_data</span>, <span class="st">"combined.csv"</span><span class="op">)</span>,
+  in_chunk_size <span class="op">=</span> <span class="va">in_chunk_size</span>,
+  backend <span class="op">=</span> <span class="st">"LaF"</span><span class="op">)</span><span class="op">)</span></code></pre></div>
 <p>there were multiple warnings</p>
-<div class="sourceCode" id="cb10"><html><body><pre class="r">#&gt; Loading required namespace: LaF
-#&gt; Warning in FUN(X[[i]], ...): Unsupported type 'logical'; using default type
-#&gt; 'string'</pre></body></html></div>
+<div class="sourceCode" id="cb10"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="co">#&gt; Loading required namespace: LaF</span>
+<span class="co">#&gt; Warning in FUN(X[[i]], ...): Unsupported type 'logical'; using default type</span>
+<span class="co">#&gt; 'string'</span></code></pre></div>
 <p>and the timings were</p>
-<div class="sourceCode" id="cb11"><html><body><pre class="r">#&gt;    user  system elapsed 
-#&gt;  591.32   26.94  599.08</pre></body></html></div>
+<div class="sourceCode" id="cb11"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="co">#&gt;    user  system elapsed </span>
+<span class="co">#&gt;  591.32   26.94  599.08</span></code></pre></div>
 <p>As can be seen <code>LaF</code> works and can detect the column types automatically. However it is slower than the default backend which is <code>data.table</code>.</p>
 </div>
-<div id="summary" class="section level3">
-<h3 class="hasAnchor">
-<a href="#summary" class="anchor"></a>Summary</h3>
+<div class="section level3">
+<h3 id="summary">Summary<a class="anchor" aria-label="anchor" href="#summary"></a>
+</h3>
 <p>Here is a chart summarizing the performance of the various approaches for reading large CSVs on my computer</p>
 <p><img src="08-more-epic_files/figure-html/unnamed-chunk-2-1.png" width="700"></p>
 </div>
 </div>
-<div id="can-disk-frame-be-even-more-epic" class="section level2">
-<h2 class="hasAnchor">
-<a href="#can-disk-frame-be-even-more-epic" class="anchor"></a>Can {disk.frame} be even more “epic”?</h2>
+<div class="section level2">
+<h2 id="can-disk-frame-be-even-more-epic">Can {disk.frame} be even more “epic”?<a class="anchor" aria-label="anchor" href="#can-disk-frame-be-even-more-epic"></a>
+</h2>
 <p>Well yes! We can actually speed up the group-by operation that Bruno did by using <code>srckeep</code>. The use of <code>srckeep</code> can’t be emphasized enough! It works by reading from disk only the columns needed for the analysis, and hence disk IO time is (drastically) reduced!</p>
-<div class="sourceCode" id="cb12"><html><body><pre class="r"><span class="no">tic</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/Sys.time.html">Sys.time</a></span>()
+<div class="sourceCode" id="cb12"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">tic</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/Sys.time.html" class="external-link">Sys.time</a></span><span class="op">(</span><span class="op">)</span>
 
 <span class="co"># doing group-by in two-stages which is annoying; I am working on something better</span>
-<span class="no">mean_dep_delay</span> <span class="kw">&lt;-</span> <span class="no">flights.df</span> <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="../reference/srckeep.html">srckeep</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/c.html">c</a></span>(<span class="st">"YEAR"</span>, <span class="st">"MONTH"</span>, <span class="st">"DAY_OF_MONTH"</span>, <span class="st">"DEP_DELAY"</span>)) <span class="kw">%&gt;%</span>
-  <span class="fu">group_by</span>(<span class="no">YEAR</span>, <span class="no">MONTH</span>, <span class="no">DAY_OF_MONTH</span>) <span class="kw">%&gt;%</span>
-  <span class="fu">summarise</span>(<span class="kw">mean_delay</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/mean.html">mean</a></span>(<span class="no">DEP_DELAY</span>, <span class="kw">na.rm</span> <span class="kw">=</span> <span class="fl">TRUE</span>))
-(<span class="no">toc</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/Sys.time.html">Sys.time</a></span>() - <span class="no">tic</span>)
-<span class="co">#&gt; Time difference of 2.800005 secs</span></pre></body></html></div>
+<span class="va">mean_dep_delay</span> <span class="op">&lt;-</span> <span class="va">flights.df</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="fu"><a href="../reference/srckeep.html">srckeep</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">"YEAR"</span>, <span class="st">"MONTH"</span>, <span class="st">"DAY_OF_MONTH"</span>, <span class="st">"DEP_DELAY"</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/group_by.html" class="external-link">group_by</a></span><span class="op">(</span><span class="va">YEAR</span>, <span class="va">MONTH</span>, <span class="va">DAY_OF_MONTH</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/summarise.html" class="external-link">summarise</a></span><span class="op">(</span>mean_delay <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/mean.html" class="external-link">mean</a></span><span class="op">(</span><span class="va">DEP_DELAY</span>, na.rm <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span><span class="op">)</span> 
+<span class="op">(</span><span class="va">toc</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/Sys.time.html" class="external-link">Sys.time</a></span><span class="op">(</span><span class="op">)</span> <span class="op">-</span> <span class="va">tic</span><span class="op">)</span>
+<span class="co">#&gt; Time difference of 2.800005 secs</span></code></pre></div>
 <p>Compare the above the to timing without <code>srckeep</code></p>
-<div class="sourceCode" id="cb13"><html><body><pre class="r"><span class="no">tic</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/Sys.time.html">Sys.time</a></span>()
-<span class="no">mean_dep_delay</span> <span class="kw">&lt;-</span> <span class="no">flights.df</span> <span class="kw">%&gt;%</span>
-  <span class="fu">group_by</span>(<span class="no">YEAR</span>, <span class="no">MONTH</span>, <span class="no">DAY_OF_MONTH</span>) <span class="kw">%&gt;%</span>
-  <span class="fu">summarise</span>(<span class="kw">mean_delay</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/mean.html">mean</a></span>(<span class="no">DEP_DELAY</span>, <span class="kw">na.rm</span> <span class="kw">=</span> <span class="fl">TRUE</span>))
-(<span class="no">toc</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/Sys.time.html">Sys.time</a></span>() - <span class="no">tic</span>)
-<span class="co">#&gt; Time difference of 15.62312 secs</span></pre></body></html></div>
+<div class="sourceCode" id="cb13"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">tic</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/Sys.time.html" class="external-link">Sys.time</a></span><span class="op">(</span><span class="op">)</span>
+<span class="va">mean_dep_delay</span> <span class="op">&lt;-</span> <span class="va">flights.df</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/group_by.html" class="external-link">group_by</a></span><span class="op">(</span><span class="va">YEAR</span>, <span class="va">MONTH</span>, <span class="va">DAY_OF_MONTH</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/summarise.html" class="external-link">summarise</a></span><span class="op">(</span>mean_delay <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/mean.html" class="external-link">mean</a></span><span class="op">(</span><span class="va">DEP_DELAY</span>, na.rm <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span><span class="op">)</span> 
+<span class="op">(</span><span class="va">toc</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/Sys.time.html" class="external-link">Sys.time</a></span><span class="op">(</span><span class="op">)</span> <span class="op">-</span> <span class="va">tic</span><span class="op">)</span>
+<span class="co">#&gt; Time difference of 15.62312 secs</span></code></pre></div>
 <p>On my computer, with <code>srckeep</code> the timing is only ~3 seconds and without it is 16 seconds!</p>
 <p><img src="08-more-epic_files/figure-html/unnamed-chunk-3-1.png" width="700"></p>
 </div>
-<div id="conclusion" class="section level2">
-<h2 class="hasAnchor">
-<a href="#conclusion" class="anchor"></a>Conclusion</h2>
+<div class="section level2">
+<h2 id="conclusion">Conclusion<a class="anchor" aria-label="anchor" href="#conclusion"></a>
+</h2>
 <p>So there you go! {disk.frame} can be even more “epic”! Here are the two main take-aways</p>
 <ol style="list-style-type: decimal">
 <li>Load CSV files as many individual files if possible to take advantage of multi-core parallelism</li>
 <li>
-<code>srckeep</code> is your friend! Disk IO is often the bottleneck in data manipulation, and you can reduce disk IO by specifying only columns that you will use with <code><a href="../reference/srckeep.html">srckeep(c(columns1, columns2, ...))</a></code>.</li>
+<code>srckeep</code> is your friend! Disk IO is often the bottleneck in data manipulation, and you can reduce disk IO by specifying only columns that you will use with <code>srckeep(c(columns1, columns2, ...))</code>.</li>
 </ol>
 </div>
   </div>
@@ -303,11 +314,13 @@ <h2 class="hasAnchor">
 
 
       <footer><div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+  <p></p>
+<p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p>
+<p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
       </footer>
@@ -316,5 +329,7 @@ <h2 class="hasAnchor">
   
 
 
+  
+
   </body>
 </html>
diff --git a/docs/articles/08-more-epic_files/figure-html/unnamed-chunk-2-1.png b/docs/articles/08-more-epic_files/figure-html/unnamed-chunk-2-1.png
index 9096f2a8..75e8627b 100644
Binary files a/docs/articles/08-more-epic_files/figure-html/unnamed-chunk-2-1.png and b/docs/articles/08-more-epic_files/figure-html/unnamed-chunk-2-1.png differ
diff --git a/docs/articles/08-more-epic_files/figure-html/unnamed-chunk-3-1.png b/docs/articles/08-more-epic_files/figure-html/unnamed-chunk-3-1.png
index f81dec5b..8ba6ef69 100644
Binary files a/docs/articles/08-more-epic_files/figure-html/unnamed-chunk-3-1.png and b/docs/articles/08-more-epic_files/figure-html/unnamed-chunk-3-1.png differ
diff --git a/docs/articles/08-more-epic_files/header-attrs-2.8/header-attrs.js b/docs/articles/08-more-epic_files/header-attrs-2.8/header-attrs.js
new file mode 100644
index 00000000..dd57d92e
--- /dev/null
+++ b/docs/articles/08-more-epic_files/header-attrs-2.8/header-attrs.js
@@ -0,0 +1,12 @@
+// Pandoc 2.9 adds attributes on both header and div. We remove the former (to
+// be compatible with the behavior of Pandoc < 2.8).
+document.addEventListener('DOMContentLoaded', function(e) {
+  var hs = document.querySelectorAll("div.section[class*='level'] > :first-child");
+  var i, h, a;
+  for (i = 0; i < hs.length; i++) {
+    h = hs[i];
+    if (!/^h[1-6]$/i.test(h.tagName)) continue;  // it should be a header h1-h6
+    a = h.attributes;
+    while (a.length > 0) h.removeAttribute(a[0].name);
+  }
+});
diff --git a/docs/articles/09-convenience-features.html b/docs/articles/09-convenience-features.html
index 9c9c7c77..81ab3af8 100644
--- a/docs/articles/09-convenience-features.html
+++ b/docs/articles/09-convenience-features.html
@@ -19,6 +19,8 @@
 <![endif]-->
 </head>
 <body data-spy="scroll" data-target="#toc">
+    
+
     <div class="container template-article">
       <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
@@ -31,18 +33,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
       <ul class="nav navbar-nav">
-<li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
 <li>
   <a href="../reference/index.html">Reference</a>
 </li>
@@ -86,6 +82,9 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
   </ul>
 </li>
 <li>
@@ -94,8 +93,8 @@
       </ul>
 <ul class="nav navbar-nav navbar-right">
 <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
@@ -113,46 +112,49 @@
   <div class="col-md-9 contents">
     <div class="page-header toc-ignore">
       <h1 data-toc-skip>Convenience features</h1>
-                        <h4 class="author">ZJ</h4>
+                        <h4 data-toc-skip class="author">ZJ</h4>
             
       
-      <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/master/vignettes/09-convenience-features.Rmd"><code>vignettes/09-convenience-features.Rmd</code></a></small>
+      <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/vignettes/09-convenience-features.Rmd" class="external-link"><code>vignettes/09-convenience-features.Rmd</code></a></small>
       <div class="hidden name"><code>09-convenience-features.Rmd</code></div>
 
     </div>
 
     
     
-<div id="convenience-features" class="section level2">
-<h2 class="hasAnchor">
-<a href="#convenience-features" class="anchor"></a>Convenience Features</h2>
-<div id="graphical-user-interface-gui-for-setting-options" class="section level3">
-<h3 class="hasAnchor">
-<a href="#graphical-user-interface-gui-for-setting-options" class="anchor"></a>Graphical User Interface (GUI) for setting options</h3>
-<p>I wanted to make <code>{disk.frame}</code> as easy to use as possible. I often forget what options are available to me. So I’ve made a graphical user interface (GUI) which can invoked with</p>
-<div class="sourceCode" id="cb1"><html><body><pre class="r"><span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span>(<span class="kw">gui</span> <span class="kw">=</span> <span class="fl">TRUE</span>)</pre></body></html></div>
-<p>The above opens up a Shiny app where the user can adjust the <code>{disk.frame}</code> options in a .</p>
+<div class="section level2">
+<h2 id="convenience-features">Convenience Features<a class="anchor" aria-label="anchor" href="#convenience-features"></a>
+</h2>
+<div class="section level3">
+<h3 id="graphical-user-interface-gui-for-setting-options">Graphical User Interface (GUI) for setting options<a class="anchor" aria-label="anchor" href="#graphical-user-interface-gui-for-setting-options"></a>
+</h3>
+<p>I wanted to make <a href="https://diskframe.com" class="external-link">disk.frame</a> as easy to use as possible. I often forget what options are available to me. So I’ve made a graphical user interface (GUI) which can invoked with</p>
+<div class="sourceCode" id="cb1"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span><span class="op">(</span>gui <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span></code></pre></div>
+<p>The above opens up a Shiny app where the user can adjust the <a href="https://diskframe.com" class="external-link">disk.frame</a> options in a .</p>
 </div>
-<div id="rstudio-column-name-completion" class="section level3">
-<h3 class="hasAnchor">
-<a href="#rstudio-column-name-completion" class="anchor"></a>RStudio column name completion</h3>
-<div class="sourceCode" id="cb2"><html><body><pre class="r">library(disk.frame)
-mtcars.df = as.disk.frame(mtcars)
-
-mtcars.df %&gt;% 
-  filter(&lt;press tab&gt;)</pre></body></html></div>
+<div class="section level3">
+<h3 id="rstudio-column-name-completion">RStudio column name completion<a class="anchor" aria-label="anchor" href="#rstudio-column-name-completion"></a>
+</h3>
+<div class="sourceCode" id="cb2"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb2-1"><a href="#cb2-1" aria-hidden="true" tabindex="-1"></a><span class="fu">library</span>(disk.frame)</span>
+<span id="cb2-2"><a href="#cb2-2" aria-hidden="true" tabindex="-1"></a>mtcars.df <span class="ot">=</span> <span class="fu">as.disk.frame</span>(mtcars)</span>
+<span id="cb2-3"><a href="#cb2-3" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb2-4"><a href="#cb2-4" aria-hidden="true" tabindex="-1"></a>mtcars.df <span class="sc">%&gt;%</span> </span>
+<span id="cb2-5"><a href="#cb2-5" aria-hidden="true" tabindex="-1"></a>  <span class="fu">filter</span>(<span class="sc">&lt;</span>press tab<span class="sc">&gt;</span>)</span></code></pre></div>
 <p>you can press tab in RStudio and it will show all columns available.</p>
 </div>
-<div id="insert-ceremonyboilerplate-into-code-in-rstudio" class="section level3">
-<h3 class="hasAnchor">
-<a href="#insert-ceremonyboilerplate-into-code-in-rstudio" class="anchor"></a>Insert ceremony/boilerplate into code in RStudio</h3>
+<div class="section level3">
+<h3 id="insert-ceremonyboilerplate-into-code-in-rstudio">Insert ceremony/boilerplate into code in RStudio<a class="anchor" aria-label="anchor" href="#insert-ceremonyboilerplate-into-code-in-rstudio"></a>
+</h3>
 <p>The below will insert the recommended ceremony code into your editor</p>
-<div class="sourceCode" id="cb3"><html><body><pre class="r"><span class="kw pkg">disk.frame</span><span class="kw ns">::</span><span class="fu"><a href="../reference/show_ceremony.html">insert_ceremony</a></span>()</pre></body></html></div>
+<div class="sourceCode" id="cb3"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu">disk.frame</span><span class="fu">::</span><span class="fu"><a href="../reference/show_ceremony.html">insert_ceremony</a></span><span class="op">(</span><span class="op">)</span> </code></pre></div>
 <p>should insert</p>
-<div class="sourceCode" id="cb4"><html><body><pre class="r"><span class="co"># this willl set disk.frame with multiple workers</span>
-<span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span>()
+<div class="sourceCode" id="cb4"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="co"># this willl set disk.frame with multiple workers</span>
+<span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span><span class="op">(</span><span class="op">)</span>
 <span class="co"># this will allow unlimited amount of data to be passed from worker to worker</span>
-<span class="fu"><a href="https://rdrr.io/r/base/options.html">options</a></span>(<span class="kw">future.globals.maxSize</span> <span class="kw">=</span> <span class="fl">Inf</span>)</pre></body></html></div>
+<span class="fu"><a href="https://rdrr.io/r/base/options.html" class="external-link">options</a></span><span class="op">(</span>future.globals.maxSize <span class="op">=</span> <span class="cn">Inf</span><span class="op">)</span></code></pre></div>
 </div>
 </div>
   </div>
@@ -168,11 +170,13 @@ <h3 class="hasAnchor">
 
 
       <footer><div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+  <p></p>
+<p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p>
+<p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
       </footer>
@@ -181,5 +185,7 @@ <h3 class="hasAnchor">
   
 
 
+  
+
   </body>
 </html>
diff --git a/docs/articles/09-convenience-features_files/header-attrs-2.8/header-attrs.js b/docs/articles/09-convenience-features_files/header-attrs-2.8/header-attrs.js
new file mode 100644
index 00000000..dd57d92e
--- /dev/null
+++ b/docs/articles/09-convenience-features_files/header-attrs-2.8/header-attrs.js
@@ -0,0 +1,12 @@
+// Pandoc 2.9 adds attributes on both header and div. We remove the former (to
+// be compatible with the behavior of Pandoc < 2.8).
+document.addEventListener('DOMContentLoaded', function(e) {
+  var hs = document.querySelectorAll("div.section[class*='level'] > :first-child");
+  var i, h, a;
+  for (i = 0; i < hs.length; i++) {
+    h = hs[i];
+    if (!/^h[1-6]$/i.test(h.tagName)) continue;  // it should be a header h1-h6
+    a = h.attributes;
+    while (a.length > 0) h.removeAttribute(a[0].name);
+  }
+});
diff --git a/docs/articles/10-group-by.html b/docs/articles/10-group-by.html
index 9c1b79f0..c2799355 100644
--- a/docs/articles/10-group-by.html
+++ b/docs/articles/10-group-by.html
@@ -19,6 +19,8 @@
 <![endif]-->
 </head>
 <body data-spy="scroll" data-target="#toc">
+    
+
     <div class="container template-article">
       <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
@@ -31,18 +33,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
       <ul class="nav navbar-nav">
-<li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
 <li>
   <a href="../reference/index.html">Reference</a>
 </li>
@@ -86,6 +82,9 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
   </ul>
 </li>
 <li>
@@ -94,8 +93,8 @@
       </ul>
 <ul class="nav navbar-nav navbar-right">
 <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
@@ -113,55 +112,55 @@
   <div class="col-md-9 contents">
     <div class="page-header toc-ignore">
       <h1 data-toc-skip>Group-by</h1>
-                        <h4 class="author">ZJ</h4>
+                        <h4 data-toc-skip class="author">ZJ</h4>
             
       
-      <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/master/vignettes/10-group-by.Rmd"><code>vignettes/10-group-by.Rmd</code></a></small>
+      <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/vignettes/10-group-by.Rmd" class="external-link"><code>vignettes/10-group-by.Rmd</code></a></small>
       <div class="hidden name"><code>10-group-by.Rmd</code></div>
 
     </div>
 
     
     
-<div id="group-by-in-disk-frame" class="section level1">
-<h1 class="hasAnchor">
-<a href="#group-by-in-disk-frame" class="anchor"></a>Group-by in <code>{disk.frame}</code>
-</h1>
-<p>The group-by framework of <a href="https://diskframe.com"><code>{disk.frame}</code></a> has been overhauled in v0.3.0. It is now able to perform some group-by-summarize operations in one stage. In this chapter we will cover</p>
+<div class="section level2">
+<h2 id="group-by-in-disk-frame">Group-by in <code>{disk.frame}</code><a class="anchor" aria-label="anchor" href="#group-by-in-disk-frame"></a>
+</h2>
+<p>The group-by framework of <a href="https://diskframe.com" class="external-link"><code>{disk.frame}</code></a> has been overhauled in v0.3.0. It is now able to perform some group-by-summarize operations in one stage. In this chapter we will cover</p>
 <ol style="list-style-type: decimal">
 <li>How to use one-stage group-by</li>
 <li>Manual two-stage group and hard group-by</li>
 </ol>
-<p>In the custom <a href="https://diskframe.com/articles/custom-group-by.html">one-stage group-by chapter</a>, we will cover</p>
+<p>In the custom <a href="https://diskframe.com/articles/custom-group-by.html" class="external-link">one-stage group-by chapter</a>, we will cover</p>
 <ul>
-<li>The architecture of <code>{disk.frame}</code> and its implications for group-by</li>
+<li>The architecture of <a href="https://diskframe.com" class="external-link">disk.frame</a> and its implications for group-by</li>
 <li>How to define custom one-stage group-by functions and its limitations</li>
 </ul>
-<div id="one-stage-group-by" class="section level2">
-<h2 class="hasAnchor">
-<a href="#one-stage-group-by" class="anchor"></a>One-stage Group-by</h2>
-<p>A one-stage group-by is the same as group-by for data.frames. This would be unremarkable, if not for the limitations imposed by the disk-based nature of <code>{disk.frame}</code>. Before v0.3.0 of <code>{disk.frame}</code>, one-stage group-by was not possible, and the user had to rely on two-stage group-by even for simple operations like <code>mean</code>.</p>
+<div class="section level3">
+<h3 id="one-stage-group-by">One-stage Group-by<a class="anchor" aria-label="anchor" href="#one-stage-group-by"></a>
+</h3>
+<p>A one-stage group-by is the same as group-by for data.frames. This would be unremarkable, if not for the limitations imposed by the disk-based nature of <a href="https://diskframe.com" class="external-link">disk.frame</a>. Before v0.3.0 of <a href="https://diskframe.com" class="external-link">disk.frame</a>, one-stage group-by was not possible, and the user had to rely on two-stage group-by even for simple operations like <code>mean</code>.</p>
 <p>However, now that one-stage group-by is possible, there are still limitations and not all functions are supported out-of-the-box. Hence, in the next chapter we will describe how to define custom one-stage group-by functions.</p>
 <p>An example of one-stage group-by:</p>
-<div class="sourceCode" id="cb1"><html><body><pre class="r"><span class="no">result_from_disk.frame</span> <span class="kw">=</span> <span class="no">iris</span> <span class="kw">%&gt;%</span>
-  <span class="no">as.disk.frame</span> <span class="kw">%&gt;%</span>
-  <span class="fu">group_by</span>(<span class="no">Species</span>) <span class="kw">%&gt;%</span>
-  <span class="fu">summarize</span>(
-    <span class="fu"><a href="https://rdrr.io/r/base/mean.html">mean</a></span>(<span class="no">Petal.Length</span>),
-    <span class="kw">sumx</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/sum.html">sum</a></span>(<span class="no">Petal.Length</span>/<span class="no">Sepal.Width</span>),
-    <span class="fu"><a href="https://rdrr.io/r/stats/sd.html">sd</a></span>(<span class="no">Sepal.Width</span>/ <span class="no">Petal.Length</span>),
-    <span class="fu"><a href="https://rdrr.io/r/stats/cor.html">var</a></span>(<span class="no">Sepal.Width</span>/ <span class="no">Sepal.Width</span>),
-    <span class="kw">l</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/length.html">length</a></span>(<span class="no">Sepal.Width</span>/ <span class="no">Sepal.Width</span> + <span class="fl">2</span>),
-    <span class="fu"><a href="https://rdrr.io/r/base/Extremes.html">max</a></span>(<span class="no">Sepal.Width</span>),
-    <span class="fu"><a href="https://rdrr.io/r/base/Extremes.html">min</a></span>(<span class="no">Sepal.Width</span>),
-    <span class="fu"><a href="https://rdrr.io/r/stats/median.html">median</a></span>(<span class="no">Sepal.Width</span>)
-    ) <span class="kw">%&gt;%</span>
-  <span class="no">collect</span></pre></body></html></div>
-<p>It is important to note that not all functions that can run in <code><a href="https://dplyr.tidyverse.org/reference/summarise.html">dplyr::summarize</a></code> would work automatically. This is because of how <code>{disk.frame}</code> works. Please see the next chapter on defining custom one-stage group-by functions to learn more.</p>
-<div id="list-of-supported-group-by-functions" class="section level3">
-<h3 class="hasAnchor">
-<a href="#list-of-supported-group-by-functions" class="anchor"></a>List of supported group-by functions</h3>
-<p>If a function you need/like is missing, please make a feature request <a href="https://github.com/xiaodaigh/disk.frame/issues">here</a>. It is a limitation that function that depend on the order a column can only obtained using estimated methods.</p>
+<div class="sourceCode" id="cb1"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">result_from_disk.frame</span> <span class="op">=</span> <span class="va">iris</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="va">as.disk.frame</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/group_by.html" class="external-link">group_by</a></span><span class="op">(</span><span class="va">Species</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/summarise.html" class="external-link">summarize</a></span><span class="op">(</span>
+    <span class="fu"><a href="https://rdrr.io/r/base/mean.html" class="external-link">mean</a></span><span class="op">(</span><span class="va">Petal.Length</span><span class="op">)</span>, 
+    sumx <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/sum.html" class="external-link">sum</a></span><span class="op">(</span><span class="va">Petal.Length</span><span class="op">/</span><span class="va">Sepal.Width</span><span class="op">)</span>, 
+    <span class="fu"><a href="https://rdrr.io/r/stats/sd.html" class="external-link">sd</a></span><span class="op">(</span><span class="va">Sepal.Width</span><span class="op">/</span> <span class="va">Petal.Length</span><span class="op">)</span>, 
+    <span class="fu"><a href="https://rdrr.io/r/stats/cor.html" class="external-link">var</a></span><span class="op">(</span><span class="va">Sepal.Width</span><span class="op">/</span> <span class="va">Sepal.Width</span><span class="op">)</span>, 
+    l <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/length.html" class="external-link">length</a></span><span class="op">(</span><span class="va">Sepal.Width</span><span class="op">/</span> <span class="va">Sepal.Width</span> <span class="op">+</span> <span class="fl">2</span><span class="op">)</span>,
+    <span class="fu"><a href="https://rdrr.io/r/base/Extremes.html" class="external-link">max</a></span><span class="op">(</span><span class="va">Sepal.Width</span><span class="op">)</span>, 
+    <span class="fu"><a href="https://rdrr.io/r/base/Extremes.html" class="external-link">min</a></span><span class="op">(</span><span class="va">Sepal.Width</span><span class="op">)</span>, 
+    <span class="fu"><a href="https://rdrr.io/r/stats/median.html" class="external-link">median</a></span><span class="op">(</span><span class="va">Sepal.Width</span><span class="op">)</span>
+    <span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="va">collect</span></code></pre></div>
+<p>It is important to note that not all functions that can run in <code><a href="https://dplyr.tidyverse.org/reference/summarise.html" class="external-link">dplyr::summarize</a></code> would work automatically. This is because of how <a href="https://diskframe.com" class="external-link">disk.frame</a> works. Please see the next chapter on defining custom one-stage group-by functions to learn more.</p>
+<div class="section level4">
+<h4 id="list-of-supported-group-by-functions">List of supported group-by functions<a class="anchor" aria-label="anchor" href="#list-of-supported-group-by-functions"></a>
+</h4>
+<p>If a function you need/like is missing, please make a feature request <a href="https://github.com/xiaodaigh/disk.frame/issues" class="external-link">here</a>. It is a limitation that function that depend on the order a column can only obtained using estimated methods.</p>
 <table class="table">
 <thead><tr class="header">
 <th>Function</th>
@@ -213,7 +212,7 @@ <h3 class="hasAnchor">
 <td><code>var</code></td>
 <td>Exact</td>
 <td>
-<code><a href="https://rdrr.io/r/stats/cor.html">var(x)</a></code> only <code>cor, cov</code> support <em>planned</em>
+<code>var(x)</code> only <code>cor, cov</code> support <em>planned</em>
 </td>
 </tr>
 <tr class="even">
@@ -244,121 +243,128 @@ <h3 class="hasAnchor">
 </tbody>
 </table>
 </div>
-<div id="notes-on-one-stage-group-by" class="section level3">
-<h3 class="hasAnchor">
-<a href="#notes-on-one-stage-group-by" class="anchor"></a>Notes on One-Stage group-by</h3>
-<p>The results should be exactly the same as if applying the same group-by operations on a <code>data.frame</code>. If not then please <a href="https://github.com/xiaodaigh/disk.frame/issues">report a bug</a>.</p>
+<div class="section level4">
+<h4 id="notes-on-one-stage-group-by">Notes on One-Stage group-by<a class="anchor" aria-label="anchor" href="#notes-on-one-stage-group-by"></a>
+</h4>
+<p>The results should be exactly the same as if applying the same group-by operations on a <code>data.frame</code>. If not then please <a href="https://github.com/xiaodaigh/disk.frame/issues" class="external-link">report a bug</a>.</p>
 </div>
 </div>
-<div id="group-by-notes" class="section level2">
-<h2 class="hasAnchor">
-<a href="#group-by-notes" class="anchor"></a>Group-by notes</h2>
+<div class="section level3">
+<h3 id="group-by-notes">Group-by notes<a class="anchor" aria-label="anchor" href="#group-by-notes"></a>
+</h3>
 <p>The <code>disk.frame</code> implements the <code>chunk_group_by</code> operation with a significant caveat. In the <code>disk.frame</code> framework, group-by happens WITHIN each chunk and not ACROSS chunks. To achieve group by across chunk we need to put <strong>all rows with the same group keys into the same file chunk</strong>; this can be achieved with <code>hard_group_by</code>. However, the <code>hard_group_by</code> operation can be <strong>VERY TIME CONSUMING</strong> computationally and should be <strong>avoided</strong> if possible.</p>
 <p>The <code>hard_group_by</code> operation is best illustrated with an example, suppose a <code>disk.frame</code> has three chunks</p>
-<pre><code># chunk1 = 1.fst
-#  id n
-#1  a 1
-#2  a 2
-#3  b 3
-#4  d 4
+<pre><code><span class="co"># chunk1 = 1.fst</span>
+<span class="co">#  id n</span>
+<span class="co">#1  a 1</span>
+<span class="co">#2  a 2</span>
+<span class="co">#3  b 3</span>
+<span class="co">#4  d 4</span>
 
-# chunk2 = 2.fst
-#  id n
-#1  a 4
-#2  a 5
-#3  b 6
-#4  d 7
+<span class="co"># chunk2 = 2.fst</span>
+<span class="co">#  id n</span>
+<span class="co">#1  a 4</span>
+<span class="co">#2  a 5</span>
+<span class="co">#3  b 6</span>
+<span class="co">#4  d 7</span>
 
-# chunk3 = 3.fst
-#  id n
-#1  a 4
-#2  b 5
-#3  c 6</code></pre>
-<p>and notice that the <code>id</code> column contains 3 distinct values <code>"a"</code>,<code>"b"</code>, and <code>"c"</code>. To perform <code><a href="../reference/hard_group_by.html">hard_group_by(df, by = id)</a></code> MAY give you the following <code>disk.frame</code> where all the <code>id</code>s with the same values end up in the same chunks.</p>
-<pre><code># chunk1 = 1.fst
-#  id n
-#1  b 3
-#2  b 6
+<span class="co"># chunk3 = 3.fst</span>
+<span class="co">#  id n</span>
+<span class="co">#1  a 4</span>
+<span class="co">#2  b 5</span>
+<span class="co">#3  c 6</span></code></pre>
+<p>and notice that the <code>id</code> column contains 3 distinct values <code>"a"</code>,<code>"b"</code>, and <code>"c"</code>. To perform <code>hard_group_by(df, by = id)</code> MAY give you the following <code>disk.frame</code> where all the <code>id</code>s with the same values end up in the same chunks.</p>
+<pre><code><span class="co"># chunk1 = 1.fst</span>
+<span class="co">#  id n</span>
+<span class="co">#1  b 3</span>
+<span class="co">#2  b 6</span>
 
-# chunk2 = 2.fst
-#  id n
-#1  c 6
-#2  d 4
-#3  d 7
+<span class="co"># chunk2 = 2.fst</span>
+<span class="co">#  id n</span>
+<span class="co">#1  c 6</span>
+<span class="co">#2  d 4</span>
+<span class="co">#3  d 7</span>
 
-# chunk3 = 3.fst
-#  id n
-#1  a 1
-#2  a 2
-#3  a 4
-#4  a 5
-#5  a 4</code></pre>
+<span class="co"># chunk3 = 3.fst</span>
+<span class="co">#  id n</span>
+<span class="co">#1  a 1</span>
+<span class="co">#2  a 2</span>
+<span class="co">#3  a 4</span>
+<span class="co">#4  a 5</span>
+<span class="co">#5  a 4</span></code></pre>
 <p>Also, notice that there is no guaranteed order for the distribution of the <code>id</code>s to the chunks. The order is random, but each chunk is likely to have a similar number of rows, provided that <code>id</code> does not follow a skewed distribution i.e. where a few distinct values make up the majority of the rows.</p>
 <p>Typically, <code>chunk_group_by</code> is performed WITHIN each chunk. This is not an issue if the chunks have already been sharded on the <code>by</code> variables beforehand; however, if this is not the case then one may need a second stage aggregation to obtain the correct result, see <em>Two-stage group by</em>.</p>
 <p>By forcing the user to choose <code>chunk_group_by</code> (within each chunk) and <code>hard_group_by</code> (across all chunks), this ensures that the user is conscious of the choice they are making. In <code>sparklyr</code> the equivalent of a <code>hard_group_by</code> is performed, which we should avoid, where possible, as it is time-consuming and expensive. Hence, <code>disk.frame</code> has chosen to explain the theory and allow the user to make a conscious choice when performing <code>group_by</code>.</p>
-<div class="sourceCode" id="cb4"><html><body><pre class="r"><span class="fu"><a href="https://rdrr.io/r/base/message.html">suppressMessages</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/library.html">library</a></span>(<span class="no">disk.frame</span>))
-<span class="no">flights.df</span> <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="../reference/hard_group_by.html">hard_group_by</a></span>(<span class="no">carrier</span>) <span class="kw">%&gt;%</span> <span class="co"># notice that hard_group_by needs to be set</span>
-  <span class="fu"><a href="../reference/chunk_group_by.html">chunk_summarize</a></span>(<span class="kw">count</span> <span class="kw">=</span> <span class="fu">n</span>(), <span class="kw">mean_dep_delay</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/mean.html">mean</a></span>(<span class="no">dep_delay</span>, <span class="kw">na.rm</span><span class="kw">=</span><span class="no">T</span>)) <span class="kw">%&gt;%</span>  <span class="co"># mean follows normal R rules</span>
-  <span class="no">collect</span> <span class="kw">%&gt;%</span>
-  <span class="fu">arrange</span>(<span class="no">carrier</span>)</pre></body></html></div>
+<div class="sourceCode" id="cb4"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu"><a href="https://rdrr.io/r/base/message.html" class="external-link">suppressMessages</a></span><span class="op">(</span><span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://diskframe.com" class="external-link">disk.frame</a></span><span class="op">)</span><span class="op">)</span>
+<span class="va">flights.df</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="fu"><a href="../reference/hard_group_by.html">hard_group_by</a></span><span class="op">(</span><span class="va">carrier</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="co"># notice that hard_group_by needs to be set</span>
+  <span class="fu"><a href="../reference/chunk_group_by.html">chunk_summarize</a></span><span class="op">(</span>count <span class="op">=</span> <span class="fu"><a href="https://dplyr.tidyverse.org/reference/context.html" class="external-link">n</a></span><span class="op">(</span><span class="op">)</span>, mean_dep_delay <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/mean.html" class="external-link">mean</a></span><span class="op">(</span><span class="va">dep_delay</span>, na.rm<span class="op">=</span><span class="cn">T</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>  <span class="co"># mean follows normal R rules</span>
+  <span class="va">collect</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/arrange.html" class="external-link">arrange</a></span><span class="op">(</span><span class="va">carrier</span><span class="op">)</span></code></pre></div>
 </div>
-<div id="two-stage-group-by" class="section level2">
-<h2 class="hasAnchor">
-<a href="#two-stage-group-by" class="anchor"></a>Two-Stage Group-by</h2>
-<p>Prior to <code>{disk.frame}</code> v0.3.0, there is no general support for one-stage group-by. Hence a two-stage style group-by is needed. The key is understand is the <code>chunk_group_by</code> which performs <code>group-by</code> within each chunk.</p>
+<div class="section level3">
+<h3 id="two-stage-group-by">Two-Stage Group-by<a class="anchor" aria-label="anchor" href="#two-stage-group-by"></a>
+</h3>
+<p>Prior to <a href="https://diskframe.com" class="external-link">disk.frame</a> v0.3.0, there is no general support for one-stage group-by. Hence a two-stage style group-by is needed. The key is understand is the <code>chunk_group_by</code> which performs <code>group-by</code> within each chunk.</p>
 <p>For most group-by tasks, the user can achieve the desired result WITHOUT using <code>hard = TRUE</code> by performing the group by in two stages. For example, suppose you aim to count the number of rows group by <code>carrier</code>, you can set <code>hard = F</code> to find the count within each chunk and then use a second group-by to summaries each chunk’s results into the desired result. For example,</p>
-<div class="sourceCode" id="cb5"><html><body><pre class="r"><span class="no">flights.df</span> <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="../reference/chunk_group_by.html">chunk_group_by</a></span>(<span class="no">carrier</span>) <span class="kw">%&gt;%</span> <span class="co"># `chunk_group_by` aggregates within each chunk</span>
-  <span class="fu"><a href="../reference/chunk_group_by.html">chunk_summarize</a></span>(<span class="kw">count</span> <span class="kw">=</span> <span class="fu">n</span>()) <span class="kw">%&gt;%</span>  <span class="co"># mean follows normal R rules</span>
-  <span class="no">collect</span> <span class="kw">%&gt;%</span>  <span class="co"># collect each individul chunks results and row-bind into a data.table</span>
-  <span class="fu">group_by</span>(<span class="no">carrier</span>) <span class="kw">%&gt;%</span>
-  <span class="fu">summarize</span>(<span class="kw">count</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/sum.html">sum</a></span>(<span class="no">count</span>)) <span class="kw">%&gt;%</span>
-  <span class="fu">arrange</span>(<span class="no">carrier</span>)</pre></body></html></div>
+<div class="sourceCode" id="cb5"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">flights.df</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="fu"><a href="../reference/chunk_group_by.html">chunk_group_by</a></span><span class="op">(</span><span class="va">carrier</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="co"># `chunk_group_by` aggregates within each chunk</span>
+  <span class="fu"><a href="../reference/chunk_group_by.html">chunk_summarize</a></span><span class="op">(</span>count <span class="op">=</span> <span class="fu"><a href="https://dplyr.tidyverse.org/reference/context.html" class="external-link">n</a></span><span class="op">(</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>  <span class="co"># mean follows normal R rules</span>
+  <span class="va">collect</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>  <span class="co"># collect each individul chunks results and row-bind into a data.table</span>
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/group_by.html" class="external-link">group_by</a></span><span class="op">(</span><span class="va">carrier</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/summarise.html" class="external-link">summarize</a></span><span class="op">(</span>count <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/sum.html" class="external-link">sum</a></span><span class="op">(</span><span class="va">count</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/arrange.html" class="external-link">arrange</a></span><span class="op">(</span><span class="va">carrier</span><span class="op">)</span></code></pre></div>
 <p>Because this two-stage approach avoids the expensive <code>hard group_by</code> operation, it is often significantly faster. However, it can be tedious to write; and this is a con of the <code>disk.frame</code> chunking mechanism.</p>
 <p><em>Note</em>: this two-stage approach is similar to a map-reduce operation.</p>
-<div class="sourceCode" id="cb6"><html><body><pre class="r"><span class="fu"><a href="https://rdrr.io/r/base/message.html">suppressPackageStartupMessages</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/library.html">library</a></span>(<span class="no">disk.frame</span>))
-<span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span>()</pre></body></html></div>
-<div class="sourceCode" id="cb7"><html><body><pre class="r"><span class="no">flights.df</span> <span class="kw">=</span> <span class="fu"><a href="../reference/as.disk.frame.html">as.disk.frame</a></span>(<span class="kw pkg">nycflights13</span><span class="kw ns">::</span><span class="no"><a href="https://rdrr.io/pkg/nycflights13/man/flights.html">flights</a></span>)
+<div class="sourceCode" id="cb6"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu"><a href="https://rdrr.io/r/base/message.html" class="external-link">suppressPackageStartupMessages</a></span><span class="op">(</span><span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://diskframe.com" class="external-link">disk.frame</a></span><span class="op">)</span><span class="op">)</span>
+<span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span><span class="op">(</span><span class="op">)</span></code></pre></div>
+<div class="sourceCode" id="cb7"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">flights.df</span> <span class="op">=</span> <span class="fu"><a href="../reference/as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="fu">nycflights13</span><span class="fu">::</span><span class="va"><a href="https://rdrr.io/pkg/nycflights13/man/flights.html" class="external-link">flights</a></span><span class="op">)</span>
 
-<span class="no">flights.df</span> <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="../reference/srckeep.html">srckeep</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/c.html">c</a></span>(<span class="st">"year"</span>,<span class="st">"distance"</span>)) <span class="kw">%&gt;%</span>  <span class="co"># keep only carrier and distance columns</span>
-  <span class="fu"><a href="../reference/chunk_group_by.html">chunk_group_by</a></span>(<span class="no">year</span>) <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="../reference/chunk_group_by.html">chunk_summarise</a></span>(<span class="kw">sum_dist</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/sum.html">sum</a></span>(<span class="no">distance</span>)) <span class="kw">%&gt;%</span> <span class="co"># this does a count per chunk</span>
-  <span class="no">collect</span></pre></body></html></div>
+<span class="va">flights.df</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="fu"><a href="../reference/srckeep.html">srckeep</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">"year"</span>,<span class="st">"distance"</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>  <span class="co"># keep only carrier and distance columns</span>
+  <span class="fu"><a href="../reference/chunk_group_by.html">chunk_group_by</a></span><span class="op">(</span><span class="va">year</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="../reference/chunk_group_by.html">chunk_summarise</a></span><span class="op">(</span>sum_dist <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/sum.html" class="external-link">sum</a></span><span class="op">(</span><span class="va">distance</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="co"># this does a count per chunk</span>
+  <span class="va">collect</span></code></pre></div>
 <p>This is two-stage group-by in action</p>
-<div class="sourceCode" id="cb8"><html><body><pre class="r"><span class="co"># need a 2nd stage to finalise summing</span>
-<span class="no">flights.df</span> <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="../reference/srckeep.html">srckeep</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/c.html">c</a></span>(<span class="st">"year"</span>,<span class="st">"distance"</span>)) <span class="kw">%&gt;%</span>  <span class="co"># keep only carrier and distance columns</span>
-  <span class="fu"><a href="../reference/chunk_group_by.html">chunk_group_by</a></span>(<span class="no">year</span>) <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="../reference/chunk_group_by.html">chunk_summarise</a></span>(<span class="kw">sum_dist</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/sum.html">sum</a></span>(<span class="no">distance</span>)) <span class="kw">%&gt;%</span> <span class="co"># this does a count per chunk</span>
-  <span class="no">collect</span> <span class="kw">%&gt;%</span>
-  <span class="fu">group_by</span>(<span class="no">year</span>) <span class="kw">%&gt;%</span>
-  <span class="fu">summarise</span>(<span class="kw">sum_dist</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/sum.html">sum</a></span>(<span class="no">sum_dist</span>))</pre></body></html></div>
+<div class="sourceCode" id="cb8"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="co"># need a 2nd stage to finalise summing</span>
+<span class="va">flights.df</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="fu"><a href="../reference/srckeep.html">srckeep</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">"year"</span>,<span class="st">"distance"</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>  <span class="co"># keep only carrier and distance columns</span>
+  <span class="fu"><a href="../reference/chunk_group_by.html">chunk_group_by</a></span><span class="op">(</span><span class="va">year</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="../reference/chunk_group_by.html">chunk_summarise</a></span><span class="op">(</span>sum_dist <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/sum.html" class="external-link">sum</a></span><span class="op">(</span><span class="va">distance</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="co"># this does a count per chunk</span>
+  <span class="va">collect</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/group_by.html" class="external-link">group_by</a></span><span class="op">(</span><span class="va">year</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/summarise.html" class="external-link">summarise</a></span><span class="op">(</span>sum_dist <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/sum.html" class="external-link">sum</a></span><span class="op">(</span><span class="va">sum_dist</span><span class="op">)</span><span class="op">)</span></code></pre></div>
 <p>You can mix group-by with other dplyr verbs as below, here is an example of using <code>filter</code>.</p>
-<div class="sourceCode" id="cb9"><html><body><pre class="r"><span class="co"># filter</span>
-<span class="no">pt</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/proc.time.html">proc.time</a></span>()
-<span class="no">df_filtered</span> <span class="kw">&lt;-</span>
-  <span class="no">flights.df</span> <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="https://rdrr.io/r/stats/filter.html">filter</a></span>(<span class="no">month</span> <span class="kw">==</span> <span class="fl">1</span>)
-<span class="fu"><a href="https://rdrr.io/r/base/cat.html">cat</a></span>(<span class="st">"filtering a &lt; 0.1 took: "</span>, <span class="kw pkg">data.table</span><span class="kw ns">::</span><span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/timetaken.html">timetaken</a></span>(<span class="no">pt</span>), <span class="st">"\n"</span>)
-<span class="fu"><a href="../reference/ncol_nrow.html">nrow</a></span>(<span class="no">df_filtered</span>)</pre></body></html></div>
+<div class="sourceCode" id="cb9"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="co"># filter</span>
+<span class="va">pt</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/proc.time.html" class="external-link">proc.time</a></span><span class="op">(</span><span class="op">)</span>
+<span class="va">df_filtered</span> <span class="op">&lt;-</span>
+  <span class="va">flights.df</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/filter.html" class="external-link">filter</a></span><span class="op">(</span><span class="va">month</span> <span class="op">==</span> <span class="fl">1</span><span class="op">)</span>
+<span class="fu"><a href="https://rdrr.io/r/base/cat.html" class="external-link">cat</a></span><span class="op">(</span><span class="st">"filtering a &lt; 0.1 took: "</span>, <span class="fu">data.table</span><span class="fu">::</span><span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/timetaken.html" class="external-link">timetaken</a></span><span class="op">(</span><span class="va">pt</span><span class="op">)</span>, <span class="st">"\n"</span><span class="op">)</span>
+<span class="fu"><a href="../reference/ncol_nrow.html">nrow</a></span><span class="op">(</span><span class="va">df_filtered</span><span class="op">)</span></code></pre></div>
 </div>
-<div id="hard-group-by" class="section level2">
-<h2 class="hasAnchor">
-<a href="#hard-group-by" class="anchor"></a>Hard group-by</h2>
+<div class="section level3">
+<h3 id="hard-group-by">Hard group-by<a class="anchor" aria-label="anchor" href="#hard-group-by"></a>
+</h3>
 <p>Another way to perform a one-stage <code>group_by</code> is to perform a <code>hard_group_by</code> on a <code>disk.frame</code>. This will rechunk the <code>disk.frame</code> by the by-columns. This is <strong>not</strong> recommended for performance reasons, as it can be quite slow to rechunk the file chunks on disk.</p>
-<div class="sourceCode" id="cb10"><html><body><pre class="r"><span class="no">pt</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/proc.time.html">proc.time</a></span>()
-<span class="no">res1</span> <span class="kw">&lt;-</span> <span class="no">flights.df</span> <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="../reference/srckeep.html">srckeep</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/c.html">c</a></span>(<span class="st">"month"</span>, <span class="st">"dep_delay"</span>)) <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="https://rdrr.io/r/stats/filter.html">filter</a></span>(<span class="no">month</span> <span class="kw">&lt;=</span> <span class="fl">6</span>) <span class="kw">%&gt;%</span>
-  <span class="fu">mutate</span>(<span class="kw">qtr</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/ifelse.html">ifelse</a></span>(<span class="no">month</span> <span class="kw">&lt;=</span> <span class="fl">3</span>, <span class="st">"Q1"</span>, <span class="st">"Q2"</span>)) <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="../reference/hard_group_by.html">hard_group_by</a></span>(<span class="no">qtr</span>) <span class="kw">%&gt;%</span> <span class="co"># hard group_by is MUCH SLOWER but avoid a 2nd stage aggregation</span>
-  <span class="fu"><a href="../reference/chunk_group_by.html">chunk_summarise</a></span>(<span class="kw">avg_delay</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/mean.html">mean</a></span>(<span class="no">dep_delay</span>, <span class="kw">na.rm</span> <span class="kw">=</span> <span class="fl">TRUE</span>)) <span class="kw">%&gt;%</span>
-  <span class="no">collect</span>
-<span class="fu"><a href="https://rdrr.io/r/base/cat.html">cat</a></span>(<span class="st">"group-by took: "</span>, <span class="kw pkg">data.table</span><span class="kw ns">::</span><span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/timetaken.html">timetaken</a></span>(<span class="no">pt</span>), <span class="st">"\n"</span>)
+<div class="sourceCode" id="cb10"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">pt</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/proc.time.html" class="external-link">proc.time</a></span><span class="op">(</span><span class="op">)</span>
+<span class="va">res1</span> <span class="op">&lt;-</span> <span class="va">flights.df</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="../reference/srckeep.html">srckeep</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">"month"</span>, <span class="st">"dep_delay"</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/filter.html" class="external-link">filter</a></span><span class="op">(</span><span class="va">month</span> <span class="op">&lt;=</span> <span class="fl">6</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate.html" class="external-link">mutate</a></span><span class="op">(</span>qtr <span class="op">=</span> <span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/fifelse.html" class="external-link">ifelse</a></span><span class="op">(</span><span class="va">month</span> <span class="op">&lt;=</span> <span class="fl">3</span>, <span class="st">"Q1"</span>, <span class="st">"Q2"</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="../reference/hard_group_by.html">hard_group_by</a></span><span class="op">(</span><span class="va">qtr</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="co"># hard group_by is MUCH SLOWER but avoid a 2nd stage aggregation</span>
+  <span class="fu"><a href="../reference/chunk_group_by.html">chunk_summarise</a></span><span class="op">(</span>avg_delay <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/mean.html" class="external-link">mean</a></span><span class="op">(</span><span class="va">dep_delay</span>, na.rm <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="va">collect</span>
+<span class="fu"><a href="https://rdrr.io/r/base/cat.html" class="external-link">cat</a></span><span class="op">(</span><span class="st">"group-by took: "</span>, <span class="fu">data.table</span><span class="fu">::</span><span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/timetaken.html" class="external-link">timetaken</a></span><span class="op">(</span><span class="va">pt</span><span class="op">)</span>, <span class="st">"\n"</span><span class="op">)</span>
 
-<span class="fu">collect</span>(<span class="no">res1</span>)</pre></body></html></div>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/compute.html" class="external-link">collect</a></span><span class="op">(</span><span class="va">res1</span><span class="op">)</span></code></pre></div>
 </div>
 </div>
   </div>
@@ -374,11 +380,13 @@ <h2 class="hasAnchor">
 
 
       <footer><div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+  <p></p>
+<p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p>
+<p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
       </footer>
@@ -387,5 +395,7 @@ <h2 class="hasAnchor">
   
 
 
+  
+
   </body>
 </html>
diff --git a/docs/articles/10-group-by_files/header-attrs-2.8/header-attrs.js b/docs/articles/10-group-by_files/header-attrs-2.8/header-attrs.js
new file mode 100644
index 00000000..dd57d92e
--- /dev/null
+++ b/docs/articles/10-group-by_files/header-attrs-2.8/header-attrs.js
@@ -0,0 +1,12 @@
+// Pandoc 2.9 adds attributes on both header and div. We remove the former (to
+// be compatible with the behavior of Pandoc < 2.8).
+document.addEventListener('DOMContentLoaded', function(e) {
+  var hs = document.querySelectorAll("div.section[class*='level'] > :first-child");
+  var i, h, a;
+  for (i = 0; i < hs.length; i++) {
+    h = hs[i];
+    if (!/^h[1-6]$/i.test(h.tagName)) continue;  // it should be a header h1-h6
+    a = h.attributes;
+    while (a.length > 0) h.removeAttribute(a[0].name);
+  }
+});
diff --git a/docs/articles/11-custom-group-by.html b/docs/articles/11-custom-group-by.html
index 4d0952c0..356dfa28 100644
--- a/docs/articles/11-custom-group-by.html
+++ b/docs/articles/11-custom-group-by.html
@@ -19,6 +19,8 @@
 <![endif]-->
 </head>
 <body data-spy="scroll" data-target="#toc">
+    
+
     <div class="container template-article">
       <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
@@ -31,18 +33,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
       <ul class="nav navbar-nav">
-<li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
 <li>
   <a href="../reference/index.html">Reference</a>
 </li>
@@ -86,6 +82,9 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
   </ul>
 </li>
 <li>
@@ -94,8 +93,8 @@
       </ul>
 <ul class="nav navbar-nav navbar-right">
 <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
@@ -113,42 +112,43 @@
   <div class="col-md-9 contents">
     <div class="page-header toc-ignore">
       <h1 data-toc-skip>Custom One-Stage Group-by functions</h1>
-                        <h4 class="author">ZJ</h4>
+                        <h4 data-toc-skip class="author">ZJ</h4>
             
       
-      <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/master/vignettes/11-custom-group-by.Rmd"><code>vignettes/11-custom-group-by.Rmd</code></a></small>
+      <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/vignettes/11-custom-group-by.Rmd" class="external-link"><code>vignettes/11-custom-group-by.Rmd</code></a></small>
       <div class="hidden name"><code>11-custom-group-by.Rmd</code></div>
 
     </div>
 
     
     
-<div id="custom-one-stage-group-by" class="section level1">
-<h1 class="hasAnchor">
-<a href="#custom-one-stage-group-by" class="anchor"></a>Custom one-stage group-by</h1>
+<div class="section level2">
+<h2 id="custom-one-stage-group-by">Custom one-stage group-by<a class="anchor" aria-label="anchor" href="#custom-one-stage-group-by"></a>
+</h2>
 <p>Group-by is one the most useful and commonly used operations in data manipulation. The most common to perform group with dplyr syntax would be something similar to the below</p>
-<div class="sourceCode" id="cb1"><html><body><pre class="r"><span class="no">dataf</span> <span class="kw">%&gt;%</span>
-  <span class="fu">group_by</span>(<span class="no">grpA</span>) <span class="kw">%&gt;%</span>
-  <span class="fu">summarize</span>(<span class="fu"><a href="https://rdrr.io/r/base/mean.html">mean</a></span>(<span class="no">X</span>))</pre></body></html></div>
-<p>However, the above nice and concise group-by syntax creates a challenge in <code>{disk.frame}</code>, because <code>{disk.frame}</code> organises the data in chunks and these chunks are often manipulated independently to each other which makes it difficult to compute the <code>mean</code> of any column if the group-by column is stored in different chunks. In this chapter, I will explain how <code>{disk.frame}</code> achieve the one-stage group-by syntax that you see, and how you can define custom one-stage group-by functions for use with <code>{disk.frame}</code>.</p>
-<div id="at-a-glance" class="section level2">
-<h2 class="hasAnchor">
-<a href="#at-a-glance" class="anchor"></a>At a glance</h2>
-<p><code>{disk.frame}</code> allows the user to create custom one-stage group-by functions. To make a function <code>fn</code> one stage, one needs to define two functions:</p>
+<div class="sourceCode" id="cb1"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">dataf</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/group_by.html" class="external-link">group_by</a></span><span class="op">(</span><span class="va">grpA</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/summarise.html" class="external-link">summarize</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/mean.html" class="external-link">mean</a></span><span class="op">(</span><span class="va">X</span><span class="op">)</span><span class="op">)</span></code></pre></div>
+<p>However, the above nice and concise group-by syntax creates a challenge in <a href="https://diskframe.com" class="external-link">disk.frame</a>, because <a href="https://diskframe.com" class="external-link">disk.frame</a> organises the data in chunks and these chunks are often manipulated independently to each other which makes it difficult to compute the <code>mean</code> of any column if the group-by column is stored in different chunks. In this chapter, I will explain how <a href="https://diskframe.com" class="external-link">disk.frame</a> achieve the one-stage group-by syntax that you see, and how you can define custom one-stage group-by functions for use with <a href="https://diskframe.com" class="external-link">disk.frame</a>.</p>
+<div class="section level3">
+<h3 id="at-a-glance">At a glance<a class="anchor" aria-label="anchor" href="#at-a-glance"></a>
+</h3>
+<p><a href="https://diskframe.com" class="external-link">disk.frame</a> allows the user to create custom one-stage group-by functions. To make a function <code>fn</code> one stage, one needs to define two functions:</p>
 <ol style="list-style-type: decimal">
 <li>
 <code>fn_df.chunk_agg.disk.frame</code> which applies itself to each chunk</li>
 <li>
 <code>fn_df.collected_agg.disk.frame</code> which accepts a <code>list</code> of returns from <code>fn_df.chunk_agg.disk.frame</code> and finalize the computation</li>
 </ol>
-<p>For example, to make <code>mean</code> a one-stage group-by function, <code>{disk.frame}</code> has defined <code>mean_df.chunk_agg.disk.frame</code> and <code>mean_df.collected_agg.disk.frame</code>, which we will illustrate with examples below.</p>
-<p>But first, we shall explain some theory behind <code>{disk.frame}</code> to help you better understand “why does <code>{disk.frame}</code> do it like that?”.</p>
+<p>For example, to make <code>mean</code> a one-stage group-by function, <a href="https://diskframe.com" class="external-link">disk.frame</a> has defined <code>mean_df.chunk_agg.disk.frame</code> and <code>mean_df.collected_agg.disk.frame</code>, which we will illustrate with examples below.</p>
+<p>But first, we shall explain some theory behind <a href="https://diskframe.com" class="external-link">disk.frame</a> to help you better understand “why does <a href="https://diskframe.com" class="external-link">disk.frame</a> do it like that?”.</p>
 </div>
-<div id="how-does-disk-frame-work" class="section level2">
-<h2 class="hasAnchor">
-<a href="#how-does-disk-frame-work" class="anchor"></a>How does <code>{disk.frame}</code> work</h2>
-<p>One may ask, how come only a few functions are supported for one-stage group-by? And why are some functions like <code>median</code> only produce estimates instead of producing the exact figure? To answer these questions, we need to have an understanding of how <code>{disk.frame}</code> works.</p>
-<p>A <code>disk.frame</code> is organized as chunks stored on disk. Each chunk is a file stored in <a href="https://www.fstpackage.org/">fst format</a>. The <a href="https://CRAN.R-project.org/package=future"><code>{future}</code> package</a> is used to apply the same function to each chunk, each of these operations are carried out in a separate R session. These R sessions cannot communicate with each other during the execution of the operations.</p>
+<div class="section level3">
+<h3 id="how-does-disk-frame-work">How does <code>{disk.frame}</code> work<a class="anchor" aria-label="anchor" href="#how-does-disk-frame-work"></a>
+</h3>
+<p>One may ask, how come only a few functions are supported for one-stage group-by? And why are some functions like <code>median</code> only produce estimates instead of producing the exact figure? To answer these questions, we need to have an understanding of how <a href="https://diskframe.com" class="external-link">disk.frame</a> works.</p>
+<p>A <code>disk.frame</code> is organized as chunks stored on disk. Each chunk is a file stored in <a href="https://www.fstpackage.org/" class="external-link">fst format</a>. The <a href="https://CRAN.R-project.org/package=future" class="external-link"><code>{future}</code> package</a> is used to apply the same function to each chunk, each of these operations are carried out in a separate R session. These R sessions cannot communicate with each other during the execution of the operations.</p>
 <p>Once the operations have been performed on all chunks, the results will be bought back to the session from which the operations were called. This is the only point of inter-process communication.</p>
 <p>To summarize, the two phases of a <code>df %&gt;% some_fn %&gt;% collect</code> operation are</p>
 <ol style="list-style-type: decimal">
@@ -157,63 +157,68 @@ <h2 class="hasAnchor">
 <code>collect</code> then row-binds (<code>rbind</code>/<code>bind_rows</code>/<code>rbindlist</code>) the results together to form a data.frame in the main session</li>
 </ol>
 </div>
-<div id="how-group-by-works" class="section level2">
-<h2 class="hasAnchor">
-<a href="#how-group-by-works" class="anchor"></a>How group-by works</h2>
-<p>Except for passing the result back to the main session, communication between worker sessions are not allowed. This limits how group-by operations can be performed, hence why group-by was done in two stages prior to <code>{disk.frame}</code> v0.3.0. However, R’s meta-programming abilities allow us to rewrite code to perform the two-stage group-bys using one-stage group-by code. For example, consider:</p>
-<div class="sourceCode" id="cb2"><html><body><pre class="r"><span class="no">df</span> <span class="kw">%&gt;%</span>
-  <span class="fu">group_by</span>(<span class="no">grp1</span>) <span class="kw">%&gt;%</span>
-  <span class="fu">summarize</span>(<span class="fu"><a href="https://rdrr.io/r/base/sum.html">sum</a></span>(<span class="no">x</span>)) <span class="kw">%&gt;%</span>
-  <span class="no">collect</span></pre></body></html></div>
+<div class="section level3">
+<h3 id="how-group-by-works">How group-by works<a class="anchor" aria-label="anchor" href="#how-group-by-works"></a>
+</h3>
+<p>Except for passing the result back to the main session, communication between worker sessions are not allowed. This limits how group-by operations can be performed, hence why group-by was done in two stages prior to <a href="https://diskframe.com" class="external-link">disk.frame</a> v0.3.0. However, R’s meta-programming abilities allow us to rewrite code to perform the two-stage group-bys using one-stage group-by code. For example, consider:</p>
+<div class="sourceCode" id="cb2"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">df</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/group_by.html" class="external-link">group_by</a></span><span class="op">(</span><span class="va">grp1</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/summarise.html" class="external-link">summarize</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/sum.html" class="external-link">sum</a></span><span class="op">(</span><span class="va">x</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="va">collect</span></code></pre></div>
 <p>we can use meta-programming to transform that to</p>
-<div class="sourceCode" id="cb3"><html><body><pre class="r">df %&gt;% 
-  chunk_group_by(grp1) %&gt;% 
-  chunk_summarize(__tmp1__= sum(x)) %&gt;% 
-  collect() %&gt;% 
-  group_by(grp1) %&gt;% 
-  summarize(x = sum(__tmp1__))</pre></body></html></div>
+<div class="sourceCode" id="cb3"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb3-1"><a href="#cb3-1" aria-hidden="true" tabindex="-1"></a>df <span class="sc">%&gt;%</span> </span>
+<span id="cb3-2"><a href="#cb3-2" aria-hidden="true" tabindex="-1"></a>  <span class="fu">chunk_group_by</span>(grp1) <span class="sc">%&gt;%</span> </span>
+<span id="cb3-3"><a href="#cb3-3" aria-hidden="true" tabindex="-1"></a>  <span class="fu">chunk_summarize</span>(<span class="at">__tmp1__=</span> <span class="fu">sum</span>(x)) <span class="sc">%&gt;%</span> </span>
+<span id="cb3-4"><a href="#cb3-4" aria-hidden="true" tabindex="-1"></a>  <span class="fu">collect</span>() <span class="sc">%&gt;%</span> </span>
+<span id="cb3-5"><a href="#cb3-5" aria-hidden="true" tabindex="-1"></a>  <span class="fu">group_by</span>(grp1) <span class="sc">%&gt;%</span> </span>
+<span id="cb3-6"><a href="#cb3-6" aria-hidden="true" tabindex="-1"></a>  <span class="fu">summarize</span>(<span class="at">x =</span> <span class="fu">sum</span>(__tmp1__))</span></code></pre></div>
 <p>Basically, we are “compiling” one-stage group-by code to two-stage group-by code, and then executing it.</p>
 <p>For <code>mean</code>, it’s trickier, as one needs to keep track on the numerator and the denominator separately in computing <code>mean(x) = sum(x)/length(x)</code>.</p>
-<p>Therefore, <code>{disk.frame}</code> compiles</p>
-<div class="sourceCode" id="cb4"><html><body><pre class="r"><span class="no">df</span> <span class="kw">%&gt;%</span>
-  <span class="fu">group_by</span>(<span class="no">grp1</span>) <span class="kw">%&gt;%</span>
-  <span class="fu">summarize</span>(<span class="kw">meanx</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/mean.html">mean</a></span>(<span class="no">x</span>)) <span class="kw">%&gt;%</span>
-  <span class="no">collect</span></pre></body></html></div>
+<p>Therefore, <a href="https://diskframe.com" class="external-link">disk.frame</a> compiles</p>
+<div class="sourceCode" id="cb4"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">df</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/group_by.html" class="external-link">group_by</a></span><span class="op">(</span><span class="va">grp1</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/summarise.html" class="external-link">summarize</a></span><span class="op">(</span>meanx <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/mean.html" class="external-link">mean</a></span><span class="op">(</span><span class="va">x</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="va">collect</span></code></pre></div>
 <p>to</p>
-<div class="sourceCode" id="cb5"><html><body><pre class="r">df %&gt;% 
-  chunk_group_by(grp1) %&gt;% 
-  chunk_summarize(__tmp1__ = list(mean_df.chunk_agg.disk.frame(x))) %&gt;% 
-  collect %&gt;% 
-  group_by(grp1) %&gt;% 
-  chunk_summarize(meanx = mean_df.chunk_agg.disk.frame(__tmp1__))</pre></body></html></div>
+<div class="sourceCode" id="cb5"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb5-1"><a href="#cb5-1" aria-hidden="true" tabindex="-1"></a>df <span class="sc">%&gt;%</span> </span>
+<span id="cb5-2"><a href="#cb5-2" aria-hidden="true" tabindex="-1"></a>  <span class="fu">chunk_group_by</span>(grp1) <span class="sc">%&gt;%</span> </span>
+<span id="cb5-3"><a href="#cb5-3" aria-hidden="true" tabindex="-1"></a>  <span class="fu">chunk_summarize</span>(<span class="at">__tmp1__ =</span> <span class="fu">list</span>(<span class="fu">mean_df.chunk_agg.disk.frame</span>(x))) <span class="sc">%&gt;%</span> </span>
+<span id="cb5-4"><a href="#cb5-4" aria-hidden="true" tabindex="-1"></a>  collect <span class="sc">%&gt;%</span> </span>
+<span id="cb5-5"><a href="#cb5-5" aria-hidden="true" tabindex="-1"></a>  <span class="fu">group_by</span>(grp1) <span class="sc">%&gt;%</span> </span>
+<span id="cb5-6"><a href="#cb5-6" aria-hidden="true" tabindex="-1"></a>  <span class="fu">chunk_summarize</span>(<span class="at">meanx =</span> <span class="fu">mean_df.chunk_agg.disk.frame</span>(__tmp1__))</span></code></pre></div>
 <p>where <code>mean_df.chunk_agg.disk.frame</code> defines what needs to be done to each chunk, as you can see, the return value is a vector where the elements are named <code>sumx</code> and <code>lengthx</code>. Also note because the return value is not a scalar, we need to write it in a <code>list</code> (line 3).</p>
 <p>Here is an example implementation of <code>mean.chunk_agg.disk.frame</code></p>
-<div class="sourceCode" id="cb6"><html><body><pre class="r"><span class="no">mean_df.chunk_agg.disk.frame</span> <span class="kw">&lt;-</span> <span class="kw">function</span>(<span class="no">x</span>, <span class="no">na.rm</span> <span class="kw">=</span> <span class="fl">FALSE</span>, <span class="no">...</span>) {
-  <span class="no">sumx</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/sum.html">sum</a></span>(<span class="no">x</span>, <span class="kw">na.rm</span> <span class="kw">=</span> <span class="no">na.rm</span>)
-  <span class="no">lengthx</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/length.html">length</a></span>(<span class="no">x</span>) - <span class="fu"><a href="https://rdrr.io/r/base/ifelse.html">ifelse</a></span>(<span class="no">na.rm</span>, <span class="fu"><a href="https://rdrr.io/r/base/sum.html">sum</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/NA.html">is.na</a></span>(<span class="no">x</span>)), <span class="fl">0</span>)
-  <span class="fu"><a href="https://rdrr.io/r/base/c.html">c</a></span>(<span class="kw">sumx</span> <span class="kw">=</span> <span class="no">sumx</span>, <span class="kw">lengthx</span> <span class="kw">=</span> <span class="no">lengthx</span>)
-}</pre></body></html></div>
+<div class="sourceCode" id="cb6"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">mean_df.chunk_agg.disk.frame</span> <span class="op">&lt;-</span> <span class="kw">function</span><span class="op">(</span><span class="va">x</span>, <span class="va">na.rm</span> <span class="op">=</span> <span class="cn">FALSE</span>, <span class="va">...</span><span class="op">)</span> <span class="op">{</span>
+  <span class="va">sumx</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/sum.html" class="external-link">sum</a></span><span class="op">(</span><span class="va">x</span>, na.rm <span class="op">=</span> <span class="va">na.rm</span><span class="op">)</span>
+  <span class="va">lengthx</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/length.html" class="external-link">length</a></span><span class="op">(</span><span class="va">x</span><span class="op">)</span> <span class="op">-</span> <span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/fifelse.html" class="external-link">ifelse</a></span><span class="op">(</span><span class="va">na.rm</span>, <span class="fu"><a href="https://rdrr.io/r/base/sum.html" class="external-link">sum</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/NA.html" class="external-link">is.na</a></span><span class="op">(</span><span class="va">x</span><span class="op">)</span><span class="op">)</span>, <span class="fl">0</span><span class="op">)</span>
+  <span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span>sumx <span class="op">=</span> <span class="va">sumx</span>, lengthx <span class="op">=</span> <span class="va">lengthx</span><span class="op">)</span>
+<span class="op">}</span></code></pre></div>
 <p>The <code>mean_df.collected_agg.disk.frame</code> receives a list of outputs from <code>mean_df.chunk_agg.disk.frame</code>. Recall that <code>mean.chunk_agg.disk.frame</code> returns a vector for each chunk, so the input to <code>mean_df.collected_agg.disk.frame</code> is a <em>list of vectors</em></p>
-<div class="sourceCode" id="cb7"><html><body><pre class="r"><span class="no">mean_df.collected_agg.disk.frame</span> <span class="kw">&lt;-</span> <span class="kw">function</span>(<span class="no">listx</span>) {
-  <span class="fu"><a href="https://rdrr.io/r/base/sum.html">sum</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/lapply.html">sapply</a></span>(<span class="no">listx</span>, <span class="kw">function</span>(<span class="no">x</span>) <span class="no">x</span>[<span class="st">"sumx"</span>]))/<span class="fu"><a href="https://rdrr.io/r/base/sum.html">sum</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/lapply.html">sapply</a></span>(<span class="no">listx</span>, <span class="kw">function</span>(<span class="no">x</span>) <span class="no">x</span>[<span class="st">"lengthx"</span>]))
-}</pre></body></html></div>
+<div class="sourceCode" id="cb7"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">mean_df.collected_agg.disk.frame</span> <span class="op">&lt;-</span> <span class="kw">function</span><span class="op">(</span><span class="va">listx</span><span class="op">)</span> <span class="op">{</span>
+  <span class="fu"><a href="https://rdrr.io/r/base/sum.html" class="external-link">sum</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/lapply.html" class="external-link">sapply</a></span><span class="op">(</span><span class="va">listx</span>, <span class="kw">function</span><span class="op">(</span><span class="va">x</span><span class="op">)</span> <span class="va">x</span><span class="op">[</span><span class="st">"sumx"</span><span class="op">]</span><span class="op">)</span><span class="op">)</span><span class="op">/</span><span class="fu"><a href="https://rdrr.io/r/base/sum.html" class="external-link">sum</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/lapply.html" class="external-link">sapply</a></span><span class="op">(</span><span class="va">listx</span>, <span class="kw">function</span><span class="op">(</span><span class="va">x</span><span class="op">)</span> <span class="va">x</span><span class="op">[</span><span class="st">"lengthx"</span><span class="op">]</span><span class="op">)</span><span class="op">)</span>
+<span class="op">}</span></code></pre></div>
 </div>
-<div id="how-to-define-custom-one-stage-group-by-functions" class="section level2">
-<h2 class="hasAnchor">
-<a href="#how-to-define-custom-one-stage-group-by-functions" class="anchor"></a>How to define custom one-stage group-by functions</h2>
+<div class="section level3">
+<h3 id="how-to-define-custom-one-stage-group-by-functions">How to define custom one-stage group-by functions<a class="anchor" aria-label="anchor" href="#how-to-define-custom-one-stage-group-by-functions"></a>
+</h3>
 <p>Now that we have seen two examples, namely <code>sum</code> and <code>mean</code>, we are ready to summarize how group-by functions are implemented.</p>
 <p>Given the below</p>
-<div class="sourceCode" id="cb8"><html><body><pre class="r"><span class="no">df</span> <span class="kw">%&gt;%</span>
-  <span class="fu">group_by</span>(<span class="no">grp1</span>) <span class="kw">%&gt;%</span>
-  <span class="fu">summarize</span>(<span class="kw">namex</span> <span class="kw">=</span> <span class="fu">fn</span>(<span class="no">x</span>)) <span class="kw">%&gt;%</span>
-  <span class="no">collect</span></pre></body></html></div>
-<p><code>{disk.frame}</code> compiles it to</p>
-<div class="sourceCode" id="cb9"><html><body><pre class="r">df %&gt;% 
-  chunk_group_by(grp1) %&gt;% 
-  chunk_summarize(__tmp1__ = list(fn_df.chunk_agg.disk.frame(x))) %&gt;% 
-  collect %&gt;% 
-  group_by(grp1) %&gt;% 
-  chunk_summarize(namex = fn_df.collected_agg.disk.frame(__tmp1__))</pre></body></html></div>
+<div class="sourceCode" id="cb8"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">df</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/group_by.html" class="external-link">group_by</a></span><span class="op">(</span><span class="va">grp1</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/summarise.html" class="external-link">summarize</a></span><span class="op">(</span>namex <span class="op">=</span> <span class="fu">fn</span><span class="op">(</span><span class="va">x</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="va">collect</span></code></pre></div>
+<p><a href="https://diskframe.com" class="external-link">disk.frame</a> compiles it to</p>
+<div class="sourceCode" id="cb9"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb9-1"><a href="#cb9-1" aria-hidden="true" tabindex="-1"></a>df <span class="sc">%&gt;%</span> </span>
+<span id="cb9-2"><a href="#cb9-2" aria-hidden="true" tabindex="-1"></a>  <span class="fu">chunk_group_by</span>(grp1) <span class="sc">%&gt;%</span> </span>
+<span id="cb9-3"><a href="#cb9-3" aria-hidden="true" tabindex="-1"></a>  <span class="fu">chunk_summarize</span>(<span class="at">__tmp1__ =</span> <span class="fu">list</span>(<span class="fu">fn_df.chunk_agg.disk.frame</span>(x))) <span class="sc">%&gt;%</span> </span>
+<span id="cb9-4"><a href="#cb9-4" aria-hidden="true" tabindex="-1"></a>  collect <span class="sc">%&gt;%</span> </span>
+<span id="cb9-5"><a href="#cb9-5" aria-hidden="true" tabindex="-1"></a>  <span class="fu">group_by</span>(grp1) <span class="sc">%&gt;%</span> </span>
+<span id="cb9-6"><a href="#cb9-6" aria-hidden="true" tabindex="-1"></a>  <span class="fu">chunk_summarize</span>(<span class="at">namex =</span> <span class="fu">fn_df.collected_agg.disk.frame</span>(__tmp1__))</span></code></pre></div>
 <p>Based on the above information, to make <code>fn</code> a one-stage group-by function, the user has to</p>
 <ol style="list-style-type: decimal">
 <li>Define <code>fn_df.chunk_agg.disk.frame</code> which is a function to be applied to each chunk</li>
@@ -225,45 +230,49 @@ <h2 class="hasAnchor">
 <li>Define <code>sum_df.chunk_agg.disk.frame</code>
 </li>
 </ol>
-<div class="sourceCode" id="cb10"><html><body><pre class="r"><span class="no">sum_df.chunk_agg.disk.frame</span> <span class="kw">&lt;-</span> <span class="kw">function</span>(<span class="no">x</span>, <span class="no">na.rm</span> <span class="kw">=</span> <span class="fl">FALSE</span>) {
-  <span class="fu"><a href="https://rdrr.io/r/base/sum.html">sum</a></span>(<span class="no">x</span>, <span class="kw">na.rm</span><span class="kw">=</span><span class="no">na.rm</span>)
-}</pre></body></html></div>
+<div class="sourceCode" id="cb10"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">sum_df.chunk_agg.disk.frame</span> <span class="op">&lt;-</span> <span class="kw">function</span><span class="op">(</span><span class="va">x</span>, <span class="va">na.rm</span> <span class="op">=</span> <span class="cn">FALSE</span><span class="op">)</span> <span class="op">{</span>
+  <span class="fu"><a href="https://rdrr.io/r/base/sum.html" class="external-link">sum</a></span><span class="op">(</span><span class="va">x</span>, na.rm<span class="op">=</span><span class="va">na.rm</span><span class="op">)</span>
+<span class="op">}</span></code></pre></div>
 <ol start="2" style="list-style-type: decimal">
-<li>Define <code>sum_df.collected_agg.disk.frame</code>, which needs to accept a list of <code><a href="https://rdrr.io/r/base/sum.html">sum(x, na.rm)</a></code>, but <code><a href="https://rdrr.io/r/base/sum.html">sum(x, na.rm)</a></code> is just a numeric, so</li>
+<li>Define <code>sum_df.collected_agg.disk.frame</code>, which needs to accept a list of <code>sum(x, na.rm)</code>, but <code>sum(x, na.rm)</code> is just a numeric, so</li>
 </ol>
-<div class="sourceCode" id="cb11"><html><body><pre class="r"><span class="no">sum_df.collected_agg.disk.frame</span> <span class="kw">&lt;-</span> <span class="kw">function</span>(<span class="no">list_sum</span>) {
-  <span class="fu"><a href="https://rdrr.io/r/base/sum.html">sum</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/unlist.html">unlist</a></span>(<span class="no">list_sum</span>))
-}</pre></body></html></div>
+<div class="sourceCode" id="cb11"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">sum_df.collected_agg.disk.frame</span> <span class="op">&lt;-</span> <span class="kw">function</span><span class="op">(</span><span class="va">list_sum</span><span class="op">)</span> <span class="op">{</span>
+  <span class="fu"><a href="https://rdrr.io/r/base/sum.html" class="external-link">sum</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/unlist.html" class="external-link">unlist</a></span><span class="op">(</span><span class="va">list_sum</span><span class="op">)</span><span class="op">)</span>
+<span class="op">}</span></code></pre></div>
 <p><strong>Example of implementing <code>n_distinct</code></strong>:</p>
-<p>The <code><a href="https://dplyr.tidyverse.org/reference/n_distinct.html">dplyr::n_distinct</a></code> function counts the number of distint values from a vector <code>x</code></p>
+<p>The <code><a href="https://dplyr.tidyverse.org/reference/n_distinct.html" class="external-link">dplyr::n_distinct</a></code> function counts the number of distint values from a vector <code>x</code></p>
 <ol style="list-style-type: decimal">
 <li>Define <code>n_distinct_df.chunk_agg.disk.frame</code>, to return a list of unique values. Because the same value can appear in multiple chunks, to ensure that we don’t double count, we simply return all the unique values from each chunk which is then de-duplicated in the next phase</li>
 </ol>
-<div class="sourceCode" id="cb12"><html><body><pre class="r"><span class="no">n_distinct_df.chunk_agg.disk.frame</span> <span class="kw">&lt;-</span> <span class="kw">function</span>(<span class="no">x</span>, <span class="no">na.rm</span> <span class="kw">=</span> <span class="fl">FALSE</span>) {
-  <span class="kw">if</span>(<span class="no">na.rm</span>) {
-    <span class="fu"><a href="https://rdrr.io/r/base/sets.html">setdiff</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/unique.html">unique</a></span>(<span class="no">x</span>), <span class="fl">NA</span>)
-  } <span class="kw">else</span> {
-    <span class="fu"><a href="https://rdrr.io/r/base/unique.html">unique</a></span>(<span class="no">x</span>)
-  }
-}</pre></body></html></div>
+<div class="sourceCode" id="cb12"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">n_distinct_df.chunk_agg.disk.frame</span> <span class="op">&lt;-</span> <span class="kw">function</span><span class="op">(</span><span class="va">x</span>, <span class="va">na.rm</span> <span class="op">=</span> <span class="cn">FALSE</span><span class="op">)</span> <span class="op">{</span>
+  <span class="kw">if</span><span class="op">(</span><span class="va">na.rm</span><span class="op">)</span> <span class="op">{</span>
+    <span class="fu"><a href="https://generics.r-lib.org/reference/setops.html" class="external-link">setdiff</a></span><span class="op">(</span><span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/duplicated.html" class="external-link">unique</a></span><span class="op">(</span><span class="va">x</span><span class="op">)</span>, <span class="cn">NA</span><span class="op">)</span>
+  <span class="op">}</span> <span class="kw">else</span> <span class="op">{</span>
+    <span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/duplicated.html" class="external-link">unique</a></span><span class="op">(</span><span class="va">x</span><span class="op">)</span>
+  <span class="op">}</span>
+<span class="op">}</span></code></pre></div>
 <ol start="2" style="list-style-type: decimal">
 <li>Define <code>n_distinct_df.collected_agg.disk.frame</code>, which de-duplicates the unique values</li>
 </ol>
-<div class="sourceCode" id="cb13"><html><body><pre class="r"><span class="no">n_distinct_df.collected_agg.disk.frame</span> <span class="kw">&lt;-</span> <span class="kw">function</span>(<span class="no">list_of_chunkwise_uniques</span>) {
-  <span class="kw pkg">dplyr</span><span class="kw ns">::</span><span class="fu"><a href="https://dplyr.tidyverse.org/reference/n_distinct.html">n_distinct</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/unlist.html">unlist</a></span>(<span class="no">list_of_chunkwise_uniques</span>))
-}</pre></body></html></div>
+<div class="sourceCode" id="cb13"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">n_distinct_df.collected_agg.disk.frame</span> <span class="op">&lt;-</span> <span class="kw">function</span><span class="op">(</span><span class="va">list_of_chunkwise_uniques</span><span class="op">)</span> <span class="op">{</span>
+  <span class="fu">dplyr</span><span class="fu">::</span><span class="fu"><a href="https://dplyr.tidyverse.org/reference/n_distinct.html" class="external-link">n_distinct</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/unlist.html" class="external-link">unlist</a></span><span class="op">(</span><span class="va">list_of_chunkwise_uniques</span><span class="op">)</span><span class="op">)</span>
+<span class="op">}</span></code></pre></div>
 </div>
-<div id="limitations" class="section level2">
-<h2 class="hasAnchor">
-<a href="#limitations" class="anchor"></a>Limitations</h2>
-<p>We have seen that <code>{disk.frame}</code> performs operations in two phases</p>
+<div class="section level3">
+<h3 id="limitations">Limitations<a class="anchor" aria-label="anchor" href="#limitations"></a>
+</h3>
+<p>We have seen that <a href="https://diskframe.com" class="external-link">disk.frame</a> performs operations in two phases</p>
 <ol style="list-style-type: decimal">
 <li>apply the same function to each chunk</li>
 <li>row-bind the results</li>
 </ol>
 <p>and there are no communication between the sessions that applies the functions at chunk level.</p>
 <p>Hence, it is generally difficult to compute rank based summarizations like <code>median</code> exactly. Hence most rank based calculations are estimates only. This is also true of distributed data system like Spark whose median function is also estimates only.</p>
-<p>Another limitation for now is that summarization that is more complex then <code>f(x)</code> is not supported. E.g. <code>sum(x) + 1</code>, <code><a href="https://rdrr.io/r/base/sum.html">sum(x + mean(x))</a></code>, <code>sum(x) + mean(x)</code>, and <code>fn(sum(x))</code> are not yet supported as arguments in the <code>summarize</code> function.</p>
+<p>Another limitation for now is that summarization that is more complex then <code>f(x)</code> is not supported. E.g. <code>sum(x) + 1</code>, <code>sum(x + mean(x))</code>, <code>sum(x) + mean(x)</code>, and <code>fn(sum(x))</code> are not yet supported as arguments in the <code>summarize</code> function.</p>
 </div>
 </div>
   </div>
@@ -279,11 +288,13 @@ <h2 class="hasAnchor">
 
 
       <footer><div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+  <p></p>
+<p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p>
+<p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
       </footer>
@@ -292,5 +303,7 @@ <h2 class="hasAnchor">
   
 
 
+  
+
   </body>
 </html>
diff --git a/docs/articles/11-custom-group-by_files/header-attrs-2.8/header-attrs.js b/docs/articles/11-custom-group-by_files/header-attrs-2.8/header-attrs.js
new file mode 100644
index 00000000..dd57d92e
--- /dev/null
+++ b/docs/articles/11-custom-group-by_files/header-attrs-2.8/header-attrs.js
@@ -0,0 +1,12 @@
+// Pandoc 2.9 adds attributes on both header and div. We remove the former (to
+// be compatible with the behavior of Pandoc < 2.8).
+document.addEventListener('DOMContentLoaded', function(e) {
+  var hs = document.querySelectorAll("div.section[class*='level'] > :first-child");
+  var i, h, a;
+  for (i = 0; i < hs.length; i++) {
+    h = hs[i];
+    if (!/^h[1-6]$/i.test(h.tagName)) continue;  // it should be a header h1-h6
+    a = h.attributes;
+    while (a.length > 0) h.removeAttribute(a[0].name);
+  }
+});
diff --git a/docs/articles/88-trouble-shooting.html b/docs/articles/88-trouble-shooting.html
new file mode 100644
index 00000000..ab2a72a9
--- /dev/null
+++ b/docs/articles/88-trouble-shooting.html
@@ -0,0 +1,186 @@
+<!DOCTYPE html>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en">
+<head>
+<meta http-equiv="Content-Type" content="text/html; charset=UTF-8">
+<meta charset="utf-8">
+<meta http-equiv="X-UA-Compatible" content="IE=edge">
+<meta name="viewport" content="width=device-width, initial-scale=1.0">
+<title>Trouble shooting • disk.frame</title>
+<!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous">
+<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css">
+<script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous">
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous">
+<!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet">
+<script src="../pkgdown.js"></script><meta property="og:title" content="Trouble shooting">
+<meta property="og:description" content="disk.frame">
+<!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
+<script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
+<script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
+<![endif]-->
+</head>
+<body data-spy="scroll" data-target="#toc">
+    
+
+    <div class="container template-article">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
+  <div class="container">
+    <div class="navbar-header">
+      <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
+        <span class="sr-only">Toggle navigation</span>
+        <span class="icon-bar"></span>
+        <span class="icon-bar"></span>
+        <span class="icon-bar"></span>
+      </button>
+      <span class="navbar-brand">
+        <a class="navbar-link" href="../index.html">disk.frame</a>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
+      </span>
+    </div>
+
+    <div id="navbar" class="navbar-collapse collapse">
+      <ul class="nav navbar-nav">
+<li>
+  <a href="../reference/index.html">Reference</a>
+</li>
+<li class="dropdown">
+  <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-expanded="false">
+    Articles
+     
+    <span class="caret"></span>
+  </a>
+  <ul class="dropdown-menu" role="menu">
+<li>
+      <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
+    </li>
+    <li>
+      <a href="../articles/02-intro-disk-frame.html">Quick Start: Basic Operations with nycflights13</a>
+    </li>
+    <li>
+      <a href="../articles/03-concepts.html">Key `{disk.frame}` concepts</a>
+    </li>
+    <li>
+      <a href="../articles/04-ingesting-data.html">Ingesting Data</a>
+    </li>
+    <li>
+      <a href="../articles/05-data-table-syntax.html">Using data.table syntax with disk.frame</a>
+    </li>
+    <li>
+      <a href="../articles/06-vs-dask-juliadb.html">Benchmarks 1: disk.frame beats Dask! disk.frame beats JuliaDB! Anyone else wanna challenge?</a>
+    </li>
+    <li>
+      <a href="../articles/07-glm.html">Generalized Linear Models (GLM) including logistic regression with disk.frame</a>
+    </li>
+    <li>
+      <a href="../articles/08-more-epic.html">{disk.frame} can be more 'epic'</a>
+    </li>
+    <li>
+      <a href="../articles/09-convenience-features.html">Convenience features</a>
+    </li>
+    <li>
+      <a href="../articles/10-group-by.html">Group-by</a>
+    </li>
+    <li>
+      <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
+    </li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul>
+</li>
+<li>
+  <a href="../news/index.html">Changelog</a>
+</li>
+      </ul>
+<ul class="nav navbar-nav navbar-right">
+<li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
+     
+  </a>
+</li>
+      </ul>
+</div>
+<!--/.nav-collapse -->
+  </div>
+<!--/.container -->
+</div>
+<!--/.navbar -->
+
+      
+
+      </header><div class="row">
+  <div class="col-md-9 contents">
+    <div class="page-header toc-ignore">
+      <h1 data-toc-skip>Trouble shooting</h1>
+                        <h4 data-toc-skip class="author">ZJ</h4>
+            
+      
+      <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/vignettes/88-trouble-shooting.Rmd" class="external-link"><code>vignettes/88-trouble-shooting.Rmd</code></a></small>
+      <div class="hidden name"><code>88-trouble-shooting.Rmd</code></div>
+
+    </div>
+
+    
+    
+<div class="section level3">
+<h3 id="steps-to-trouble-shoot">Steps to trouble shoot<a class="anchor" aria-label="anchor" href="#steps-to-trouble-shoot"></a>
+</h3>
+<ol style="list-style-type: decimal">
+<li><p>I suggest updating {future} and your R version if you have not already done so.</p></li>
+<li><p>Are you able to share the data?</p></li>
+<li><p>Do a good MWE</p></li>
+</ol>
+<pre><code><span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://diskframe.com" class="external-link">disk.frame</a></span><span class="op">)</span>
+<span class="fu"><a href="../reference/setup_disk.frame.html">setup_disk.frame</a></span><span class="op">(</span><span class="op">)</span>
+
+<span class="va">df</span><span class="op">&lt;-</span><span class="fu"><a href="../reference/as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">a</span><span class="op">)</span>
+
+
+<span class="va">df1</span> <span class="op">=</span> <span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate.html" class="external-link">mutate</a></span><span class="op">(</span><span class="va">df</span>, date <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/as.Date.html" class="external-link">as.Date</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/character.html" class="external-link">as.character</a></span><span class="op">(</span><span class="va">datadate</span><span class="op">)</span>, format<span class="op">=</span><span class="st">"%Y%m%d"</span><span class="op">)</span><span class="op">)</span>
+
+<span class="fu"><a href="https://rdrr.io/r/utils/head.html" class="external-link">head</a></span><span class="op">(</span><span class="va">df1</span><span class="op">)</span></code></pre>
+<ol start="3" style="list-style-type: decimal">
+<li><p>Check if your virus scanner is blocking interprocess communication</p></li>
+<li><p>Try to apply the function to just one chunk, perhaps there is a syntax error or column error? If one chunk works then you can rule out coding error</p></li>
+</ol>
+<pre><code><span class="fu"><a href="../reference/get_chunk.html">get_chunk</a></span><span class="op">(</span><span class="va">df</span>, <span class="fl">1</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span>
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate.html" class="external-link">mutate</a></span><span class="op">(</span>date <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/as.Date.html" class="external-link">as.Date</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/character.html" class="external-link">as.character</a></span><span class="op">(</span><span class="va">datadate</span><span class="op">)</span>, format<span class="op">=</span><span class="st">"%Y%m%d"</span><span class="op">)</span><span class="op">)</span></code></pre>
+<ol start="5" style="list-style-type: decimal">
+<li>Set the number of workers to 1, so there is no more inter-process communication. Does it work now? If it does, then it’s the inter process communication. You might need to contact your admin for help</li>
+</ol>
+<pre><code>setup_disk.frame(workers=1)
+mutate(df, date = as.Date(as.character(datadate), format="%Y%m%d"))
+As an MWE this works for me.
+
+a = data.frame(datadate = rep("20201007", 3e6))</code></pre>
+</div>
+  </div>
+
+  <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
+
+      </div>
+
+</div>
+
+
+
+      <footer><div class="copyright">
+  <p></p>
+<p>Developed by Dai ZJ.</p>
+</div>
+
+<div class="pkgdown">
+  <p></p>
+<p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
+</div>
+
+      </footer>
+</div>
+
+  
+
+
+  
+
+  </body>
+</html>
diff --git a/docs/articles/88-trouble-shooting_files/header-attrs-2.8/header-attrs.js b/docs/articles/88-trouble-shooting_files/header-attrs-2.8/header-attrs.js
new file mode 100644
index 00000000..dd57d92e
--- /dev/null
+++ b/docs/articles/88-trouble-shooting_files/header-attrs-2.8/header-attrs.js
@@ -0,0 +1,12 @@
+// Pandoc 2.9 adds attributes on both header and div. We remove the former (to
+// be compatible with the behavior of Pandoc < 2.8).
+document.addEventListener('DOMContentLoaded', function(e) {
+  var hs = document.querySelectorAll("div.section[class*='level'] > :first-child");
+  var i, h, a;
+  for (i = 0; i < hs.length; i++) {
+    h = hs[i];
+    if (!/^h[1-6]$/i.test(h.tagName)) continue;  // it should be a header h1-h6
+    a = h.attributes;
+    while (a.length > 0) h.removeAttribute(a[0].name);
+  }
+});
diff --git a/docs/articles/index.html b/docs/articles/index.html
index 7e29886b..f767f6f8 100644
--- a/docs/articles/index.html
+++ b/docs/articles/index.html
@@ -1,66 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Articles • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Articles" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Articles • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Articles"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
-
-
-  </head>
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-article-index">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -71,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -92,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -126,30 +64,26 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
       <h1>Articles</h1>
@@ -159,51 +93,49 @@ <h1>Articles</h1>
       <h3>All vignettes</h3>
       <p class="section-desc"></p>
 
-      <dl>
-        <dt><a href="01-intro.html">Preface - The birth of `disk.frame`</a></dt>
-        <dd></dt>
-        <dt><a href="02-intro-disk-frame.html">Quick Start: Basic Operations with nycflights13</a></dt>
-        <dd></dt>
-        <dt><a href="03-concepts.html">Key `{disk.frame}` concepts</a></dt>
-        <dd></dt>
-        <dt><a href="04-ingesting-data.html">Ingesting Data</a></dt>
-        <dd></dt>
-        <dt><a href="05-data-table-syntax.html">Using data.table syntax with disk.frame</a></dt>
-        <dd></dt>
-        <dt><a href="06-vs-dask-juliadb.html">Benchmarks 1: disk.frame beats Dask! disk.frame beats JuliaDB! Anyone else wanna challenge?</a></dt>
-        <dd></dt>
-        <dt><a href="07-glm.html">Generalized Linear Models (GLM) including logistic regression with disk.frame</a></dt>
-        <dd></dt>
-        <dt><a href="08-more-epic.html">{disk.frame} can be more 'epic'</a></dt>
-        <dd></dt>
-        <dt><a href="09-convenience-features.html">Convenience features</a></dt>
-        <dd></dt>
-        <dt><a href="10-group-by.html">Group-by</a></dt>
-        <dd></dt>
-        <dt><a href="11-custom-group-by.html">Custom One-Stage Group-by functions</a></dt>
-        <dd></dt>
-      </dl>
-    </div>
+      <dl><dt><a href="01-intro.html">Preface - The birth of `disk.frame`</a></dt>
+        <dd>
+        </dd><dt><a href="02-intro-disk-frame.html">Quick Start: Basic Operations with nycflights13</a></dt>
+        <dd>
+        </dd><dt><a href="03-concepts.html">Key `{disk.frame}` concepts</a></dt>
+        <dd>
+        </dd><dt><a href="04-ingesting-data.html">Ingesting Data</a></dt>
+        <dd>
+        </dd><dt><a href="05-data-table-syntax.html">Using data.table syntax with disk.frame</a></dt>
+        <dd>
+        </dd><dt><a href="06-vs-dask-juliadb.html">Benchmarks 1: disk.frame beats Dask! disk.frame beats JuliaDB! Anyone else wanna challenge?</a></dt>
+        <dd>
+        </dd><dt><a href="07-glm.html">Generalized Linear Models (GLM) including logistic regression with disk.frame</a></dt>
+        <dd>
+        </dd><dt><a href="08-more-epic.html">{disk.frame} can be more 'epic'</a></dt>
+        <dd>
+        </dd><dt><a href="09-convenience-features.html">Convenience features</a></dt>
+        <dd>
+        </dd><dt><a href="10-group-by.html">Group-by</a></dt>
+        <dd>
+        </dd><dt><a href="11-custom-group-by.html">Custom One-Stage Group-by functions</a></dt>
+        <dd>
+        </dd><dt><a href="88-trouble-shooting.html">Trouble shooting</a></dt>
+        <dd>
+      </dd></dl></div>
   </div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/authors.html b/docs/authors.html
index fd9e2f46..342af2fa 100644
--- a/docs/authors.html
+++ b/docs/authors.html
@@ -1,66 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Authors • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="bootstrap-toc.css">
-<script src="bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="pkgdown.css" rel="stylesheet">
-<script src="pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Authors" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Authors and Citation • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="bootstrap-toc.css"><script src="bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="pkgdown.css" rel="stylesheet"><script src="pkgdown.js"></script><meta property="og:title" content="Authors and Citation"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
-    <div class="container template-authors">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+    <div class="container template-citation-authors">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -71,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -92,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -126,45 +64,61 @@
     <li>
       <a href="articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="contents col-md-9">
-    <div class="page-header">
-      <h1>Authors</h1>
+    <div class="section level2 authors-section">
+      <div class="page-header">
+        <h1>Authors</h1>
+      </div>
+
+      
+      <ul class="list-unstyled"><li>
+          <p><strong>Dai ZJ</strong>. Author, maintainer. 
+          </p>
+        </li>
+        <li>
+          <p><strong>Jacky Poon</strong>. Contributor. 
+          </p>
+        </li>
+      </ul></div>
+    <div class="section level2 citation-section">
+    <div>
+      <h1 id="citation">Citation</h1>
+      <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/DESCRIPTION" class="external-link"><code>DESCRIPTION</code></a></small>
+    </div>
     </div>
 
-    <ul class="list-unstyled">
-      <li>
-        <p><strong>Dai ZJ</strong>. Author, maintainer. 
-        </p>
-      </li>
-      <li>
-        <p><strong>Jacky Poon</strong>. Contributor. 
-        </p>
-      </li>
-    </ul>
+
+    <p>ZJ D (2022).
+<em>disk.frame: Larger-than-RAM Disk-Based Data Manipulation Framework</em>.
+R package version 0.5.0, <a href="https://diskframe.com" class="external-link">https://diskframe.com</a>. 
+</p>
+    <pre>@Manual{,
+  title = {disk.frame: Larger-than-RAM Disk-Based Data Manipulation Framework},
+  author = {Dai ZJ},
+  year = {2022},
+  note = {R package version 0.5.0},
+  url = {https://diskframe.com},
+}</pre>
 
   </div>
 
@@ -172,22 +126,20 @@ <h1>Authors</h1>
 
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/index.html b/docs/index.html
index 41066c9b..89c4a22e 100644
--- a/docs/index.html
+++ b/docs/index.html
@@ -23,6 +23,8 @@
 <![endif]-->
 </head>
 <body data-spy="scroll" data-target="#toc">
+    
+
     <div class="container template-home">
       <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
@@ -35,18 +37,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
       <ul class="nav navbar-nav">
-<li>
-  <a href="index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
 <li>
   <a href="reference/index.html">Reference</a>
 </li>
@@ -90,6 +86,9 @@
     <li>
       <a href="articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
+    <li>
+      <a href="articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
   </ul>
 </li>
 <li>
@@ -98,8 +97,8 @@
       </ul>
 <ul class="nav navbar-nav navbar-right">
 <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
@@ -116,161 +115,170 @@
       </header><div class="row">
   <div class="contents col-md-9">
 
-<div id="diskframe-" class="section level1">
-<div class="page-header"><h1 class="hasAnchor">
-<a href="#diskframe-" class="anchor"></a>disk.frame <img src="inst/figures/disk.frame.png" align="right">
+<div class="section level1">
+<div class="page-header"><h1 id="diskframe-">disk.frame <img src="inst/figures/disk.frame.png" align="right"><a class="anchor" aria-label="anchor" href="#diskframe-"></a>
 </h1></div>
 </div>
-<div id="introduction" class="section level1">
-<h1 class="hasAnchor">
-<a href="#introduction" class="anchor"></a>Introduction</h1>
+<div class="section level1">
+<h1 id="introduction">Introduction<a class="anchor" aria-label="anchor" href="#introduction"></a>
+</h1>
 <p>How do I manipulate tabular data that doesn’t fit into Random Access Memory (RAM)?</p>
-<p>Use <code>{disk.frame}</code>!</p>
-<p>In a nutshell, <code>{disk.frame}</code> makes use of two simple ideas</p>
-<p>1) split up a larger-than-RAM dataset into chunks and store each chunk in a separate file inside a folder and 2) provide a convenient API to manipulate these chunks</p>
-<p><code>{disk.frame}</code> performs a similar role to distributed systems such as Apache Spark, Python’s Dask, and Julia’s JuliaDB.jl for <em>medium data</em> which are datasets that are too large for RAM but not quite large enough to qualify as <em>big data</em>.</p>
-<div id="installation" class="section level2">
-<h2 class="hasAnchor">
-<a href="#installation" class="anchor"></a>Installation</h2>
-<p>You can install the released version of <code>{disk.frame}</code> from <a href="https://CRAN.R-project.org">CRAN</a> with:</p>
-<div class="sourceCode" id="cb1"><pre class="r"><span class="fu"><a href="https://rdrr.io/r/utils/install.packages.html">install.packages</a></span>(<span class="st">"disk.frame"</span>)</pre></div>
-<p>And the development version from <a href="https://github.com/">GitHub</a> with:</p>
-<div class="sourceCode" id="cb2"><pre class="r"><span class="co"># install.packages("devtools")</span>
-<span class="kw pkg">devtools</span><span class="kw ns">::</span><span class="fu"><a href="https://devtools.r-lib.org//reference/remote-reexports.html">install_github</a></span>(<span class="st">"xiaodaigh/disk.frame"</span>)</pre></div>
+<p>Use <a href="https://diskframe.com" class="external-link">disk.frame</a>!</p>
+<p>In a nutshell, <a href="https://diskframe.com" class="external-link">disk.frame</a> makes use of two simple ideas</p>
+<ol style="list-style-type: decimal">
+<li>split up a larger-than-RAM dataset into chunks and store each chunk in a separate file inside a folder and</li>
+<li>provide a convenient API to manipulate these chunks</li>
+</ol>
+<p><a href="https://diskframe.com" class="external-link">disk.frame</a> performs a similar role to distributed systems such as Apache Spark, Python’s Dask, and Julia’s JuliaDB.jl for <em>medium data</em> which are datasets that are too large for RAM but not quite large enough to qualify as <em>big data</em>.</p>
+<div class="section level2">
+<h2 id="installation">Installation<a class="anchor" aria-label="anchor" href="#installation"></a>
+</h2>
+<p>You can install the released version of <a href="https://diskframe.com" class="external-link">disk.frame</a> from <a href="https://CRAN.R-project.org" class="external-link">CRAN</a> with:</p>
+<div class="sourceCode" id="cb1"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu"><a href="https://rdrr.io/r/utils/install.packages.html" class="external-link">install.packages</a></span><span class="op">(</span><span class="st">"disk.frame"</span><span class="op">)</span></code></pre></div>
+<p>And the development version from <a href="https://github.com/" class="external-link">GitHub</a> with:</p>
+<div class="sourceCode" id="cb2"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="co"># install.packages("devtools")</span>
+<span class="fu">devtools</span><span class="fu">::</span><span class="fu"><a href="https://devtools.r-lib.org/reference/remote-reexports.html" class="external-link">install_github</a></span><span class="op">(</span><span class="st">"xiaodaigh/disk.frame"</span><span class="op">)</span></code></pre></div>
 <p>On some platforms, such as SageMaker, you may need to explicitly specify a repo like this</p>
-<div class="sourceCode" id="cb3"><pre class="r"><span class="fu"><a href="https://rdrr.io/r/utils/install.packages.html">install.packages</a></span>(<span class="st">"disk.frame"</span>, <span class="kw">repo</span><span class="kw">=</span><span class="st">"https://cran.rstudio.com"</span>)</pre></div>
+<div class="sourceCode" id="cb3"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu"><a href="https://rdrr.io/r/utils/install.packages.html" class="external-link">install.packages</a></span><span class="op">(</span><span class="st">"disk.frame"</span>, repo<span class="op">=</span><span class="st">"https://cran.rstudio.com"</span><span class="op">)</span></code></pre></div>
 </div>
-<div id="vignettes-and-articles" class="section level2">
-<h2 class="hasAnchor">
-<a href="#vignettes-and-articles" class="anchor"></a>Vignettes and articles</h2>
-<p>Please see these vignettes and articles about <code>{disk.frame}</code></p>
+<div class="section level2">
+<h2 id="vignettes-and-articles">Vignettes and articles<a class="anchor" aria-label="anchor" href="#vignettes-and-articles"></a>
+</h2>
+<p>Please see these vignettes and articles about <a href="https://diskframe.com" class="external-link">disk.frame</a></p>
 <ul>
 <li>
-<a href="https://diskframe.com/articles/intro-disk-frame.html">Quick start: <code>{disk.frame}</code></a> which replicates the <code>sparklyr</code> vignette for manipulating the <code>nycflights13</code> flights data.</li>
+<a href="https://diskframe.com/articles/intro-disk-frame.html" class="external-link">Quick start: <code>{disk.frame}</code></a> which replicates the <code>sparklyr</code> vignette for manipulating the <code>nycflights13</code> flights data.</li>
 <li>
-<a href="https://diskframe.com/articles/ingesting-data.html">Ingesting data into <code>{disk.frame}</code></a> which lists some commons way of creating disk.frames</li>
+<a href="https://diskframe.com/articles/ingesting-data.html" class="external-link">Ingesting data into <code>{disk.frame}</code></a> which lists some commons way of creating disk.frames</li>
 <li>
-<a href="https://diskframe.com/articles/more-epic.html"><code>{disk.frame}</code> can be more epic!</a> shows some ways of loading large CSVs and the importance of <code>srckeep</code>
+<a href="https://diskframe.com/articles/more-epic.html" class="external-link"><code>{disk.frame}</code> can be more epic!</a> shows some ways of loading large CSVs and the importance of <code>srckeep</code>
 </li>
 <li>
-<a href="https://diskframe.com/articles/group-by.html">Group-by</a> the various types of group-bys</li>
+<a href="https://diskframe.com/articles/group-by.html" class="external-link">Group-by</a> the various types of group-bys</li>
 <li>
-<a href="https://diskframe.com/articles/custom-group-by.html">Custom one-stage group-by functions</a> how to define custom one-stage group-by functions</li>
+<a href="https://diskframe.com/articles/custom-group-by.html" class="external-link">Custom one-stage group-by functions</a> how to define custom one-stage group-by functions</li>
 <li>
-<a href="https://diskframe.com/articles/glm.html">Fitting GLMs (including logistic regression)</a> introduces the <code>dfglm</code> function for fitting generalized linear models</li>
-<li><a href="https://diskframe.com/articles/data-table-syntax.html">Using data.table syntax with disk.frame</a></li>
-<li><a href="https://diskframe.com/articles/concepts.html">disk.frame concepts</a></li>
-<li><a href="https://diskframe.com/articles/vs-dask-juliadb.html">Benchmark 1: disk.frame vs Dask vs JuliaDB</a></li>
+<a href="https://diskframe.com/articles/glm.html" class="external-link">Fitting GLMs (including logistic regression)</a> introduces the <code>dfglm</code> function for fitting generalized linear models</li>
+<li><a href="https://diskframe.com/articles/data-table-syntax.html" class="external-link">Using data.table syntax with disk.frame</a></li>
+<li><a href="https://diskframe.com/articles/concepts.html" class="external-link">disk.frame concepts</a></li>
+<li><a href="https://diskframe.com/articles/vs-dask-juliadb.html" class="external-link">Benchmark 1: disk.frame vs Dask vs JuliaDB</a></li>
 </ul>
 </div>
-<div id="common-questions" class="section level2">
-<h2 class="hasAnchor">
-<a href="#common-questions" class="anchor"></a>Common questions</h2>
-<div id="a-what-is-diskframe-and-why-create-it" class="section level3">
-<h3 class="hasAnchor">
-<a href="#a-what-is-diskframe-and-why-create-it" class="anchor"></a>a) What is <code>{disk.frame}</code> and why create it?</h3>
-<p><code>{disk.frame}</code> is an R package that provides a framework for manipulating larger-than-RAM structured tabular data on disk efficiently. The reason one would want to manipulate data on disk is that it allows arbitrarily large datasets to be processed by R. In other words, we go from “R can only deal with data that fits in RAM” to “R can deal with any data that fits on disk”. See the next section.</p>
-</div>
-<div id="b-how-is-it-different-to-dataframe-and-datatable" class="section level3">
-<h3 class="hasAnchor">
-<a href="#b-how-is-it-different-to-dataframe-and-datatable" class="anchor"></a>b) How is it different to <code>data.frame</code> and <code>data.table</code>?</h3>
+<div class="section level2">
+<h2 id="common-questions">Common questions<a class="anchor" aria-label="anchor" href="#common-questions"></a>
+</h2>
+<div class="section level3">
+<h3 id="a-what-is-diskframe-and-why-create-it">a) What is <code>{disk.frame}</code> and why create it?<a class="anchor" aria-label="anchor" href="#a-what-is-diskframe-and-why-create-it"></a>
+</h3>
+<p><a href="https://diskframe.com" class="external-link">disk.frame</a> is an R package that provides a framework for manipulating larger-than-RAM structured tabular data on disk efficiently. The reason one would want to manipulate data on disk is that it allows arbitrarily large datasets to be processed by R. In other words, we go from “R can only deal with data that fits in RAM” to “R can deal with any data that fits on disk”. See the next section.</p>
+</div>
+<div class="section level3">
+<h3 id="b-how-is-it-different-to-dataframe-and-datatable">b) How is it different to <code>data.frame</code> and <code>data.table</code>?<a class="anchor" aria-label="anchor" href="#b-how-is-it-different-to-dataframe-and-datatable"></a>
+</h3>
 <p>A <code>data.frame</code> in R is an in-memory data structure, which means that R must load the data in its entirety into RAM. A corollary of this is that only data that can fit into RAM can be processed using <code>data.frame</code>s. This places significant restrictions on what R can process with minimal hassle.</p>
-<p>In contrast, <code>{disk.frame}</code> provides a framework to store and manipulate data on the hard drive. It does this by loading only a small part of the data, called a chunk, into RAM; process the chunk, write out the results and repeat with the next chunk. This chunking strategy is widely applied in other packages to enable processing large amounts of data in R, for example, see <a href="https://github.com/edwindj/chunked"><code>chunkded</code></a> <a href="https://github.com/ropensci/arkdb"><code>arkdb</code></a>, and <a href="https://github.com/s-u/iotools"><code>iotools</code></a>.</p>
-<p>Furthermore, there is a row-limit of 2^31 for <code>data.frame</code>s in R; hence an alternate approach is needed to apply R to these large datasets. The chunking mechanism in <code>{disk.frame}</code> provides such an avenue to enable data manipulation beyond the 2^31 row limit.</p>
-</div>
-<div id="c-how-is-diskframe-different-to-previous-big-data-solutions-for-r" class="section level3">
-<h3 class="hasAnchor">
-<a href="#c-how-is-diskframe-different-to-previous-big-data-solutions-for-r" class="anchor"></a>c) How is <code>{disk.frame}</code> different to previous “big” data solutions for R?</h3>
-<p>R has many packages that can deal with larger-than-RAM datasets, including <code>ff</code> and <code>bigmemory</code>. However, <code>ff</code> and <code>bigmemory</code> restrict the user to primitive data types such as double, which means they do not support character (string) and factor types. In contrast, <code>{disk.frame}</code> makes use of <code><a href="https://Rdatatable.gitlab.io/data.table/reference/data.table.html">data.table::data.table</a></code> and <code>data.frame</code> directly, so all data types are supported. Also, <code>{disk.frame}</code> strives to provide an API that is as similar to <code>data.frame</code>’s where possible. <code>{disk.frame}</code> supports many <code>dplyr</code> verbs for manipulating <code>disk.frame</code>s.</p>
-<p>Additionally, <code>{disk.frame}</code> supports parallel data operations using infrastructures provided by the excellent <a href="https://CRAN.R-project.org/package=future"><code>future</code> package</a> to take advantage of multi-core CPUs. Further, <code>{disk.frame}</code> uses state-of-the-art data storage techniques such as fast data compression, and random access to rows and columns provided by the <a href="http://www.fstpackage.org/"><code>fst</code> package</a> to provide superior data manipulation speeds.</p>
-</div>
-<div id="d-how-does-diskframe-work" class="section level3">
-<h3 class="hasAnchor">
-<a href="#d-how-does-diskframe-work" class="anchor"></a>d) How does <code>{disk.frame}</code> work?</h3>
-<p><code>{disk.frame}</code> works by breaking large datasets into smaller individual chunks and storing the chunks in <code>fst</code> files inside a folder. Each chunk is a <code>fst</code> file containing a <code>data.frame/data.table</code>. One can construct the original large dataset by loading all the chunks into RAM and row-bind all the chunks into one large <code>data.frame</code>. Of course, in practice this isn’t always possible; hence why we store them as smaller individual chunks.</p>
-<p><code>{disk.frame}</code> makes it easy to manipulate the underlying chunks by implementing <code>dplyr</code> functions/verbs and other convenient functions (e.g. the <code><a href="reference/cmap.html">cmap(a.disk.frame, fn, lazy = F)</a></code> function which applies the function <code>fn</code> to each chunk of <code>a.disk.frame</code> in parallel). So that <code>{disk.frame}</code> can be manipulated in a similar fashion to in-memory <code>data.frame</code>s.</p>
-</div>
-<div id="e-how-is-diskframe-different-from-spark-dask-and-juliadbjl" class="section level3">
-<h3 class="hasAnchor">
-<a href="#e-how-is-diskframe-different-from-spark-dask-and-juliadbjl" class="anchor"></a>e) How is <code>{disk.frame}</code> different from Spark, Dask, and JuliaDB.jl?</h3>
-<p>Spark is primarily a distributed system that also works on a single machine. Dask is a Python package that is most similar to <code>{disk.frame}</code>, and JuliaDB.jl is a Julia package. All three can distribute work over a cluster of computers. However, <code>{disk.frame}</code> currently cannot distribute data processes over many computers, and is, therefore, single machine focused.</p>
-<p>In R, one can access Spark via <code>sparklyr</code>, but that requires a Spark cluster to be set up. On the other hand <code>{disk.frame}</code> requires zero-setup apart from running <code><a href="https://rdrr.io/r/utils/install.packages.html">install.packages("disk.frame")</a></code> or <code><a href="https://devtools.r-lib.org//reference/remote-reexports.html">devtools::install_github("xiaodaigh/disk.frame")</a></code>.</p>
-<p>Finally, Spark can only apply functions that are implemented for Spark, whereas <code>{disk.frame}</code> can use any function in R including user-defined functions.</p>
-</div>
-</div>
-</div>
-<div id="example-usage" class="section level1">
-<h1 class="hasAnchor">
-<a href="#example-usage" class="anchor"></a>Example usage</h1>
-<div id="set-up-diskframe" class="section level2">
-<h2 class="hasAnchor">
-<a href="#set-up-diskframe" class="anchor"></a>Set-up <code>{disk.frame}</code>
+<p>In contrast, <a href="https://diskframe.com" class="external-link">disk.frame</a> provides a framework to store and manipulate data on the hard drive. It does this by loading only a small part of the data, called a chunk, into RAM; process the chunk, write out the results and repeat with the next chunk. This chunking strategy is widely applied in other packages to enable processing large amounts of data in R, for example, see <a href="https://github.com/edwindj/chunked" class="external-link"><code>chunkded</code></a> <a href="https://github.com/ropensci/arkdb" class="external-link"><code>arkdb</code></a>, and <a href="https://github.com/s-u/iotools" class="external-link"><code>iotools</code></a>.</p>
+<p>Furthermore, there is a row-limit of 2^31 for <code>data.frame</code>s in R; hence an alternate approach is needed to apply R to these large datasets. The chunking mechanism in <a href="https://diskframe.com" class="external-link">disk.frame</a> provides such an avenue to enable data manipulation beyond the 2^31 row limit.</p>
+</div>
+<div class="section level3">
+<h3 id="c-how-is-diskframe-different-to-previous-big-data-solutions-for-r">c) How is <code>{disk.frame}</code> different to previous “big” data solutions for R?<a class="anchor" aria-label="anchor" href="#c-how-is-diskframe-different-to-previous-big-data-solutions-for-r"></a>
+</h3>
+<p>R has many packages that can deal with larger-than-RAM datasets, including <code>ff</code> and <code>bigmemory</code>. However, <code>ff</code> and <code>bigmemory</code> restrict the user to primitive data types such as double, which means they do not support character (string) and factor types. In contrast, <a href="https://diskframe.com" class="external-link">disk.frame</a> makes use of <code><a href="https://Rdatatable.gitlab.io/data.table/reference/data.table.html" class="external-link">data.table::data.table</a></code> and <code>data.frame</code> directly, so all data types are supported. Also, <a href="https://diskframe.com" class="external-link">disk.frame</a> strives to provide an API that is as similar to <code>data.frame</code>’s where possible. <a href="https://diskframe.com" class="external-link">disk.frame</a> supports many <code>dplyr</code> verbs for manipulating <code>disk.frame</code>s.</p>
+<p>Additionally, <a href="https://diskframe.com" class="external-link">disk.frame</a> supports parallel data operations using infrastructures provided by the excellent <a href="https://CRAN.R-project.org/package=future" class="external-link"><code>future</code> package</a> to take advantage of multi-core CPUs. Further, <a href="https://diskframe.com" class="external-link">disk.frame</a> uses state-of-the-art data storage techniques such as fast data compression, and random access to rows and columns provided by the <a href="http://www.fstpackage.org/" class="external-link"><code>fst</code> package</a> to provide superior data manipulation speeds.</p>
+</div>
+<div class="section level3">
+<h3 id="d-how-does-diskframe-work">d) How does <code>{disk.frame}</code> work?<a class="anchor" aria-label="anchor" href="#d-how-does-diskframe-work"></a>
+</h3>
+<p><a href="https://diskframe.com" class="external-link">disk.frame</a> works by breaking large datasets into smaller individual chunks and storing the chunks in <code>fst</code> files inside a folder. Each chunk is a <code>fst</code> file containing a <code>data.frame/data.table</code>. One can construct the original large dataset by loading all the chunks into RAM and row-bind all the chunks into one large <code>data.frame</code>. Of course, in practice this isn’t always possible; hence why we store them as smaller individual chunks.</p>
+<p><a href="https://diskframe.com" class="external-link">disk.frame</a> makes it easy to manipulate the underlying chunks by implementing <code>dplyr</code> functions/verbs and other convenient functions (e.g. the <code>cmap(a.disk.frame, fn, lazy = F)</code> function which applies the function <code>fn</code> to each chunk of <code>a.disk.frame</code> in parallel). So that <a href="https://diskframe.com" class="external-link">disk.frame</a> can be manipulated in a similar fashion to in-memory <code>data.frame</code>s.</p>
+</div>
+<div class="section level3">
+<h3 id="e-how-is-diskframe-different-from-spark-dask-and-juliadbjl">e) How is <code>{disk.frame}</code> different from Spark, Dask, and JuliaDB.jl?<a class="anchor" aria-label="anchor" href="#e-how-is-diskframe-different-from-spark-dask-and-juliadbjl"></a>
+</h3>
+<p>Spark is primarily a distributed system that also works on a single machine. Dask is a Python package that is most similar to <a href="https://diskframe.com" class="external-link">disk.frame</a>, and JuliaDB.jl is a Julia package. All three can distribute work over a cluster of computers. However, <a href="https://diskframe.com" class="external-link">disk.frame</a> currently cannot distribute data processes over many computers, and is, therefore, single machine focused.</p>
+<p>In R, one can access Spark via <code>sparklyr</code>, but that requires a Spark cluster to be set up. On the other hand <a href="https://diskframe.com" class="external-link">disk.frame</a> requires zero-setup apart from running <code>install.packages("disk.frame")</code> or <code>devtools::install_github("xiaodaigh/disk.frame")</code>.</p>
+<p>Finally, Spark can only apply functions that are implemented for Spark, whereas <a href="https://diskframe.com" class="external-link">disk.frame</a> can use any function in R including user-defined functions.</p>
+</div>
+</div>
+</div>
+<div class="section level1">
+<h1 id="example-usage">Example usage<a class="anchor" aria-label="anchor" href="#example-usage"></a>
+</h1>
+<div class="section level2">
+<h2 id="set-up-diskframe">Set-up <code>{disk.frame}</code>
+<a class="anchor" aria-label="anchor" href="#set-up-diskframe"></a>
 </h2>
-<p><code>{disk.frame}</code> works best if it can process multiple data chunks in parallel. The best way to set-up <code>{disk.frame}</code> so that each CPU core runs a background worker is by using</p>
-<div class="sourceCode" id="cb4"><pre class="r"><span class="fu"><a href="reference/setup_disk.frame.html">setup_disk.frame</a></span>()
+<p><a href="https://diskframe.com" class="external-link">disk.frame</a> works best if it can process multiple data chunks in parallel. The best way to set-up <a href="https://diskframe.com" class="external-link">disk.frame</a> so that each CPU core runs a background worker is by using</p>
+<div class="sourceCode" id="cb4"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu"><a href="reference/setup_disk.frame.html">setup_disk.frame</a></span><span class="op">(</span><span class="op">)</span>
 
 <span class="co"># this allows large datasets to be transferred between sessions</span>
-<span class="fu"><a href="https://rdrr.io/r/base/options.html">options</a></span>(<span class="kw">future.globals.maxSize</span> <span class="kw">=</span> <span class="fl">Inf</span>)</pre></div>
+<span class="fu"><a href="https://rdrr.io/r/base/options.html" class="external-link">options</a></span><span class="op">(</span>future.globals.maxSize <span class="op">=</span> <span class="cn">Inf</span><span class="op">)</span></code></pre></div>
 <p>The <code><a href="reference/setup_disk.frame.html">setup_disk.frame()</a></code> sets up background workers equal to the number of CPU cores; please note that, by default, hyper-threaded cores are counted as one not two.</p>
-<p>Alternatively, one may specify the number of workers using <code><a href="reference/setup_disk.frame.html">setup_disk.frame(workers = n)</a></code>.</p>
+<p>Alternatively, one may specify the number of workers using <code>setup_disk.frame(workers = n)</code>.</p>
 </div>
-<div id="quick-start" class="section level2">
-<h2 class="hasAnchor">
-<a href="#quick-start" class="anchor"></a>Quick-start</h2>
-<div class="sourceCode" id="cb5"><pre class="r"><span class="fu"><a href="https://rdrr.io/r/base/message.html">suppressPackageStartupMessages</a></span>(<span class="fu"><a href="https://rdrr.io/r/base/library.html">library</a></span>(<span class="no">disk.frame</span>))
-<span class="fu"><a href="https://rdrr.io/r/base/library.html">library</a></span>(<span class="no">nycflights13</span>)
+<div class="section level2">
+<h2 id="quick-start">Quick-start<a class="anchor" aria-label="anchor" href="#quick-start"></a>
+</h2>
+<div class="sourceCode" id="cb5"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="fu"><a href="https://rdrr.io/r/base/message.html" class="external-link">suppressPackageStartupMessages</a></span><span class="op">(</span><span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://diskframe.com" class="external-link">disk.frame</a></span><span class="op">)</span><span class="op">)</span>
+<span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://github.com/hadley/nycflights13" class="external-link">nycflights13</a></span><span class="op">)</span>
 
 <span class="co"># this will setup disk.frame's parallel backend with number of workers equal to the number of CPU cores (hyper-threaded cores are counted as one not two)</span>
-<span class="fu"><a href="reference/setup_disk.frame.html">setup_disk.frame</a></span>()
+<span class="fu"><a href="reference/setup_disk.frame.html">setup_disk.frame</a></span><span class="op">(</span><span class="op">)</span>
 <span class="co">#&gt; The number of workers available for disk.frame is 6</span>
 <span class="co"># this allows large datasets to be transferred between sessions</span>
-<span class="fu"><a href="https://rdrr.io/r/base/options.html">options</a></span>(<span class="kw">future.globals.maxSize</span> <span class="kw">=</span> <span class="fl">Inf</span>)
+<span class="fu"><a href="https://rdrr.io/r/base/options.html" class="external-link">options</a></span><span class="op">(</span>future.globals.maxSize <span class="op">=</span> <span class="cn">Inf</span><span class="op">)</span>
 
 <span class="co"># convert the flights data.frame to a disk.frame</span>
 <span class="co"># optionally, you may specify an outdir, otherwise, the </span>
-<span class="no">flights.df</span> <span class="kw">&lt;-</span> <span class="fu"><a href="reference/as.disk.frame.html">as.disk.frame</a></span>(<span class="kw pkg">nycflights13</span><span class="kw ns">::</span><span class="no"><a href="https://rdrr.io/pkg/nycflights13/man/flights.html">flights</a></span>)</pre></div>
-</div>
-<div id="example-dplyr-verbs" class="section level2">
-<h2 class="hasAnchor">
-<a href="#example-dplyr-verbs" class="anchor"></a>Example: dplyr verbs</h2>
-<div id="dplyr-verbs" class="section level3">
-<h3 class="hasAnchor">
-<a href="#dplyr-verbs" class="anchor"></a>dplyr verbs</h3>
+<span class="va">flights.df</span> <span class="op">&lt;-</span> <span class="fu"><a href="reference/as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="fu">nycflights13</span><span class="fu">::</span><span class="va"><a href="https://rdrr.io/pkg/nycflights13/man/flights.html" class="external-link">flights</a></span><span class="op">)</span></code></pre></div>
+</div>
+<div class="section level2">
+<h2 id="example-dplyr-verbs">Example: dplyr verbs<a class="anchor" aria-label="anchor" href="#example-dplyr-verbs"></a>
+</h2>
+<div class="section level3">
+<h3 id="dplyr-verbs">dplyr verbs<a class="anchor" aria-label="anchor" href="#dplyr-verbs"></a>
+</h3>
 <p>{disk.frame} aims to support as many dplyr verbs as possible. For example</p>
-<div class="sourceCode" id="cb6"><pre class="r"><span class="no">flights.df</span> <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="https://rdrr.io/r/stats/filter.html">filter</a></span>(<span class="no">year</span> <span class="kw">==</span> <span class="fl">2013</span>) <span class="kw">%&gt;%</span>
-  <span class="fu">mutate</span>(<span class="kw">origin_dest</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/paste.html">paste0</a></span>(<span class="no">origin</span>, <span class="no">dest</span>)) <span class="kw">%&gt;%</span>
-  <span class="fu"><a href="https://rdrr.io/r/utils/head.html">head</a></span>(<span class="fl">2</span>)
-<span class="co">#&gt;   year month day dep_time sched_dep_time dep_delay arr_time sched_arr_time arr_delay carrier flight tailnum origin</span>
-<span class="co">#&gt; 1 2013     1   1      517            515         2      830            819        11      UA   1545  N14228    EWR</span>
-<span class="co">#&gt; 2 2013     1   1      533            529         4      850            830        20      UA   1714  N24211    LGA</span>
-<span class="co">#&gt;   dest air_time distance hour minute           time_hour origin_dest</span>
-<span class="co">#&gt; 1  IAH      227     1400    5     15 2013-01-01 05:00:00      EWRIAH</span>
-<span class="co">#&gt; 2  IAH      227     1416    5     29 2013-01-01 05:00:00      LGAIAH</span></pre></div>
-</div>
-<div id="group-by" class="section level3">
-<h3 class="hasAnchor">
-<a href="#group-by" class="anchor"></a>Group-by</h3>
-<p>Starting from <code>{disk.frame}</code> v0.3.0, there is <code>group_by</code> support for a limited set of functions. For example:</p>
-<div class="sourceCode" id="cb7"><pre class="r"><span class="no">result_from_disk.frame</span> <span class="kw">=</span> <span class="no">iris</span> <span class="kw">%&gt;%</span>
-  <span class="no">as.disk.frame</span> <span class="kw">%&gt;%</span>
-  <span class="fu">group_by</span>(<span class="no">Species</span>) <span class="kw">%&gt;%</span>
-  <span class="fu">summarize</span>(
-    <span class="fu"><a href="https://rdrr.io/r/base/mean.html">mean</a></span>(<span class="no">Petal.Length</span>),
-    <span class="kw">sumx</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/sum.html">sum</a></span>(<span class="no">Petal.Length</span>/<span class="no">Sepal.Width</span>),
-    <span class="fu"><a href="https://rdrr.io/r/stats/sd.html">sd</a></span>(<span class="no">Sepal.Width</span>/ <span class="no">Petal.Length</span>),
-    <span class="fu"><a href="https://rdrr.io/r/stats/cor.html">var</a></span>(<span class="no">Sepal.Width</span>/ <span class="no">Sepal.Width</span>),
-    <span class="kw">l</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/length.html">length</a></span>(<span class="no">Sepal.Width</span>/ <span class="no">Sepal.Width</span> + <span class="fl">2</span>),
-    <span class="fu"><a href="https://rdrr.io/r/base/Extremes.html">max</a></span>(<span class="no">Sepal.Width</span>),
-    <span class="fu"><a href="https://rdrr.io/r/base/Extremes.html">min</a></span>(<span class="no">Sepal.Width</span>),
-    <span class="fu"><a href="https://rdrr.io/r/stats/median.html">median</a></span>(<span class="no">Sepal.Width</span>)
-    ) <span class="kw">%&gt;%</span>
-  <span class="no">collect</span></pre></div>
-<p>The results should be exactly the same as if applying the same group-by operations on a data.frame. If not, please <a href="https://github.com/xiaodaigh/disk.frame/issues">report a bug</a>.</p>
-<div id="list-of-supported-group-by-functions" class="section level4">
-<h4 class="hasAnchor">
-<a href="#list-of-supported-group-by-functions" class="anchor"></a>List of supported group-by functions</h4>
-<p>If a function you like is missing, please make a feature request <a href="https://github.com/xiaodaigh/disk.frame/issues">here</a>. It is a limitation that function that depend on the order a column can only be obtained using estimated methods.</p>
+<div class="sourceCode" id="cb6"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">flights.df</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/filter.html" class="external-link">filter</a></span><span class="op">(</span><span class="va">year</span> <span class="op">==</span> <span class="fl">2013</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate.html" class="external-link">mutate</a></span><span class="op">(</span>origin_dest <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/paste.html" class="external-link">paste0</a></span><span class="op">(</span><span class="va">origin</span>, <span class="va">dest</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://rdrr.io/r/utils/head.html" class="external-link">head</a></span><span class="op">(</span><span class="fl">2</span><span class="op">)</span>
+<span class="co">#&gt;   year month day dep_time sched_dep_time dep_delay arr_time sched_arr_time arr_delay carrier</span>
+<span class="co">#&gt; 1 2013     1   1      517            515         2      830            819        11      UA</span>
+<span class="co">#&gt; 2 2013     1   1      533            529         4      850            830        20      UA</span>
+<span class="co">#&gt;   flight tailnum origin dest air_time distance hour minute           time_hour origin_dest</span>
+<span class="co">#&gt; 1   1545  N14228    EWR  IAH      227     1400    5     15 2013-01-01 05:00:00      EWRIAH</span>
+<span class="co">#&gt; 2   1714  N24211    LGA  IAH      227     1416    5     29 2013-01-01 05:00:00      LGAIAH</span></code></pre></div>
+</div>
+<div class="section level3">
+<h3 id="group-by">Group-by<a class="anchor" aria-label="anchor" href="#group-by"></a>
+</h3>
+<p>Starting from <a href="https://diskframe.com" class="external-link">disk.frame</a> v0.3.0, there is <code>group_by</code> support for a limited set of functions. For example:</p>
+<div class="sourceCode" id="cb7"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">result_from_disk.frame</span> <span class="op">=</span> <span class="va">iris</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="va">as.disk.frame</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/group_by.html" class="external-link">group_by</a></span><span class="op">(</span><span class="va">Species</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/summarise.html" class="external-link">summarize</a></span><span class="op">(</span>
+    <span class="fu"><a href="https://rdrr.io/r/base/mean.html" class="external-link">mean</a></span><span class="op">(</span><span class="va">Petal.Length</span><span class="op">)</span>, 
+    sumx <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/sum.html" class="external-link">sum</a></span><span class="op">(</span><span class="va">Petal.Length</span><span class="op">/</span><span class="va">Sepal.Width</span><span class="op">)</span>, 
+    <span class="fu"><a href="https://rdrr.io/r/stats/sd.html" class="external-link">sd</a></span><span class="op">(</span><span class="va">Sepal.Width</span><span class="op">/</span> <span class="va">Petal.Length</span><span class="op">)</span>, 
+    <span class="fu"><a href="https://rdrr.io/r/stats/cor.html" class="external-link">var</a></span><span class="op">(</span><span class="va">Sepal.Width</span><span class="op">/</span> <span class="va">Sepal.Width</span><span class="op">)</span>, 
+    l <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/length.html" class="external-link">length</a></span><span class="op">(</span><span class="va">Sepal.Width</span><span class="op">/</span> <span class="va">Sepal.Width</span> <span class="op">+</span> <span class="fl">2</span><span class="op">)</span>,
+    <span class="fu"><a href="https://rdrr.io/r/base/Extremes.html" class="external-link">max</a></span><span class="op">(</span><span class="va">Sepal.Width</span><span class="op">)</span>, 
+    <span class="fu"><a href="https://rdrr.io/r/base/Extremes.html" class="external-link">min</a></span><span class="op">(</span><span class="va">Sepal.Width</span><span class="op">)</span>, 
+    <span class="fu"><a href="https://rdrr.io/r/stats/median.html" class="external-link">median</a></span><span class="op">(</span><span class="va">Sepal.Width</span><span class="op">)</span>
+    <span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> 
+  <span class="va">collect</span></code></pre></div>
+<p>The results should be exactly the same as if applying the same group-by operations on a data.frame. If not, please <a href="https://github.com/xiaodaigh/disk.frame/issues" class="external-link">report a bug</a>.</p>
+<div class="section level4">
+<h4 id="list-of-supported-group-by-functions">List of supported group-by functions<a class="anchor" aria-label="anchor" href="#list-of-supported-group-by-functions"></a>
+</h4>
+<p>If a function you like is missing, please make a feature request <a href="https://github.com/xiaodaigh/disk.frame/issues" class="external-link">here</a>. It is a limitation that function that depend on the order a column can only be obtained using estimated methods.</p>
 <table class="table">
 <thead><tr class="header">
 <th>Function</th>
@@ -322,7 +330,7 @@ <h4 class="hasAnchor">
 <td><code>var</code></td>
 <td>Exact</td>
 <td>
-<code><a href="https://rdrr.io/r/stats/cor.html">var(x)</a></code> only <code>cor, cov</code> support <em>planned</em>
+<code>var(x)</code> only <code>cor, cov</code> support <em>planned</em>
 </td>
 </tr>
 <tr class="even">
@@ -355,88 +363,88 @@ <h4 class="hasAnchor">
 </div>
 </div>
 </div>
-<div id="example-datatable-syntax" class="section level2">
-<h2 class="hasAnchor">
-<a href="#example-datatable-syntax" class="anchor"></a>Example: data.table syntax</h2>
-<div class="sourceCode" id="cb8"><pre class="r"><span class="fu"><a href="https://rdrr.io/r/base/library.html">library</a></span>(<span class="no">data.table</span>)
-<span class="co">#&gt; data.table 1.12.8 using 6 threads (see ?getDTthreads).  Latest news: r-datatable.com</span>
-<span class="co">#&gt; </span>
-<span class="co">#&gt; Attaching package: 'data.table'</span>
-<span class="co">#&gt; The following object is masked from 'package:purrr':</span>
-<span class="co">#&gt; </span>
-<span class="co">#&gt;     transpose</span>
-<span class="co">#&gt; The following objects are masked from 'package:dplyr':</span>
-<span class="co">#&gt; </span>
-<span class="co">#&gt;     between, first, last</span>
+<div class="section level2">
+<h2 id="example-datatable-syntax">Example: data.table syntax<a class="anchor" aria-label="anchor" href="#example-datatable-syntax"></a>
+</h2>
+<div class="sourceCode" id="cb8"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://r-datatable.com" class="external-link">data.table</a></span><span class="op">)</span>
 
-<span class="fu"><a href="https://rdrr.io/r/base/warning.html">suppressWarnings</a></span>(
-  <span class="no">grp_by_stage1</span> <span class="kw">&lt;-</span>
-    <span class="no">flights.df</span>[
-      <span class="kw">keep</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html">c</a></span>(<span class="st">"month"</span>, <span class="st">"distance"</span>), <span class="co"># this analysis only required "month" and "dist" so only load those</span>
-      <span class="no">month</span> <span class="kw">&lt;=</span> <span class="fl">6</span>,
-      <span class="fu">.</span>(<span class="kw">sum_dist</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/sum.html">sum</a></span>(<span class="no">distance</span>)),
-      <span class="fu">.</span>(<span class="kw">qtr</span> <span class="kw">=</span> <span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/fifelse.html">ifelse</a></span>(<span class="no">month</span> <span class="kw">&lt;=</span> <span class="fl">3</span>, <span class="st">"Q1"</span>, <span class="st">"Q2"</span>))
-      ]
-)
+<span class="fu"><a href="https://rdrr.io/r/base/warning.html" class="external-link">suppressWarnings</a></span><span class="op">(</span>
+  <span class="va">grp_by_stage1</span> <span class="op">&lt;-</span> 
+    <span class="va">flights.df</span><span class="op">[</span>
+      keep <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">"month"</span>, <span class="st">"distance"</span><span class="op">)</span>, <span class="co"># this analysis only required "month" and "dist" so only load those</span>
+      <span class="va">month</span> <span class="op">&lt;=</span> <span class="fl">6</span>, 
+      <span class="fu">.</span><span class="op">(</span>sum_dist <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/sum.html" class="external-link">sum</a></span><span class="op">(</span><span class="va">distance</span><span class="op">)</span><span class="op">)</span>, 
+      <span class="fu">.</span><span class="op">(</span>qtr <span class="op">=</span> <span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/fifelse.html" class="external-link">ifelse</a></span><span class="op">(</span><span class="va">month</span> <span class="op">&lt;=</span> <span class="fl">3</span>, <span class="st">"Q1"</span>, <span class="st">"Q2"</span><span class="op">)</span><span class="op">)</span>
+      <span class="op">]</span>
+<span class="op">)</span>
 
-<span class="no">grp_by_stage1</span>
+<span class="va">grp_by_stage1</span>
 <span class="co">#&gt;    qtr sum_dist</span>
 <span class="co">#&gt; 1:  Q1 27188805</span>
 <span class="co">#&gt; 2:  Q1   953578</span>
 <span class="co">#&gt; 3:  Q1 53201567</span>
 <span class="co">#&gt; 4:  Q2  3383527</span>
 <span class="co">#&gt; 5:  Q2 58476357</span>
-<span class="co">#&gt; 6:  Q2 27397926</span></pre></div>
+<span class="co">#&gt; 6:  Q2 27397926</span></code></pre></div>
 <p>The result <code>grp_by_stage1</code> is a <code>data.table</code> so we can finish off the two-stage aggregation using data.table syntax</p>
-<div class="sourceCode" id="cb9"><pre class="r"><span class="no">grp_by_stage2</span> <span class="kw">=</span> <span class="no">grp_by_stage1</span>[,<span class="fu">.</span>(<span class="kw">sum_dist</span> <span class="kw">=</span> <span class="fu"><a href="https://rdrr.io/r/base/sum.html">sum</a></span>(<span class="no">sum_dist</span>)), <span class="no">qtr</span>]
+<div class="sourceCode" id="cb9"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="va">grp_by_stage2</span> <span class="op">=</span> <span class="va">grp_by_stage1</span><span class="op">[</span>,<span class="fu">.</span><span class="op">(</span>sum_dist <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/sum.html" class="external-link">sum</a></span><span class="op">(</span><span class="va">sum_dist</span><span class="op">)</span><span class="op">)</span>, <span class="va">qtr</span><span class="op">]</span>
 
-<span class="no">grp_by_stage2</span>
+<span class="va">grp_by_stage2</span>
 <span class="co">#&gt;    qtr sum_dist</span>
 <span class="co">#&gt; 1:  Q1 81343950</span>
-<span class="co">#&gt; 2:  Q2 89257810</span></pre></div>
+<span class="co">#&gt; 2:  Q2 89257810</span></code></pre></div>
 </div>
-<div id="basic-info" class="section level2">
-<h2 class="hasAnchor">
-<a href="#basic-info" class="anchor"></a>Basic info</h2>
+<div class="section level2">
+<h2 id="basic-info">Basic info<a class="anchor" aria-label="anchor" href="#basic-info"></a>
+</h2>
 <p>To find out where the disk.frame is stored on disk:</p>
-<div class="sourceCode" id="cb10"><pre class="r"><span class="co"># where is the disk.frame stored</span>
-<span class="fu"><a href="https://rdrr.io/r/base/attr.html">attr</a></span>(<span class="no">flights.df</span>, <span class="st">"path"</span>)
-<span class="co">#&gt; [1] "C:\\Users\\RTX2080\\AppData\\Local\\Temp\\RtmpSyWIOI\\file26ac7d293556.df"</span></pre></div>
+<div class="sourceCode" id="cb10"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="co"># where is the disk.frame stored</span>
+<span class="fu"><a href="https://rdrr.io/r/base/attr.html" class="external-link">attr</a></span><span class="op">(</span><span class="va">flights.df</span>, <span class="st">"path"</span><span class="op">)</span>
+<span class="co">#&gt; [1] "C:\\Users\\RTX2080\\AppData\\Local\\Temp\\RtmpIlXNzn\\file568813b835a7.df"</span></code></pre></div>
 <p>A number of data.frame functions are implemented for disk.frame</p>
-<div class="sourceCode" id="cb11"><pre class="r"><span class="co"># get first few rows</span>
-<span class="fu"><a href="https://rdrr.io/r/utils/head.html">head</a></span>(<span class="no">flights.df</span>, <span class="fl">1</span>)
-<span class="co">#&gt;    year month day dep_time sched_dep_time dep_delay arr_time sched_arr_time arr_delay carrier flight tailnum origin</span>
-<span class="co">#&gt; 1: 2013     1   1      517            515         2      830            819        11      UA   1545  N14228    EWR</span>
-<span class="co">#&gt;    dest air_time distance hour minute           time_hour</span>
-<span class="co">#&gt; 1:  IAH      227     1400    5     15 2013-01-01 05:00:00</span></pre></div>
-<div class="sourceCode" id="cb12"><pre class="r"><span class="co"># get last few rows</span>
-<span class="fu"><a href="https://rdrr.io/r/utils/head.html">tail</a></span>(<span class="no">flights.df</span>, <span class="fl">1</span>)
-<span class="co">#&gt;    year month day dep_time sched_dep_time dep_delay arr_time sched_arr_time arr_delay carrier flight tailnum origin</span>
-<span class="co">#&gt; 1: 2013     9  30       NA            840        NA       NA           1020        NA      MQ   3531  N839MQ    LGA</span>
-<span class="co">#&gt;    dest air_time distance hour minute           time_hour</span>
-<span class="co">#&gt; 1:  RDU       NA      431    8     40 2013-09-30 08:00:00</span></pre></div>
-<div class="sourceCode" id="cb13"><pre class="r"><span class="co"># number of rows</span>
-<span class="fu"><a href="reference/ncol_nrow.html">nrow</a></span>(<span class="no">flights.df</span>)
-<span class="co">#&gt; [1] 336776</span></pre></div>
-<div class="sourceCode" id="cb14"><pre class="r"><span class="co"># number of columns</span>
-<span class="fu"><a href="reference/ncol_nrow.html">ncol</a></span>(<span class="no">flights.df</span>)
-<span class="co">#&gt; [1] 19</span></pre></div>
-</div>
-<div id="hex-logo" class="section level2">
-<h2 class="hasAnchor">
-<a href="#hex-logo" class="anchor"></a>Hex logo</h2>
-<p><img src="inst/figures/logo.png?raw=true" alt="disk.frame logo"></p>
-</div>
-<div id="contributors" class="section level2">
-<h2 class="hasAnchor">
-<a href="#contributors" class="anchor"></a>Contributors</h2>
-<p>This project exists thanks to all the people who contribute. <a href="https://github.com/xiaodaigh/disk.frame/graphs/contributors"><img src="https://opencollective.com/diskframe/contributors.svg?width=890&amp;button=false"></a></p>
-</div>
-<div id="current-priorities" class="section level2">
-<h2 class="hasAnchor">
-<a href="#current-priorities" class="anchor"></a>Current Priorities</h2>
+<div class="sourceCode" id="cb11"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="co"># get first few rows</span>
+<span class="fu"><a href="https://rdrr.io/r/utils/head.html" class="external-link">head</a></span><span class="op">(</span><span class="va">flights.df</span>, <span class="fl">1</span><span class="op">)</span>
+<span class="co">#&gt;    year month day dep_time sched_dep_time dep_delay arr_time sched_arr_time arr_delay carrier</span>
+<span class="co">#&gt; 1: 2013     1   1      517            515         2      830            819        11      UA</span>
+<span class="co">#&gt;    flight tailnum origin dest air_time distance hour minute           time_hour</span>
+<span class="co">#&gt; 1:   1545  N14228    EWR  IAH      227     1400    5     15 2013-01-01 05:00:00</span></code></pre></div>
+<div class="sourceCode" id="cb12"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="co"># get last few rows</span>
+<span class="fu"><a href="https://rdrr.io/r/utils/head.html" class="external-link">tail</a></span><span class="op">(</span><span class="va">flights.df</span>, <span class="fl">1</span><span class="op">)</span>
+<span class="co">#&gt;    year month day dep_time sched_dep_time dep_delay arr_time sched_arr_time arr_delay carrier</span>
+<span class="co">#&gt; 1: 2013     9  30       NA            840        NA       NA           1020        NA      MQ</span>
+<span class="co">#&gt;    flight tailnum origin dest air_time distance hour minute           time_hour</span>
+<span class="co">#&gt; 1:   3531  N839MQ    LGA  RDU       NA      431    8     40 2013-09-30 08:00:00</span></code></pre></div>
+<div class="sourceCode" id="cb13"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="co"># number of rows</span>
+<span class="fu"><a href="reference/ncol_nrow.html">nrow</a></span><span class="op">(</span><span class="va">flights.df</span><span class="op">)</span>
+<span class="co">#&gt; [1] 336776</span></code></pre></div>
+<div class="sourceCode" id="cb14"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span class="co"># number of columns</span>
+<span class="fu"><a href="reference/ncol_nrow.html">ncol</a></span><span class="op">(</span><span class="va">flights.df</span><span class="op">)</span>
+<span class="co">#&gt; [1] 19</span></code></pre></div>
+</div>
+<div class="section level2">
+<h2 id="hex-logo">Hex logo<a class="anchor" aria-label="anchor" href="#hex-logo"></a>
+</h2>
+<div class="figure">
+<img src="inst/figures/logo.png" alt=""><p class="caption">disk.frame logo</p>
+</div>
+</div>
+<div class="section level2">
+<h2 id="contributors">Contributors<a class="anchor" aria-label="anchor" href="#contributors"></a>
+</h2>
+<p>This project exists thanks to all the people who contribute. <a href="https://github.com/xiaodaigh/disk.frame/graphs/contributors" class="external-link"><img src="https://opencollective.com/diskframe/contributors.svg?width=890&amp;button=false"></a></p>
+</div>
+<div class="section level2">
+<h2 id="current-priorities">Current Priorities<a class="anchor" aria-label="anchor" href="#current-priorities"></a>
+</h2>
 <p>The work priorities at this stage are</p>
-<ol>
+<ol style="list-style-type: decimal">
 <li>Bugs</li>
 <li>Urgent feature implementations that can improve an awful user-experience</li>
 <li>More vignettes covering every aspect of disk.frame</li>
@@ -445,16 +453,16 @@ <h2 class="hasAnchor">
 <li>More features</li>
 </ol>
 </div>
-<div id="blogs-and-other-resources" class="section level2">
-<h2 class="hasAnchor">
-<a href="#blogs-and-other-resources" class="anchor"></a>Blogs and other resources</h2>
+<div class="section level2">
+<h2 id="blogs-and-other-resources">Blogs and other resources<a class="anchor" aria-label="anchor" href="#blogs-and-other-resources"></a>
+</h2>
 <table class="table">
 <colgroup>
-<col width="50%">
+<col width="49%">
 <col width="3%">
-<col width="5%">
-<col width="3%">
-<col width="37%">
+<col width="6%">
+<col width="4%">
+<col width="36%">
 </colgroup>
 <thead><tr class="header">
 <th>Title</th>
@@ -465,67 +473,67 @@ <h2 class="hasAnchor">
 </tr></thead>
 <tbody>
 <tr class="odd">
-<td><a href="https://twitter.com/evalparse/status/1200963268270886912">25 days of disk.frame</a></td>
+<td><a href="https://twitter.com/evalparse/status/1200963268270886912" class="external-link">25 days of disk.frame</a></td>
 <td>English</td>
 <td>ZJ</td>
 <td>2019-12-01</td>
-<td>25 tweets about <code>{disk.frame}</code>
+<td>25 tweets about <a href="https://diskframe.com" class="external-link">disk.frame</a>
 </td>
 </tr>
 <tr class="even">
-<td><a href="https://www.researchgate.net/post/What_is_the_Maximum_size_of_data_that_is_supported_by_R-datamining" class="uri">https://www.researchgate.net/post/What_is_the_Maximum_size_of_data_that_is_supported_by_R-datamining</a></td>
+<td><a href="https://www.researchgate.net/post/What-is-the-Maximum-size-of-data-that-is-supported-by-R-datamining" class="external-link uri">https://www.researchgate.net/post/What-is-the-Maximum-size-of-data-that-is-supported-by-R-datamining</a></td>
 <td>English</td>
 <td>Knut Jägersberg</td>
 <td>2019-11-11</td>
 <td>Great answer on using disk.frame</td>
 </tr>
 <tr class="odd">
-<td><a href="https://www.brodrigues.co/blog/2019-09-03-disk_frame/"><code>{disk.frame}</code> is epic</a></td>
+<td><a href="https://www.brodrigues.co/blog/2019-09-03-disk_frame/" class="external-link"><code>{disk.frame}</code> is epic</a></td>
 <td>English</td>
 <td>Bruno Rodriguez</td>
 <td>2019-09-03</td>
-<td>It’s about loading a 30G file into <code>{disk.frame}</code>
+<td>It’s about loading a 30G file into <a href="https://diskframe.com" class="external-link">disk.frame</a>
 </td>
 </tr>
 <tr class="even">
-<td><a href="https://www.actuaries.digital/2019/09/26/my-top-10-r-packages-for-data-analytics/">My top 10 R packages for data analytics</a></td>
+<td><a href="https://www.actuaries.digital/2019/09/26/my-top-10-r-packages-for-data-analytics/" class="external-link">My top 10 R packages for data analytics</a></td>
 <td>English</td>
 <td>Jacky Poon</td>
 <td>2019-09-03</td>
 <td>
-<code>{disk.frame}</code> was number 3</td>
+<a href="https://diskframe.com" class="external-link">disk.frame</a> was number 3</td>
 </tr>
 <tr class="odd">
-<td><a href="https://www.youtube.com/watch?v=3XMTyi_H4q4">useR! 2019 presentation video</a></td>
+<td><a href="https://www.youtube.com/watch?v=3XMTyi_H4q4" class="external-link">useR! 2019 presentation video</a></td>
 <td>English</td>
 <td>Dai ZJ</td>
 <td>2019-08-03</td>
 <td></td>
 </tr>
 <tr class="even">
-<td><a href="https://www.beautiful.ai/player/-LphQ0YaJwRektb8nZoY">useR! 2019 presentation slides</a></td>
+<td><a href="https://www.beautiful.ai/player/-LphQ0YaJwRektb8nZoY" class="external-link">useR! 2019 presentation slides</a></td>
 <td>English</td>
 <td>Dai ZJ</td>
 <td>2019-08-03</td>
 <td></td>
 </tr>
 <tr class="odd">
-<td><a href="https://www.brodrigues.co/blog/2019-10-05-parallel_maxlik/">Split-apply-combine for Maximum Likelihood Estimation of a linear model</a></td>
+<td><a href="https://www.brodrigues.co/blog/2019-10-05-parallel_maxlik/" class="external-link">Split-apply-combine for Maximum Likelihood Estimation of a linear model</a></td>
 <td>English</td>
 <td>Bruno Rodriguez</td>
 <td>2019-10-06</td>
 <td>
-<code>{disk.frame}</code> used in helping to create a maximum likelihood estimation program for linear models</td>
+<a href="https://diskframe.com" class="external-link">disk.frame</a> used in helping to create a maximum likelihood estimation program for linear models</td>
 </tr>
 <tr class="even">
-<td><a href="https://emmavestesson.netlify.com/2019/07/user2019/">Emma goes to useR! 2019</a></td>
+<td><a href="https://emmavestesson.netlify.app/2019/07/user2019/" class="external-link">Emma goes to useR! 2019</a></td>
 <td>English</td>
 <td>Emma Vestesson</td>
 <td>2019-07-16</td>
-<td>The first mention of <code>{disk.frame}</code> in a blog post</td>
+<td>The first mention of <a href="https://diskframe.com" class="external-link">disk.frame</a> in a blog post</td>
 </tr>
 <tr class="odd">
-<td><a href="https://segmentfault.com/a/1190000021653567">深入对比数据科学工具箱：Python3 和 R 之争(2020版)</a></td>
+<td><a href="https://segmentfault.com/a/1190000021653567" class="external-link">深入对比数据科学工具箱：Python3 和 R 之争(2020版)</a></td>
 <td>Chinese</td>
 <td>Harry Zhu</td>
 <td>2020-02-16</td>
@@ -533,67 +541,60 @@ <h2 class="hasAnchor">
 </tr>
 </tbody>
 </table>
-<div id="interested-in-learning-diskframe-in-a-structured-course" class="section level3">
-<h3 class="hasAnchor">
-<a href="#interested-in-learning-diskframe-in-a-structured-course" class="anchor"></a>Interested in learning <code>{disk.frame}</code> in a structured course?</h3>
+<div class="section level3">
+<h3 id="interested-in-learning-diskframe-in-a-structured-course">Interested in learning <code>{disk.frame}</code> in a structured course?<a class="anchor" aria-label="anchor" href="#interested-in-learning-diskframe-in-a-structured-course"></a>
+</h3>
 <p>Please register your interest at:</p>
-<p><a href="https://leanpub.com/c/taminglarger-than-ramwithdiskframe" class="uri">https://leanpub.com/c/taminglarger-than-ramwithdiskframe</a></p>
+<p><a href="https://leanpub.com/c/taminglarger-than-ramwithdiskframe" class="external-link uri">https://leanpub.com/c/taminglarger-than-ramwithdiskframe</a></p>
 </div>
 </div>
-<div id="open-collective" class="section level2">
-<h2 class="hasAnchor">
-<a href="#open-collective" class="anchor"></a>Open Collective</h2>
-<p>If you like <code>{disk.frame}</code> and want to speed up its development or perhaps you have a feature request? Please consider sponsoring <code>{disk.frame}</code> on Open Collective</p>
-<div id="backers" class="section level3">
-<h3 class="hasAnchor">
-<a href="#backers" class="anchor"></a>Backers</h3>
+<div class="section level2">
+<h2 id="open-collective">Open Collective<a class="anchor" aria-label="anchor" href="#open-collective"></a>
+</h2>
+<p>If you like <a href="https://diskframe.com" class="external-link">disk.frame</a> and want to speed up its development or perhaps you have a feature request? Please consider sponsoring <a href="https://diskframe.com" class="external-link">disk.frame</a> on Open Collective</p>
+<div class="section level3">
+<h3 id="backers">Backers<a class="anchor" aria-label="anchor" href="#backers"></a>
+</h3>
 <p>Thank you to all our backers!</p>
-<p><a href="https://opencollective.com/diskframe#backers" target="_blank"><img src="https://opencollective.com/diskframe/backers.svg?width=890"></a></p>
+<p><a href="https://opencollective.com/diskframe#backers" target="_blank" class="external-link"><img src="https://opencollective.com/diskframe/backers.svg?width=890"></a></p>
 </div>
-<div id="sponsor-and-back-diskframe" class="section level3">
-<h3 class="hasAnchor">
-<a href="#sponsor-and-back-diskframe" class="anchor"></a>Sponsor and back <code>{disk.frame}</code>
+<div class="section level3">
+<h3 id="sponsor-and-back-diskframe">Sponsor and back <code>{disk.frame}</code>
+<a class="anchor" aria-label="anchor" href="#sponsor-and-back-diskframe"></a>
 </h3>
-<p>Support <code>{disk.frame}</code> development by becoming a sponsor. Your logo will show up here with a link to your website.</p>
-<p><a href="https://opencollective.com/diskframe#sponsors" target="_blank"><img src="https://opencollective.com/diskframe/sponsors.svg?width=890"></a></p>
+<p>Support <a href="https://diskframe.com" class="external-link">disk.frame</a> development by becoming a sponsor. Your logo will show up here with a link to your website.</p>
+<p><a href="https://opencollective.com/diskframe#sponsors" target="_blank" class="external-link"><img src="https://opencollective.com/diskframe/sponsors.svg?width=890"></a></p>
 </div>
 </div>
-<div id="contact-me-for-consulting" class="section level2">
-<h2 class="hasAnchor">
-<a href="#contact-me-for-consulting" class="anchor"></a>Contact me for consulting</h2>
+<div class="section level2">
+<h2 id="contact-me-for-consulting">Contact me for consulting<a class="anchor" aria-label="anchor" href="#contact-me-for-consulting"></a>
+</h2>
 <p><strong>Do you need help with machine learning and data science in R, Python, or Julia?</strong> I am available for Machine Learning/Data Science/R/Python/Julia consulting! <a href="mailto:dzj@analytixware.com">Email me</a></p>
 </div>
-<div id="non-financial-ways-to-contribute" class="section level2">
-<h2 class="hasAnchor">
-<a href="#non-financial-ways-to-contribute" class="anchor"></a>Non-financial ways to contribute</h2>
+<div class="section level2">
+<h2 id="non-financial-ways-to-contribute">Non-financial ways to contribute<a class="anchor" aria-label="anchor" href="#non-financial-ways-to-contribute"></a>
+</h2>
 <p>Do you wish to give back the open-source community in non-financial ways? Here are some ways you can contribute</p>
 <ul>
-<li>Write a blogpost about your <code>{disk.frame}</code> usage or experience. I would love to learn more about how <code>{disk.frame}</code> has helped you</li>
-<li>Tweet or post on social media (e.g LinkedIn) about <code>{disk.frame}</code> to help promote it</li>
-<li>Bring attention to typos and grammatical errors by correcting and making a PR. Or simply by <a href="https://github.com/xiaodaigh/disk.frame/issues">raising an issue here</a>
+<li>Write a blogpost about your <a href="https://diskframe.com" class="external-link">disk.frame</a> usage or experience. I would love to learn more about how <a href="https://diskframe.com" class="external-link">disk.frame</a> has helped you</li>
+<li>Tweet or post on social media (e.g LinkedIn) about <a href="https://diskframe.com" class="external-link">disk.frame</a> to help promote it</li>
+<li>Bring attention to typos and grammatical errors by correcting and making a PR. Or simply by <a href="https://github.com/xiaodaigh/disk.frame/issues" class="external-link">raising an issue here</a>
 </li>
-<li>Star the <a href="https://github.com/xiaodaigh/disk.frame"><code>{disk.frame}</code> Github repo</a>
+<li>Star the <a href="https://github.com/xiaodaigh/disk.frame" class="external-link"><code>{disk.frame}</code> Github repo</a>
 </li>
-<li>Star any repo that <code>{disk.frame}</code> depends on e.g. <a href="https://github.com/fstpackage/fst"><code>{fst}</code></a> and <a href="https://github.com/HenrikBengtsson/future"><code>{future}</code></a>
+<li>Star any repo that <a href="https://diskframe.com" class="external-link">disk.frame</a> depends on e.g. <a href="https://github.com/fstpackage/fst" class="external-link"><code>{fst}</code></a> and <a href="https://github.com/HenrikBengtsson/future" class="external-link"><code>{future}</code></a>
 </li>
 </ul>
 </div>
-<div id="related-repos" class="section level2">
-<h2 class="hasAnchor">
-<a href="#related-repos" class="anchor"></a>Related Repos</h2>
-<p><a href="https://github.com/xiaodaigh/disk.frame-fannie-mae-example" class="uri">https://github.com/xiaodaigh/disk.frame-fannie-mae-example</a> <a href="https://github.com/xiaodaigh/disk.frame-vs" class="uri">https://github.com/xiaodaigh/disk.frame-vs</a> <a href="https://github.com/xiaodaigh/disk.frame.ml" class="uri">https://github.com/xiaodaigh/disk.frame.ml</a> <a href="https://github.com/xiaodaigh/courses-larger-than-ram-data-manipulation-with-disk-frame" class="uri">https://github.com/xiaodaigh/courses-larger-than-ram-data-manipulation-with-disk-frame</a></p>
-</div>
-<div id="download-counts--build-status" class="section level2">
-<h2 class="hasAnchor">
-<a href="#download-counts--build-status" class="anchor"></a>Download Counts &amp; Build Status</h2>
-<p><a href="https://cran.r-project.org/package=disk.frame"><embed src="https://cranlogs.r-pkg.org/badges/disk.frame"></embed></a> <a href="https://cran.r-project.org/package=disk.frame"><embed src="http://cranlogs.r-pkg.org/badges/grand-total/disk.frame"></embed></a> <a href="https://travis-ci.org/xiaodaigh/disk.frame"><img src="https://travis-ci.org/xiaodaigh/disk.frame.svg?branch=master" alt="Travis build status"></a> <a href="https://ci.appveyor.com/project/xiaodaigh/disk.frame"><embed src="https://ci.appveyor.com/api/projects/status/github/xiaodaigh/disk.frame?branch=master&amp;svg=true"></embed></a></p>
+<div class="section level2">
+<h2 id="related-repos">Related Repos<a class="anchor" aria-label="anchor" href="#related-repos"></a>
+</h2>
+<p><a href="https://github.com/xiaodaigh/disk.frame-fannie-mae-example" class="external-link uri">https://github.com/xiaodaigh/disk.frame-fannie-mae-example</a> <a href="https://github.com/xiaodaigh/disk.frame-vs" class="external-link uri">https://github.com/xiaodaigh/disk.frame-vs</a> <a href="https://github.com/xiaodaigh/disk.frame.ml" class="external-link uri">https://github.com/xiaodaigh/disk.frame.ml</a> <a href="https://github.com/xiaodaigh/courses-larger-than-ram-data-manipulation-with-disk-frame" class="external-link uri">https://github.com/xiaodaigh/courses-larger-than-ram-data-manipulation-with-disk-frame</a></p>
 </div>
-<div id="live-stream-of-diskframe-development" class="section level2">
-<h2 class="hasAnchor">
-<a href="#live-stream-of-diskframe-development" class="anchor"></a>Live Stream of <code>{disk.frame}</code> development</h2>
-<ul>
-<li><a href="https://www.youtube.com/playlist?list=PL3DVdT3kym4fIU5CO-pxKtWhdjMVn4XGe" class="uri">https://www.youtube.com/playlist?list=PL3DVdT3kym4fIU5CO-pxKtWhdjMVn4XGe</a></li>
-</ul>
+<div class="section level2">
+<h2 id="download-counts--build-status">Download Counts &amp; Build Status<a class="anchor" aria-label="anchor" href="#download-counts--build-status"></a>
+</h2>
+<p><a href="https://cran.r-project.org/package=disk.frame" class="external-link"><embed src="https://cranlogs.r-pkg.org/badges/disk.frame"></embed></a> <a href="https://cran.r-project.org/package=disk.frame" class="external-link"><embed src="http://cranlogs.r-pkg.org/badges/grand-total/disk.frame"></embed></a></p>
 </div>
 </div>
 
@@ -601,42 +602,53 @@ <h2 class="hasAnchor">
 
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
     <div class="links">
-<h2>Links</h2>
+<h2 data-toc-skip>Links</h2>
 <ul class="list-unstyled">
-<li>Download from CRAN at <br><a href="https://cloud.r-project.org/package=disk.frame">https://​cloud.r-project.org/​package=disk.frame</a>
-</li>
-<li>Browse source code at <br><a href="https://github.com/xiaodaigh/disk.frame/">https://​github.com/​xiaodaigh/​disk.frame/​</a>
-</li>
-<li>Report a bug at <br><a href="https://github.com/xiaodaigh/disk.frame/issues">https://​github.com/​xiaodaigh/​disk.frame/​issues</a>
-</li>
+<li><a href="https://cloud.r-project.org/package=disk.frame" class="external-link">View on CRAN</a></li>
+<li><a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">Browse source code</a></li>
+<li><a href="https://github.com/xiaodaigh/disk.frame/issues" class="external-link">Report a bug</a></li>
 </ul>
 </div>
+
 <div class="license">
-<h2>License</h2>
+<h2 data-toc-skip>License</h2>
 <ul class="list-unstyled">
 <li>
-<a href="https://opensource.org/licenses/mit-license.php">MIT</a> + file <a href="LICENSE-text.html">LICENSE</a>
+<a href="https://opensource.org/licenses/mit-license.php" class="external-link">MIT</a> + file <a href="LICENSE-text.html">LICENSE</a>
 </li>
 </ul>
 </div>
+
+
+<div class="citation">
+<h2 data-toc-skip>Citation</h2>
+<ul class="list-unstyled">
+<li><a href="authors.html#citation">Citing disk.frame</a></li>
+</ul>
+</div>
+
 <div class="developers">
-<h2>Developers</h2>
+<h2 data-toc-skip>Developers</h2>
 <ul class="list-unstyled">
 <li>Dai ZJ <br><small class="roles"> Author, maintainer </small>  </li>
-<li><a href="authors.html">All authors...</a></li>
+<li><a href="authors.html">More about authors...</a></li>
 </ul>
 </div>
 
+
+
   </div>
 </div>
 
 
       <footer><div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+  <p></p>
+<p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p>
+<p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
       </footer>
@@ -645,5 +657,7 @@ <h2>Developers</h2>
   
 
 
+  
+
   </body>
 </html>
diff --git a/docs/news/index.html b/docs/news/index.html
index 83e34b3d..0fb5baf2 100644
--- a/docs/news/index.html
+++ b/docs/news/index.html
@@ -1,66 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Changelog • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Changelog" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Changelog • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Changelog"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-news">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -71,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -92,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -126,171 +64,143 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
       <h1 data-toc-skip>Changelog <small></small></h1>
-      <small>Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/NEWS.md'><code>NEWS.md</code></a></small>
+      <small>Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/NEWS.md" class="external-link"><code>NEWS.md</code></a></small>
     </div>
 
-    <div id="diskframe-036" class="section level1">
-<h1 class="page-header" data-toc-text="0.3.6">
-<a href="#diskframe-036" class="anchor"></a>disk.frame 0.3.6<small> 2020-06-13 </small>
-</h1>
-<ul>
-<li>General update to dplyr v1</li>
+    <div class="section level2">
+<h2 class="page-header" data-toc-text="0.5" id="diskframe-05">disk.frame 0.5<a class="anchor" aria-label="anchor" href="#diskframe-05"></a></h2>
+<ul><li>removed <code>add_count</code> method</li>
+</ul></div>
+    <div class="section level2">
+<h2 class="page-header" data-toc-text="0.4.1" id="diskframe-041">disk.frame 0.4.1<small>2021-03-14</small><a class="anchor" aria-label="anchor" href="#diskframe-041"></a></h2>
+<ul><li>removed use of <code>sysctl</code> which was violating CRAN policy</li>
+</ul></div>
+    <div class="section level2">
+<h2 class="page-header" data-toc-text="0.4.0" id="diskframe-040">disk.frame 0.4.0<small>2021-02-14</small><a class="anchor" aria-label="anchor" href="#diskframe-040"></a></h2>
+<ul><li>Removed <code>count</code> and <code>tally</code>
+</li>
+<li>Fixed package compatibility</li>
+</ul></div>
+    <div class="section level2">
+<h2 class="page-header" data-toc-text="0.3.7" id="diskframe-037">disk.frame 0.3.7<small>2020-07-07</small><a class="anchor" aria-label="anchor" href="#diskframe-037"></a></h2>
+<ul><li>Bugfix - add_chunk with date column not working</li>
+<li>Minor - added compression and other aprameters to <code>add_chunk</code>
+</li>
+</ul></div>
+    <div class="section level2">
+<h2 class="page-header" data-toc-text="0.3.6" id="diskframe-036">disk.frame 0.3.6<small>2020-06-13</small><a class="anchor" aria-label="anchor" href="#diskframe-036"></a></h2>
+<ul><li>General update to dplyr v1</li>
 <li>Remove all <code>_all/if/at</code> functions for dplyr v1</li>
 <li>Updated <code>pull</code> function to conform to dplyr</li>
-</ul>
-</div>
-    <div id="diskframe-035" class="section level1">
-<h1 class="page-header" data-toc-text="0.3.5">
-<a href="#diskframe-035" class="anchor"></a>disk.frame 0.3.5<small> 2020-05-08 </small>
-</h1>
-<ul>
-<li>Support for !!! in summarise; github <a href='https://github.com/xiaodaigh/disk.frame/issues/250'>#250</a></li>
-<li>Added <code><a href="https://dplyr.tidyverse.org/reference/pull.html">dplyr::pull</a></code> verb</li>
-</ul>
-</div>
-    <div id="diskframe-034" class="section level1">
-<h1 class="page-header" data-toc-text="0.3.4">
-<a href="#diskframe-034" class="anchor"></a>disk.frame 0.3.4<small> 2020-02-26 </small>
-</h1>
-<ul>
-<li>fixed vignette bug and all vignette are now in static pdf</li>
+</ul></div>
+    <div class="section level2">
+<h2 class="page-header" data-toc-text="0.3.5" id="diskframe-035">disk.frame 0.3.5<small>2020-05-08</small><a class="anchor" aria-label="anchor" href="#diskframe-035"></a></h2>
+<ul><li>Support for !!! in summarise; github <a href="https://github.com/xiaodaigh/disk.frame/issues/250" class="external-link">#250</a></li>
+<li>Added <code><a href="https://dplyr.tidyverse.org/reference/pull.html" class="external-link">dplyr::pull</a></code> verb</li>
+</ul></div>
+    <div class="section level2">
+<h2 class="page-header" data-toc-text="0.3.4" id="diskframe-034">disk.frame 0.3.4<small>2020-02-26</small><a class="anchor" aria-label="anchor" href="#diskframe-034"></a></h2>
+<ul><li>fixed vignette bug and all vignette are now in static pdf</li>
 <li>fixed bugs with group-by when run with Rscript</li>
 <li>also fixed bugs with multiple group-by columns</li>
-</ul>
-</div>
-    <div id="diskframe-033" class="section level1">
-<h1 class="page-header" data-toc-text="0.3.3">
-<a href="#diskframe-033" class="anchor"></a>disk.frame 0.3.3<small> 2020-01-21 </small>
-</h1>
-<ul>
-<li>removed bloom filters as they were causing issues with CRAN solaris system for some reason</li>
-</ul>
-</div>
-    <div id="diskframe-032" class="section level1">
-<h1 class="page-header" data-toc-text="0.3.2">
-<a href="#diskframe-032" class="anchor"></a>disk.frame 0.3.2<small> 2020-01-19 </small>
-</h1>
-<ul>
-<li>removed usage proc/meminfo inline with CRAN policy</li>
+</ul></div>
+    <div class="section level2">
+<h2 class="page-header" data-toc-text="0.3.3" id="diskframe-033">disk.frame 0.3.3<small>2020-01-21</small><a class="anchor" aria-label="anchor" href="#diskframe-033"></a></h2>
+<ul><li>removed bloom filters as they were causing issues with CRAN solaris system for some reason</li>
+</ul></div>
+    <div class="section level2">
+<h2 class="page-header" data-toc-text="0.3.2" id="diskframe-032">disk.frame 0.3.2<small>2020-01-19</small><a class="anchor" aria-label="anchor" href="#diskframe-032"></a></h2>
+<ul><li>removed usage proc/meminfo inline with CRAN policy</li>
 <li>added (experimental) bloomfilter</li>
-</ul>
-</div>
-    <div id="diskframe-031" class="section level1">
-<h1 class="page-header" data-toc-text="0.3.1">
-<a href="#diskframe-031" class="anchor"></a>disk.frame 0.3.1<small> 2019-12-20 </small>
-</h1>
-<ul>
-<li>urgent bug fix for group-by failing when the number chunks is 1; see Github <a href='https://github.com/xiaodaigh/disk.frame/issues/241'>#241</a></li>
-</ul>
-</div>
-    <div id="diskframe-030" class="section level1">
-<h1 class="page-header" data-toc-text="0.3.0">
-<a href="#diskframe-030" class="anchor"></a>disk.frame 0.3.0<small> 2019-12-18 </small>
-</h1>
-<ul>
-<li>experimental one-stage group-by framework!</li>
+</ul></div>
+    <div class="section level2">
+<h2 class="page-header" data-toc-text="0.3.1" id="diskframe-031">disk.frame 0.3.1<small>2019-12-20</small><a class="anchor" aria-label="anchor" href="#diskframe-031"></a></h2>
+<ul><li>urgent bug fix for group-by failing when the number chunks is 1; see Github <a href="https://github.com/xiaodaigh/disk.frame/issues/241" class="external-link">#241</a></li>
+</ul></div>
+    <div class="section level2">
+<h2 class="page-header" data-toc-text="0.3.0" id="diskframe-030">disk.frame 0.3.0<small>2019-12-18</small><a class="anchor" aria-label="anchor" href="#diskframe-030"></a></h2>
+<ul><li>experimental one-stage group-by framework!</li>
 <li>bug fixes for data.table trigger by integration with tidyfast</li>
 <li>removed assertthat from imports</li>
 <li>add benchmarkme to Suggests</li>
-</ul>
-</div>
-    <div id="diskframe-021" class="section level1">
-<h1 class="page-header" data-toc-text="0.2.1">
-<a href="#diskframe-021" class="anchor"></a>disk.frame 0.2.1<small> 2019-11-23 </small>
-</h1>
-<ul>
-<li>got rid of benchmarkme as a dependency</li>
+</ul></div>
+    <div class="section level2">
+<h2 class="page-header" data-toc-text="0.2.1" id="diskframe-021">disk.frame 0.2.1<small>2019-11-23</small><a class="anchor" aria-label="anchor" href="#diskframe-021"></a></h2>
+<ul><li>got rid of benchmarkme as a dependency</li>
 <li>added <code>hard_arrange</code> thanks to Jacky Poon</li>
 <li>added more .progress options for joins</li>
 <li>Using data.table::getDTthreads() as default number of workers</li>
 <li>multisession instead of multiprocess as default backend for data.table</li>
 <li>added support for R3.4</li>
 <li>fixed df_get_ram for R &lt; 3.6</li>
-</ul>
-</div>
-    <div id="diskframe-020" class="section level1">
-<h1 class="page-header" data-toc-text="0.2.0">
-<a href="#diskframe-020" class="anchor"></a>disk.frame 0.2.0<small> 2019-10-05 </small>
-</h1>
-<ul>
-<li>deprecated group_by, arrange, summarise</li>
+</ul></div>
+    <div class="section level2">
+<h2 class="page-header" data-toc-text="0.2.0" id="diskframe-020">disk.frame 0.2.0<small>2019-10-05</small><a class="anchor" aria-label="anchor" href="#diskframe-020"></a></h2>
+<ul><li>deprecated group_by, arrange, summarise</li>
 <li>add chunk_group_by, chunk_arrange, chunk_summarise</li>
 <li>fit GLMs with <code>dfglm</code>
 </li>
 <li>fixed so that dplyr function also work in mutate even with ~ in the name</li>
 <li>fixed disk.frame so that in works in functions too</li>
-</ul>
-</div>
-    <div id="diskframe-011" class="section level1">
-<h1 class="page-header" data-toc-text="0.1.1">
-<a href="#diskframe-011" class="anchor"></a>disk.frame 0.1.1<small> 2019-09-15 </small>
-</h1>
-<ul>
-<li>Allowed <code>map</code> to accept multiple arguments. Thanks Knut Jägersberg for suggestion</li>
+</ul></div>
+    <div class="section level2">
+<h2 class="page-header" data-toc-text="0.1.1" id="diskframe-011">disk.frame 0.1.1<small>2019-09-15</small><a class="anchor" aria-label="anchor" href="#diskframe-011"></a></h2>
+<ul><li>Allowed <code>map</code> to accept multiple arguments. Thanks Knut Jägersberg for suggestion</li>
 <li>Fixed bug where if the CSV is larger than RAM then it fails by adding {LaF} backend</li>
 <li>Added {bigreadr} backend for reading large files by first splitting the file. This is the default behaviour</li>
 <li>Added {LaF} and {readr} chunk readers to <code>csv_to_disk.frame</code>
 </li>
-<li>fixed <code><a href="../reference/write_disk.frame.html">write_disk.frame(...., shardby)</a></code> and other <code>shardby</code> functions including <code>rechunk</code> and <code>shard</code>
+<li>fixed <code>write_disk.frame(...., shardby)</code> and other <code>shardby</code> functions including <code>rechunk</code> and <code>shard</code>
 </li>
 <li>added <code><a href="../reference/df_ram_size.html">df_ram_size()</a></code> to accurate determine RAM size for RStudio in R3.6</li>
 <li>added <code>show_ceremony</code> and <code>show_boiler_plate</code> to show setup code</li>
-</ul>
-</div>
+</ul></div>
   </div>
 
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/pkgdown.css b/docs/pkgdown.css
index c01e5923..80ea5b83 100644
--- a/docs/pkgdown.css
+++ b/docs/pkgdown.css
@@ -56,8 +56,10 @@ img.icon {
   float: right;
 }
 
-img {
+/* Ensure in-page images don't run outside their container */
+.contents img {
   max-width: 100%;
+  height: auto;
 }
 
 /* Fix bug in bootstrap (only seen in firefox) */
@@ -78,11 +80,10 @@ dd {
 /* Section anchors ---------------------------------*/
 
 a.anchor {
-  margin-left: -30px;
-  display:inline-block;
-  width: 30px;
-  height: 30px;
-  visibility: hidden;
+  display: none;
+  margin-left: 5px;
+  width: 20px;
+  height: 20px;
 
   background-image: url(./link.svg);
   background-repeat: no-repeat;
@@ -90,17 +91,15 @@ a.anchor {
   background-position: center center;
 }
 
-.hasAnchor:hover a.anchor {
-  visibility: visible;
-}
-
-@media (max-width: 767px) {
-  .hasAnchor:hover a.anchor {
-    visibility: hidden;
-  }
+h1:hover .anchor,
+h2:hover .anchor,
+h3:hover .anchor,
+h4:hover .anchor,
+h5:hover .anchor,
+h6:hover .anchor {
+  display: inline-block;
 }
 
-
 /* Fixes for fixed navbar --------------------------*/
 
 .contents h1, .contents h2, .contents h3, .contents h4 {
@@ -244,14 +243,14 @@ nav[data-toggle='toc'] .nav .nav > .active:focus > a {
 
 .ref-index th {font-weight: normal;}
 
-.ref-index td {vertical-align: top;}
+.ref-index td {vertical-align: top; min-width: 100px}
 .ref-index .icon {width: 40px;}
 .ref-index .alias {width: 40%;}
 .ref-index-icons .alias {width: calc(40% - 40px);}
 .ref-index .title {width: 60%;}
 
 .ref-arguments th {text-align: right; padding-right: 10px;}
-.ref-arguments th, .ref-arguments td {vertical-align: top;}
+.ref-arguments th, .ref-arguments td {vertical-align: top; min-width: 100px}
 .ref-arguments .name {width: 20%;}
 .ref-arguments .desc {width: 80%;}
 
@@ -264,31 +263,26 @@ table {
 
 /* Syntax highlighting ---------------------------------------------------- */
 
-pre {
-  word-wrap: normal;
-  word-break: normal;
-  border: 1px solid #eee;
-}
-
-pre, code {
+pre, code, pre code {
   background-color: #f8f8f8;
   color: #333;
 }
+pre, pre code {
+  white-space: pre-wrap;
+  word-break: break-all;
+  overflow-wrap: break-word;
+}
 
-pre code {
-  overflow: auto;
-  word-wrap: normal;
-  white-space: pre;
+pre {
+  border: 1px solid #eee;
 }
 
-pre .img {
+pre .img, pre .r-plt {
   margin: 5px 0;
 }
 
-pre .img img {
+pre .img img, pre .r-plt img {
   background-color: #fff;
-  display: block;
-  height: auto;
 }
 
 code a, pre a {
@@ -305,9 +299,8 @@ a.sourceLine:hover {
 .kw      {color: #264D66;} /* keyword */
 .co      {color: #888888;} /* comment */
 
-.message { color: black;   font-weight: bolder;}
-.error   { color: orange;  font-weight: bolder;}
-.warning { color: #6A0366; font-weight: bolder;}
+.error   {font-weight: bolder;}
+.warning {font-weight: bolder;}
 
 /* Clipboard --------------------------*/
 
@@ -365,3 +358,27 @@ mark {
     content: "";
   }
 }
+
+/* Section anchors ---------------------------------
+   Added in pandoc 2.11: https://github.com/jgm/pandoc-templates/commit/9904bf71
+*/
+
+div.csl-bib-body { }
+div.csl-entry {
+  clear: both;
+}
+.hanging-indent div.csl-entry {
+  margin-left:2em;
+  text-indent:-2em;
+}
+div.csl-left-margin {
+  min-width:2em;
+  float:left;
+}
+div.csl-right-inline {
+  margin-left:2em;
+  padding-left:1em;
+}
+div.csl-indent {
+  margin-left: 2em;
+}
diff --git a/docs/pkgdown.js b/docs/pkgdown.js
index 7e7048fa..6f0eee40 100644
--- a/docs/pkgdown.js
+++ b/docs/pkgdown.js
@@ -80,7 +80,7 @@
     $(document).ready(function() {
       var copyButton = "<button type='button' class='btn btn-primary btn-copy-ex' type = 'submit' title='Copy to clipboard' aria-label='Copy to clipboard' data-toggle='tooltip' data-placement='left auto' data-trigger='hover' data-clipboard-copy><i class='fa fa-copy'></i></button>";
 
-      $(".examples, div.sourceCode").addClass("hasCopyButton");
+      $("div.sourceCode").addClass("hasCopyButton");
 
       // Insert copy buttons:
       $(copyButton).prependTo(".hasCopyButton");
@@ -91,7 +91,7 @@
       // Initialize clipboard:
       var clipboardBtnCopies = new ClipboardJS('[data-clipboard-copy]', {
         text: function(trigger) {
-          return trigger.parentNode.textContent;
+          return trigger.parentNode.textContent.replace(/\n#>[^\n]*/g, "");
         }
       });
 
diff --git a/docs/pkgdown.yml b/docs/pkgdown.yml
index c679f03b..e9e64112 100644
--- a/docs/pkgdown.yml
+++ b/docs/pkgdown.yml
@@ -1,5 +1,5 @@
-pandoc: 2.7.3
-pkgdown: 1.5.1
+pandoc: 2.14.0.3
+pkgdown: 2.0.2
 pkgdown_sha: ~
 articles:
   01-intro: 01-intro.html
@@ -13,5 +13,6 @@ articles:
   09-convenience-features: 09-convenience-features.html
   10-group-by: 10-group-by.html
   11-custom-group-by: 11-custom-group-by.html
-last_built: 2020-06-18T00:21Z
+  88-trouble-shooting: 88-trouble-shooting.html
+last_built: 2022-01-24T10:36Z
 
diff --git a/docs/reference/add_chunk.html b/docs/reference/add_chunk.html
index 0ab099b3..82b43bf9 100644
--- a/docs/reference/add_chunk.html
+++ b/docs/reference/add_chunk.html
@@ -1,68 +1,13 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Add a chunk to the disk.frame — add_chunk • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Add a chunk to the disk.frame — add_chunk" />
-<meta property="og:description" content="If no chunk_id is specified, then the chunk is added at the end as the
-largest numbered file, &quot;n.fst&quot;." />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Add a chunk to the disk.frame — add_chunk • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Add a chunk to the disk.frame — add_chunk"><meta property="og:description" content='If no chunk_id is specified, then the chunk is added at the end as the
+largest numbered file, "n.fst".'><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -73,19 +18,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -94,8 +32,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -128,34 +65,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Add a chunk to the disk.frame</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/add_chunk.r'><code>R/add_chunk.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/add_chunk.r" class="external-link"><code>R/add_chunk.r</code></a></small>
     <div class="hidden name"><code>add_chunk.Rd</code></div>
     </div>
 
@@ -164,105 +97,114 @@ <h1>Add a chunk to the disk.frame</h1>
 largest numbered file, "n.fst".</p>
     </div>
 
-    <pre class="usage"><span class='fu'>add_chunk</span>(<span class='no'>df</span>, <span class='no'>chunk</span>, <span class='kw'>chunk_id</span> <span class='kw'>=</span> <span class='kw'>NULL</span>, <span class='kw'>full.names</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>df</th>
-      <td><p>the disk.frame to add a chunk to</p></td>
-    </tr>
-    <tr>
-      <th>chunk</th>
-      <td><p>a data.frame to be added as a chunk</p></td>
-    </tr>
-    <tr>
-      <th>chunk_id</th>
-      <td><p>a numeric number indicating the id of the chunk. If NULL it
-will be set to the largest chunk_id + 1</p></td>
-    </tr>
-    <tr>
-      <th>full.names</th>
-      <td><p>whether the chunk_id name match should be to the full file
-path not just the file name</p></td>
-    </tr>
-    </table>
-
-    <h2 class="hasAnchor" id="value"><a class="anchor" href="#value"></a>Value</h2>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">add_chunk</span><span class="op">(</span><span class="va">df</span>, <span class="va">chunk</span>, chunk_id <span class="op">=</span> <span class="cn">NULL</span>, full.names <span class="op">=</span> <span class="cn">FALSE</span>, <span class="va">...</span><span class="op">)</span></code></pre></div>
+    </div>
 
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>df</dt>
+<dd><p>the disk.frame to add a chunk to</p></dd>
+<dt>chunk</dt>
+<dd><p>a data.frame to be added as a chunk</p></dd>
+<dt>chunk_id</dt>
+<dd><p>a numeric number indicating the id of the chunk. If NULL it
+will be set to the largest chunk_id + 1</p></dd>
+<dt>full.names</dt>
+<dd><p>whether the chunk_id name match should be to the full file
+path not just the file name</p></dd>
+<dt>...</dt>
+<dd><p>Passed in the write_fst. E.g. compress</p></dd>
+</dl></div>
+    <div id="value">
+    <h2>Value</h2>
     <p>disk.frame</p>
-    <h2 class="hasAnchor" id="details"><a class="anchor" href="#details"></a>Details</h2>
-
+    </div>
+    <div id="details">
+    <h2>Details</h2>
     <p>The function is the preferred way to add a chunk to a disk.frame. It
   performs checks on the types to make sure that the new chunk doesn't have
   different types to the disk.frame.</p>
+    </div>
 
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='co'># create a disk.frame</span>
-<span class='no'>df_path</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/file.path.html'>file.path</a></span>(<span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempdir</a></span>(), <span class='st'>"tmp_add_chunk"</span>)
-<span class='no'>diskf</span> <span class='kw'>=</span> <span class='fu'><a href='disk.frame.html'>disk.frame</a></span>(<span class='no'>df_path</span>)
-
-<span class='co'># add a chunk to diskf</span>
-<span class='fu'>add_chunk</span>(<span class='no'>diskf</span>, <span class='no'>cars</span>)</div><div class='output co'>#&gt; <span class='message'>path: "C:\Users\RTX2080\AppData\Local\Temp\RtmpInritK/tmp_add_chunk"</span>
-#&gt; <span class='message'>nchunks: 1</span>
-#&gt; <span class='message'>nrow (at source): 50</span>
-#&gt; <span class='message'>ncol (at source): 2</span>
-#&gt; <span class='message'>nrow (post operations): ???</span>
-#&gt; <span class='message'>ncol (post operations): ???</span></div><div class='input'><span class='fu'>add_chunk</span>(<span class='no'>diskf</span>, <span class='no'>cars</span>)</div><div class='output co'>#&gt; <span class='message'>path: "C:\Users\RTX2080\AppData\Local\Temp\RtmpInritK/tmp_add_chunk"</span>
-#&gt; <span class='message'>nchunks: 2</span>
-#&gt; <span class='message'>nrow (at source): 100</span>
-#&gt; <span class='message'>ncol (at source): 2</span>
-#&gt; <span class='message'>nrow (post operations): ???</span>
-#&gt; <span class='message'>ncol (post operations): ???</span></div><div class='input'>
-<span class='fu'><a href='nchunks.html'>nchunks</a></span>(<span class='no'>diskf</span>) <span class='co'># 2</span></div><div class='output co'>#&gt; [1] 2</div><div class='input'>
-<span class='no'>df2</span> <span class='kw'>=</span> <span class='fu'><a href='disk.frame.html'>disk.frame</a></span>(<span class='fu'><a href='https://rdrr.io/r/base/file.path.html'>file.path</a></span>(<span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempdir</a></span>(), <span class='st'>"tmp_add_chunk2"</span>))
-
-<span class='co'># add chunks by specifying the chunk_id number; this is especially useful if</span>
-<span class='co'># you wish to add multiple chunk in parralel</span>
-
-<span class='fu'>add_chunk</span>(<span class='no'>df2</span>, <span class='fu'><a href='https://rdrr.io/r/base/data.frame.html'>data.frame</a></span>(<span class='kw'>chunk</span><span class='kw'>=</span><span class='fl'>1</span>), <span class='fl'>1</span>)</div><div class='output co'>#&gt; <span class='message'>path: "C:\Users\RTX2080\AppData\Local\Temp\RtmpInritK/tmp_add_chunk2"</span>
-#&gt; <span class='message'>nchunks: 1</span>
-#&gt; <span class='message'>nrow (at source): 1</span>
-#&gt; <span class='message'>ncol (at source): 1</span>
-#&gt; <span class='message'>nrow (post operations): ???</span>
-#&gt; <span class='message'>ncol (post operations): ???</span></div><div class='input'><span class='fu'>add_chunk</span>(<span class='no'>df2</span>, <span class='fu'><a href='https://rdrr.io/r/base/data.frame.html'>data.frame</a></span>(<span class='kw'>chunk</span><span class='kw'>=</span><span class='fl'>2</span>), <span class='fl'>3</span>)</div><div class='output co'>#&gt; <span class='message'>path: "C:\Users\RTX2080\AppData\Local\Temp\RtmpInritK/tmp_add_chunk2"</span>
-#&gt; <span class='message'>nchunks: 2</span>
-#&gt; <span class='message'>nrow (at source): 2</span>
-#&gt; <span class='message'>ncol (at source): 1</span>
-#&gt; <span class='message'>nrow (post operations): ???</span>
-#&gt; <span class='message'>ncol (post operations): ???</span></div><div class='input'>
-<span class='fu'><a href='nchunks.html'>nchunks</a></span>(<span class='no'>df2</span>) <span class='co'># 2</span></div><div class='output co'>#&gt; [1] 2</div><div class='input'>
-<span class='fu'><a href='https://rdrr.io/r/base/list.files.html'>dir</a></span>(<span class='fu'><a href='https://rdrr.io/r/base/attr.html'>attr</a></span>(<span class='no'>df2</span>, <span class='st'>"path"</span>, <span class='kw'>exact</span><span class='kw'>=</span><span class='fl'>TRUE</span>))</div><div class='output co'>#&gt; [1] "1.fst" "3.fst"</div><div class='input'><span class='co'># [1] "1.fst" "3.fst"</span>
-
-<span class='co'># clean up</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>diskf</span>)
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>df2</span>)</div></pre>
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="co"># create a disk.frame</span></span>
+<span class="r-in"><span class="va">df_path</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/file.path.html" class="external-link">file.path</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempdir</a></span><span class="op">(</span><span class="op">)</span>, <span class="st">"tmp_add_chunk"</span><span class="op">)</span></span>
+<span class="r-in"><span class="va">diskf</span> <span class="op">=</span> <span class="fu"><a href="disk.frame.html">disk.frame</a></span><span class="op">(</span><span class="va">df_path</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># add a chunk to diskf</span></span>
+<span class="r-in"><span class="fu">add_chunk</span><span class="op">(</span><span class="va">diskf</span>, <span class="va">cars</span><span class="op">)</span></span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> path: "C:\Users\RTX2080\AppData\Local\Temp\Rtmp2rQjw5/tmp_add_chunk"</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nchunks: 1</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nrow (at source): 50</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> ncol (at source): 2</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nrow (post operations): ???</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> ncol (post operations): ???</span>
+<span class="r-in"><span class="fu">add_chunk</span><span class="op">(</span><span class="va">diskf</span>, <span class="va">cars</span><span class="op">)</span></span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> path: "C:\Users\RTX2080\AppData\Local\Temp\Rtmp2rQjw5/tmp_add_chunk"</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nchunks: 2</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nrow (at source): 100</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> ncol (at source): 2</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nrow (post operations): ???</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> ncol (post operations): ???</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="fu"><a href="nchunks.html">nchunks</a></span><span class="op">(</span><span class="va">diskf</span><span class="op">)</span> <span class="co"># 2</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] 2</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="va">df2</span> <span class="op">=</span> <span class="fu"><a href="disk.frame.html">disk.frame</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/file.path.html" class="external-link">file.path</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempdir</a></span><span class="op">(</span><span class="op">)</span>, <span class="st">"tmp_add_chunk2"</span><span class="op">)</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># add chunks by specifying the chunk_id number; this is especially useful if</span></span>
+<span class="r-in"><span class="co"># you wish to add multiple chunk in parralel</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="fu">add_chunk</span><span class="op">(</span><span class="va">df2</span>, <span class="fu"><a href="https://rdrr.io/r/base/data.frame.html" class="external-link">data.frame</a></span><span class="op">(</span>chunk<span class="op">=</span><span class="fl">1</span><span class="op">)</span>, <span class="fl">1</span><span class="op">)</span></span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> path: "C:\Users\RTX2080\AppData\Local\Temp\Rtmp2rQjw5/tmp_add_chunk2"</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nchunks: 1</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nrow (at source): 1</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> ncol (at source): 1</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nrow (post operations): ???</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> ncol (post operations): ???</span>
+<span class="r-in"><span class="fu">add_chunk</span><span class="op">(</span><span class="va">df2</span>, <span class="fu"><a href="https://rdrr.io/r/base/data.frame.html" class="external-link">data.frame</a></span><span class="op">(</span>chunk<span class="op">=</span><span class="fl">2</span><span class="op">)</span>, <span class="fl">3</span><span class="op">)</span></span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> path: "C:\Users\RTX2080\AppData\Local\Temp\Rtmp2rQjw5/tmp_add_chunk2"</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nchunks: 2</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nrow (at source): 2</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> ncol (at source): 1</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nrow (post operations): ???</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> ncol (post operations): ???</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="fu"><a href="nchunks.html">nchunks</a></span><span class="op">(</span><span class="va">df2</span><span class="op">)</span> <span class="co"># 2</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] 2</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="fu"><a href="https://rdrr.io/r/base/list.files.html" class="external-link">dir</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/attr.html" class="external-link">attr</a></span><span class="op">(</span><span class="va">df2</span>, <span class="st">"path"</span>, exact<span class="op">=</span><span class="cn">TRUE</span><span class="op">)</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] "1.fst" "3.fst"</span>
+<span class="r-in"><span class="co"># [1] "1.fst" "3.fst"</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">diskf</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">df2</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/as.data.frame.disk.frame.html b/docs/reference/as.data.frame.disk.frame.html
index 77c883d0..abfa6194 100644
--- a/docs/reference/as.data.frame.disk.frame.html
+++ b/docs/reference/as.data.frame.disk.frame.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Convert disk.frame to data.frame by collecting all chunks — as.data.frame.disk.frame • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Convert disk.frame to data.frame by collecting all chunks — as.data.frame.disk.frame" />
-<meta property="og:description" content="Convert disk.frame to data.frame by collecting all chunks" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Convert disk.frame to data.frame by collecting all chunks — as.data.frame.disk.frame • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Convert disk.frame to data.frame by collecting all chunks — as.data.frame.disk.frame"><meta property="og:description" content="Convert disk.frame to data.frame by collecting all chunks"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Convert disk.frame to data.frame by collecting all chunks</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/as.data.frame.r'><code>R/as.data.frame.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/as.data.frame.r" class="external-link"><code>R/as.data.frame.r</code></a></small>
     <div class="hidden name"><code>as.data.frame.disk.frame.Rd</code></div>
     </div>
 
@@ -162,111 +95,104 @@ <h1>Convert disk.frame to data.frame by collecting all chunks</h1>
     <p>Convert disk.frame to data.frame by collecting all chunks</p>
     </div>
 
-    <pre class="usage"><span class='co'># S3 method for disk.frame</span>
-<span class='fu'><a href='https://rdrr.io/r/base/as.data.frame.html'>as.data.frame</a></span>(<span class='no'>x</span>, <span class='no'>row.names</span>, <span class='no'>optional</span>, <span class='no'>...</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>x</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>row.names</th>
-      <td><p>NULL or a character vector giving the row names for the data frame. Missing values are not allowed.</p></td>
-    </tr>
-    <tr>
-      <th>optional</th>
-      <td><p>logical. If TRUE, setting row names and converting column names (to syntactic names: see make.names) is optional. Note that all of R's base package as.data.frame() methods use optional only for column names treatment, basically with the meaning of data.frame(*, check.names = !optional). See also the make.names argument of the matrix method.</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>additional arguments to be passed to or from methods.</p></td>
-    </tr>
-    </table>
-
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://rdrr.io/r/base/as.data.frame.html" class="external-link">as.data.frame</a></span><span class="op">(</span><span class="va">x</span>, <span class="va">row.names</span>, <span class="va">optional</span>, <span class="va">...</span><span class="op">)</span></code></pre></div>
+    </div>
 
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
-<span class='fu'><a href='https://rdrr.io/r/base/as.data.frame.html'>as.data.frame</a></span>(<span class='no'>cars.df</span>)</div><div class='output co'>#&gt;    speed dist
-#&gt; 1      4    2
-#&gt; 2      4   10
-#&gt; 3      7    4
-#&gt; 4      7   22
-#&gt; 5      8   16
-#&gt; 6      9   10
-#&gt; 7     10   18
-#&gt; 8     10   26
-#&gt; 9     10   34
-#&gt; 10    11   17
-#&gt; 11    11   28
-#&gt; 12    12   14
-#&gt; 13    12   20
-#&gt; 14    12   24
-#&gt; 15    12   28
-#&gt; 16    13   26
-#&gt; 17    13   34
-#&gt; 18    13   34
-#&gt; 19    13   46
-#&gt; 20    14   26
-#&gt; 21    14   36
-#&gt; 22    14   60
-#&gt; 23    14   80
-#&gt; 24    15   20
-#&gt; 25    15   26
-#&gt; 26    15   54
-#&gt; 27    16   32
-#&gt; 28    16   40
-#&gt; 29    17   32
-#&gt; 30    17   40
-#&gt; 31    17   50
-#&gt; 32    18   42
-#&gt; 33    18   56
-#&gt; 34    18   76
-#&gt; 35    18   84
-#&gt; 36    19   36
-#&gt; 37    19   46
-#&gt; 38    19   68
-#&gt; 39    20   32
-#&gt; 40    20   48
-#&gt; 41    20   52
-#&gt; 42    20   56
-#&gt; 43    20   64
-#&gt; 44    22   66
-#&gt; 45    23   54
-#&gt; 46    24   70
-#&gt; 47    24   92
-#&gt; 48    24   93
-#&gt; 49    24  120
-#&gt; 50    25   85</div><div class='input'>
-<span class='co'># clean up</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)</div></pre>
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>x</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>row.names</dt>
+<dd><p>NULL or a character vector giving the row names for the data frame. Missing values are not allowed.</p></dd>
+<dt>optional</dt>
+<dd><p>logical. If TRUE, setting row names and converting column names (to syntactic names: see make.names) is optional. Note that all of R's base package as.data.frame() methods use optional only for column names treatment, basically with the meaning of data.frame(*, check.names = !optional). See also the make.names argument of the matrix method.</p></dd>
+<dt>...</dt>
+<dd><p>additional arguments to be passed to or from methods.</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="https://rdrr.io/r/base/as.data.frame.html" class="external-link">as.data.frame</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>    speed dist</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 1      4    2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 2      4   10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 3      7    4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 4      7   22</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 5      8   16</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 6      9   10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 7     10   18</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 8     10   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 9     10   34</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 10    11   17</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 11    11   28</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 12    12   14</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 13    12   20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 14    12   24</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 15    12   28</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 16    13   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 17    13   34</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 18    13   34</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 19    13   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 20    14   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 21    14   36</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 22    14   60</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 23    14   80</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 24    15   20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 25    15   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 26    15   54</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 27    16   32</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 28    16   40</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 29    17   32</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 30    17   40</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 31    17   50</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 32    18   42</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 33    18   56</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 34    18   76</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 35    18   84</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 36    19   36</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 37    19   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 38    19   68</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 39    20   32</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 40    20   48</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 41    20   52</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 42    20   56</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 43    20   64</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 44    22   66</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 45    23   54</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 46    24   70</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 47    24   92</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 48    24   93</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 49    24  120</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 50    25   85</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/as.data.table.disk.frame.html b/docs/reference/as.data.table.disk.frame.html
index a705e8c7..7e9ac1e2 100644
--- a/docs/reference/as.data.table.disk.frame.html
+++ b/docs/reference/as.data.table.disk.frame.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Convert disk.frame to data.table by collecting all chunks — as.data.table.disk.frame • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Convert disk.frame to data.table by collecting all chunks — as.data.table.disk.frame" />
-<meta property="og:description" content="Convert disk.frame to data.table by collecting all chunks" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Convert disk.frame to data.table by collecting all chunks — as.data.table.disk.frame • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Convert disk.frame to data.table by collecting all chunks — as.data.table.disk.frame"><meta property="og:description" content="Convert disk.frame to data.table by collecting all chunks"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Convert disk.frame to data.table by collecting all chunks</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/as.data.frame.r'><code>R/as.data.frame.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/as.data.frame.r" class="external-link"><code>R/as.data.frame.r</code></a></small>
     <div class="hidden name"><code>as.data.table.disk.frame.Rd</code></div>
     </div>
 
@@ -162,113 +95,112 @@ <h1>Convert disk.frame to data.table by collecting all chunks</h1>
     <p>Convert disk.frame to data.table by collecting all chunks</p>
     </div>
 
-    <pre class="usage"><span class='co'># S3 method for disk.frame</span>
-<span class='fu'>as.data.table</span>(<span class='no'>x</span>, <span class='kw'>keep.rownames</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>, <span class='no'>...</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>x</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>keep.rownames</th>
-      <td><p>passed to as.data.table</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>passed to as.data.table</p></td>
-    </tr>
-    </table>
-
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/as.data.table.html" class="external-link">as.data.table</a></span><span class="op">(</span><span class="va">x</span>, keep.rownames <span class="op">=</span> <span class="cn">FALSE</span>, <span class="va">...</span><span class="op">)</span></code></pre></div>
+    </div>
 
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='fu'><a href='https://rdrr.io/r/base/library.html'>library</a></span>(<span class='no'>data.table</span>)</div><div class='output co'>#&gt; <span class='message'></span>
-#&gt; <span class='message'>Attaching package: 'data.table'</span></div><div class='output co'>#&gt; <span class='message'>The following object is masked from 'package:purrr':</span>
-#&gt; <span class='message'></span>
-#&gt; <span class='message'>    transpose</span></div><div class='output co'>#&gt; <span class='message'>The following objects are masked from 'package:dplyr':</span>
-#&gt; <span class='message'></span>
-#&gt; <span class='message'>    between, first, last</span></div><div class='input'><span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
-<span class='fu'><a href='https://Rdatatable.gitlab.io/data.table/reference/as.data.table.html'>as.data.table</a></span>(<span class='no'>cars.df</span>)</div><div class='output co'>#&gt;     speed dist
-#&gt;  1:     4    2
-#&gt;  2:     4   10
-#&gt;  3:     7    4
-#&gt;  4:     7   22
-#&gt;  5:     8   16
-#&gt;  6:     9   10
-#&gt;  7:    10   18
-#&gt;  8:    10   26
-#&gt;  9:    10   34
-#&gt; 10:    11   17
-#&gt; 11:    11   28
-#&gt; 12:    12   14
-#&gt; 13:    12   20
-#&gt; 14:    12   24
-#&gt; 15:    12   28
-#&gt; 16:    13   26
-#&gt; 17:    13   34
-#&gt; 18:    13   34
-#&gt; 19:    13   46
-#&gt; 20:    14   26
-#&gt; 21:    14   36
-#&gt; 22:    14   60
-#&gt; 23:    14   80
-#&gt; 24:    15   20
-#&gt; 25:    15   26
-#&gt; 26:    15   54
-#&gt; 27:    16   32
-#&gt; 28:    16   40
-#&gt; 29:    17   32
-#&gt; 30:    17   40
-#&gt; 31:    17   50
-#&gt; 32:    18   42
-#&gt; 33:    18   56
-#&gt; 34:    18   76
-#&gt; 35:    18   84
-#&gt; 36:    19   36
-#&gt; 37:    19   46
-#&gt; 38:    19   68
-#&gt; 39:    20   32
-#&gt; 40:    20   48
-#&gt; 41:    20   52
-#&gt; 42:    20   56
-#&gt; 43:    20   64
-#&gt; 44:    22   66
-#&gt; 45:    23   54
-#&gt; 46:    24   70
-#&gt; 47:    24   92
-#&gt; 48:    24   93
-#&gt; 49:    24  120
-#&gt; 50:    25   85
-#&gt;     speed dist</div><div class='input'>
-<span class='co'># clean up</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)</div></pre>
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>x</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>keep.rownames</dt>
+<dd><p>passed to as.data.table</p></dd>
+<dt>...</dt>
+<dd><p>passed to as.data.table</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://r-datatable.com" class="external-link">data.table</a></span><span class="op">)</span></span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> </span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Attaching package: 'data.table'</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> The following object is masked from 'package:purrr':</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> </span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span>     transpose</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> The following objects are masked from 'package:dplyr':</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> </span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span>     between, first, last</span>
+<span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/as.data.table.html" class="external-link">as.data.table</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>     speed dist</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  1:     4    2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  2:     4   10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  3:     7    4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  4:     7   22</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  5:     8   16</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  6:     9   10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  7:    10   18</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  8:    10   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  9:    10   34</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 10:    11   17</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 11:    11   28</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 12:    12   14</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 13:    12   20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 14:    12   24</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 15:    12   28</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 16:    13   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 17:    13   34</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 18:    13   34</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 19:    13   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 20:    14   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 21:    14   36</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 22:    14   60</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 23:    14   80</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 24:    15   20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 25:    15   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 26:    15   54</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 27:    16   32</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 28:    16   40</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 29:    17   32</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 30:    17   40</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 31:    17   50</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 32:    18   42</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 33:    18   56</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 34:    18   76</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 35:    18   84</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 36:    19   36</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 37:    19   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 38:    19   68</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 39:    20   32</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 40:    20   48</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 41:    20   52</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 42:    20   56</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 43:    20   64</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 44:    22   66</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 45:    23   54</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 46:    24   70</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 47:    24   92</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 48:    24   93</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 49:    24  120</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 50:    25   85</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>     speed dist</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/as.disk.frame.html b/docs/reference/as.disk.frame.html
index 6fe5d859..10189939 100644
--- a/docs/reference/as.disk.frame.html
+++ b/docs/reference/as.disk.frame.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Make a data.frame into a disk.frame — as.disk.frame • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Make a data.frame into a disk.frame — as.disk.frame" />
-<meta property="og:description" content="Make a data.frame into a disk.frame" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Make a data.frame into a disk.frame — as.disk.frame • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Make a data.frame into a disk.frame — as.disk.frame"><meta property="og:description" content="Make a data.frame into a disk.frame"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Make a data.frame into a disk.frame</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/as.disk.frame.r'><code>R/as.disk.frame.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/as.disk.frame.r" class="external-link"><code>R/as.disk.frame.r</code></a></small>
     <div class="hidden name"><code>as.disk.frame.Rd</code></div>
     </div>
 
@@ -162,90 +95,75 @@ <h1>Make a data.frame into a disk.frame</h1>
     <p>Make a data.frame into a disk.frame</p>
     </div>
 
-    <pre class="usage"><span class='fu'>as.disk.frame</span>(
-  <span class='no'>df</span>,
-  <span class='kw'>outdir</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempfile</a></span>(<span class='kw'>fileext</span> <span class='kw'>=</span> <span class='st'>".df"</span>),
-  <span class='kw'>nchunks</span> <span class='kw'>=</span> <span class='fu'><a href='recommend_nchunks.html'>recommend_nchunks</a></span>(<span class='no'>df</span>),
-  <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>,
-  <span class='kw'>shardby</span> <span class='kw'>=</span> <span class='kw'>NULL</span>,
-  <span class='kw'>compress</span> <span class='kw'>=</span> <span class='fl'>50</span>,
-  <span class='no'>...</span>
-)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>df</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>outdir</th>
-      <td><p>the output directory</p></td>
-    </tr>
-    <tr>
-      <th>nchunks</th>
-      <td><p>number of chunks</p></td>
-    </tr>
-    <tr>
-      <th>overwrite</th>
-      <td><p>if TRUE the outdir will be overwritten, if FALSE it will throw an error if the directory is not empty</p></td>
-    </tr>
-    <tr>
-      <th>shardby</th>
-      <td><p>The shardkey</p></td>
-    </tr>
-    <tr>
-      <th>compress</th>
-      <td><p>the compression level 0-100; 100 is highest</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>passed to output_disk.frame</p></td>
-    </tr>
-    </table>
-
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='co'># write to temporary location</span>
-<span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'>as.disk.frame</span>(<span class='no'>cars</span>)
-
-<span class='co'># specify a different path in the temporary folder, you are free to choose a different folder</span>
-<span class='no'>cars_new_location.df</span> <span class='kw'>=</span> <span class='fu'>as.disk.frame</span>(<span class='no'>cars</span>, <span class='kw'>outdir</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/file.path.html'>file.path</a></span>(<span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempdir</a></span>(), <span class='st'>"some_path.df"</span>))
-
-<span class='co'># specify a different number of chunks</span>
-<span class='co'># this writes to tempdir() by default</span>
-<span class='no'>cars_chunks.df</span> <span class='kw'>=</span> <span class='fu'>as.disk.frame</span>(<span class='no'>cars</span>, <span class='kw'>nchunks</span> <span class='kw'>=</span> <span class='fl'>4</span>, <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>)
-
-<span class='co'># clean up</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars_new_location.df</span>)
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars_chunks.df</span>)</div></pre>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">as.disk.frame</span><span class="op">(</span>
+  <span class="va">df</span>,
+  outdir <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempfile</a></span><span class="op">(</span>fileext <span class="op">=</span> <span class="st">".df"</span><span class="op">)</span>,
+  nchunks <span class="op">=</span> <span class="fu"><a href="recommend_nchunks.html">recommend_nchunks</a></span><span class="op">(</span><span class="va">df</span><span class="op">)</span>,
+  overwrite <span class="op">=</span> <span class="cn">FALSE</span>,
+  shardby <span class="op">=</span> <span class="cn">NULL</span>,
+  compress <span class="op">=</span> <span class="fl">50</span>,
+  <span class="va">...</span>
+<span class="op">)</span></code></pre></div>
+    </div>
+
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>df</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>outdir</dt>
+<dd><p>the output directory</p></dd>
+<dt>nchunks</dt>
+<dd><p>number of chunks</p></dd>
+<dt>overwrite</dt>
+<dd><p>if TRUE the outdir will be overwritten, if FALSE it will throw an error if the directory is not empty</p></dd>
+<dt>shardby</dt>
+<dd><p>The shardkey</p></dd>
+<dt>compress</dt>
+<dd><p>the compression level 0-100; 100 is highest</p></dd>
+<dt>...</dt>
+<dd><p>passed to output_disk.frame</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="co"># write to temporary location</span></span>
+<span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu">as.disk.frame</span><span class="op">(</span><span class="va">cars</span><span class="op">)</span> </span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># specify a different path in the temporary folder, you are free to choose a different folder</span></span>
+<span class="r-in"><span class="va">cars_new_location.df</span> <span class="op">=</span> <span class="fu">as.disk.frame</span><span class="op">(</span><span class="va">cars</span>, outdir <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/file.path.html" class="external-link">file.path</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempdir</a></span><span class="op">(</span><span class="op">)</span>, <span class="st">"some_path.df"</span><span class="op">)</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># specify a different number of chunks</span></span>
+<span class="r-in"><span class="co"># this writes to tempdir() by default</span></span>
+<span class="r-in"><span class="va">cars_chunks.df</span> <span class="op">=</span> <span class="fu">as.disk.frame</span><span class="op">(</span><span class="va">cars</span>, nchunks <span class="op">=</span> <span class="fl">4</span>, overwrite <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span> </span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars_new_location.df</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars_chunks.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/chunk_group_by.html b/docs/reference/chunk_group_by.html
index 97d24c23..3b4f8168 100644
--- a/docs/reference/chunk_group_by.html
+++ b/docs/reference/chunk_group_by.html
@@ -1,70 +1,15 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Group by within each disk.frame — chunk_summarize • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Group by within each disk.frame — chunk_summarize" />
-<meta property="og:description" content="The disk.frame group by operation perform group WITHIN each chunk. This is
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Group by within each disk.frame — chunk_summarize • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Group by within each disk.frame — chunk_summarize"><meta property="og:description" content="The disk.frame group by operation perform group WITHIN each chunk. This is
 often used for performance reasons. If the user wishes to perform group-by,
 they may choose to use the `hard_group_by` function which is expensive as it
-reorganizes the chunks by the shard key." />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+reorganizes the chunks by the shard key."><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -75,19 +20,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -96,8 +34,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -130,34 +67,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Group by within each disk.frame</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/dplyr_verbs.r'><code>R/dplyr_verbs.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/dplyr_verbs.r" class="external-link"><code>R/dplyr_verbs.r</code></a></small>
     <div class="hidden name"><code>chunk_group_by.Rd</code></div>
     </div>
 
@@ -168,56 +101,49 @@ <h1>Group by within each disk.frame</h1>
 reorganizes the chunks by the shard key.</p>
     </div>
 
-    <pre class="usage"><span class='fu'>chunk_summarize</span>(<span class='no'>.data</span>, <span class='no'>...</span>)
-
-<span class='fu'>chunk_summarise</span>(<span class='no'>.data</span>, <span class='no'>...</span>)
-
-<span class='fu'>chunk_group_by</span>(<span class='no'>.data</span>, <span class='no'>...</span>)
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">chunk_summarize</span><span class="op">(</span><span class="va">.data</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>chunk_ungroup</span>(<span class='no'>.data</span>, <span class='no'>...</span>)</pre>
+<span class="fu">chunk_summarise</span><span class="op">(</span><span class="va">.data</span>, <span class="va">...</span><span class="op">)</span>
 
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>.data</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>passed to dplyr::group_by</p></td>
-    </tr>
-    </table>
+<span class="fu">chunk_group_by</span><span class="op">(</span><span class="va">.data</span>, <span class="va">...</span><span class="op">)</span>
 
-    <h2 class="hasAnchor" id="see-also"><a class="anchor" href="#see-also"></a>See also</h2>
+<span class="fu">chunk_ungroup</span><span class="op">(</span><span class="va">.data</span>, <span class="va">...</span><span class="op">)</span></code></pre></div>
+    </div>
 
-    <div class='dont-index'><p>hard_group_by group_by</p></div>
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>.data</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>...</dt>
+<dd><p>passed to dplyr::group_by</p></dd>
+</dl></div>
+    <div id="see-also">
+    <h2>See also</h2>
+    <div class="dont-index"><p>hard_group_by group_by</p></div>
+    </div>
 
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/cmap.html b/docs/reference/cmap.html
index 06e4a674..8d46d751 100644
--- a/docs/reference/cmap.html
+++ b/docs/reference/cmap.html
@@ -1,71 +1,16 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Apply the same function to all chunks — cmap • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Apply the same function to all chunks — cmap" />
-<meta property="og:description" content="Apply the same function to all chunks
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Apply the same function to all chunks — cmap • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Apply the same function to all chunks — cmap"><meta property="og:description" content="Apply the same function to all chunks
 `cimap.disk.frame` accepts a two argument function where the first argument is a data.frame and the 
 second is the chunk ID
 `lazy` is convenience function to apply `.f` to every chunk
-`delayed` is an alias for lazy and is consistent with the naming in Dask and Dagger.jl" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+`delayed` is an alias for lazy and is consistent with the naming in Dask and Dagger.jl"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
-
-
-  </head>
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -76,19 +21,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -97,8 +35,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -131,34 +68,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Apply the same function to all chunks</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/cmap.r'><code>R/cmap.r</code></a>, <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/map-deprecated.r'><code>R/map-deprecated.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/cmap.r" class="external-link"><code>R/cmap.r</code></a>, <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/map-deprecated.r" class="external-link"><code>R/map-deprecated.r</code></a></small>
     <div class="hidden name"><code>cmap.Rd</code></div>
     </div>
 
@@ -170,430 +103,415 @@ <h1>Apply the same function to all chunks</h1>
 <p>`delayed` is an alias for lazy and is consistent with the naming in Dask and Dagger.jl</p>
     </div>
 
-    <pre class="usage"><span class='fu'>cmap</span>(<span class='no'>.x</span>, <span class='no'>.f</span>, <span class='no'>...</span>)
-
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>cmap</span>(
-  <span class='no'>.x</span>,
-  <span class='no'>.f</span>,
-  <span class='no'>...</span>,
-  <span class='kw'>outdir</span> <span class='kw'>=</span> <span class='kw'>NULL</span>,
-  <span class='kw'>keep</span> <span class='kw'>=</span> <span class='kw'>NULL</span>,
-  <span class='kw'>chunks</span> <span class='kw'>=</span> <span class='fu'><a href='nchunks.html'>nchunks</a></span>(<span class='no'>.x</span>),
-  <span class='kw'>compress</span> <span class='kw'>=</span> <span class='fl'>50</span>,
-  <span class='kw'>lazy</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>,
-  <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>,
-  <span class='kw'>vars_and_pkgs</span> <span class='kw'>=</span> <span class='kw pkg'>future</span><span class='kw ns'>::</span><span class='fu'><a href='https://rdrr.io/pkg/future/man/getGlobalsAndPackages.html'>getGlobalsAndPackages</a></span>(<span class='no'>.f</span>, <span class='kw'>envir</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/sys.parent.html'>parent.frame</a></span>()),
-  <span class='kw'>.progress</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>
-)
-
-<span class='fu'>cmap_dfr</span>(<span class='no'>.x</span>, <span class='no'>.f</span>, <span class='no'>...</span>, <span class='kw'>.id</span> <span class='kw'>=</span> <span class='kw'>NULL</span>)
-
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>cmap_dfr</span>(<span class='no'>.x</span>, <span class='no'>.f</span>, <span class='no'>...</span>, <span class='kw'>.id</span> <span class='kw'>=</span> <span class='kw'>NULL</span>, <span class='kw'>use.names</span> <span class='kw'>=</span> <span class='no'>fill</span>, <span class='kw'>fill</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>, <span class='kw'>idcol</span> <span class='kw'>=</span> <span class='kw'>NULL</span>)
-
-<span class='fu'>cimap</span>(<span class='no'>.x</span>, <span class='no'>.f</span>, <span class='no'>...</span>)
-
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>cimap</span>(
-  <span class='no'>.x</span>,
-  <span class='no'>.f</span>,
-  <span class='kw'>outdir</span> <span class='kw'>=</span> <span class='kw'>NULL</span>,
-  <span class='kw'>keep</span> <span class='kw'>=</span> <span class='kw'>NULL</span>,
-  <span class='kw'>chunks</span> <span class='kw'>=</span> <span class='fu'><a href='nchunks.html'>nchunks</a></span>(<span class='no'>.x</span>),
-  <span class='kw'>compress</span> <span class='kw'>=</span> <span class='fl'>50</span>,
-  <span class='kw'>lazy</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>,
-  <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>,
-  <span class='no'>...</span>
-)
-
-<span class='fu'>cimap_dfr</span>(<span class='no'>.x</span>, <span class='no'>.f</span>, <span class='no'>...</span>, <span class='kw'>.id</span> <span class='kw'>=</span> <span class='kw'>NULL</span>)
-
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>cimap_dfr</span>(
-  <span class='no'>.x</span>,
-  <span class='no'>.f</span>,
-  <span class='no'>...</span>,
-  <span class='kw'>.id</span> <span class='kw'>=</span> <span class='kw'>NULL</span>,
-  <span class='kw'>use.names</span> <span class='kw'>=</span> <span class='no'>fill</span>,
-  <span class='kw'>fill</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>,
-  <span class='kw'>idcol</span> <span class='kw'>=</span> <span class='kw'>NULL</span>
-)
-
-<span class='fu'>lazy</span>(<span class='no'>.x</span>, <span class='no'>.f</span>, <span class='no'>...</span>)
-
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>lazy</span>(<span class='no'>.x</span>, <span class='no'>.f</span>, <span class='no'>...</span>)
-
-<span class='fu'>delayed</span>(<span class='no'>.x</span>, <span class='no'>.f</span>, <span class='no'>...</span>)
-
-<span class='fu'>chunk_lapply</span>(<span class='no'>...</span>)
-
-<span class='fu'>map</span>(<span class='no'>.x</span>, <span class='no'>.f</span>, <span class='no'>...</span>)
-
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>map</span>(<span class='no'>...</span>)
-
-<span class='co'># S3 method for default</span>
-<span class='fu'>map</span>(<span class='no'>.x</span>, <span class='no'>.f</span>, <span class='no'>...</span>)
-
-<span class='fu'>imap_dfr</span>(<span class='no'>.x</span>, <span class='no'>.f</span>, <span class='no'>...</span>, <span class='kw'>.id</span> <span class='kw'>=</span> <span class='kw'>NULL</span>)
-
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>imap_dfr</span>(<span class='no'>...</span>)
-
-<span class='co'># S3 method for default</span>
-<span class='fu'>imap_dfr</span>(<span class='no'>.x</span>, <span class='no'>.f</span>, <span class='no'>...</span>, <span class='kw'>.id</span> <span class='kw'>=</span> <span class='kw'>NULL</span>)
-
-<span class='fu'>imap</span>(<span class='no'>.x</span>, <span class='no'>.f</span>, <span class='no'>...</span>)
-
-<span class='co'># S3 method for default</span>
-<span class='fu'>imap</span>(<span class='no'>.x</span>, <span class='no'>.f</span>, <span class='no'>...</span>)
-
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>map_dfr</span>(<span class='no'>...</span>)
-
-<span class='co'># S3 method for default</span>
-<span class='fu'>map_dfr</span>(<span class='no'>.x</span>, <span class='no'>.f</span>, <span class='no'>...</span>, <span class='kw'>.id</span> <span class='kw'>=</span> <span class='kw'>NULL</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>.x</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>.f</th>
-      <td><p>a function to apply to each of the chunks</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>for compatibility with `purrr::map`</p></td>
-    </tr>
-    <tr>
-      <th>outdir</th>
-      <td><p>the output directory</p></td>
-    </tr>
-    <tr>
-      <th>keep</th>
-      <td><p>the columns to keep from the input</p></td>
-    </tr>
-    <tr>
-      <th>chunks</th>
-      <td><p>The number of chunks to output</p></td>
-    </tr>
-    <tr>
-      <th>compress</th>
-      <td><p>0-100 fst compression ratio</p></td>
-    </tr>
-    <tr>
-      <th>lazy</th>
-      <td><p>if TRUE then do this lazily</p></td>
-    </tr>
-    <tr>
-      <th>overwrite</th>
-      <td><p>if TRUE removes any existing chunks in the data</p></td>
-    </tr>
-    <tr>
-      <th>vars_and_pkgs</th>
-      <td><p>variables and packages to send to a background session. This is typically automatically detected</p></td>
-    </tr>
-    <tr>
-      <th>.progress</th>
-      <td><p>A logical, for whether or not to print a progress bar for multiprocess, multisession, and multicore plans. From furrr</p></td>
-    </tr>
-    <tr>
-      <th>.id</th>
-      <td><p>not used</p></td>
-    </tr>
-    <tr>
-      <th>use.names</th>
-      <td><p>for cmap_dfr's call to data.table::rbindlist. See data.table::rbindlist</p></td>
-    </tr>
-    <tr>
-      <th>fill</th>
-      <td><p>for cmap_dfr's call to data.table::rbindlist. See data.table::rbindlist</p></td>
-    </tr>
-    <tr>
-      <th>idcol</th>
-      <td><p>for cmap_dfr's call to data.table::rbindlist. See data.table::rbindlist</p></td>
-    </tr>
-    </table>
-
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
-
-<span class='co'># return the first row of each chunk lazily</span>
-<span class='co'># </span>
-<span class='no'>cars2</span> <span class='kw'>=</span> <span class='fu'>cmap</span>(<span class='no'>cars.df</span>, <span class='kw'>function</span>(<span class='no'>chunk</span>) {
- <span class='no'>chunk</span>[,<span class='fl'>1</span>]
-})
-
-<span class='fu'>collect</span>(<span class='no'>cars2</span>)</div><div class='output co'>#&gt;     speed
-#&gt;  1:     4
-#&gt;  2:     4
-#&gt;  3:     7
-#&gt;  4:     7
-#&gt;  5:     8
-#&gt;  6:     9
-#&gt;  7:    10
-#&gt;  8:    10
-#&gt;  9:    10
-#&gt; 10:    11
-#&gt; 11:    11
-#&gt; 12:    12
-#&gt; 13:    12
-#&gt; 14:    12
-#&gt; 15:    12
-#&gt; 16:    13
-#&gt; 17:    13
-#&gt; 18:    13
-#&gt; 19:    13
-#&gt; 20:    14
-#&gt; 21:    14
-#&gt; 22:    14
-#&gt; 23:    14
-#&gt; 24:    15
-#&gt; 25:    15
-#&gt; 26:    15
-#&gt; 27:    16
-#&gt; 28:    16
-#&gt; 29:    17
-#&gt; 30:    17
-#&gt; 31:    17
-#&gt; 32:    18
-#&gt; 33:    18
-#&gt; 34:    18
-#&gt; 35:    18
-#&gt; 36:    19
-#&gt; 37:    19
-#&gt; 38:    19
-#&gt; 39:    20
-#&gt; 40:    20
-#&gt; 41:    20
-#&gt; 42:    20
-#&gt; 43:    20
-#&gt; 44:    22
-#&gt; 45:    23
-#&gt; 46:    24
-#&gt; 47:    24
-#&gt; 48:    24
-#&gt; 49:    24
-#&gt; 50:    25
-#&gt;     speed</div><div class='input'>
-<span class='co'># same as above but using purrr </span>
-<span class='no'>cars2</span> <span class='kw'>=</span> <span class='fu'>cmap</span>(<span class='no'>cars.df</span>, ~<span class='no'>.x</span>[<span class='fl'>1</span>,])
-
-<span class='fu'>collect</span>(<span class='no'>cars2</span>)</div><div class='output co'>#&gt;    speed dist
-#&gt; 1:     4    2
-#&gt; 2:    11   17
-#&gt; 3:    13   46
-#&gt; 4:    16   40
-#&gt; 5:    19   46
-#&gt; 6:    24   70</div><div class='input'>
-<span class='co'># return the first row of each chunk eagerly as list</span>
-<span class='fu'>cmap</span>(<span class='no'>cars.df</span>, ~<span class='no'>.x</span>[<span class='fl'>1</span>,], <span class='kw'>lazy</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>)</div><div class='output co'>#&gt; [[1]]
-#&gt;    speed dist
-#&gt; 1:     4    2
-#&gt; 
-#&gt; [[2]]
-#&gt;    speed dist
-#&gt; 1:    11   17
-#&gt; 
-#&gt; [[3]]
-#&gt;    speed dist
-#&gt; 1:    13   46
-#&gt; 
-#&gt; [[4]]
-#&gt;    speed dist
-#&gt; 1:    16   40
-#&gt; 
-#&gt; [[5]]
-#&gt;    speed dist
-#&gt; 1:    19   46
-#&gt; 
-#&gt; [[6]]
-#&gt;    speed dist
-#&gt; 1:    24   70
-#&gt; </div><div class='input'>
-<span class='co'># return the first row of each chunk eagerly as data.table/data.frame by row-binding</span>
-<span class='fu'>cmap_dfr</span>(<span class='no'>cars.df</span>, ~<span class='no'>.x</span>[<span class='fl'>1</span>,])</div><div class='output co'>#&gt;    speed dist
-#&gt; 1:     4    2
-#&gt; 2:    11   17
-#&gt; 3:    13   46
-#&gt; 4:    16   40
-#&gt; 5:    19   46
-#&gt; 6:    24   70</div><div class='input'>
-<span class='co'># lazy and delayed are just an aliases for cmap(..., lazy = TRUE)</span>
-<span class='fu'>collect</span>(<span class='fu'>lazy</span>(<span class='no'>cars.df</span>, ~<span class='no'>.x</span>[<span class='fl'>1</span>,]))</div><div class='output co'>#&gt;    speed dist
-#&gt; 1:     4    2
-#&gt; 2:    11   17
-#&gt; 3:    13   46
-#&gt; 4:    16   40
-#&gt; 5:    19   46
-#&gt; 6:    24   70</div><div class='input'><span class='fu'>collect</span>(<span class='fu'>delayed</span>(<span class='no'>cars.df</span>, ~<span class='no'>.x</span>[<span class='fl'>1</span>,]))</div><div class='output co'>#&gt;    speed dist
-#&gt; 1:     4    2
-#&gt; 2:    11   17
-#&gt; 3:    13   46
-#&gt; 4:    16   40
-#&gt; 5:    19   46
-#&gt; 6:    24   70</div><div class='input'>
-<span class='co'># clean up cars.df</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)
-<span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
-
-<span class='co'># .x is the chunk and .y is the ID as an integer</span>
-
-<span class='co'># lazy = TRUE support is not available at the moment</span>
-<span class='fu'>cimap</span>(<span class='no'>cars.df</span>, ~<span class='no'>.x</span>[, <span class='no'>id</span> <span class='kw'>:=</span> <span class='no'>.y</span>], <span class='kw'>lazy</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>)</div><div class='output co'>#&gt; [[1]]
-#&gt;    speed dist id
-#&gt; 1:     4    2  1
-#&gt; 2:     4   10  1
-#&gt; 3:     7    4  1
-#&gt; 4:     7   22  1
-#&gt; 5:     8   16  1
-#&gt; 6:     9   10  1
-#&gt; 7:    10   18  1
-#&gt; 8:    10   26  1
-#&gt; 9:    10   34  1
-#&gt; 
-#&gt; [[2]]
-#&gt;    speed dist id
-#&gt; 1:    11   17  2
-#&gt; 2:    11   28  2
-#&gt; 3:    12   14  2
-#&gt; 4:    12   20  2
-#&gt; 5:    12   24  2
-#&gt; 6:    12   28  2
-#&gt; 7:    13   26  2
-#&gt; 8:    13   34  2
-#&gt; 9:    13   34  2
-#&gt; 
-#&gt; [[3]]
-#&gt;    speed dist id
-#&gt; 1:    13   46  3
-#&gt; 2:    14   26  3
-#&gt; 3:    14   36  3
-#&gt; 4:    14   60  3
-#&gt; 5:    14   80  3
-#&gt; 6:    15   20  3
-#&gt; 7:    15   26  3
-#&gt; 8:    15   54  3
-#&gt; 9:    16   32  3
-#&gt; 
-#&gt; [[4]]
-#&gt;    speed dist id
-#&gt; 1:    16   40  4
-#&gt; 2:    17   32  4
-#&gt; 3:    17   40  4
-#&gt; 4:    17   50  4
-#&gt; 5:    18   42  4
-#&gt; 6:    18   56  4
-#&gt; 7:    18   76  4
-#&gt; 8:    18   84  4
-#&gt; 9:    19   36  4
-#&gt; 
-#&gt; [[5]]
-#&gt;    speed dist id
-#&gt; 1:    19   46  5
-#&gt; 2:    19   68  5
-#&gt; 3:    20   32  5
-#&gt; 4:    20   48  5
-#&gt; 5:    20   52  5
-#&gt; 6:    20   56  5
-#&gt; 7:    20   64  5
-#&gt; 8:    22   66  5
-#&gt; 9:    23   54  5
-#&gt; 
-#&gt; [[6]]
-#&gt;    speed dist id
-#&gt; 1:    24   70  6
-#&gt; 2:    24   92  6
-#&gt; 3:    24   93  6
-#&gt; 4:    24  120  6
-#&gt; 5:    25   85  6
-#&gt; </div><div class='input'>
-<span class='fu'>cimap_dfr</span>(<span class='no'>cars.df</span>, ~<span class='no'>.x</span>[, <span class='no'>id</span> <span class='kw'>:=</span> <span class='no'>.y</span>])</div><div class='output co'>#&gt;     speed dist id
-#&gt;  1:     4    2  1
-#&gt;  2:     4   10  1
-#&gt;  3:     7    4  1
-#&gt;  4:     7   22  1
-#&gt;  5:     8   16  1
-#&gt;  6:     9   10  1
-#&gt;  7:    10   18  1
-#&gt;  8:    10   26  1
-#&gt;  9:    10   34  1
-#&gt; 10:    11   17  2
-#&gt; 11:    11   28  2
-#&gt; 12:    12   14  2
-#&gt; 13:    12   20  2
-#&gt; 14:    12   24  2
-#&gt; 15:    12   28  2
-#&gt; 16:    13   26  2
-#&gt; 17:    13   34  2
-#&gt; 18:    13   34  2
-#&gt; 19:    13   46  3
-#&gt; 20:    14   26  3
-#&gt; 21:    14   36  3
-#&gt; 22:    14   60  3
-#&gt; 23:    14   80  3
-#&gt; 24:    15   20  3
-#&gt; 25:    15   26  3
-#&gt; 26:    15   54  3
-#&gt; 27:    16   32  3
-#&gt; 28:    16   40  4
-#&gt; 29:    17   32  4
-#&gt; 30:    17   40  4
-#&gt; 31:    17   50  4
-#&gt; 32:    18   42  4
-#&gt; 33:    18   56  4
-#&gt; 34:    18   76  4
-#&gt; 35:    18   84  4
-#&gt; 36:    19   36  4
-#&gt; 37:    19   46  5
-#&gt; 38:    19   68  5
-#&gt; 39:    20   32  5
-#&gt; 40:    20   48  5
-#&gt; 41:    20   52  5
-#&gt; 42:    20   56  5
-#&gt; 43:    20   64  5
-#&gt; 44:    22   66  5
-#&gt; 45:    23   54  5
-#&gt; 46:    24   70  6
-#&gt; 47:    24   92  6
-#&gt; 48:    24   93  6
-#&gt; 49:    24  120  6
-#&gt; 50:    25   85  6
-#&gt;     speed dist id</div><div class='input'>
-<span class='co'># clean up cars.df</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)</div></pre>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">cmap</span><span class="op">(</span><span class="va">.x</span>, <span class="va">.f</span>, <span class="va">...</span><span class="op">)</span>
+
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu">cmap</span><span class="op">(</span>
+  <span class="va">.x</span>,
+  <span class="va">.f</span>,
+  <span class="va">...</span>,
+  outdir <span class="op">=</span> <span class="cn">NULL</span>,
+  keep <span class="op">=</span> <span class="cn">NULL</span>,
+  chunks <span class="op">=</span> <span class="fu"><a href="nchunks.html">nchunks</a></span><span class="op">(</span><span class="va">.x</span><span class="op">)</span>,
+  compress <span class="op">=</span> <span class="fl">50</span>,
+  lazy <span class="op">=</span> <span class="cn">TRUE</span>,
+  overwrite <span class="op">=</span> <span class="cn">FALSE</span>,
+  vars_and_pkgs <span class="op">=</span> <span class="fu">future</span><span class="fu">::</span><span class="fu"><a href="https://future.futureverse.org/reference/getGlobalsAndPackages.html" class="external-link">getGlobalsAndPackages</a></span><span class="op">(</span><span class="va">.f</span>, envir <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/sys.parent.html" class="external-link">parent.frame</a></span><span class="op">(</span><span class="op">)</span><span class="op">)</span>,
+  .progress <span class="op">=</span> <span class="cn">TRUE</span>
+<span class="op">)</span>
+
+<span class="fu">cmap_dfr</span><span class="op">(</span><span class="va">.x</span>, <span class="va">.f</span>, <span class="va">...</span>, .id <span class="op">=</span> <span class="cn">NULL</span><span class="op">)</span>
+
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu">cmap_dfr</span><span class="op">(</span><span class="va">.x</span>, <span class="va">.f</span>, <span class="va">...</span>, .id <span class="op">=</span> <span class="cn">NULL</span>, use.names <span class="op">=</span> <span class="va">fill</span>, fill <span class="op">=</span> <span class="cn">FALSE</span>, idcol <span class="op">=</span> <span class="cn">NULL</span><span class="op">)</span>
+
+<span class="fu">cimap</span><span class="op">(</span><span class="va">.x</span>, <span class="va">.f</span>, <span class="va">...</span><span class="op">)</span>
+
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu">cimap</span><span class="op">(</span>
+  <span class="va">.x</span>,
+  <span class="va">.f</span>,
+  outdir <span class="op">=</span> <span class="cn">NULL</span>,
+  keep <span class="op">=</span> <span class="cn">NULL</span>,
+  chunks <span class="op">=</span> <span class="fu"><a href="nchunks.html">nchunks</a></span><span class="op">(</span><span class="va">.x</span><span class="op">)</span>,
+  compress <span class="op">=</span> <span class="fl">50</span>,
+  lazy <span class="op">=</span> <span class="cn">TRUE</span>,
+  overwrite <span class="op">=</span> <span class="cn">FALSE</span>,
+  <span class="va">...</span>
+<span class="op">)</span>
+
+<span class="fu">cimap_dfr</span><span class="op">(</span><span class="va">.x</span>, <span class="va">.f</span>, <span class="va">...</span>, .id <span class="op">=</span> <span class="cn">NULL</span><span class="op">)</span>
+
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu">cimap_dfr</span><span class="op">(</span>
+  <span class="va">.x</span>,
+  <span class="va">.f</span>,
+  <span class="va">...</span>,
+  .id <span class="op">=</span> <span class="cn">NULL</span>,
+  use.names <span class="op">=</span> <span class="va">fill</span>,
+  fill <span class="op">=</span> <span class="cn">FALSE</span>,
+  idcol <span class="op">=</span> <span class="cn">NULL</span>
+<span class="op">)</span>
+
+<span class="fu">lazy</span><span class="op">(</span><span class="va">.x</span>, <span class="va">.f</span>, <span class="va">...</span><span class="op">)</span>
+
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu">lazy</span><span class="op">(</span><span class="va">.x</span>, <span class="va">.f</span>, <span class="va">...</span><span class="op">)</span>
+
+<span class="fu">delayed</span><span class="op">(</span><span class="va">.x</span>, <span class="va">.f</span>, <span class="va">...</span><span class="op">)</span>
+
+<span class="fu">chunk_lapply</span><span class="op">(</span><span class="va">...</span><span class="op">)</span>
+
+<span class="fu">map</span><span class="op">(</span><span class="va">.x</span>, <span class="va">.f</span>, <span class="va">...</span><span class="op">)</span>
+
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu">map</span><span class="op">(</span><span class="va">...</span><span class="op">)</span>
+
+<span class="co"># S3 method for default</span>
+<span class="fu">map</span><span class="op">(</span><span class="va">.x</span>, <span class="va">.f</span>, <span class="va">...</span><span class="op">)</span>
+
+<span class="fu">imap_dfr</span><span class="op">(</span><span class="va">.x</span>, <span class="va">.f</span>, <span class="va">...</span>, .id <span class="op">=</span> <span class="cn">NULL</span><span class="op">)</span>
+
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu">imap_dfr</span><span class="op">(</span><span class="va">...</span><span class="op">)</span>
+
+<span class="co"># S3 method for default</span>
+<span class="fu">imap_dfr</span><span class="op">(</span><span class="va">.x</span>, <span class="va">.f</span>, <span class="va">...</span>, .id <span class="op">=</span> <span class="cn">NULL</span><span class="op">)</span>
+
+<span class="fu">imap</span><span class="op">(</span><span class="va">.x</span>, <span class="va">.f</span>, <span class="va">...</span><span class="op">)</span>
+
+<span class="co"># S3 method for default</span>
+<span class="fu">imap</span><span class="op">(</span><span class="va">.x</span>, <span class="va">.f</span>, <span class="va">...</span><span class="op">)</span>
+
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://purrr.tidyverse.org/reference/map.html" class="external-link">map_dfr</a></span><span class="op">(</span><span class="va">...</span><span class="op">)</span>
+
+<span class="co"># S3 method for default</span>
+<span class="fu"><a href="https://purrr.tidyverse.org/reference/map.html" class="external-link">map_dfr</a></span><span class="op">(</span><span class="va">.x</span>, <span class="va">.f</span>, <span class="va">...</span>, .id <span class="op">=</span> <span class="cn">NULL</span><span class="op">)</span></code></pre></div>
+    </div>
+
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>.x</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>.f</dt>
+<dd><p>a function to apply to each of the chunks</p></dd>
+<dt>...</dt>
+<dd><p>for compatibility with `purrr::map`</p></dd>
+<dt>outdir</dt>
+<dd><p>the output directory</p></dd>
+<dt>keep</dt>
+<dd><p>the columns to keep from the input</p></dd>
+<dt>chunks</dt>
+<dd><p>The number of chunks to output</p></dd>
+<dt>compress</dt>
+<dd><p>0-100 fst compression ratio</p></dd>
+<dt>lazy</dt>
+<dd><p>if TRUE then do this lazily</p></dd>
+<dt>overwrite</dt>
+<dd><p>if TRUE removes any existing chunks in the data</p></dd>
+<dt>vars_and_pkgs</dt>
+<dd><p>variables and packages to send to a background session. This is typically automatically detected</p></dd>
+<dt>.progress</dt>
+<dd><p>A logical, for whether or not to print a progress bar for multiprocess, multisession, and multicore plans. From furrr</p></dd>
+<dt>.id</dt>
+<dd><p>not used</p></dd>
+<dt>use.names</dt>
+<dd><p>for cmap_dfr's call to data.table::rbindlist. See data.table::rbindlist</p></dd>
+<dt>fill</dt>
+<dd><p>for cmap_dfr's call to data.table::rbindlist. See data.table::rbindlist</p></dd>
+<dt>idcol</dt>
+<dd><p>for cmap_dfr's call to data.table::rbindlist. See data.table::rbindlist</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># return the first row of each chunk lazily</span></span>
+<span class="r-in"><span class="co"># </span></span>
+<span class="r-in"><span class="va">cars2</span> <span class="op">=</span> <span class="fu">cmap</span><span class="op">(</span><span class="va">cars.df</span>, <span class="kw">function</span><span class="op">(</span><span class="va">chunk</span><span class="op">)</span> <span class="op">{</span></span>
+<span class="r-in"> <span class="va">chunk</span><span class="op">[</span>,<span class="fl">1</span><span class="op">]</span></span>
+<span class="r-in"><span class="op">}</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="fu"><a href="https://dplyr.tidyverse.org/reference/compute.html" class="external-link">collect</a></span><span class="op">(</span><span class="va">cars2</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>     speed</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  1:     4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  2:     4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  3:     7</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  4:     7</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  5:     8</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  6:     9</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  7:    10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  8:    10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  9:    10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 10:    11</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 11:    11</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 12:    12</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 13:    12</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 14:    12</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 15:    12</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 16:    13</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 17:    13</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 18:    13</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 19:    13</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 20:    14</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 21:    14</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 22:    14</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 23:    14</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 24:    15</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 25:    15</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 26:    15</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 27:    16</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 28:    16</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 29:    17</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 30:    17</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 31:    17</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 32:    18</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 33:    18</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 34:    18</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 35:    18</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 36:    19</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 37:    19</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 38:    19</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 39:    20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 40:    20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 41:    20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 42:    20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 43:    20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 44:    22</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 45:    23</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 46:    24</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 47:    24</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 48:    24</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 49:    24</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 50:    25</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>     speed</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># same as above but using purrr </span></span>
+<span class="r-in"><span class="va">cars2</span> <span class="op">=</span> <span class="fu">cmap</span><span class="op">(</span><span class="va">cars.df</span>, <span class="op">~</span><span class="va">.x</span><span class="op">[</span><span class="fl">1</span>,<span class="op">]</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="fu"><a href="https://dplyr.tidyverse.org/reference/compute.html" class="external-link">collect</a></span><span class="op">(</span><span class="va">cars2</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>    speed dist</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 1:     4    2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 2:    11   17</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 3:    13   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 4:    16   40</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 5:    19   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 6:    24   70</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># return the first row of each chunk eagerly as list</span></span>
+<span class="r-in"><span class="fu">cmap</span><span class="op">(</span><span class="va">cars.df</span>, <span class="op">~</span><span class="va">.x</span><span class="op">[</span><span class="fl">1</span>,<span class="op">]</span>, lazy <span class="op">=</span> <span class="cn">FALSE</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [[1]]</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>    speed dist</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 1:     4    2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [[2]]</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>    speed dist</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 1:    11   17</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [[3]]</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>    speed dist</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 1:    13   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [[4]]</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>    speed dist</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 1:    16   40</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [[5]]</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>    speed dist</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 1:    19   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [[6]]</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>    speed dist</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 1:    24   70</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> </span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># return the first row of each chunk eagerly as data.table/data.frame by row-binding</span></span>
+<span class="r-in"><span class="fu">cmap_dfr</span><span class="op">(</span><span class="va">cars.df</span>, <span class="op">~</span><span class="va">.x</span><span class="op">[</span><span class="fl">1</span>,<span class="op">]</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>    speed dist</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 1:     4    2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 2:    11   17</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 3:    13   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 4:    16   40</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 5:    19   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 6:    24   70</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># lazy and delayed are just an aliases for cmap(..., lazy = TRUE)</span></span>
+<span class="r-in"><span class="fu"><a href="https://dplyr.tidyverse.org/reference/compute.html" class="external-link">collect</a></span><span class="op">(</span><span class="fu">lazy</span><span class="op">(</span><span class="va">cars.df</span>, <span class="op">~</span><span class="va">.x</span><span class="op">[</span><span class="fl">1</span>,<span class="op">]</span><span class="op">)</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>    speed dist</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 1:     4    2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 2:    11   17</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 3:    13   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 4:    16   40</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 5:    19   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 6:    24   70</span>
+<span class="r-in"><span class="fu"><a href="https://dplyr.tidyverse.org/reference/compute.html" class="external-link">collect</a></span><span class="op">(</span><span class="fu">delayed</span><span class="op">(</span><span class="va">cars.df</span>, <span class="op">~</span><span class="va">.x</span><span class="op">[</span><span class="fl">1</span>,<span class="op">]</span><span class="op">)</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>    speed dist</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 1:     4    2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 2:    11   17</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 3:    13   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 4:    16   40</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 5:    19   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 6:    24   70</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up cars.df</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># .x is the chunk and .y is the ID as an integer</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># lazy = TRUE support is not available at the moment</span></span>
+<span class="r-in"><span class="fu">cimap</span><span class="op">(</span><span class="va">cars.df</span>, <span class="op">~</span><span class="va">.x</span><span class="op">[</span>, <span class="va">id</span> <span class="op">:=</span> <span class="va">.y</span><span class="op">]</span>, lazy <span class="op">=</span> <span class="cn">FALSE</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [[1]]</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>    speed dist id</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 1:     4    2  1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 2:     4   10  1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 3:     7    4  1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 4:     7   22  1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 5:     8   16  1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 6:     9   10  1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 7:    10   18  1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 8:    10   26  1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 9:    10   34  1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [[2]]</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>    speed dist id</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 1:    11   17  2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 2:    11   28  2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 3:    12   14  2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 4:    12   20  2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 5:    12   24  2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 6:    12   28  2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 7:    13   26  2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 8:    13   34  2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 9:    13   34  2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [[3]]</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>    speed dist id</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 1:    13   46  3</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 2:    14   26  3</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 3:    14   36  3</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 4:    14   60  3</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 5:    14   80  3</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 6:    15   20  3</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 7:    15   26  3</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 8:    15   54  3</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 9:    16   32  3</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [[4]]</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>    speed dist id</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 1:    16   40  4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 2:    17   32  4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 3:    17   40  4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 4:    17   50  4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 5:    18   42  4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 6:    18   56  4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 7:    18   76  4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 8:    18   84  4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 9:    19   36  4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [[5]]</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>    speed dist id</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 1:    19   46  5</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 2:    19   68  5</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 3:    20   32  5</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 4:    20   48  5</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 5:    20   52  5</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 6:    20   56  5</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 7:    20   64  5</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 8:    22   66  5</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 9:    23   54  5</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [[6]]</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>    speed dist id</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 1:    24   70  6</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 2:    24   92  6</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 3:    24   93  6</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 4:    24  120  6</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 5:    25   85  6</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> </span>
+<span class="r-in"></span>
+<span class="r-in"><span class="fu">cimap_dfr</span><span class="op">(</span><span class="va">cars.df</span>, <span class="op">~</span><span class="va">.x</span><span class="op">[</span>, <span class="va">id</span> <span class="op">:=</span> <span class="va">.y</span><span class="op">]</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>     speed dist id</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  1:     4    2  1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  2:     4   10  1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  3:     7    4  1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  4:     7   22  1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  5:     8   16  1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  6:     9   10  1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  7:    10   18  1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  8:    10   26  1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  9:    10   34  1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 10:    11   17  2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 11:    11   28  2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 12:    12   14  2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 13:    12   20  2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 14:    12   24  2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 15:    12   28  2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 16:    13   26  2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 17:    13   34  2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 18:    13   34  2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 19:    13   46  3</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 20:    14   26  3</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 21:    14   36  3</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 22:    14   60  3</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 23:    14   80  3</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 24:    15   20  3</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 25:    15   26  3</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 26:    15   54  3</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 27:    16   32  3</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 28:    16   40  4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 29:    17   32  4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 30:    17   40  4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 31:    17   50  4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 32:    18   42  4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 33:    18   56  4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 34:    18   76  4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 35:    18   84  4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 36:    19   36  4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 37:    19   46  5</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 38:    19   68  5</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 39:    20   32  5</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 40:    20   48  5</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 41:    20   52  5</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 42:    20   56  5</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 43:    20   64  5</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 44:    22   66  5</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 45:    23   54  5</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 46:    24   70  6</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 47:    24   92  6</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 48:    24   93  6</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 49:    24  120  6</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 50:    25   85  6</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>     speed dist id</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up cars.df</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/cmap2.html b/docs/reference/cmap2.html
index 795270b3..0910f609 100644
--- a/docs/reference/cmap2.html
+++ b/docs/reference/cmap2.html
@@ -1,68 +1,13 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>`cmap2` a function to two disk.frames — cmap2 • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="`cmap2` a function to two disk.frames — cmap2" />
-<meta property="og:description" content="Perform a function on both disk.frames .x and .y, each chunk of .x and .y
-gets run by .f(x.chunk, y.chunk)" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>`cmap2` a function to two disk.frames — cmap2 • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="`cmap2` a function to two disk.frames — cmap2"><meta property="og:description" content="Perform a function on both disk.frames .x and .y, each chunk of .x and .y
+gets run by .f(x.chunk, y.chunk)"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -73,19 +18,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -94,8 +32,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -128,34 +65,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>`cmap2` a function to two disk.frames</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/map2.r'><code>R/map2.r</code></a>, <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/map_by_chunk_id.r'><code>R/map_by_chunk_id.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/map2.r" class="external-link"><code>R/map2.r</code></a>, <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/map_by_chunk_id.r" class="external-link"><code>R/map_by_chunk_id.r</code></a></small>
     <div class="hidden name"><code>cmap2.Rd</code></div>
     </div>
 
@@ -164,173 +97,164 @@ <h1>`cmap2` a function to two disk.frames</h1>
 gets run by .f(x.chunk, y.chunk)</p>
     </div>
 
-    <pre class="usage"><span class='fu'>cmap2</span>(<span class='no'>.x</span>, <span class='no'>.y</span>, <span class='no'>.f</span>, <span class='no'>...</span>)
-
-<span class='fu'>map2</span>(<span class='no'>.x</span>, <span class='no'>.y</span>, <span class='no'>.f</span>, <span class='no'>...</span>)
-
-<span class='fu'>map_by_chunk_id</span>(<span class='no'>.x</span>, <span class='no'>.y</span>, <span class='no'>.f</span>, <span class='no'>...</span>, <span class='no'>outdir</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>.x</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>.y</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>.f</th>
-      <td><p>a function to be called on each chunk of x and y matched by
-chunk_id</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>not used</p></td>
-    </tr>
-    <tr>
-      <th>outdir</th>
-      <td><p>output directory</p></td>
-    </tr>
-    </table>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">cmap2</span><span class="op">(</span><span class="va">.x</span>, <span class="va">.y</span>, <span class="va">.f</span>, <span class="va">...</span><span class="op">)</span>
 
+<span class="fu">map2</span><span class="op">(</span><span class="va">.x</span>, <span class="va">.y</span>, <span class="va">.f</span>, <span class="va">...</span><span class="op">)</span>
 
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
+<span class="fu">map_by_chunk_id</span><span class="op">(</span><span class="va">.x</span>, <span class="va">.y</span>, <span class="va">.f</span>, <span class="va">...</span>, <span class="va">outdir</span><span class="op">)</span></code></pre></div>
+    </div>
 
-<span class='no'>cars2.df</span> <span class='kw'>=</span> <span class='fu'>cmap2</span>(<span class='no'>cars.df</span>, <span class='no'>cars.df</span>, ~<span class='kw pkg'>data.table</span><span class='kw ns'>::</span><span class='fu'><a href='https://Rdatatable.gitlab.io/data.table/reference/rbindlist.html'>rbindlist</a></span>(<span class='fu'><a href='https://rdrr.io/r/base/list.html'>list</a></span>(<span class='no'>.x</span>, <span class='no'>.y</span>)))
-<span class='fu'>collect</span>(<span class='no'>cars2.df</span>)</div><div class='output co'>#&gt;      speed dist
-#&gt;   1:     4    2
-#&gt;   2:     4   10
-#&gt;   3:     7    4
-#&gt;   4:     7   22
-#&gt;   5:     8   16
-#&gt;   6:     9   10
-#&gt;   7:    10   18
-#&gt;   8:    10   26
-#&gt;   9:    10   34
-#&gt;  10:     4    2
-#&gt;  11:     4   10
-#&gt;  12:     7    4
-#&gt;  13:     7   22
-#&gt;  14:     8   16
-#&gt;  15:     9   10
-#&gt;  16:    10   18
-#&gt;  17:    10   26
-#&gt;  18:    10   34
-#&gt;  19:    11   17
-#&gt;  20:    11   28
-#&gt;  21:    12   14
-#&gt;  22:    12   20
-#&gt;  23:    12   24
-#&gt;  24:    12   28
-#&gt;  25:    13   26
-#&gt;  26:    13   34
-#&gt;  27:    13   34
-#&gt;  28:    11   17
-#&gt;  29:    11   28
-#&gt;  30:    12   14
-#&gt;  31:    12   20
-#&gt;  32:    12   24
-#&gt;  33:    12   28
-#&gt;  34:    13   26
-#&gt;  35:    13   34
-#&gt;  36:    13   34
-#&gt;  37:    13   46
-#&gt;  38:    14   26
-#&gt;  39:    14   36
-#&gt;  40:    14   60
-#&gt;  41:    14   80
-#&gt;  42:    15   20
-#&gt;  43:    15   26
-#&gt;  44:    15   54
-#&gt;  45:    16   32
-#&gt;  46:    13   46
-#&gt;  47:    14   26
-#&gt;  48:    14   36
-#&gt;  49:    14   60
-#&gt;  50:    14   80
-#&gt;  51:    15   20
-#&gt;  52:    15   26
-#&gt;  53:    15   54
-#&gt;  54:    16   32
-#&gt;  55:    16   40
-#&gt;  56:    17   32
-#&gt;  57:    17   40
-#&gt;  58:    17   50
-#&gt;  59:    18   42
-#&gt;  60:    18   56
-#&gt;  61:    18   76
-#&gt;  62:    18   84
-#&gt;  63:    19   36
-#&gt;  64:    16   40
-#&gt;  65:    17   32
-#&gt;  66:    17   40
-#&gt;  67:    17   50
-#&gt;  68:    18   42
-#&gt;  69:    18   56
-#&gt;  70:    18   76
-#&gt;  71:    18   84
-#&gt;  72:    19   36
-#&gt;  73:    19   46
-#&gt;  74:    19   68
-#&gt;  75:    20   32
-#&gt;  76:    20   48
-#&gt;  77:    20   52
-#&gt;  78:    20   56
-#&gt;  79:    20   64
-#&gt;  80:    22   66
-#&gt;  81:    23   54
-#&gt;  82:    19   46
-#&gt;  83:    19   68
-#&gt;  84:    20   32
-#&gt;  85:    20   48
-#&gt;  86:    20   52
-#&gt;  87:    20   56
-#&gt;  88:    20   64
-#&gt;  89:    22   66
-#&gt;  90:    23   54
-#&gt;  91:    24   70
-#&gt;  92:    24   92
-#&gt;  93:    24   93
-#&gt;  94:    24  120
-#&gt;  95:    25   85
-#&gt;  96:    24   70
-#&gt;  97:    24   92
-#&gt;  98:    24   93
-#&gt;  99:    24  120
-#&gt; 100:    25   85
-#&gt;      speed dist</div><div class='input'>
-<span class='co'># clean up cars.df</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars2.df</span>)</div></pre>
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>.x</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>.y</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>.f</dt>
+<dd><p>a function to be called on each chunk of x and y matched by
+chunk_id</p></dd>
+<dt>...</dt>
+<dd><p>not used</p></dd>
+<dt>outdir</dt>
+<dd><p>output directory</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="va">cars2.df</span> <span class="op">=</span> <span class="fu">cmap2</span><span class="op">(</span><span class="va">cars.df</span>, <span class="va">cars.df</span>, <span class="op">~</span><span class="fu">data.table</span><span class="fu">::</span><span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/rbindlist.html" class="external-link">rbindlist</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/list.html" class="external-link">list</a></span><span class="op">(</span><span class="va">.x</span>, <span class="va">.y</span><span class="op">)</span><span class="op">)</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="https://dplyr.tidyverse.org/reference/compute.html" class="external-link">collect</a></span><span class="op">(</span><span class="va">cars2.df</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>      speed dist</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>   1:     4    2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>   2:     4   10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>   3:     7    4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>   4:     7   22</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>   5:     8   16</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>   6:     9   10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>   7:    10   18</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>   8:    10   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>   9:    10   34</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  10:     4    2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  11:     4   10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  12:     7    4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  13:     7   22</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  14:     8   16</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  15:     9   10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  16:    10   18</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  17:    10   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  18:    10   34</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  19:    11   17</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  20:    11   28</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  21:    12   14</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  22:    12   20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  23:    12   24</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  24:    12   28</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  25:    13   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  26:    13   34</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  27:    13   34</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  28:    11   17</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  29:    11   28</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  30:    12   14</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  31:    12   20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  32:    12   24</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  33:    12   28</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  34:    13   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  35:    13   34</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  36:    13   34</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  37:    13   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  38:    14   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  39:    14   36</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  40:    14   60</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  41:    14   80</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  42:    15   20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  43:    15   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  44:    15   54</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  45:    16   32</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  46:    13   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  47:    14   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  48:    14   36</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  49:    14   60</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  50:    14   80</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  51:    15   20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  52:    15   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  53:    15   54</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  54:    16   32</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  55:    16   40</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  56:    17   32</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  57:    17   40</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  58:    17   50</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  59:    18   42</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  60:    18   56</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  61:    18   76</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  62:    18   84</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  63:    19   36</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  64:    16   40</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  65:    17   32</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  66:    17   40</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  67:    17   50</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  68:    18   42</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  69:    18   56</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  70:    18   76</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  71:    18   84</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  72:    19   36</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  73:    19   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  74:    19   68</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  75:    20   32</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  76:    20   48</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  77:    20   52</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  78:    20   56</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  79:    20   64</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  80:    22   66</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  81:    23   54</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  82:    19   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  83:    19   68</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  84:    20   32</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  85:    20   48</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  86:    20   52</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  87:    20   56</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  88:    20   64</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  89:    22   66</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  90:    23   54</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  91:    24   70</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  92:    24   92</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  93:    24   93</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  94:    24  120</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  95:    25   85</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  96:    24   70</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  97:    24   92</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  98:    24   93</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  99:    24  120</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 100:    25   85</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>      speed dist</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up cars.df</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars2.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/collect.html b/docs/reference/collect.html
index b4759f5f..5b195078 100644
--- a/docs/reference/collect.html
+++ b/docs/reference/collect.html
@@ -1,70 +1,15 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Bring the disk.frame into R — collect.disk.frame • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Bring the disk.frame into R — collect.disk.frame" />
-<meta property="og:description" content="Bring the disk.frame into RAM by loading the data and running all lazy
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Bring the disk.frame into R — collect.disk.frame • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Bring the disk.frame into R — collect.disk.frame"><meta property="og:description" content="Bring the disk.frame into RAM by loading the data and running all lazy
 operations as data.table/data.frame or as a list
 Bring the disk.frame into RAM by loading the data and running all lazy
-operations as data.table/data.frame or as a list" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+operations as data.table/data.frame or as a list"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -75,19 +20,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -96,8 +34,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -130,34 +67,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Bring the disk.frame into R</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/collect.r'><code>R/collect.r</code></a>, <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/collect.summarized_disk.frame.r'><code>R/collect.summarized_disk.frame.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/collect.r" class="external-link"><code>R/collect.r</code></a>, <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/collect.summarized_disk.frame.r" class="external-link"><code>R/collect.summarized_disk.frame.r</code></a></small>
     <div class="hidden name"><code>collect.Rd</code></div>
     </div>
 
@@ -168,207 +101,205 @@ <h1>Bring the disk.frame into R</h1>
 operations as data.table/data.frame or as a list</p>
     </div>
 
-    <pre class="usage"><span class='co'># S3 method for disk.frame</span>
-<span class='fu'>collect</span>(<span class='no'>x</span>, <span class='no'>...</span>, <span class='kw'>parallel</span> <span class='kw'>=</span> !<span class='fu'><a href='https://rdrr.io/r/base/NULL.html'>is.null</a></span>(<span class='fu'><a href='https://rdrr.io/r/base/attr.html'>attr</a></span>(<span class='no'>x</span>, <span class='st'>"lazyfn"</span>)))
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/compute.html" class="external-link">collect</a></span><span class="op">(</span><span class="va">x</span>, <span class="va">...</span>, parallel <span class="op">=</span> <span class="op">!</span><span class="fu"><a href="https://rdrr.io/r/base/NULL.html" class="external-link">is.null</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/attr.html" class="external-link">attr</a></span><span class="op">(</span><span class="va">x</span>, <span class="st">"lazyfn"</span><span class="op">)</span><span class="op">)</span><span class="op">)</span>
 
-<span class='fu'>collect_list</span>(<span class='no'>x</span>, <span class='kw'>simplify</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>, <span class='kw'>parallel</span> <span class='kw'>=</span> !<span class='fu'><a href='https://rdrr.io/r/base/NULL.html'>is.null</a></span>(<span class='fu'><a href='https://rdrr.io/r/base/attr.html'>attr</a></span>(<span class='no'>x</span>, <span class='st'>"lazyfn"</span>)))
+<span class="fu">collect_list</span><span class="op">(</span><span class="va">x</span>, simplify <span class="op">=</span> <span class="cn">FALSE</span>, parallel <span class="op">=</span> <span class="op">!</span><span class="fu"><a href="https://rdrr.io/r/base/NULL.html" class="external-link">is.null</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/attr.html" class="external-link">attr</a></span><span class="op">(</span><span class="va">x</span>, <span class="st">"lazyfn"</span><span class="op">)</span><span class="op">)</span><span class="op">)</span>
 
-<span class='co'># S3 method for summarized_disk.frame</span>
-<span class='fu'>collect</span>(<span class='no'>x</span>, <span class='no'>...</span>, <span class='kw'>parallel</span> <span class='kw'>=</span> !<span class='fu'><a href='https://rdrr.io/r/base/NULL.html'>is.null</a></span>(<span class='fu'><a href='https://rdrr.io/r/base/attr.html'>attr</a></span>(<span class='no'>x</span>, <span class='st'>"lazyfn"</span>)))</pre>
+<span class="co"># S3 method for summarized_disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/compute.html" class="external-link">collect</a></span><span class="op">(</span><span class="va">x</span>, <span class="va">...</span>, parallel <span class="op">=</span> <span class="op">!</span><span class="fu"><a href="https://rdrr.io/r/base/NULL.html" class="external-link">is.null</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/attr.html" class="external-link">attr</a></span><span class="op">(</span><span class="va">x</span>, <span class="st">"lazyfn"</span><span class="op">)</span><span class="op">)</span><span class="op">)</span></code></pre></div>
+    </div>
 
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>x</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>not used</p></td>
-    </tr>
-    <tr>
-      <th>parallel</th>
-      <td><p>if TRUE the collection is performed in parallel. By default
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>x</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>...</dt>
+<dd><p>not used</p></dd>
+<dt>parallel</dt>
+<dd><p>if TRUE the collection is performed in parallel. By default
 if there are delayed/lazy steps then it will be parallel, otherwise it will
 not be in parallel. This is because parallel requires transferring data
 from background R session to the current R session and if there is no
 computation then it's better to avoid transferring data between session,
-hence parallel = FALSE is a better choice</p></td>
-    </tr>
-    <tr>
-      <th>simplify</th>
-      <td><p>Should the result be simplified to array</p></td>
-    </tr>
-    </table>
-
-    <h2 class="hasAnchor" id="value"><a class="anchor" href="#value"></a>Value</h2>
-
-    <p>collect return a data.frame/data.table</p>
-<p>collect_list returns a list</p>
-<p>collect return a data.frame/data.table</p>
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
-<span class='co'># use collect to bring the data into RAM as a data.table/data.frame</span>
-<span class='fu'>collect</span>(<span class='no'>cars.df</span>)</div><div class='output co'>#&gt;     speed dist
-#&gt;  1:     4    2
-#&gt;  2:     4   10
-#&gt;  3:     7    4
-#&gt;  4:     7   22
-#&gt;  5:     8   16
-#&gt;  6:     9   10
-#&gt;  7:    10   18
-#&gt;  8:    10   26
-#&gt;  9:    10   34
-#&gt; 10:    11   17
-#&gt; 11:    11   28
-#&gt; 12:    12   14
-#&gt; 13:    12   20
-#&gt; 14:    12   24
-#&gt; 15:    12   28
-#&gt; 16:    13   26
-#&gt; 17:    13   34
-#&gt; 18:    13   34
-#&gt; 19:    13   46
-#&gt; 20:    14   26
-#&gt; 21:    14   36
-#&gt; 22:    14   60
-#&gt; 23:    14   80
-#&gt; 24:    15   20
-#&gt; 25:    15   26
-#&gt; 26:    15   54
-#&gt; 27:    16   32
-#&gt; 28:    16   40
-#&gt; 29:    17   32
-#&gt; 30:    17   40
-#&gt; 31:    17   50
-#&gt; 32:    18   42
-#&gt; 33:    18   56
-#&gt; 34:    18   76
-#&gt; 35:    18   84
-#&gt; 36:    19   36
-#&gt; 37:    19   46
-#&gt; 38:    19   68
-#&gt; 39:    20   32
-#&gt; 40:    20   48
-#&gt; 41:    20   52
-#&gt; 42:    20   56
-#&gt; 43:    20   64
-#&gt; 44:    22   66
-#&gt; 45:    23   54
-#&gt; 46:    24   70
-#&gt; 47:    24   92
-#&gt; 48:    24   93
-#&gt; 49:    24  120
-#&gt; 50:    25   85
-#&gt;     speed dist</div><div class='input'>
-<span class='co'># clean up</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)
-<span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
+hence parallel = FALSE is a better choice</p></dd>
+<dt>simplify</dt>
+<dd><p>Should the result be simplified to array</p></dd>
+</dl></div>
+    <div id="value">
+    <h2>Value</h2>
+    <p>collect return a data.frame/data.table
+collect_list returns a list
+collect return a data.frame/data.table</p>
+    </div>
 
-<span class='co'># returns the result as a list</span>
-<span class='fu'>collect_list</span>(<span class='fu'><a href='cmap.html'>cmap</a></span>(<span class='no'>cars.df</span>, ~<span class='fl'>1</span>))</div><div class='output co'>#&gt; [[1]]
-#&gt; [1] 1
-#&gt; 
-#&gt; [[2]]
-#&gt; [1] 1
-#&gt; 
-#&gt; [[3]]
-#&gt; [1] 1
-#&gt; 
-#&gt; [[4]]
-#&gt; [1] 1
-#&gt; 
-#&gt; [[5]]
-#&gt; [1] 1
-#&gt; 
-#&gt; [[6]]
-#&gt; [1] 1
-#&gt; </div><div class='input'>
-<span class='co'># clean up</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)
-<span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
-<span class='co'># use collect to bring the data into RAM as a data.table/data.frame</span>
-<span class='fu'>collect</span>(<span class='no'>cars.df</span>)</div><div class='output co'>#&gt;     speed dist
-#&gt;  1:     4    2
-#&gt;  2:     4   10
-#&gt;  3:     7    4
-#&gt;  4:     7   22
-#&gt;  5:     8   16
-#&gt;  6:     9   10
-#&gt;  7:    10   18
-#&gt;  8:    10   26
-#&gt;  9:    10   34
-#&gt; 10:    11   17
-#&gt; 11:    11   28
-#&gt; 12:    12   14
-#&gt; 13:    12   20
-#&gt; 14:    12   24
-#&gt; 15:    12   28
-#&gt; 16:    13   26
-#&gt; 17:    13   34
-#&gt; 18:    13   34
-#&gt; 19:    13   46
-#&gt; 20:    14   26
-#&gt; 21:    14   36
-#&gt; 22:    14   60
-#&gt; 23:    14   80
-#&gt; 24:    15   20
-#&gt; 25:    15   26
-#&gt; 26:    15   54
-#&gt; 27:    16   32
-#&gt; 28:    16   40
-#&gt; 29:    17   32
-#&gt; 30:    17   40
-#&gt; 31:    17   50
-#&gt; 32:    18   42
-#&gt; 33:    18   56
-#&gt; 34:    18   76
-#&gt; 35:    18   84
-#&gt; 36:    19   36
-#&gt; 37:    19   46
-#&gt; 38:    19   68
-#&gt; 39:    20   32
-#&gt; 40:    20   48
-#&gt; 41:    20   52
-#&gt; 42:    20   56
-#&gt; 43:    20   64
-#&gt; 44:    22   66
-#&gt; 45:    23   54
-#&gt; 46:    24   70
-#&gt; 47:    24   92
-#&gt; 48:    24   93
-#&gt; 49:    24  120
-#&gt; 50:    25   85
-#&gt;     speed dist</div><div class='input'>
-<span class='co'># clean up</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)</div></pre>
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"><span class="co"># use collect to bring the data into RAM as a data.table/data.frame</span></span>
+<span class="r-in"><span class="fu"><a href="https://dplyr.tidyverse.org/reference/compute.html" class="external-link">collect</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>     speed dist</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  1:     4    2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  2:     4   10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  3:     7    4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  4:     7   22</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  5:     8   16</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  6:     9   10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  7:    10   18</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  8:    10   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  9:    10   34</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 10:    11   17</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 11:    11   28</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 12:    12   14</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 13:    12   20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 14:    12   24</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 15:    12   28</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 16:    13   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 17:    13   34</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 18:    13   34</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 19:    13   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 20:    14   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 21:    14   36</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 22:    14   60</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 23:    14   80</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 24:    15   20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 25:    15   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 26:    15   54</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 27:    16   32</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 28:    16   40</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 29:    17   32</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 30:    17   40</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 31:    17   50</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 32:    18   42</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 33:    18   56</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 34:    18   76</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 35:    18   84</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 36:    19   36</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 37:    19   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 38:    19   68</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 39:    20   32</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 40:    20   48</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 41:    20   52</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 42:    20   56</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 43:    20   64</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 44:    22   66</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 45:    23   54</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 46:    24   70</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 47:    24   92</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 48:    24   93</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 49:    24  120</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 50:    25   85</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>     speed dist</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># returns the result as a list</span></span>
+<span class="r-in"><span class="fu">collect_list</span><span class="op">(</span><span class="fu"><a href="cmap.html">cmap</a></span><span class="op">(</span><span class="va">cars.df</span>, <span class="op">~</span><span class="fl">1</span><span class="op">)</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [[1]]</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] 1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [[2]]</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] 1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [[3]]</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] 1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [[4]]</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] 1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [[5]]</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] 1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [[6]]</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] 1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> </span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"><span class="co"># use collect to bring the data into RAM as a data.table/data.frame</span></span>
+<span class="r-in"><span class="fu"><a href="https://dplyr.tidyverse.org/reference/compute.html" class="external-link">collect</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>     speed dist</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  1:     4    2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  2:     4   10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  3:     7    4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  4:     7   22</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  5:     8   16</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  6:     9   10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  7:    10   18</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  8:    10   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  9:    10   34</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 10:    11   17</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 11:    11   28</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 12:    12   14</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 13:    12   20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 14:    12   24</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 15:    12   28</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 16:    13   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 17:    13   34</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 18:    13   34</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 19:    13   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 20:    14   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 21:    14   36</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 22:    14   60</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 23:    14   80</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 24:    15   20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 25:    15   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 26:    15   54</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 27:    16   32</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 28:    16   40</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 29:    17   32</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 30:    17   40</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 31:    17   50</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 32:    18   42</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 33:    18   56</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 34:    18   76</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 35:    18   84</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 36:    19   36</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 37:    19   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 38:    19   68</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 39:    20   32</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 40:    20   48</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 41:    20   52</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 42:    20   56</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 43:    20   64</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 44:    22   66</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 45:    23   54</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 46:    24   70</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 47:    24   92</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 48:    24   93</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 49:    24  120</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 50:    25   85</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>     speed dist</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/colnames.html b/docs/reference/colnames.html
index 4d019358..3743a499 100644
--- a/docs/reference/colnames.html
+++ b/docs/reference/colnames.html
@@ -1,69 +1,15 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Return the column names of the disk.frame — colnames • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Return the column names of the disk.frame — colnames" />
-<meta property="og:description" content="The returned column names are from the source. So if you have lazy operations then the 
-colnames here does not reflects the results of those operations. To obtain the correct names try
-names(collect(get_chunk(df, 1)))" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Return the column names of the disk.frame — colnames • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Return the column names of the disk.frame — colnames"><meta property="og:description" content="The returned column names are from the source. So if you have lazy operations
+then the colnames here does not reflects the results of those
+operations. Note: if you have expensive lazy function then this operation
+might take some time."><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -74,19 +20,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -95,8 +34,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -129,93 +67,82 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Return the column names of the disk.frame</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/names.r'><code>R/names.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/names.r" class="external-link"><code>R/names.r</code></a></small>
     <div class="hidden name"><code>colnames.Rd</code></div>
     </div>
 
     <div class="ref-description">
-    <p>The returned column names are from the source. So if you have lazy operations then the 
-colnames here does not reflects the results of those operations. To obtain the correct names try
-<code><a href='https://rdrr.io/r/base/names.html'>names(collect(get_chunk(df, 1)))</a></code></p>
+    <p>The returned column names are from the source. So if you have lazy operations
+then the <code>colnames</code> here does not reflects the results of those
+operations. Note: if you have expensive lazy function then this operation
+might take some time.</p>
     </div>
 
-    <pre class="usage"><span class='fu'>colnames</span>(<span class='no'>x</span>, <span class='no'>...</span>)
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">colnames</span><span class="op">(</span><span class="va">x</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'><a href='https://rdrr.io/r/base/names.html'>names</a></span>(<span class='no'>x</span>, <span class='no'>...</span>)
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://rdrr.io/r/base/names.html" class="external-link">names</a></span><span class="op">(</span><span class="va">x</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>colnames</span>(<span class='no'>x</span>, <span class='no'>...</span>)
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu">colnames</span><span class="op">(</span><span class="va">x</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='co'># S3 method for default</span>
-<span class='fu'>colnames</span>(<span class='no'>x</span>, <span class='no'>...</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>x</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>not used</p></td>
-    </tr>
-    </table>
+<span class="co"># S3 method for default</span>
+<span class="fu">colnames</span><span class="op">(</span><span class="va">x</span>, <span class="va">...</span><span class="op">)</span></code></pre></div>
+    </div>
 
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>x</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>...</dt>
+<dd><p>not used</p></dd>
+</dl></div>
 
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/compute.disk.frame.html b/docs/reference/compute.disk.frame.html
index 8204b014..8feaf6eb 100644
--- a/docs/reference/compute.disk.frame.html
+++ b/docs/reference/compute.disk.frame.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Compute without writing — compute.disk.frame • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Compute without writing — compute.disk.frame" />
-<meta property="og:description" content="Perform the computation; same as calling cmap without .f and lazy = FALSE" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Compute without writing — compute.disk.frame • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Compute without writing — compute.disk.frame"><meta property="og:description" content="Perform the computation; same as calling cmap without .f and lazy = FALSE"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Compute without writing</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/compute.r'><code>R/compute.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/compute.r" class="external-link"><code>R/compute.r</code></a></small>
     <div class="hidden name"><code>compute.disk.frame.Rd</code></div>
     </div>
 
@@ -162,75 +95,64 @@ <h1>Compute without writing</h1>
     <p>Perform the computation; same as calling cmap without .f and lazy = FALSE</p>
     </div>
 
-    <pre class="usage"><span class='co'># S3 method for disk.frame</span>
-<span class='fu'>compute</span>(
-  <span class='no'>x</span>,
-  <span class='no'>name</span>,
-  <span class='kw'>outdir</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempfile</a></span>(<span class='st'>"tmp_df_"</span>, <span class='kw'>fileext</span> <span class='kw'>=</span> <span class='st'>".df"</span>),
-  <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>,
-  <span class='no'>...</span>
-)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>x</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>name</th>
-      <td><p>Not used. Kept for compatibility with dplyr</p></td>
-    </tr>
-    <tr>
-      <th>outdir</th>
-      <td><p>the output directory</p></td>
-    </tr>
-    <tr>
-      <th>overwrite</th>
-      <td><p>whether to overwrite or not</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>Not used. Kept for dplyr compatibility</p></td>
-    </tr>
-    </table>
-
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
-<span class='no'>cars.df2</span> <span class='kw'>=</span> <span class='no'>cars.df</span> <span class='kw'>%&gt;%</span> <span class='fu'><a href='cmap.html'>cmap</a></span>(~<span class='no'>.x</span>)
-<span class='co'># the computation is performed and the data is now stored elsewhere</span>
-<span class='no'>cars.df3</span> <span class='kw'>=</span> <span class='fu'>compute</span>(<span class='no'>cars.df2</span>)
-
-<span class='co'># clean up</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df3</span>)</div></pre>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/compute.html" class="external-link">compute</a></span><span class="op">(</span>
+  <span class="va">x</span>,
+  <span class="va">name</span>,
+  outdir <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempfile</a></span><span class="op">(</span><span class="st">"tmp_df_"</span>, fileext <span class="op">=</span> <span class="st">".df"</span><span class="op">)</span>,
+  overwrite <span class="op">=</span> <span class="cn">TRUE</span>,
+  <span class="va">...</span>
+<span class="op">)</span></code></pre></div>
+    </div>
+
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>x</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>name</dt>
+<dd><p>Not used. Kept for compatibility with dplyr</p></dd>
+<dt>outdir</dt>
+<dd><p>the output directory</p></dd>
+<dt>overwrite</dt>
+<dd><p>whether to overwrite or not</p></dd>
+<dt>...</dt>
+<dd><p>Not used. Kept for dplyr compatibility</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"><span class="va">cars.df2</span> <span class="op">=</span> <span class="va">cars.df</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="fu"><a href="cmap.html">cmap</a></span><span class="op">(</span><span class="op">~</span><span class="va">.x</span><span class="op">)</span></span>
+<span class="r-in"><span class="co"># the computation is performed and the data is now stored elsewhere</span></span>
+<span class="r-in"><span class="va">cars.df3</span> <span class="op">=</span> <span class="fu"><a href="https://dplyr.tidyverse.org/reference/compute.html" class="external-link">compute</a></span><span class="op">(</span><span class="va">cars.df2</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df3</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/create_chunk_mapper.html b/docs/reference/create_chunk_mapper.html
index 9fc66aac..7c28d311 100644
--- a/docs/reference/create_chunk_mapper.html
+++ b/docs/reference/create_chunk_mapper.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Create function that applies to each chunk if disk.frame — create_chunk_mapper • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Create function that applies to each chunk if disk.frame — create_chunk_mapper" />
-<meta property="og:description" content="A function to make it easier to create functions like filter" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Create function that applies to each chunk if disk.frame — create_chunk_mapper • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Create function that applies to each chunk if disk.frame — create_chunk_mapper"><meta property="og:description" content="A function to make it easier to create functions like filter"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
-
-
-  </head>
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Create function that applies to each chunk if disk.frame</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/chunk_mapper.r'><code>R/chunk_mapper.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/chunk_mapper.r" class="external-link"><code>R/chunk_mapper.r</code></a></small>
     <div class="hidden name"><code>create_chunk_mapper.Rd</code></div>
     </div>
 
@@ -162,104 +95,102 @@ <h1>Create function that applies to each chunk if disk.frame</h1>
     <p>A function to make it easier to create functions like <code>filter</code></p>
     </div>
 
-    <pre class="usage"><span class='fu'>create_chunk_mapper</span>(<span class='no'>chunk_fn</span>, <span class='kw'>warning_msg</span> <span class='kw'>=</span> <span class='kw'>NULL</span>, <span class='kw'>as.data.frame</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>chunk_fn</th>
-      <td><p>The dplyr function to create a mapper for</p></td>
-    </tr>
-    <tr>
-      <th>warning_msg</th>
-      <td><p>The warning message to display when invoking the mapper</p></td>
-    </tr>
-    <tr>
-      <th>as.data.frame</th>
-      <td><p>force the input chunk of a data.frame; needed for dtplyr</p></td>
-    </tr>
-    </table>
-
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'>
-<span class='no'>filter</span> <span class='kw'>=</span> <span class='fu'>create_chunk_mapper</span>(<span class='kw pkg'>dplyr</span><span class='kw ns'>::</span><span class='no'><a href='https://dplyr.tidyverse.org/reference/filter.html'>filter</a></span>)
-
-<span class='co'>#' example: creating a function that keeps only the first and last n row</span>
-<span class='no'>first_and_last</span> <span class='kw'>&lt;-</span> <span class='kw'>function</span>(<span class='no'>chunk</span>, <span class='no'>n</span>, <span class='no'>...</span>) {
-  <span class='no'>nr</span> <span class='kw'>=</span> <span class='fu'><a href='ncol_nrow.html'>nrow</a></span>(<span class='no'>chunk</span>)
-  <span class='fu'><a href='https://rdrr.io/r/base/print.html'>print</a></span>(<span class='no'>nr</span>-<span class='no'>n</span>+<span class='fl'>1</span>:<span class='no'>nr</span>)
-  <span class='no'>chunk</span>[<span class='fu'><a href='https://rdrr.io/r/base/c.html'>c</a></span>(<span class='fl'>1</span>:<span class='no'>n</span>, (<span class='no'>nr</span>-<span class='no'>n</span>+<span class='fl'>1</span>):<span class='no'>nr</span>), ]
-}
-
-<span class='co'>#' create the function for use with disk.frame</span>
-<span class='no'>first_and_last_df</span> <span class='kw'>=</span> <span class='fu'>create_chunk_mapper</span>(<span class='no'>first_and_last</span>)
-
-<span class='no'>mtcars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>mtcars</span>)
-
-<span class='co'>#' the operation is lazy</span>
-<span class='no'>lazy_mtcars.df</span> <span class='kw'>=</span> <span class='no'>mtcars.df</span> <span class='kw'>%&gt;%</span>
-  <span class='fu'>first_and_last_df</span>(<span class='fl'>2</span>)
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">create_chunk_mapper</span><span class="op">(</span><span class="va">chunk_fn</span>, warning_msg <span class="op">=</span> <span class="cn">NULL</span>, as.data.frame <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span></code></pre></div>
+    </div>
 
-<span class='co'>#' bring into R</span>
-<span class='fu'>collect</span>(<span class='no'>lazy_mtcars.df</span>)</div><div class='output co'>#&gt; [1]  5  6  7  8  9 10
-#&gt; [1]  5  6  7  8  9 10
-#&gt; [1]  5  6  7  8  9 10
-#&gt; [1]  5  6  7  8  9 10
-#&gt; [1]  5  6  7  8  9 10
-#&gt; [1] 1 2</div><div class='output co'>#&gt;        mpg cyl  disp  hp drat    wt  qsec vs am gear carb
-#&gt; ...1  21.0   6 160.0 110 3.90 2.620 16.46  0  1    4    4
-#&gt; ...2  21.0   6 160.0 110 3.90 2.875 17.02  0  1    4    4
-#&gt; ...3  18.7   8 360.0 175 3.15 3.440 17.02  0  0    3    2
-#&gt; ...4  18.1   6 225.0 105 2.76 3.460 20.22  1  0    3    1
-#&gt; ...5  14.3   8 360.0 245 3.21 3.570 15.84  0  0    3    4
-#&gt; ...6  24.4   4 146.7  62 3.69 3.190 20.00  1  0    4    2
-#&gt; ...7  17.8   6 167.6 123 3.92 3.440 18.90  1  0    4    4
-#&gt; ...8  16.4   8 275.8 180 3.07 4.070 17.40  0  0    3    3
-#&gt; ...9  17.3   8 275.8 180 3.07 3.730 17.60  0  0    3    3
-#&gt; ...10 15.2   8 275.8 180 3.07 3.780 18.00  0  0    3    3
-#&gt; ...11 14.7   8 440.0 230 3.23 5.345 17.42  0  0    3    4
-#&gt; ...12 32.4   4  78.7  66 4.08 2.200 19.47  1  1    4    1
-#&gt; ...13 30.4   4  75.7  52 4.93 1.615 18.52  1  1    4    2
-#&gt; ...14 33.9   4  71.1  65 4.22 1.835 19.90  1  1    4    1
-#&gt; ...15 15.2   8 304.0 150 3.15 3.435 17.30  0  0    3    2
-#&gt; ...16 13.3   8 350.0 245 3.73 3.840 15.41  0  0    3    4
-#&gt; ...17 19.2   8 400.0 175 3.08 3.845 17.05  0  0    3    2
-#&gt; ...18 27.3   4  79.0  66 4.08 1.935 18.90  1  1    4    1
-#&gt; ...19 15.8   8 351.0 264 4.22 3.170 14.50  0  1    5    4
-#&gt; ...20 19.7   6 145.0 175 3.62 2.770 15.50  0  1    5    6
-#&gt; 1     15.0   8 301.0 335 3.54 3.570 14.60  0  1    5    8
-#&gt; 2     21.4   4 121.0 109 4.11 2.780 18.60  1  1    4    2
-#&gt; 1.1   15.0   8 301.0 335 3.54 3.570 14.60  0  1    5    8
-#&gt; 2.1   21.4   4 121.0 109 4.11 2.780 18.60  1  1    4    2</div><div class='input'>
-<span class='co'>#' clean up</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>mtcars.df</span>)</div></pre>
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>chunk_fn</dt>
+<dd><p>The dplyr function to create a mapper for</p></dd>
+<dt>warning_msg</dt>
+<dd><p>The warning message to display when invoking the mapper</p></dd>
+<dt>as.data.frame</dt>
+<dd><p>force the input chunk of a data.frame; needed for dtplyr</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"></span>
+<span class="r-in"><span class="va">filter</span> <span class="op">=</span> <span class="fu">create_chunk_mapper</span><span class="op">(</span><span class="fu">dplyr</span><span class="fu">::</span><span class="va"><a href="https://dplyr.tidyverse.org/reference/filter.html" class="external-link">filter</a></span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co">#' example: creating a function that keeps only the first and last n row</span></span>
+<span class="r-in"><span class="va">first_and_last</span> <span class="op">&lt;-</span> <span class="kw">function</span><span class="op">(</span><span class="va">chunk</span>, <span class="va">n</span>, <span class="va">...</span><span class="op">)</span> <span class="op">{</span></span>
+<span class="r-in">  <span class="va">nr</span> <span class="op">=</span> <span class="fu"><a href="ncol_nrow.html">nrow</a></span><span class="op">(</span><span class="va">chunk</span><span class="op">)</span></span>
+<span class="r-in">  <span class="fu"><a href="https://rdrr.io/r/base/print.html" class="external-link">print</a></span><span class="op">(</span><span class="va">nr</span><span class="op">-</span><span class="va">n</span><span class="op">+</span><span class="fl">1</span><span class="op">:</span><span class="va">nr</span><span class="op">)</span></span>
+<span class="r-in">  <span class="va">chunk</span><span class="op">[</span><span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="fl">1</span><span class="op">:</span><span class="va">n</span>, <span class="op">(</span><span class="va">nr</span><span class="op">-</span><span class="va">n</span><span class="op">+</span><span class="fl">1</span><span class="op">)</span><span class="op">:</span><span class="va">nr</span><span class="op">)</span>, <span class="op">]</span></span>
+<span class="r-in"><span class="op">}</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co">#' create the function for use with disk.frame</span></span>
+<span class="r-in"><span class="va">first_and_last_df</span> <span class="op">=</span> <span class="fu">create_chunk_mapper</span><span class="op">(</span><span class="va">first_and_last</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="va">mtcars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">mtcars</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co">#' the operation is lazy</span></span>
+<span class="r-in"><span class="va">lazy_mtcars.df</span> <span class="op">=</span> <span class="va">mtcars.df</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span></span>
+<span class="r-in">  <span class="fu">first_and_last_df</span><span class="op">(</span><span class="fl">2</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co">#' bring into R</span></span>
+<span class="r-in"><span class="fu"><a href="https://dplyr.tidyverse.org/reference/compute.html" class="external-link">collect</a></span><span class="op">(</span><span class="va">lazy_mtcars.df</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1]  5  6  7  8  9 10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1]  5  6  7  8  9 10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1]  5  6  7  8  9 10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1]  5  6  7  8  9 10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1]  5  6  7  8  9 10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] 1 2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>      mpg cyl  disp  hp drat    wt  qsec vs am gear carb</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  1: 21.0   6 160.0 110 3.90 2.620 16.46  0  1    4    4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  2: 21.0   6 160.0 110 3.90 2.875 17.02  0  1    4    4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  3: 18.7   8 360.0 175 3.15 3.440 17.02  0  0    3    2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  4: 18.1   6 225.0 105 2.76 3.460 20.22  1  0    3    1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  5: 14.3   8 360.0 245 3.21 3.570 15.84  0  0    3    4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  6: 24.4   4 146.7  62 3.69 3.190 20.00  1  0    4    2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  7: 17.8   6 167.6 123 3.92 3.440 18.90  1  0    4    4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  8: 16.4   8 275.8 180 3.07 4.070 17.40  0  0    3    3</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  9: 17.3   8 275.8 180 3.07 3.730 17.60  0  0    3    3</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 10: 15.2   8 275.8 180 3.07 3.780 18.00  0  0    3    3</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 11: 14.7   8 440.0 230 3.23 5.345 17.42  0  0    3    4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 12: 32.4   4  78.7  66 4.08 2.200 19.47  1  1    4    1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 13: 30.4   4  75.7  52 4.93 1.615 18.52  1  1    4    2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 14: 33.9   4  71.1  65 4.22 1.835 19.90  1  1    4    1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 15: 15.2   8 304.0 150 3.15 3.435 17.30  0  0    3    2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 16: 13.3   8 350.0 245 3.73 3.840 15.41  0  0    3    4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 17: 19.2   8 400.0 175 3.08 3.845 17.05  0  0    3    2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 18: 27.3   4  79.0  66 4.08 1.935 18.90  1  1    4    1</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 19: 15.8   8 351.0 264 4.22 3.170 14.50  0  1    5    4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 20: 19.7   6 145.0 175 3.62 2.770 15.50  0  1    5    6</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 21: 15.0   8 301.0 335 3.54 3.570 14.60  0  1    5    8</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 22: 21.4   4 121.0 109 4.11 2.780 18.60  1  1    4    2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 23: 15.0   8 301.0 335 3.54 3.570 14.60  0  1    5    8</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 24: 21.4   4 121.0 109 4.11 2.780 18.60  1  1    4    2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>      mpg cyl  disp  hp drat    wt  qsec vs am gear carb</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co">#' clean up</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">mtcars.df</span><span class="op">)</span></span>
+<span class="r-in"></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/csv_to_disk.frame.html b/docs/reference/csv_to_disk.frame.html
index 3f80f571..17b0d387 100644
--- a/docs/reference/csv_to_disk.frame.html
+++ b/docs/reference/csv_to_disk.frame.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Convert CSV file(s) to disk.frame format — csv_to_disk.frame • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Convert CSV file(s) to disk.frame format — csv_to_disk.frame" />
-<meta property="og:description" content="Convert CSV file(s) to disk.frame format" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Convert CSV file(s) to disk.frame format — csv_to_disk.frame • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Convert CSV file(s) to disk.frame format — csv_to_disk.frame"><meta property="og:description" content="Convert CSV file(s) to disk.frame format"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Convert CSV file(s) to disk.frame format</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/csv2disk.frame.r'><code>R/csv2disk.frame.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/csv2disk.frame.r" class="external-link"><code>R/csv2disk.frame.r</code></a></small>
     <div class="hidden name"><code>csv_to_disk.frame.Rd</code></div>
     </div>
 
@@ -162,141 +95,115 @@ <h1>Convert CSV file(s) to disk.frame format</h1>
     <p>Convert CSV file(s) to disk.frame format</p>
     </div>
 
-    <pre class="usage"><span class='fu'>csv_to_disk.frame</span>(
-  <span class='no'>infile</span>,
-  <span class='kw'>outdir</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempfile</a></span>(<span class='kw'>fileext</span> <span class='kw'>=</span> <span class='st'>".df"</span>),
-  <span class='kw'>inmapfn</span> <span class='kw'>=</span> <span class='kw pkg'>base</span><span class='kw ns'>::</span><span class='no'><a href='https://rdrr.io/r/base/AsIs.html'>I</a></span>,
-  <span class='kw'>nchunks</span> <span class='kw'>=</span> <span class='fu'><a href='recommend_nchunks.html'>recommend_nchunks</a></span>(<span class='fu'><a href='https://rdrr.io/r/base/sum.html'>sum</a></span>(<span class='fu'><a href='https://rdrr.io/r/base/file.info.html'>file.size</a></span>(<span class='no'>infile</span>))),
-  <span class='kw'>in_chunk_size</span> <span class='kw'>=</span> <span class='kw'>NULL</span>,
-  <span class='kw'>shardby</span> <span class='kw'>=</span> <span class='kw'>NULL</span>,
-  <span class='kw'>compress</span> <span class='kw'>=</span> <span class='fl'>50</span>,
-  <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>,
-  <span class='kw'>header</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>,
-  <span class='kw'>.progress</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>,
-  <span class='kw'>backend</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/c.html'>c</a></span>(<span class='st'>"data.table"</span>, <span class='st'>"readr"</span>, <span class='st'>"LaF"</span>),
-  <span class='kw'>chunk_reader</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/c.html'>c</a></span>(<span class='st'>"bigreadr"</span>, <span class='st'>"data.table"</span>, <span class='st'>"readr"</span>, <span class='st'>"readLines"</span>),
-  <span class='no'>...</span>
-)</pre>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">csv_to_disk.frame</span><span class="op">(</span>
+  <span class="va">infile</span>,
+  outdir <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempfile</a></span><span class="op">(</span>fileext <span class="op">=</span> <span class="st">".df"</span><span class="op">)</span>,
+  inmapfn <span class="op">=</span> <span class="fu">base</span><span class="fu">::</span><span class="va"><a href="https://rdrr.io/r/base/AsIs.html" class="external-link">I</a></span>,
+  nchunks <span class="op">=</span> <span class="fu"><a href="recommend_nchunks.html">recommend_nchunks</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/sum.html" class="external-link">sum</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/file.info.html" class="external-link">file.size</a></span><span class="op">(</span><span class="va">infile</span><span class="op">)</span><span class="op">)</span><span class="op">)</span>,
+  in_chunk_size <span class="op">=</span> <span class="cn">NULL</span>,
+  shardby <span class="op">=</span> <span class="cn">NULL</span>,
+  compress <span class="op">=</span> <span class="fl">50</span>,
+  overwrite <span class="op">=</span> <span class="cn">TRUE</span>,
+  header <span class="op">=</span> <span class="cn">TRUE</span>,
+  .progress <span class="op">=</span> <span class="cn">TRUE</span>,
+  backend <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">"data.table"</span>, <span class="st">"readr"</span>, <span class="st">"LaF"</span><span class="op">)</span>,
+  chunk_reader <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">"bigreadr"</span>, <span class="st">"data.table"</span>, <span class="st">"readr"</span>, <span class="st">"readLines"</span><span class="op">)</span>,
+  <span class="va">...</span>
+<span class="op">)</span></code></pre></div>
+    </div>
 
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>infile</th>
-      <td><p>The input CSV file or files</p></td>
-    </tr>
-    <tr>
-      <th>outdir</th>
-      <td><p>The directory to output the disk.frame to</p></td>
-    </tr>
-    <tr>
-      <th>inmapfn</th>
-      <td><p>A function to be applied to the chunk read in from CSV before
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>infile</dt>
+<dd><p>The input CSV file or files</p></dd>
+<dt>outdir</dt>
+<dd><p>The directory to output the disk.frame to</p></dd>
+<dt>inmapfn</dt>
+<dd><p>A function to be applied to the chunk read in from CSV before
 the chunk is being written out. Commonly used to perform simple
-transformations. Defaults to the identity function (ie. no transformation)</p></td>
-    </tr>
-    <tr>
-      <th>nchunks</th>
-      <td><p>Number of chunks to output</p></td>
-    </tr>
-    <tr>
-      <th>in_chunk_size</th>
-      <td><p>When reading in the file, how many lines to read in at
+transformations. Defaults to the identity function (ie. no transformation)</p></dd>
+<dt>nchunks</dt>
+<dd><p>Number of chunks to output</p></dd>
+<dt>in_chunk_size</dt>
+<dd><p>When reading in the file, how many lines to read in at
 once. This is different to nchunks which controls how many chunks are
-output</p></td>
-    </tr>
-    <tr>
-      <th>shardby</th>
-      <td><p>The column(s) to shard the data by. For example suppose
+output</p></dd>
+<dt>shardby</dt>
+<dd><p>The column(s) to shard the data by. For example suppose
 `shardby = c("col1","col2")`  then every row where the values `col1` and
 `col2` are the same will end up in the same chunk; this will allow merging
-by `col1` and `col2` to be more efficient</p></td>
-    </tr>
-    <tr>
-      <th>compress</th>
-      <td><p>For fst backends it's a number between 0 and 100 where 100 is
-the highest compression ratio.</p></td>
-    </tr>
-    <tr>
-      <th>overwrite</th>
-      <td><p>Whether to overwrite the existing directory</p></td>
-    </tr>
-    <tr>
-      <th>header</th>
-      <td><p>Whether the files have header. Defaults to TRUE</p></td>
-    </tr>
-    <tr>
-      <th>.progress</th>
-      <td><p>A logical, for whether or not to print a progress bar for
-multiprocess, multisession, and multicore plans. From furrr</p></td>
-    </tr>
-    <tr>
-      <th>backend</th>
-      <td><p>The CSV reader backend to choose: "data.table" or "readr". 
+by `col1` and `col2` to be more efficient</p></dd>
+<dt>compress</dt>
+<dd><p>For fst backends it's a number between 0 and 100 where 100 is
+the highest compression ratio.</p></dd>
+<dt>overwrite</dt>
+<dd><p>Whether to overwrite the existing directory</p></dd>
+<dt>header</dt>
+<dd><p>Whether the files have header. Defaults to TRUE</p></dd>
+<dt>.progress</dt>
+<dd><p>A logical, for whether or not to print a progress bar for
+multiprocess, multisession, and multicore plans. From furrr</p></dd>
+<dt>backend</dt>
+<dd><p>The CSV reader backend to choose: "data.table" or "readr". 
 disk.frame does not have its own CSV reader. It uses either
 data.table::fread or readr::read_delimited. It is worth noting that
 data.table::fread does not detect dates and all dates are imported as
 strings, and you are encouraged to use fasttime to convert the strings to
 date. You can use the `inmapfn` to do that. However, if you want automatic
 date detection, then backend="readr" may suit your needs. However, readr
-is often slower than data.table, hence data.table is chosen as the default.</p></td>
-    </tr>
-    <tr>
-      <th>chunk_reader</th>
-      <td><p>Even if you choose a backend there can still be multiple
+is often slower than data.table, hence data.table is chosen as the default.</p></dd>
+<dt>chunk_reader</dt>
+<dd><p>Even if you choose a backend there can still be multiple
 strategies on how to approach the CSV reads. For example, data.table::fread
 tries to mmap the whole file which can cause the whole read process to
 fail. In that case we can change the chunk_reader to "readLines" which uses the
 readLines function to read chunk by chunk and still use data.table::fread
 to process the chunks. There are currently no strategies for readr backend,
-except the default one.</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>passed to data.table::fread, disk.frame::as.disk.frame,
-disk.frame::shard</p></td>
-    </tr>
-    </table>
-
-    <h2 class="hasAnchor" id="see-also"><a class="anchor" href="#see-also"></a>See also</h2>
-
-    <div class='dont-index'><p>Other ingesting data: 
-<code><a href='zip_to_disk.frame.html'>zip_to_disk.frame</a>()</code></p></div>
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>tmpfile</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempfile</a></span>()
-<span class='fu'><a href='https://rdrr.io/r/utils/write.table.html'>write.csv</a></span>(<span class='no'>cars</span>, <span class='no'>tmpfile</span>)
-<span class='no'>tmpdf</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempfile</a></span>(<span class='kw'>fileext</span> <span class='kw'>=</span> <span class='st'>".df"</span>)
-<span class='no'>df</span> <span class='kw'>=</span> <span class='fu'>csv_to_disk.frame</span>(<span class='no'>tmpfile</span>, <span class='kw'>outdir</span> <span class='kw'>=</span> <span class='no'>tmpdf</span>, <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>)
+except the default one.</p></dd>
+<dt>...</dt>
+<dd><p>passed to data.table::fread, disk.frame::as.disk.frame,
+disk.frame::shard</p></dd>
+</dl></div>
+    <div id="see-also">
+    <h2>See also</h2>
+    <div class="dont-index"><p>Other ingesting data: 
+<code><a href="zip_to_disk.frame.html">zip_to_disk.frame</a>()</code></p></div>
+    </div>
 
-<span class='co'># clean up</span>
-<span class='kw pkg'>fs</span><span class='kw ns'>::</span><span class='fu'><a href='http://fs.r-lib.org/reference/delete.html'>file_delete</a></span>(<span class='no'>tmpfile</span>)
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>df</span>)</div></pre>
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">tmpfile</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempfile</a></span><span class="op">(</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="https://rdrr.io/r/utils/write.table.html" class="external-link">write.csv</a></span><span class="op">(</span><span class="va">cars</span>, <span class="va">tmpfile</span><span class="op">)</span></span>
+<span class="r-in"><span class="va">tmpdf</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempfile</a></span><span class="op">(</span>fileext <span class="op">=</span> <span class="st">".df"</span><span class="op">)</span></span>
+<span class="r-in"><span class="va">df</span> <span class="op">=</span> <span class="fu">csv_to_disk.frame</span><span class="op">(</span><span class="va">tmpfile</span>, outdir <span class="op">=</span> <span class="va">tmpdf</span>, overwrite <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up</span></span>
+<span class="r-in"><span class="fu">fs</span><span class="fu">::</span><span class="fu"><a href="https://fs.r-lib.org/reference/delete.html" class="external-link">file_delete</a></span><span class="op">(</span><span class="va">tmpfile</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/delete.html b/docs/reference/delete.html
index f44d0caf..2a238505 100644
--- a/docs/reference/delete.html
+++ b/docs/reference/delete.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Delete a disk.frame — delete • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Delete a disk.frame — delete" />
-<meta property="og:description" content="Delete a disk.frame" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Delete a disk.frame — delete • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Delete a disk.frame — delete"><meta property="og:description" content="Delete a disk.frame"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Delete a disk.frame</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/delete.r'><code>R/delete.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/delete.r" class="external-link"><code>R/delete.r</code></a></small>
     <div class="hidden name"><code>delete.Rd</code></div>
     </div>
 
@@ -162,46 +95,43 @@ <h1>Delete a disk.frame</h1>
     <p>Delete a disk.frame</p>
     </div>
 
-    <pre class="usage"><span class='fu'>delete</span>(<span class='no'>df</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>df</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    </table>
-
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">delete</span><span class="op">(</span><span class="va">df</span><span class="op">)</span></code></pre></div>
+    </div>
 
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
-<span class='fu'>delete</span>(<span class='no'>cars.df</span>)</div></pre>
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>df</dt>
+<dd><p>a disk.frame</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu">delete</span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/df_ram_size.html b/docs/reference/df_ram_size.html
index 6a7c7b25..57bfaa8d 100644
--- a/docs/reference/df_ram_size.html
+++ b/docs/reference/df_ram_size.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Get the size of RAM in gigabytes — df_ram_size • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Get the size of RAM in gigabytes — df_ram_size" />
-<meta property="og:description" content="Get the size of RAM in gigabytes" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Get the size of RAM in gigabytes — df_ram_size • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Get the size of RAM in gigabytes — df_ram_size"><meta property="og:description" content="Get the size of RAM in gigabytes"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Get the size of RAM in gigabytes</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/recommend_nchunks.r'><code>R/recommend_nchunks.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/recommend_nchunks.r" class="external-link"><code>R/recommend_nchunks.r</code></a></small>
     <div class="hidden name"><code>df_ram_size.Rd</code></div>
     </div>
 
@@ -162,41 +95,43 @@ <h1>Get the size of RAM in gigabytes</h1>
     <p>Get the size of RAM in gigabytes</p>
     </div>
 
-    <pre class="usage"><span class='fu'>df_ram_size</span>()</pre>
-
-
-    <h2 class="hasAnchor" id="value"><a class="anchor" href="#value"></a>Value</h2>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">df_ram_size</span><span class="op">(</span><span class="op">)</span></code></pre></div>
+    </div>
 
+    <div id="value">
+    <h2>Value</h2>
     <p>integer of RAM in gigabyte (GB)</p>
+    </div>
 
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='co'># returns the RAM size in gigabyte (GB)</span>
-<span class='fu'>df_ram_size</span>()</div><div class='output co'>#&gt; [1] 64</div></pre>
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="co"># returns the RAM size in gigabyte (GB)</span></span>
+<span class="r-in"><span class="fu">df_ram_size</span><span class="op">(</span><span class="op">)</span> </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] 64</span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/dfglm.html b/docs/reference/dfglm.html
index 75c7571c..1197ac98 100644
--- a/docs/reference/dfglm.html
+++ b/docs/reference/dfglm.html
@@ -1,68 +1,13 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Fit generalized linear models (glm) with disk.frame — dfglm • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Fit generalized linear models (glm) with disk.frame — dfglm" />
-<meta property="og:description" content="Fits GLMs using `speedglm` or `biglm`. The return object will be exactly as
-those return by those functions. This is a convenience wrapper" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Fit generalized linear models (glm) with disk.frame — dfglm • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Fit generalized linear models (glm) with disk.frame — dfglm"><meta property="og:description" content="Fits GLMs using `speedglm` or `biglm`. The return object will be exactly as
+those return by those functions. This is a convenience wrapper"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -73,19 +18,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -94,8 +32,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -128,34 +65,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Fit generalized linear models (glm) with disk.frame</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/glm.r'><code>R/glm.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/glm.r" class="external-link"><code>R/glm.r</code></a></small>
     <div class="hidden name"><code>dfglm.Rd</code></div>
     </div>
 
@@ -164,37 +97,30 @@ <h1>Fit generalized linear models (glm) with disk.frame</h1>
 those return by those functions. This is a convenience wrapper</p>
     </div>
 
-    <pre class="usage"><span class='fu'>dfglm</span>(<span class='no'>formula</span>, <span class='no'>data</span>, <span class='no'>...</span>, <span class='kw'>glm_backend</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/c.html'>c</a></span>(<span class='st'>"biglm"</span>, <span class='st'>"speedglm"</span>, <span class='st'>"biglmm"</span>))</pre>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">dfglm</span><span class="op">(</span><span class="va">formula</span>, <span class="va">data</span>, <span class="va">...</span>, glm_backend <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">"biglm"</span>, <span class="st">"speedglm"</span>, <span class="st">"biglmm"</span><span class="op">)</span><span class="op">)</span></code></pre></div>
+    </div>
 
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>formula</th>
-      <td><p>A model formula</p></td>
-    </tr>
-    <tr>
-      <th>data</th>
-      <td><p>See Details below. Method dispatch is on this argument</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>Additional arguments</p></td>
-    </tr>
-    <tr>
-      <th>glm_backend</th>
-      <td><p>Which package to use for fitting GLMs. The default is
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>formula</dt>
+<dd><p>A model formula</p></dd>
+<dt>data</dt>
+<dd><p>See Details below. Method dispatch is on this argument</p></dd>
+<dt>...</dt>
+<dd><p>Additional arguments</p></dd>
+<dt>glm_backend</dt>
+<dd><p>Which package to use for fitting GLMs. The default is
 "biglm", which has known issues with factor level if different levels are
 present in different chunks. The "speedglm" option is more robust, but does not
-implement `predict` which makes prediction and implementation impossible.</p></td>
-    </tr>
-    </table>
-
-    <h2 class="hasAnchor" id="value"><a class="anchor" href="#value"></a>Value</h2>
-
+implement `predict` which makes prediction and implementation impossible.</p></dd>
+</dl></div>
+    <div id="value">
+    <h2>Value</h2>
     <p>An object of class <code>bigglm</code></p>
-    <h2 class="hasAnchor" id="details"><a class="anchor" href="#details"></a>Details</h2>
-
+    </div>
+    <div id="details">
+    <h2>Details</h2>
     <p>The <code>data</code> argument may be a function, a data frame, or a
   <code>SQLiteConnection</code> or <code>RODBC</code> connection object.</p>
 <p>When it is a function the function must take a single argument
@@ -214,60 +140,66 @@ <h2 class="hasAnchor" id="details"><a class="anchor" href="#details"></a>Details
   variables needed for the model, not the whole table. The code in the
   <code>SQLiteConnection</code> method should work for other <code>DBI</code>
   connections, but I do not have any of these to check it with.</p>
-    <h2 class="hasAnchor" id="references"><a class="anchor" href="#references"></a>References</h2>
-
+    </div>
+    <div id="references">
+    <h2>References</h2>
     <p>Algorithm AS274  Applied Statistics (1992) Vol.41, 
 No. 2</p>
-    <h2 class="hasAnchor" id="see-also"><a class="anchor" href="#see-also"></a>See also</h2>
-
-    <div class='dont-index'><p>Other Machine Learning (ML): 
-<code><a href='make_glm_streaming_fn.html'>make_glm_streaming_fn</a>()</code></p></div>
+    </div>
+    <div id="see-also">
+    <h2>See also</h2>
+    <div class="dont-index"><p>Other Machine Learning (ML): 
+<code><a href="make_glm_streaming_fn.html">make_glm_streaming_fn</a>()</code></p></div>
+    </div>
 
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
-<span class='no'>m</span> <span class='kw'>=</span> <span class='fu'>dfglm</span>(<span class='no'>dist</span> ~ <span class='no'>speed</span>, <span class='kw'>data</span> <span class='kw'>=</span> <span class='no'>cars.df</span>)</div><div class='output co'>#&gt; <span class='message'>Loading required namespace: biglm</span></div><div class='input'>
-<span class='co'># can use normal R functions</span>
-<span class='co'># Only works in version &gt; R 3.6</span>
-<span class='no'>majorv</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/integer.html'>as.integer</a></span>(<span class='no'>version</span>$<span class='no'>major</span>)
-<span class='no'>minorv</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/integer.html'>as.integer</a></span>(<span class='fu'><a href='https://rdrr.io/r/base/strsplit.html'>strsplit</a></span>(<span class='no'>version</span>$<span class='no'>minor</span>, <span class='st'>"."</span>, <span class='kw'>fixed</span><span class='kw'>=</span><span class='fl'>TRUE</span>)<span class='kw'>[[</span><span class='fl'>1</span>]][<span class='fl'>1</span>])
-<span class='kw'>if</span>(((<span class='no'>majorv</span> <span class='kw'>==</span> <span class='fl'>3</span>) <span class='kw'>&amp;</span> (<span class='no'>minorv</span> <span class='kw'>&gt;=</span> <span class='fl'>6</span>)) <span class='kw'>|</span> (<span class='no'>majorv</span> <span class='kw'>&gt;</span> <span class='fl'>3</span>)) {
-  <span class='fu'><a href='https://rdrr.io/r/base/summary.html'>summary</a></span>(<span class='no'>m</span>)
-  <span class='fu'><a href='https://rdrr.io/r/stats/predict.html'>predict</a></span>(<span class='no'>m</span>, <span class='fu'><a href='get_chunk.html'>get_chunk</a></span>(<span class='no'>cars.df</span>, <span class='fl'>1</span>))
-  <span class='fu'><a href='https://rdrr.io/r/stats/predict.html'>predict</a></span>(<span class='no'>m</span>, <span class='fu'>collect</span>(<span class='no'>cars.df</span>))
-  <span class='co'># can use broom to tidy up the returned info</span>
-  <span class='kw pkg'>broom</span><span class='kw ns'>::</span><span class='fu'><a href='https://rdrr.io/pkg/broom/man/reexports.html'>tidy</a></span>(<span class='no'>m</span>)
-}</div><div class='output co'>#&gt; <span style='color: #949494;'># A tibble: 2 x 4</span><span>
-#&gt;   term        estimate std.error  p.value
-#&gt;   </span><span style='color: #949494;font-style: italic;'>&lt;chr&gt;</span><span>          </span><span style='color: #949494;font-style: italic;'>&lt;dbl&gt;</span><span>     </span><span style='color: #949494;font-style: italic;'>&lt;dbl&gt;</span><span>    </span><span style='color: #949494;font-style: italic;'>&lt;dbl&gt;</span><span>
-#&gt; </span><span style='color: #BCBCBC;'>1</span><span> (Intercept)   -</span><span style='color: #BB0000;'>17.6</span><span>      6.76  9.29</span><span style='color: #949494;'>e</span><span style='color: #BB0000;'>- 3</span><span>
-#&gt; </span><span style='color: #BCBCBC;'>2</span><span> speed           3.93     0.416 2.96</span><span style='color: #949494;'>e</span><span style='color: #BB0000;'>-21</span><span></div><div class='input'>
-<span class='co'># clean up</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)</div></span></pre>
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"><span class="va">m</span> <span class="op">=</span> <span class="fu">dfglm</span><span class="op">(</span><span class="va">dist</span> <span class="op">~</span> <span class="va">speed</span>, data <span class="op">=</span> <span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Loading required namespace: biglm</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># can use normal R functions</span></span>
+<span class="r-in"><span class="co"># Only works in version &gt; R 3.6</span></span>
+<span class="r-in"><span class="va">majorv</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/integer.html" class="external-link">as.integer</a></span><span class="op">(</span><span class="va">version</span><span class="op">$</span><span class="va">major</span><span class="op">)</span></span>
+<span class="r-in"><span class="va">minorv</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/integer.html" class="external-link">as.integer</a></span><span class="op">(</span><span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/tstrsplit.html" class="external-link">strsplit</a></span><span class="op">(</span><span class="va">version</span><span class="op">$</span><span class="va">minor</span>, <span class="st">"."</span>, fixed<span class="op">=</span><span class="cn">TRUE</span><span class="op">)</span><span class="op">[[</span><span class="fl">1</span><span class="op">]</span><span class="op">]</span><span class="op">[</span><span class="fl">1</span><span class="op">]</span><span class="op">)</span></span>
+<span class="r-in"><span class="kw">if</span><span class="op">(</span><span class="op">(</span><span class="op">(</span><span class="va">majorv</span> <span class="op">==</span> <span class="fl">3</span><span class="op">)</span> <span class="op">&amp;</span> <span class="op">(</span><span class="va">minorv</span> <span class="op">&gt;=</span> <span class="fl">6</span><span class="op">)</span><span class="op">)</span> <span class="op">|</span> <span class="op">(</span><span class="va">majorv</span> <span class="op">&gt;</span> <span class="fl">3</span><span class="op">)</span><span class="op">)</span> <span class="op">{</span></span>
+<span class="r-in">  <span class="fu"><a href="https://rdrr.io/r/base/summary.html" class="external-link">summary</a></span><span class="op">(</span><span class="va">m</span><span class="op">)</span></span>
+<span class="r-in">  <span class="fu"><a href="https://rdrr.io/r/stats/predict.html" class="external-link">predict</a></span><span class="op">(</span><span class="va">m</span>, <span class="fu"><a href="get_chunk.html">get_chunk</a></span><span class="op">(</span><span class="va">cars.df</span>, <span class="fl">1</span><span class="op">)</span><span class="op">)</span></span>
+<span class="r-in">  <span class="fu"><a href="https://rdrr.io/r/stats/predict.html" class="external-link">predict</a></span><span class="op">(</span><span class="va">m</span>, <span class="fu"><a href="https://dplyr.tidyverse.org/reference/compute.html" class="external-link">collect</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span><span class="op">)</span></span>
+<span class="r-in">  <span class="co"># can use broom to tidy up the returned info</span></span>
+<span class="r-in">  <span class="fu">broom</span><span class="fu">::</span><span class="fu"><a href="https://generics.r-lib.org/reference/tidy.html" class="external-link">tidy</a></span><span class="op">(</span><span class="va">m</span><span class="op">)</span></span>
+<span class="r-in"><span class="op">}</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #949494;"># A tibble: 2 x 4</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>   term        estimate std.error  p.value</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>   <span style="color: #949494; font-style: italic;">&lt;chr&gt;</span>          <span style="color: #949494; font-style: italic;">&lt;dbl&gt;</span>     <span style="color: #949494; font-style: italic;">&lt;dbl&gt;</span>    <span style="color: #949494; font-style: italic;">&lt;dbl&gt;</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;">1</span> (Intercept)   -<span style="color: #BB0000;">17.6</span>      6.76  9.29<span style="color: #949494;">e</span><span style="color: #BB0000;">- 3</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;">2</span> speed           3.93     0.416 2.96<span style="color: #949494;">e</span><span style="color: #BB0000;">-21</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/disk.frame.html b/docs/reference/disk.frame.html
index 5dd9de15..0d2320c2 100644
--- a/docs/reference/disk.frame.html
+++ b/docs/reference/disk.frame.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Create a disk.frame from a folder — disk.frame • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Create a disk.frame from a folder — disk.frame" />
-<meta property="og:description" content="Create a disk.frame from a folder" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Create a disk.frame from a folder — disk.frame • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Create a disk.frame from a folder — disk.frame"><meta property="og:description" content="Create a disk.frame from a folder"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Create a disk.frame from a folder</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/disk.frame.r'><code>R/disk.frame.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/disk.frame.r" class="external-link"><code>R/disk.frame.r</code></a></small>
     <div class="hidden name"><code>disk.frame.Rd</code></div>
     </div>
 
@@ -162,63 +95,64 @@ <h1>Create a disk.frame from a folder</h1>
     <p>Create a disk.frame from a folder</p>
     </div>
 
-    <pre class="usage"><span class='fu'>disk.frame</span>(<span class='no'>path</span>, <span class='kw'>backend</span> <span class='kw'>=</span> <span class='st'>"fst"</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>path</th>
-      <td><p>The path to store the output file or to a directory</p></td>
-    </tr>
-    <tr>
-      <th>backend</th>
-      <td><p>The only available backend is fst at the moment</p></td>
-    </tr>
-    </table>
-
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>path</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/file.path.html'>file.path</a></span>(<span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempdir</a></span>(),<span class='st'>"cars"</span>)
-<span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>, <span class='kw'>outdir</span><span class='kw'>=</span><span class='no'>path</span>, <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>, <span class='kw'>nchunks</span> <span class='kw'>=</span> <span class='fl'>2</span>)</div><div class='output co'>#&gt; <span class='message'>path: "C:\Users\RTX2080\AppData\Local\Temp\RtmpInritK/cars"</span>
-#&gt; <span class='message'>nchunks: 2</span>
-#&gt; <span class='message'>nrow (at source): 50</span>
-#&gt; <span class='message'>ncol (at source): 2</span>
-#&gt; <span class='message'>nrow (post operations): ???</span>
-#&gt; <span class='message'>ncol (post operations): ???</span></div><div class='input'><span class='no'>df</span> <span class='kw'>=</span> <span class='fu'>disk.frame</span>(<span class='no'>path</span>)
-<span class='fu'><a href='https://rdrr.io/r/utils/head.html'>head</a></span>(<span class='no'>df</span>)</div><div class='output co'>#&gt;    speed dist
-#&gt; 1:     4    2
-#&gt; 2:     4   10
-#&gt; 3:     7    4
-#&gt; 4:     7   22
-#&gt; 5:     8   16
-#&gt; 6:     9   10</div><div class='input'><span class='fu'><a href='nchunks.html'>nchunks</a></span>(<span class='no'>df</span>)</div><div class='output co'>#&gt; [1] 2</div><div class='input'><span class='co'># clean up</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>df</span>)</div></pre>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">disk.frame</span><span class="op">(</span><span class="va">path</span>, backend <span class="op">=</span> <span class="st">"fst"</span><span class="op">)</span></code></pre></div>
+    </div>
+
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>path</dt>
+<dd><p>The path to store the output file or to a directory</p></dd>
+<dt>backend</dt>
+<dd><p>The only available backend is fst at the moment</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">path</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/file.path.html" class="external-link">file.path</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempdir</a></span><span class="op">(</span><span class="op">)</span>,<span class="st">"cars"</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span>, outdir<span class="op">=</span><span class="va">path</span>, overwrite <span class="op">=</span> <span class="cn">TRUE</span>, nchunks <span class="op">=</span> <span class="fl">2</span><span class="op">)</span></span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> path: "C:\Users\RTX2080\AppData\Local\Temp\Rtmp2rQjw5/cars"</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nchunks: 2</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nrow (at source): 50</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> ncol (at source): 2</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nrow (post operations): ???</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> ncol (post operations): ???</span>
+<span class="r-in"><span class="va">df</span> <span class="op">=</span> <span class="fu">disk.frame</span><span class="op">(</span><span class="va">path</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="https://rdrr.io/r/utils/head.html" class="external-link">head</a></span><span class="op">(</span><span class="va">df</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>    speed dist</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 1:     4    2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 2:     4   10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 3:     7    4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 4:     7   22</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 5:     8   16</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 6:     9   10</span>
+<span class="r-in"><span class="fu"><a href="nchunks.html">nchunks</a></span><span class="op">(</span><span class="va">df</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] 2</span>
+<span class="r-in"><span class="co"># clean up</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/dplyr_verbs.html b/docs/reference/dplyr_verbs.html
index 00f29a9e..4cbb0612 100644
--- a/docs/reference/dplyr_verbs.html
+++ b/docs/reference/dplyr_verbs.html
@@ -1,68 +1,13 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>The dplyr verbs implemented for disk.frame — select.disk.frame • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="The dplyr verbs implemented for disk.frame — select.disk.frame" />
-<meta property="og:description" content="Please see the dplyr document for their usage. Please note
-`chunk_arrange` performs the actions within each chunk" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>The dplyr verbs implemented for disk.frame — select.disk.frame • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="The dplyr verbs implemented for disk.frame — select.disk.frame"><meta property="og:description" content="Please see the dplyr document for their usage. Please note
+`chunk_arrange` performs the actions within each chunk"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
-
-
-  </head>
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -73,19 +18,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -94,8 +32,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -128,34 +65,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>The dplyr verbs implemented for disk.frame</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/dplyr_verbs.r'><code>R/dplyr_verbs.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/dplyr_verbs.r" class="external-link"><code>R/dplyr_verbs.r</code></a></small>
     <div class="hidden name"><code>dplyr_verbs.Rd</code></div>
     </div>
 
@@ -164,99 +97,88 @@ <h1>The dplyr verbs implemented for disk.frame</h1>
 `chunk_arrange` performs the actions within each chunk</p>
     </div>
 
-    <pre class="usage"><span class='co'># S3 method for disk.frame</span>
-<span class='fu'>select</span>(<span class='no'>.data</span>, <span class='no'>...</span>)
-
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>rename</span>(<span class='no'>.data</span>, <span class='no'>...</span>)
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/select.html" class="external-link">select</a></span><span class="op">(</span><span class="va">.data</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'><a href='https://rdrr.io/r/stats/filter.html'>filter</a></span>(<span class='no'>.data</span>, <span class='no'>...</span>)
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/rename.html" class="external-link">rename</a></span><span class="op">(</span><span class="va">.data</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>mutate</span>(<span class='no'>.data</span>, <span class='no'>...</span>)
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/filter.html" class="external-link">filter</a></span><span class="op">(</span><span class="va">.data</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>transmute</span>(<span class='no'>.data</span>, <span class='no'>...</span>)
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate.html" class="external-link">mutate</a></span><span class="op">(</span><span class="va">.data</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>arrange</span>(<span class='no'>.data</span>, <span class='no'>...</span>)
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate.html" class="external-link">transmute</a></span><span class="op">(</span><span class="va">.data</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>chunk_arrange</span>(<span class='no'>.data</span>, <span class='no'>...</span>)
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/arrange.html" class="external-link">arrange</a></span><span class="op">(</span><span class="va">.data</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>tally.disk.frame</span>(<span class='no'>.data</span>, <span class='no'>...</span>)
+<span class="fu">chunk_arrange</span><span class="op">(</span><span class="va">.data</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>count.disk.frame</span>(<span class='no'>.data</span>, <span class='no'>...</span>)
+<span class="fu">add_tally.disk.frame</span><span class="op">(</span><span class="va">.data</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>add_count.disk.frame</span>(<span class='no'>.data</span>, <span class='no'>...</span>)
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/do.html" class="external-link">do</a></span><span class="op">(</span><span class="va">.data</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>add_tally.disk.frame</span>(<span class='no'>.data</span>, <span class='no'>...</span>)
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/distinct.html" class="external-link">distinct</a></span><span class="op">(</span><span class="va">...</span><span class="op">)</span>
 
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>do</span>(<span class='no'>.data</span>, <span class='no'>...</span>)
+<span class="fu">chunk_distinct</span><span class="op">(</span><span class="va">.data</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>distinct</span>(<span class='no'>...</span>)
-
-<span class='fu'>chunk_distinct</span>(<span class='no'>.data</span>, <span class='no'>...</span>)
-
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>glimpse</span>(<span class='no'>.data</span>, <span class='no'>...</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>.data</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>Same as the dplyr functions</p></td>
-    </tr>
-    </table>
-
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='fu'><a href='https://rdrr.io/r/base/library.html'>library</a></span>(<span class='no'>dplyr</span>)
-<span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
-<span class='no'>mult</span> <span class='kw'>=</span> <span class='fl'>2</span>
-
-<span class='co'># use all any of the supported dplyr</span>
-<span class='no'>cars2</span> <span class='kw'>=</span> <span class='no'>cars.df</span> <span class='kw'>%&gt;%</span>
-  <span class='fu'><a href='https://dplyr.tidyverse.org/reference/select.html'>select</a></span>(<span class='no'>speed</span>) <span class='kw'>%&gt;%</span>
-  <span class='fu'><a href='https://dplyr.tidyverse.org/reference/mutate.html'>mutate</a></span>(<span class='kw'>speed2</span> <span class='kw'>=</span> <span class='no'>speed</span> * <span class='no'>mult</span>) <span class='kw'>%&gt;%</span>
-  <span class='fu'><a href='https://dplyr.tidyverse.org/reference/filter.html'>filter</a></span>(<span class='no'>speed</span> <span class='kw'>&lt;</span> <span class='fl'>50</span>) <span class='kw'>%&gt;%</span>
-  <span class='fu'><a href='https://dplyr.tidyverse.org/reference/rename.html'>rename</a></span>(<span class='kw'>speed1</span> <span class='kw'>=</span> <span class='no'>speed</span>) <span class='kw'>%&gt;%</span>
-  <span class='no'>collect</span>
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://pillar.r-lib.org/reference/glimpse.html" class="external-link">glimpse</a></span><span class="op">(</span><span class="va">.data</span>, <span class="va">...</span><span class="op">)</span></code></pre></div>
+    </div>
 
-<span class='co'># clean up cars.df</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)</div></pre>
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>.data</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>...</dt>
+<dd><p>Same as the dplyr functions</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://dplyr.tidyverse.org" class="external-link">dplyr</a></span><span class="op">)</span></span>
+<span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"><span class="va">mult</span> <span class="op">=</span> <span class="fl">2</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># use all any of the supported dplyr</span></span>
+<span class="r-in"><span class="va">cars2</span> <span class="op">=</span> <span class="va">cars.df</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> </span>
+<span class="r-in">  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/select.html" class="external-link">select</a></span><span class="op">(</span><span class="va">speed</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> </span>
+<span class="r-in">  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate.html" class="external-link">mutate</a></span><span class="op">(</span>speed2 <span class="op">=</span> <span class="va">speed</span> <span class="op">*</span> <span class="va">mult</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> </span>
+<span class="r-in">  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/filter.html" class="external-link">filter</a></span><span class="op">(</span><span class="va">speed</span> <span class="op">&lt;</span> <span class="fl">50</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> </span>
+<span class="r-in">  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/rename.html" class="external-link">rename</a></span><span class="op">(</span>speed1 <span class="op">=</span> <span class="va">speed</span><span class="op">)</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> </span>
+<span class="r-in">  <span class="va">collect</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up cars.df</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/evalparseglue.html b/docs/reference/evalparseglue.html
index 60206d23..4172714e 100644
--- a/docs/reference/evalparseglue.html
+++ b/docs/reference/evalparseglue.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Helper function to evalparse some `glue::glue` string — evalparseglue • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Helper function to evalparse some `glue::glue` string — evalparseglue" />
-<meta property="og:description" content="Helper function to evalparse some `glue::glue` string" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Helper function to evalparse some `glue::glue` string — evalparseglue • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Helper function to evalparse some `glue::glue` string — evalparseglue"><meta property="og:description" content="Helper function to evalparse some `glue::glue` string"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Helper function to evalparse some `glue::glue` string</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/util.r'><code>R/util.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/util.r" class="external-link"><code>R/util.r</code></a></small>
     <div class="hidden name"><code>evalparseglue.Rd</code></div>
     </div>
 
@@ -162,47 +95,39 @@ <h1>Helper function to evalparse some `glue::glue` string</h1>
     <p>Helper function to evalparse some `glue::glue` string</p>
     </div>
 
-    <pre class="usage"><span class='fu'>evalparseglue</span>(<span class='no'>code</span>, <span class='kw'>env</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/sys.parent.html'>parent.frame</a></span>())</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>code</th>
-      <td><p>the code in character(string) format to evaluate</p></td>
-    </tr>
-    <tr>
-      <th>env</th>
-      <td><p>the environment in which to evaluate the code</p></td>
-    </tr>
-    </table>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">evalparseglue</span><span class="op">(</span><span class="va">code</span>, env <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/sys.parent.html" class="external-link">parent.frame</a></span><span class="op">(</span><span class="op">)</span><span class="op">)</span></code></pre></div>
+    </div>
 
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>code</dt>
+<dd><p>the code in character(string) format to evaluate</p></dd>
+<dt>env</dt>
+<dd><p>the environment in which to evaluate the code</p></dd>
+</dl></div>
 
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/foverlaps.disk.frame.html b/docs/reference/foverlaps.disk.frame.html
index 11ca11f6..19607792 100644
--- a/docs/reference/foverlaps.disk.frame.html
+++ b/docs/reference/foverlaps.disk.frame.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Apply data.table's foverlaps to the disk.frame — foverlaps.disk.frame • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Apply data.table's foverlaps to the disk.frame — foverlaps.disk.frame" />
-<meta property="og:description" content="EXPERIMENTAL" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Apply data.table's foverlaps to the disk.frame — foverlaps.disk.frame • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Apply data.table's foverlaps to the disk.frame — foverlaps.disk.frame"><meta property="og:description" content="EXPERIMENTAL"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Apply data.table's foverlaps to the disk.frame</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/foverlaps.disk.frame.r'><code>R/foverlaps.disk.frame.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/foverlaps.disk.frame.r" class="external-link"><code>R/foverlaps.disk.frame.r</code></a></small>
     <div class="hidden name"><code>foverlaps.disk.frame.Rd</code></div>
     </div>
 
@@ -162,101 +95,81 @@ <h1>Apply data.table's foverlaps to the disk.frame</h1>
     <p>EXPERIMENTAL</p>
     </div>
 
-    <pre class="usage"><span class='fu'>foverlaps.disk.frame</span>(
-  <span class='no'>df1</span>,
-  <span class='no'>df2</span>,
-  <span class='kw'>by.x</span> <span class='kw'>=</span> <span class='kw'>if</span> (<span class='fu'><a href='https://rdrr.io/r/base/identical.html'>identical</a></span>(<span class='fu'><a href='shardkey.html'>shardkey</a></span>(<span class='no'>df1</span>)$<span class='no'>shardkey</span>, <span class='st'>""</span>)) <span class='fu'><a href='shardkey.html'>shardkey</a></span>(<span class='no'>df1</span>)$<span class='no'>shardkey</span> <span class='kw'>else</span>
-    <span class='fu'><a href='shardkey.html'>shardkey</a></span>(<span class='no'>df2</span>)$<span class='no'>shardkey</span>,
-  <span class='kw'>by.y</span> <span class='kw'>=</span> <span class='fu'><a href='shardkey.html'>shardkey</a></span>(<span class='no'>df2</span>)$<span class='no'>shardkey</span>,
-  <span class='no'>...</span>,
-  <span class='kw'>outdir</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempfile</a></span>(<span class='st'>"df_foverlaps_tmp"</span>, <span class='kw'>fileext</span> <span class='kw'>=</span> <span class='st'>".df"</span>),
-  <span class='kw'>merge_by_chunk_id</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>,
-  <span class='kw'>compress</span> <span class='kw'>=</span> <span class='fl'>50</span>,
-  <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>
-)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>df1</th>
-      <td><p>A disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>df2</th>
-      <td><p>A disk.frame or a data.frame</p></td>
-    </tr>
-    <tr>
-      <th>by.x</th>
-      <td><p>character/string vector. by.x used in foverlaps</p></td>
-    </tr>
-    <tr>
-      <th>by.y</th>
-      <td><p>character/string vector. by.x used in foverlaps</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>passed to data.table::foverlaps and disk.frame::cmap.disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>outdir</th>
-      <td><p>The output directory of the disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>merge_by_chunk_id</th>
-      <td><p>If TRUE then the merges will happen for chunks in df1 and df2 with the same chunk id which speed up processing. Otherwise every chunk of df1 is merged with every chunk of df2. Ignored with df2 is not a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>compress</th>
-      <td><p>The compression ratio for fst</p></td>
-    </tr>
-    <tr>
-      <th>overwrite</th>
-      <td><p>overwrite existing directory</p></td>
-    </tr>
-    </table>
-
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='fu'><a href='https://rdrr.io/r/base/library.html'>library</a></span>(<span class='no'>data.table</span>)
-
-<span class='co'>## simple example:</span>
-<span class='no'>x</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='fu'><a href='https://Rdatatable.gitlab.io/data.table/reference/data.table.html'>data.table</a></span>(<span class='kw'>start</span><span class='kw'>=</span><span class='fu'><a href='https://rdrr.io/r/base/c.html'>c</a></span>(<span class='fl'>5</span>,<span class='fl'>31</span>,<span class='fl'>22</span>,<span class='fl'>16</span>), <span class='kw'>end</span><span class='kw'>=</span><span class='fu'><a href='https://rdrr.io/r/base/c.html'>c</a></span>(<span class='fl'>8</span>,<span class='fl'>50</span>,<span class='fl'>25</span>,<span class='fl'>18</span>), <span class='kw'>val2</span> <span class='kw'>=</span> <span class='fl'>7</span>:<span class='fl'>10</span>))
-<span class='no'>y</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='fu'><a href='https://Rdatatable.gitlab.io/data.table/reference/data.table.html'>data.table</a></span>(<span class='kw'>start</span><span class='kw'>=</span><span class='fu'><a href='https://rdrr.io/r/base/c.html'>c</a></span>(<span class='fl'>10</span>, <span class='fl'>20</span>, <span class='fl'>30</span>), <span class='kw'>end</span><span class='kw'>=</span><span class='fu'><a href='https://rdrr.io/r/base/c.html'>c</a></span>(<span class='fl'>15</span>, <span class='fl'>35</span>, <span class='fl'>45</span>), <span class='kw'>val1</span> <span class='kw'>=</span> <span class='fl'>1</span>:<span class='fl'>3</span>))
-<span class='no'>byxy</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/c.html'>c</a></span>(<span class='st'>"val1"</span>, <span class='st'>"start"</span>, <span class='st'>"end"</span>)
-<span class='no'>xy.df</span> <span class='kw'>=</span> <span class='fu'>foverlaps.disk.frame</span>(
-  <span class='no'>x</span>, <span class='no'>y</span>, <span class='kw'>by.x</span> <span class='kw'>=</span> <span class='no'>byxy</span>, <span class='kw'>by.y</span> <span class='kw'>=</span> <span class='no'>byxy</span>,
-  <span class='kw'>merge_by_chunk_id</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>, <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>)
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">foverlaps.disk.frame</span><span class="op">(</span>
+  <span class="va">df1</span>,
+  <span class="va">df2</span>,
+  by.x <span class="op">=</span> <span class="kw">if</span> <span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/identical.html" class="external-link">identical</a></span><span class="op">(</span><span class="fu"><a href="shardkey.html">shardkey</a></span><span class="op">(</span><span class="va">df1</span><span class="op">)</span><span class="op">$</span><span class="va">shardkey</span>, <span class="st">""</span><span class="op">)</span><span class="op">)</span> <span class="fu"><a href="shardkey.html">shardkey</a></span><span class="op">(</span><span class="va">df1</span><span class="op">)</span><span class="op">$</span><span class="va">shardkey</span> <span class="kw">else</span>
+    <span class="fu"><a href="shardkey.html">shardkey</a></span><span class="op">(</span><span class="va">df2</span><span class="op">)</span><span class="op">$</span><span class="va">shardkey</span>,
+  by.y <span class="op">=</span> <span class="fu"><a href="shardkey.html">shardkey</a></span><span class="op">(</span><span class="va">df2</span><span class="op">)</span><span class="op">$</span><span class="va">shardkey</span>,
+  <span class="va">...</span>,
+  outdir <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempfile</a></span><span class="op">(</span><span class="st">"df_foverlaps_tmp"</span>, fileext <span class="op">=</span> <span class="st">".df"</span><span class="op">)</span>,
+  merge_by_chunk_id <span class="op">=</span> <span class="cn">FALSE</span>,
+  compress <span class="op">=</span> <span class="fl">50</span>,
+  overwrite <span class="op">=</span> <span class="cn">TRUE</span>
+<span class="op">)</span></code></pre></div>
+    </div>
 
-<span class='co'># clean up</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>x</span>)
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>y</span>)
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>xy.df</span>)</div></pre>
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>df1</dt>
+<dd><p>A disk.frame</p></dd>
+<dt>df2</dt>
+<dd><p>A disk.frame or a data.frame</p></dd>
+<dt>by.x</dt>
+<dd><p>character/string vector. by.x used in foverlaps</p></dd>
+<dt>by.y</dt>
+<dd><p>character/string vector. by.x used in foverlaps</p></dd>
+<dt>...</dt>
+<dd><p>passed to data.table::foverlaps and disk.frame::cmap.disk.frame</p></dd>
+<dt>outdir</dt>
+<dd><p>The output directory of the disk.frame</p></dd>
+<dt>merge_by_chunk_id</dt>
+<dd><p>If TRUE then the merges will happen for chunks in df1 and df2 with the same chunk id which speed up processing. Otherwise every chunk of df1 is merged with every chunk of df2. Ignored with df2 is not a disk.frame</p></dd>
+<dt>compress</dt>
+<dd><p>The compression ratio for fst</p></dd>
+<dt>overwrite</dt>
+<dd><p>overwrite existing directory</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://r-datatable.com" class="external-link">data.table</a></span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co">## simple example:</span></span>
+<span class="r-in"><span class="va">x</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/data.table.html" class="external-link">data.table</a></span><span class="op">(</span>start<span class="op">=</span><span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="fl">5</span>,<span class="fl">31</span>,<span class="fl">22</span>,<span class="fl">16</span><span class="op">)</span>, end<span class="op">=</span><span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="fl">8</span>,<span class="fl">50</span>,<span class="fl">25</span>,<span class="fl">18</span><span class="op">)</span>, val2 <span class="op">=</span> <span class="fl">7</span><span class="op">:</span><span class="fl">10</span><span class="op">)</span><span class="op">)</span></span>
+<span class="r-in"><span class="va">y</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/data.table.html" class="external-link">data.table</a></span><span class="op">(</span>start<span class="op">=</span><span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="fl">10</span>, <span class="fl">20</span>, <span class="fl">30</span><span class="op">)</span>, end<span class="op">=</span><span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="fl">15</span>, <span class="fl">35</span>, <span class="fl">45</span><span class="op">)</span>, val1 <span class="op">=</span> <span class="fl">1</span><span class="op">:</span><span class="fl">3</span><span class="op">)</span><span class="op">)</span></span>
+<span class="r-in"><span class="va">byxy</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="st">"start"</span>, <span class="st">"end"</span><span class="op">)</span></span>
+<span class="r-in"><span class="va">xy.df</span> <span class="op">=</span> <span class="fu">foverlaps.disk.frame</span><span class="op">(</span></span>
+<span class="r-in">   <span class="va">x</span>, <span class="va">y</span>, by.x <span class="op">=</span> <span class="va">byxy</span>, by.y <span class="op">=</span> <span class="va">byxy</span>,</span>
+<span class="r-in">  merge_by_chunk_id <span class="op">=</span> <span class="cn">TRUE</span>, overwrite <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span></span>
+<span class="r-in"><span class="co"># clean up</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">x</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">y</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">xy.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/gen_datatable_synthetic.html b/docs/reference/gen_datatable_synthetic.html
index c7eb7d31..608041f6 100644
--- a/docs/reference/gen_datatable_synthetic.html
+++ b/docs/reference/gen_datatable_synthetic.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Generate synthetic dataset for testing — gen_datatable_synthetic • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Generate synthetic dataset for testing — gen_datatable_synthetic" />
-<meta property="og:description" content="Generate synthetic dataset for testing" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Generate synthetic dataset for testing — gen_datatable_synthetic • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Generate synthetic dataset for testing — gen_datatable_synthetic"><meta property="og:description" content="Generate synthetic dataset for testing"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Generate synthetic dataset for testing</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/util.r'><code>R/util.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/util.r" class="external-link"><code>R/util.r</code></a></small>
     <div class="hidden name"><code>gen_datatable_synthetic.Rd</code></div>
     </div>
 
@@ -162,47 +95,39 @@ <h1>Generate synthetic dataset for testing</h1>
     <p>Generate synthetic dataset for testing</p>
     </div>
 
-    <pre class="usage"><span class='fu'>gen_datatable_synthetic</span>(<span class='kw'>N</span> <span class='kw'>=</span> <span class='fl'>2e+08</span>, <span class='kw'>K</span> <span class='kw'>=</span> <span class='fl'>100</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>N</th>
-      <td><p>number of rows. Defaults to 200 million</p></td>
-    </tr>
-    <tr>
-      <th>K</th>
-      <td><p>controls the number of unique values for id. Some ids will have K distinct values while others have N/K distinct values</p></td>
-    </tr>
-    </table>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">gen_datatable_synthetic</span><span class="op">(</span>N <span class="op">=</span> <span class="fl">2e+08</span>, K <span class="op">=</span> <span class="fl">100</span><span class="op">)</span></code></pre></div>
+    </div>
 
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>N</dt>
+<dd><p>number of rows. Defaults to 200 million</p></dd>
+<dt>K</dt>
+<dd><p>controls the number of unique values for id. Some ids will have K distinct values while others have N/K distinct values</p></dd>
+</dl></div>
 
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/get_chunk.html b/docs/reference/get_chunk.html
index 5cf436cb..66df5c10 100644
--- a/docs/reference/get_chunk.html
+++ b/docs/reference/get_chunk.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Obtain one chunk by chunk id — get_chunk • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Obtain one chunk by chunk id — get_chunk" />
-<meta property="og:description" content="Obtain one chunk by chunk id" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Obtain one chunk by chunk id — get_chunk • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Obtain one chunk by chunk id — get_chunk"><meta property="og:description" content="Obtain one chunk by chunk id"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Obtain one chunk by chunk id</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/get_chunk.r'><code>R/get_chunk.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/get_chunk.r" class="external-link"><code>R/get_chunk.r</code></a></small>
     <div class="hidden name"><code>get_chunk.Rd</code></div>
     </div>
 
@@ -162,173 +95,170 @@ <h1>Obtain one chunk by chunk id</h1>
     <p>Obtain one chunk by chunk id</p>
     </div>
 
-    <pre class="usage"><span class='fu'>get_chunk</span>(<span class='no'>...</span>)
-
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>get_chunk</span>(<span class='no'>df</span>, <span class='no'>n</span>, <span class='kw'>keep</span> <span class='kw'>=</span> <span class='kw'>NULL</span>, <span class='kw'>full.names</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>, <span class='no'>...</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>...</th>
-      <td><p>passed to fst::read_fst or whichever read function is used in the backend</p></td>
-    </tr>
-    <tr>
-      <th>df</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>n</th>
-      <td><p>the chunk id. If numeric then matches by number, if character then returns the chunk with the same name as n</p></td>
-    </tr>
-    <tr>
-      <th>keep</th>
-      <td><p>the columns to keep</p></td>
-    </tr>
-    <tr>
-      <th>full.names</th>
-      <td><p>whether n is the full path to the chunks or just a relative path file name. Ignored if n is numeric</p></td>
-    </tr>
-    </table>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">get_chunk</span><span class="op">(</span><span class="va">...</span><span class="op">)</span>
 
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu">get_chunk</span><span class="op">(</span><span class="va">df</span>, <span class="va">n</span>, keep <span class="op">=</span> <span class="cn">NULL</span>, full.names <span class="op">=</span> <span class="cn">FALSE</span>, <span class="va">...</span><span class="op">)</span></code></pre></div>
+    </div>
 
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>, <span class='kw'>nchunks</span> <span class='kw'>=</span> <span class='fl'>2</span>)
-<span class='fu'>get_chunk</span>(<span class='no'>cars.df</span>, <span class='fl'>1</span>)</div><div class='output co'>#&gt;     speed dist
-#&gt;  1:     4    2
-#&gt;  2:     4   10
-#&gt;  3:     7    4
-#&gt;  4:     7   22
-#&gt;  5:     8   16
-#&gt;  6:     9   10
-#&gt;  7:    10   18
-#&gt;  8:    10   26
-#&gt;  9:    10   34
-#&gt; 10:    11   17
-#&gt; 11:    11   28
-#&gt; 12:    12   14
-#&gt; 13:    12   20
-#&gt; 14:    12   24
-#&gt; 15:    12   28
-#&gt; 16:    13   26
-#&gt; 17:    13   34
-#&gt; 18:    13   34
-#&gt; 19:    13   46
-#&gt; 20:    14   26
-#&gt; 21:    14   36
-#&gt; 22:    14   60
-#&gt; 23:    14   80
-#&gt; 24:    15   20
-#&gt; 25:    15   26
-#&gt;     speed dist</div><div class='input'><span class='fu'>get_chunk</span>(<span class='no'>cars.df</span>, <span class='fl'>2</span>)</div><div class='output co'>#&gt;     speed dist
-#&gt;  1:    15   54
-#&gt;  2:    16   32
-#&gt;  3:    16   40
-#&gt;  4:    17   32
-#&gt;  5:    17   40
-#&gt;  6:    17   50
-#&gt;  7:    18   42
-#&gt;  8:    18   56
-#&gt;  9:    18   76
-#&gt; 10:    18   84
-#&gt; 11:    19   36
-#&gt; 12:    19   46
-#&gt; 13:    19   68
-#&gt; 14:    20   32
-#&gt; 15:    20   48
-#&gt; 16:    20   52
-#&gt; 17:    20   56
-#&gt; 18:    20   64
-#&gt; 19:    22   66
-#&gt; 20:    23   54
-#&gt; 21:    24   70
-#&gt; 22:    24   92
-#&gt; 23:    24   93
-#&gt; 24:    24  120
-#&gt; 25:    25   85
-#&gt;     speed dist</div><div class='input'><span class='fu'>get_chunk</span>(<span class='no'>cars.df</span>, <span class='fl'>1</span>, <span class='kw'>keep</span> <span class='kw'>=</span> <span class='st'>"speed"</span>)</div><div class='output co'>#&gt;     speed
-#&gt;  1:     4
-#&gt;  2:     4
-#&gt;  3:     7
-#&gt;  4:     7
-#&gt;  5:     8
-#&gt;  6:     9
-#&gt;  7:    10
-#&gt;  8:    10
-#&gt;  9:    10
-#&gt; 10:    11
-#&gt; 11:    11
-#&gt; 12:    12
-#&gt; 13:    12
-#&gt; 14:    12
-#&gt; 15:    12
-#&gt; 16:    13
-#&gt; 17:    13
-#&gt; 18:    13
-#&gt; 19:    13
-#&gt; 20:    14
-#&gt; 21:    14
-#&gt; 22:    14
-#&gt; 23:    14
-#&gt; 24:    15
-#&gt; 25:    15
-#&gt;     speed</div><div class='input'>
-<span class='co'># if full.names = TRUE then the full path to the chunk need to be provided</span>
-<span class='fu'>get_chunk</span>(<span class='no'>cars.df</span>, <span class='fu'><a href='https://rdrr.io/r/base/file.path.html'>file.path</a></span>(<span class='fu'><a href='https://rdrr.io/r/base/attr.html'>attr</a></span>(<span class='no'>cars.df</span>, <span class='st'>"path"</span>), <span class='st'>"1.fst"</span>), <span class='kw'>full.names</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>)</div><div class='output co'>#&gt;     speed dist
-#&gt;  1:     4    2
-#&gt;  2:     4   10
-#&gt;  3:     7    4
-#&gt;  4:     7   22
-#&gt;  5:     8   16
-#&gt;  6:     9   10
-#&gt;  7:    10   18
-#&gt;  8:    10   26
-#&gt;  9:    10   34
-#&gt; 10:    11   17
-#&gt; 11:    11   28
-#&gt; 12:    12   14
-#&gt; 13:    12   20
-#&gt; 14:    12   24
-#&gt; 15:    12   28
-#&gt; 16:    13   26
-#&gt; 17:    13   34
-#&gt; 18:    13   34
-#&gt; 19:    13   46
-#&gt; 20:    14   26
-#&gt; 21:    14   36
-#&gt; 22:    14   60
-#&gt; 23:    14   80
-#&gt; 24:    15   20
-#&gt; 25:    15   26
-#&gt;     speed dist</div><div class='input'>
-<span class='co'># clean up cars.df</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)</div></pre>
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>...</dt>
+<dd><p>passed to fst::read_fst or whichever read function is used in the backend</p></dd>
+<dt>df</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>n</dt>
+<dd><p>the chunk id. If numeric then matches by number, if character then returns the chunk with the same name as n</p></dd>
+<dt>keep</dt>
+<dd><p>the columns to keep</p></dd>
+<dt>full.names</dt>
+<dd><p>whether n is the full path to the chunks or just a relative path file name. Ignored if n is numeric</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span>, nchunks <span class="op">=</span> <span class="fl">2</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu">get_chunk</span><span class="op">(</span><span class="va">cars.df</span>, <span class="fl">1</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>     speed dist</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  1:     4    2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  2:     4   10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  3:     7    4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  4:     7   22</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  5:     8   16</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  6:     9   10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  7:    10   18</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  8:    10   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  9:    10   34</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 10:    11   17</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 11:    11   28</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 12:    12   14</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 13:    12   20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 14:    12   24</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 15:    12   28</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 16:    13   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 17:    13   34</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 18:    13   34</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 19:    13   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 20:    14   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 21:    14   36</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 22:    14   60</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 23:    14   80</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 24:    15   20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 25:    15   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>     speed dist</span>
+<span class="r-in"><span class="fu">get_chunk</span><span class="op">(</span><span class="va">cars.df</span>, <span class="fl">2</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>     speed dist</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  1:    15   54</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  2:    16   32</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  3:    16   40</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  4:    17   32</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  5:    17   40</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  6:    17   50</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  7:    18   42</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  8:    18   56</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  9:    18   76</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 10:    18   84</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 11:    19   36</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 12:    19   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 13:    19   68</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 14:    20   32</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 15:    20   48</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 16:    20   52</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 17:    20   56</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 18:    20   64</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 19:    22   66</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 20:    23   54</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 21:    24   70</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 22:    24   92</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 23:    24   93</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 24:    24  120</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 25:    25   85</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>     speed dist</span>
+<span class="r-in"><span class="fu">get_chunk</span><span class="op">(</span><span class="va">cars.df</span>, <span class="fl">1</span>, keep <span class="op">=</span> <span class="st">"speed"</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>     speed</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  1:     4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  2:     4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  3:     7</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  4:     7</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  5:     8</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  6:     9</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  7:    10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  8:    10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  9:    10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 10:    11</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 11:    11</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 12:    12</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 13:    12</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 14:    12</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 15:    12</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 16:    13</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 17:    13</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 18:    13</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 19:    13</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 20:    14</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 21:    14</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 22:    14</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 23:    14</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 24:    15</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 25:    15</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>     speed</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># if full.names = TRUE then the full path to the chunk need to be provided</span></span>
+<span class="r-in"><span class="fu">get_chunk</span><span class="op">(</span><span class="va">cars.df</span>, <span class="fu"><a href="https://rdrr.io/r/base/file.path.html" class="external-link">file.path</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/attr.html" class="external-link">attr</a></span><span class="op">(</span><span class="va">cars.df</span>, <span class="st">"path"</span><span class="op">)</span>, <span class="st">"1.fst"</span><span class="op">)</span>, full.names <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>     speed dist</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  1:     4    2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  2:     4   10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  3:     7    4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  4:     7   22</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  5:     8   16</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  6:     9   10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  7:    10   18</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  8:    10   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  9:    10   34</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 10:    11   17</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 11:    11   28</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 12:    12   14</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 13:    12   20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 14:    12   24</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 15:    12   28</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 16:    13   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 17:    13   34</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 18:    13   34</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 19:    13   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 20:    14   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 21:    14   36</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 22:    14   60</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 23:    14   80</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 24:    15   20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 25:    15   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>     speed dist</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up cars.df</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/get_chunk_ids.html b/docs/reference/get_chunk_ids.html
index 968aaa4b..d54c8f15 100644
--- a/docs/reference/get_chunk_ids.html
+++ b/docs/reference/get_chunk_ids.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Get the chunk IDs and files names — get_chunk_ids • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Get the chunk IDs and files names — get_chunk_ids" />
-<meta property="og:description" content="Get the chunk IDs and files names" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Get the chunk IDs and files names — get_chunk_ids • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Get the chunk IDs and files names — get_chunk_ids"><meta property="og:description" content="Get the chunk IDs and files names"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Get the chunk IDs and files names</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/get_chunk_ids.r'><code>R/get_chunk_ids.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/get_chunk_ids.r" class="external-link"><code>R/get_chunk_ids.r</code></a></small>
     <div class="hidden name"><code>get_chunk_ids.Rd</code></div>
     </div>
 
@@ -162,71 +95,68 @@ <h1>Get the chunk IDs and files names</h1>
     <p>Get the chunk IDs and files names</p>
     </div>
 
-    <pre class="usage"><span class='fu'>get_chunk_ids</span>(<span class='no'>df</span>, <span class='no'>...</span>, <span class='kw'>full.names</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>, <span class='kw'>strip_extension</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>df</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>passed to list.files</p></td>
-    </tr>
-    <tr>
-      <th>full.names</th>
-      <td><p>If TRUE returns the full path to the file, Defaults to FALSE</p></td>
-    </tr>
-    <tr>
-      <th>strip_extension</th>
-      <td><p>If TRUE then the file extension in the chunk_id is removed. Defaults to TRUE</p></td>
-    </tr>
-    </table>
-
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
-
-<span class='co'># return the integer-string chunk IDs</span>
-<span class='fu'>get_chunk_ids</span>(<span class='no'>cars.df</span>)</div><div class='output co'>#&gt; [1] "1" "2" "3" "4" "5" "6"</div><div class='input'>
-<span class='co'># return the file name chunk IDs</span>
-<span class='fu'>get_chunk_ids</span>(<span class='no'>cars.df</span>, <span class='kw'>full.names</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>)</div><div class='output co'>#&gt; [1] "C:\\Users\\RTX2080\\AppData\\Local\\Temp\\RtmpInritK\\file187ce9d748c.df/1.fst"
-#&gt; [2] "C:\\Users\\RTX2080\\AppData\\Local\\Temp\\RtmpInritK\\file187ce9d748c.df/2.fst"
-#&gt; [3] "C:\\Users\\RTX2080\\AppData\\Local\\Temp\\RtmpInritK\\file187ce9d748c.df/3.fst"
-#&gt; [4] "C:\\Users\\RTX2080\\AppData\\Local\\Temp\\RtmpInritK\\file187ce9d748c.df/4.fst"
-#&gt; [5] "C:\\Users\\RTX2080\\AppData\\Local\\Temp\\RtmpInritK\\file187ce9d748c.df/5.fst"
-#&gt; [6] "C:\\Users\\RTX2080\\AppData\\Local\\Temp\\RtmpInritK\\file187ce9d748c.df/6.fst"</div><div class='input'>
-<span class='co'># return the file name chunk IDs with file extension</span>
-<span class='fu'>get_chunk_ids</span>(<span class='no'>cars.df</span>, <span class='kw'>strip_extension</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>)</div><div class='output co'>#&gt; [1] "1.fst" "2.fst" "3.fst" "4.fst" "5.fst" "6.fst"</div><div class='input'>
-<span class='co'># clean up cars.df</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)</div></pre>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">get_chunk_ids</span><span class="op">(</span><span class="va">df</span>, <span class="va">...</span>, full.names <span class="op">=</span> <span class="cn">FALSE</span>, strip_extension <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span></code></pre></div>
+    </div>
+
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>df</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>...</dt>
+<dd><p>passed to list.files</p></dd>
+<dt>full.names</dt>
+<dd><p>If TRUE returns the full path to the file, Defaults to FALSE</p></dd>
+<dt>strip_extension</dt>
+<dd><p>If TRUE then the file extension in the chunk_id is removed. Defaults to TRUE</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># return the integer-string chunk IDs</span></span>
+<span class="r-in"><span class="fu">get_chunk_ids</span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] "1" "2" "3" "4" "5" "6"</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># return the file name chunk IDs</span></span>
+<span class="r-in"><span class="fu">get_chunk_ids</span><span class="op">(</span><span class="va">cars.df</span>, full.names <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] "C:\\Users\\RTX2080\\AppData\\Local\\Temp\\Rtmp2rQjw5\\file56f46178545a.df/1.fst"</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [2] "C:\\Users\\RTX2080\\AppData\\Local\\Temp\\Rtmp2rQjw5\\file56f46178545a.df/2.fst"</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [3] "C:\\Users\\RTX2080\\AppData\\Local\\Temp\\Rtmp2rQjw5\\file56f46178545a.df/3.fst"</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [4] "C:\\Users\\RTX2080\\AppData\\Local\\Temp\\Rtmp2rQjw5\\file56f46178545a.df/4.fst"</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [5] "C:\\Users\\RTX2080\\AppData\\Local\\Temp\\Rtmp2rQjw5\\file56f46178545a.df/5.fst"</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [6] "C:\\Users\\RTX2080\\AppData\\Local\\Temp\\Rtmp2rQjw5\\file56f46178545a.df/6.fst"</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># return the file name chunk IDs with file extension</span></span>
+<span class="r-in"><span class="fu">get_chunk_ids</span><span class="op">(</span><span class="va">cars.df</span>, strip_extension <span class="op">=</span> <span class="cn">FALSE</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] "1.fst" "2.fst" "3.fst" "4.fst" "5.fst" "6.fst"</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up cars.df</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/group_by.html b/docs/reference/group_by.html
index c2f6087d..a7d39c8e 100644
--- a/docs/reference/group_by.html
+++ b/docs/reference/group_by.html
@@ -1,70 +1,15 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>A function to parse the summarize function — summarise.grouped_disk.frame • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="A function to parse the summarize function — summarise.grouped_disk.frame" />
-<meta property="og:description" content="The disk.frame group by operation perform group WITHIN each chunk. This is
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>A function to parse the summarize function — summarise.grouped_disk.frame • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="A function to parse the summarize function — summarise.grouped_disk.frame"><meta property="og:description" content="The disk.frame group by operation perform group WITHIN each chunk. This is
 often used for performance reasons. If the user wishes to perform group-by,
 they may choose to use the `hard_group_by` function which is expensive as it
-reorganizes the chunks by the shard key." />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+reorganizes the chunks by the shard key."><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -75,19 +20,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -96,8 +34,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -130,34 +67,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>A function to parse the summarize function</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/one-stage-verbs.R'><code>R/one-stage-verbs.R</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/one-stage-verbs.R" class="external-link"><code>R/one-stage-verbs.R</code></a></small>
     <div class="hidden name"><code>group_by.Rd</code></div>
     </div>
 
@@ -168,71 +101,60 @@ <h1>A function to parse the summarize function</h1>
 reorganizes the chunks by the shard key.</p>
     </div>
 
-    <pre class="usage"><span class='co'># S3 method for grouped_disk.frame</span>
-<span class='fu'>summarise</span>(<span class='no'>.data</span>, <span class='no'>...</span>)
-
-<span class='co'># S3 method for grouped_disk.frame</span>
-<span class='fu'>summarize</span>(<span class='no'>.data</span>, <span class='no'>...</span>)
-
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>group_by</span>(<span class='no'>.data</span>, <span class='no'>...</span>, <span class='kw'>add</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>, <span class='kw'>.drop</span> <span class='kw'>=</span> <span class='kw pkg'>dplyr</span><span class='kw ns'>::</span><span class='fu'><a href='https://dplyr.tidyverse.org/reference/group_by_drop_default.html'>group_by_drop_default</a></span>(<span class='no'>.data</span>))
-
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>summarize</span>(<span class='no'>.data</span>, <span class='no'>...</span>)
-
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>summarise</span>(<span class='no'>.data</span>, <span class='no'>...</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>.data</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>same as the dplyr::group_by</p></td>
-    </tr>
-    <tr>
-      <th>add</th>
-      <td><p>from dplyr</p></td>
-    </tr>
-    <tr>
-      <th>.drop</th>
-      <td><p>from dplyr</p></td>
-    </tr>
-    </table>
-
-    <h2 class="hasAnchor" id="see-also"><a class="anchor" href="#see-also"></a>See also</h2>
-
-    <div class='dont-index'><p>hard_group_by</p></div>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="co"># S3 method for grouped_disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/summarise.html" class="external-link">summarise</a></span><span class="op">(</span><span class="va">.data</span>, <span class="va">...</span><span class="op">)</span>
+
+<span class="co"># S3 method for grouped_disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/summarise.html" class="external-link">summarize</a></span><span class="op">(</span><span class="va">.data</span>, <span class="va">...</span><span class="op">)</span>
+
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/group_by.html" class="external-link">group_by</a></span><span class="op">(</span><span class="va">.data</span>, <span class="va">...</span>, add <span class="op">=</span> <span class="cn">FALSE</span>, .drop <span class="op">=</span> <span class="fu">dplyr</span><span class="fu">::</span><span class="fu"><a href="https://dplyr.tidyverse.org/reference/group_by_drop_default.html" class="external-link">group_by_drop_default</a></span><span class="op">(</span><span class="va">.data</span><span class="op">)</span><span class="op">)</span>
+
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/summarise.html" class="external-link">summarize</a></span><span class="op">(</span><span class="va">.data</span>, <span class="va">...</span><span class="op">)</span>
+
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/summarise.html" class="external-link">summarise</a></span><span class="op">(</span><span class="va">.data</span>, <span class="va">...</span><span class="op">)</span></code></pre></div>
+    </div>
+
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>.data</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>...</dt>
+<dd><p>same as the dplyr::group_by</p></dd>
+<dt>add</dt>
+<dd><p>from dplyr</p></dd>
+<dt>.drop</dt>
+<dd><p>from dplyr</p></dd>
+</dl></div>
+    <div id="see-also">
+    <h2>See also</h2>
+    <div class="dont-index"><p>hard_group_by</p></div>
+    </div>
 
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/groups.disk.frame.html b/docs/reference/groups.disk.frame.html
index dbe0e2dd..02be8acf 100644
--- a/docs/reference/groups.disk.frame.html
+++ b/docs/reference/groups.disk.frame.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>The shard keys of the disk.frame — groups.disk.frame • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="The shard keys of the disk.frame — groups.disk.frame" />
-<meta property="og:description" content="The shard keys of the disk.frame" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>The shard keys of the disk.frame — groups.disk.frame • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="The shard keys of the disk.frame — groups.disk.frame"><meta property="og:description" content="The shard keys of the disk.frame"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>The shard keys of the disk.frame</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/dplyr_verbs.r'><code>R/dplyr_verbs.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/dplyr_verbs.r" class="external-link"><code>R/dplyr_verbs.r</code></a></small>
     <div class="hidden name"><code>groups.disk.frame.Rd</code></div>
     </div>
 
@@ -162,47 +95,42 @@ <h1>The shard keys of the disk.frame</h1>
     <p>The shard keys of the disk.frame</p>
     </div>
 
-    <pre class="usage"><span class='co'># S3 method for disk.frame</span>
-<span class='fu'>groups</span>(<span class='no'>x</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>x</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    </table>
-
-    <h2 class="hasAnchor" id="value"><a class="anchor" href="#value"></a>Value</h2>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/group_data.html" class="external-link">groups</a></span><span class="op">(</span><span class="va">x</span><span class="op">)</span></code></pre></div>
+    </div>
 
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>x</dt>
+<dd><p>a disk.frame</p></dd>
+</dl></div>
+    <div id="value">
+    <h2>Value</h2>
     <p>character</p>
+    </div>
 
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/hard_arrange.html b/docs/reference/hard_arrange.html
index cb5c473d..c880a71b 100644
--- a/docs/reference/hard_arrange.html
+++ b/docs/reference/hard_arrange.html
@@ -1,69 +1,14 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Perform a hard arrange — hard_arrange • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Perform a hard arrange — hard_arrange" />
-<meta property="og:description" content="A hard_arrange is a sort by that also reorganizes the chunks to ensure that
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Perform a hard arrange — hard_arrange • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Perform a hard arrange — hard_arrange"><meta property="og:description" content="A hard_arrange is a sort by that also reorganizes the chunks to ensure that
 every unique grouping of `by`` is in the same chunk. Or in other words, every
-row that share the same `by` value will end up in the same chunk." />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+row that share the same `by` value will end up in the same chunk."><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -74,19 +19,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -95,8 +33,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -129,34 +66,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Perform a hard arrange</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/hard_arrange.r'><code>R/hard_arrange.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/hard_arrange.r" class="external-link"><code>R/hard_arrange.r</code></a></small>
     <div class="hidden name"><code>hard_arrange.Rd</code></div>
     </div>
 
@@ -166,116 +99,107 @@ <h1>Perform a hard arrange</h1>
 row that share the same `by` value will end up in the same chunk.</p>
     </div>
 
-    <pre class="usage"><span class='fu'>hard_arrange</span>(<span class='no'>df</span>, <span class='no'>...</span>, <span class='kw'>add</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>, <span class='kw'>.drop</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>)
-
-<span class='co'># S3 method for data.frame</span>
-<span class='fu'>hard_arrange</span>(<span class='no'>df</span>, <span class='no'>...</span>)
-
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>hard_arrange</span>(
-  <span class='no'>df</span>,
-  <span class='no'>...</span>,
-  <span class='kw'>outdir</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempfile</a></span>(<span class='st'>"tmp_disk_frame_hard_arrange"</span>),
-  <span class='kw'>nchunks</span> <span class='kw'>=</span> <span class='kw pkg'>disk.frame</span><span class='kw ns'>::</span><span class='fu'><a href='nchunks.html'>nchunks</a></span>(<span class='no'>df</span>),
-  <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>
-)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>df</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>grouping variables</p></td>
-    </tr>
-    <tr>
-      <th>add</th>
-      <td><p>same as dplyr::arrange</p></td>
-    </tr>
-    <tr>
-      <th>.drop</th>
-      <td><p>same as dplyr::arrange</p></td>
-    </tr>
-    <tr>
-      <th>outdir</th>
-      <td><p>the output directory</p></td>
-    </tr>
-    <tr>
-      <th>nchunks</th>
-      <td><p>The number of chunks in the output. Defaults = nchunks.disk.frame(df)</p></td>
-    </tr>
-    <tr>
-      <th>overwrite</th>
-      <td><p>overwrite the out put directory</p></td>
-    </tr>
-    </table>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">hard_arrange</span><span class="op">(</span><span class="va">df</span>, <span class="va">...</span>, add <span class="op">=</span> <span class="cn">FALSE</span>, .drop <span class="op">=</span> <span class="cn">FALSE</span><span class="op">)</span>
 
+<span class="co"># S3 method for data.frame</span>
+<span class="fu">hard_arrange</span><span class="op">(</span><span class="va">df</span>, <span class="va">...</span><span class="op">)</span>
 
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>iris.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>iris</span>, <span class='kw'>nchunks</span> <span class='kw'>=</span> <span class='fl'>2</span>)
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu">hard_arrange</span><span class="op">(</span>
+  <span class="va">df</span>,
+  <span class="va">...</span>,
+  outdir <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempfile</a></span><span class="op">(</span><span class="st">"tmp_disk_frame_hard_arrange"</span><span class="op">)</span>,
+  nchunks <span class="op">=</span> <span class="fu">disk.frame</span><span class="fu">::</span><span class="fu"><a href="nchunks.html">nchunks</a></span><span class="op">(</span><span class="va">df</span><span class="op">)</span>,
+  overwrite <span class="op">=</span> <span class="cn">TRUE</span>
+<span class="op">)</span></code></pre></div>
+    </div>
 
-<span class='co'># arrange iris.df by specifies and ensure rows with the same specifies are in the same chunk</span>
-<span class='no'>iris_hard.df</span> <span class='kw'>=</span> <span class='fu'>hard_arrange</span>(<span class='no'>iris.df</span>, <span class='no'>Species</span>)</div><div class='output co'>#&gt; <span class='message'>Appending disk.frames: </span></div><div class='input'>
-<span class='fu'><a href='get_chunk.html'>get_chunk</a></span>(<span class='no'>iris_hard.df</span>, <span class='fl'>1</span>)</div><div class='output co'>#&gt; <span style='color: #949494;'># A tibble: 50 x 5</span><span>
-#&gt; </span><span style='color: #949494;'># Groups:   Species [1]</span><span>
-#&gt;    Sepal.Length Sepal.Width Petal.Length Petal.Width Species  
-#&gt;           </span><span style='color: #949494;font-style: italic;'>&lt;dbl&gt;</span><span>       </span><span style='color: #949494;font-style: italic;'>&lt;dbl&gt;</span><span>        </span><span style='color: #949494;font-style: italic;'>&lt;dbl&gt;</span><span>       </span><span style='color: #949494;font-style: italic;'>&lt;dbl&gt;</span><span> </span><span style='color: #949494;font-style: italic;'>&lt;fct&gt;</span><span>    
-#&gt; </span><span style='color: #BCBCBC;'> 1</span><span>          6.3         3.3          6           2.5 virginica
-#&gt; </span><span style='color: #BCBCBC;'> 2</span><span>          5.8         2.7          5.1         1.9 virginica
-#&gt; </span><span style='color: #BCBCBC;'> 3</span><span>          7.1         3            5.9         2.1 virginica
-#&gt; </span><span style='color: #BCBCBC;'> 4</span><span>          6.3         2.9          5.6         1.8 virginica
-#&gt; </span><span style='color: #BCBCBC;'> 5</span><span>          6.5         3            5.8         2.2 virginica
-#&gt; </span><span style='color: #BCBCBC;'> 6</span><span>          7.6         3            6.6         2.1 virginica
-#&gt; </span><span style='color: #BCBCBC;'> 7</span><span>          4.9         2.5          4.5         1.7 virginica
-#&gt; </span><span style='color: #BCBCBC;'> 8</span><span>          7.3         2.9          6.3         1.8 virginica
-#&gt; </span><span style='color: #BCBCBC;'> 9</span><span>          6.7         2.5          5.8         1.8 virginica
-#&gt; </span><span style='color: #BCBCBC;'>10</span><span>          7.2         3.6          6.1         2.5 virginica
-#&gt; </span><span style='color: #949494;'># ... with 40 more rows</span><span></div><div class='input'><span class='fu'><a href='get_chunk.html'>get_chunk</a></span>(<span class='no'>iris_hard.df</span>, <span class='fl'>2</span>)</div><div class='output co'>#&gt; </span><span style='color: #949494;'># A tibble: 50 x 5</span><span>
-#&gt; </span><span style='color: #949494;'># Groups:   Species [1]</span><span>
-#&gt;    Sepal.Length Sepal.Width Petal.Length Petal.Width Species  
-#&gt;           </span><span style='color: #949494;font-style: italic;'>&lt;dbl&gt;</span><span>       </span><span style='color: #949494;font-style: italic;'>&lt;dbl&gt;</span><span>        </span><span style='color: #949494;font-style: italic;'>&lt;dbl&gt;</span><span>       </span><span style='color: #949494;font-style: italic;'>&lt;dbl&gt;</span><span> </span><span style='color: #949494;font-style: italic;'>&lt;fct&gt;</span><span>    
-#&gt; </span><span style='color: #BCBCBC;'> 1</span><span>          6.3         3.3          6           2.5 virginica
-#&gt; </span><span style='color: #BCBCBC;'> 2</span><span>          5.8         2.7          5.1         1.9 virginica
-#&gt; </span><span style='color: #BCBCBC;'> 3</span><span>          7.1         3            5.9         2.1 virginica
-#&gt; </span><span style='color: #BCBCBC;'> 4</span><span>          6.3         2.9          5.6         1.8 virginica
-#&gt; </span><span style='color: #BCBCBC;'> 5</span><span>          6.5         3            5.8         2.2 virginica
-#&gt; </span><span style='color: #BCBCBC;'> 6</span><span>          7.6         3            6.6         2.1 virginica
-#&gt; </span><span style='color: #BCBCBC;'> 7</span><span>          4.9         2.5          4.5         1.7 virginica
-#&gt; </span><span style='color: #BCBCBC;'> 8</span><span>          7.3         2.9          6.3         1.8 virginica
-#&gt; </span><span style='color: #BCBCBC;'> 9</span><span>          6.7         2.5          5.8         1.8 virginica
-#&gt; </span><span style='color: #BCBCBC;'>10</span><span>          7.2         3.6          6.1         2.5 virginica
-#&gt; </span><span style='color: #949494;'># ... with 40 more rows</span><span></div><div class='input'>
-<span class='co'># clean up cars.df</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>iris.df</span>)
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>iris_hard.df</span>)</div></span></pre>
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>df</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>...</dt>
+<dd><p>grouping variables</p></dd>
+<dt>add</dt>
+<dd><p>same as dplyr::arrange</p></dd>
+<dt>.drop</dt>
+<dd><p>same as dplyr::arrange</p></dd>
+<dt>outdir</dt>
+<dd><p>the output directory</p></dd>
+<dt>nchunks</dt>
+<dd><p>The number of chunks in the output. Defaults = nchunks.disk.frame(df)</p></dd>
+<dt>overwrite</dt>
+<dd><p>overwrite the out put directory</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">iris.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">iris</span>, nchunks <span class="op">=</span> <span class="fl">2</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># arrange iris.df by specifies and ensure rows with the same specifies are in the same chunk</span></span>
+<span class="r-in"><span class="va">iris_hard.df</span> <span class="op">=</span> <span class="fu">hard_arrange</span><span class="op">(</span><span class="va">iris.df</span>, <span class="va">Species</span><span class="op">)</span></span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Appending disk.frames: </span>
+<span class="r-in"></span>
+<span class="r-in"><span class="fu"><a href="get_chunk.html">get_chunk</a></span><span class="op">(</span><span class="va">iris_hard.df</span>, <span class="fl">1</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #949494;"># A tibble: 50 x 5</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #949494;"># Groups:   Species [1]</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>    Sepal.Length Sepal.Width Petal.Length Petal.Width Species  </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>           <span style="color: #949494; font-style: italic;">&lt;dbl&gt;</span>       <span style="color: #949494; font-style: italic;">&lt;dbl&gt;</span>        <span style="color: #949494; font-style: italic;">&lt;dbl&gt;</span>       <span style="color: #949494; font-style: italic;">&lt;dbl&gt;</span> <span style="color: #949494; font-style: italic;">&lt;fct&gt;</span>    </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 1</span>          6.3         3.3          6           2.5 virginica</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 2</span>          5.8         2.7          5.1         1.9 virginica</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 3</span>          7.1         3            5.9         2.1 virginica</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 4</span>          6.3         2.9          5.6         1.8 virginica</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 5</span>          6.5         3            5.8         2.2 virginica</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 6</span>          7.6         3            6.6         2.1 virginica</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 7</span>          4.9         2.5          4.5         1.7 virginica</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 8</span>          7.3         2.9          6.3         1.8 virginica</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 9</span>          6.7         2.5          5.8         1.8 virginica</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;">10</span>          7.2         3.6          6.1         2.5 virginica</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #949494;"># ... with 40 more rows</span></span>
+<span class="r-in"><span class="fu"><a href="get_chunk.html">get_chunk</a></span><span class="op">(</span><span class="va">iris_hard.df</span>, <span class="fl">2</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #949494;"># A tibble: 50 x 5</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #949494;"># Groups:   Species [1]</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>    Sepal.Length Sepal.Width Petal.Length Petal.Width Species  </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>           <span style="color: #949494; font-style: italic;">&lt;dbl&gt;</span>       <span style="color: #949494; font-style: italic;">&lt;dbl&gt;</span>        <span style="color: #949494; font-style: italic;">&lt;dbl&gt;</span>       <span style="color: #949494; font-style: italic;">&lt;dbl&gt;</span> <span style="color: #949494; font-style: italic;">&lt;fct&gt;</span>    </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 1</span>          6.3         3.3          6           2.5 virginica</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 2</span>          5.8         2.7          5.1         1.9 virginica</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 3</span>          7.1         3            5.9         2.1 virginica</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 4</span>          6.3         2.9          5.6         1.8 virginica</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 5</span>          6.5         3            5.8         2.2 virginica</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 6</span>          7.6         3            6.6         2.1 virginica</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 7</span>          4.9         2.5          4.5         1.7 virginica</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 8</span>          7.3         2.9          6.3         1.8 virginica</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 9</span>          6.7         2.5          5.8         1.8 virginica</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;">10</span>          7.2         3.6          6.1         2.5 virginica</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #949494;"># ... with 40 more rows</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up cars.df</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">iris.df</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">iris_hard.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/hard_group_by.html b/docs/reference/hard_group_by.html
index 1b6f636c..8dd5247b 100644
--- a/docs/reference/hard_group_by.html
+++ b/docs/reference/hard_group_by.html
@@ -1,69 +1,14 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Perform a hard group — hard_group_by • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Perform a hard group — hard_group_by" />
-<meta property="og:description" content="A hard_group_by is a group by that also reorganizes the chunks to ensure that
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Perform a hard group — hard_group_by • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Perform a hard group — hard_group_by"><meta property="og:description" content="A hard_group_by is a group by that also reorganizes the chunks to ensure that
 every unique grouping of `by`` is in the same chunk. Or in other words, every
-row that share the same `by` value will end up in the same chunk." />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+row that share the same `by` value will end up in the same chunk."><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -74,19 +19,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -95,8 +33,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -129,34 +66,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Perform a hard group</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/hard_group_by.r'><code>R/hard_group_by.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/hard_group_by.r" class="external-link"><code>R/hard_group_by.r</code></a></small>
     <div class="hidden name"><code>hard_group_by.Rd</code></div>
     </div>
 
@@ -166,122 +99,108 @@ <h1>Perform a hard group</h1>
 row that share the same `by` value will end up in the same chunk.</p>
     </div>
 
-    <pre class="usage"><span class='fu'>hard_group_by</span>(<span class='no'>df</span>, <span class='no'>...</span>, <span class='kw'>.add</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>, <span class='kw'>.drop</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>)
-
-<span class='co'># S3 method for data.frame</span>
-<span class='fu'>hard_group_by</span>(<span class='no'>df</span>, <span class='no'>...</span>, <span class='kw'>.add</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>, <span class='kw'>.drop</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>)
-
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>hard_group_by</span>(
-  <span class='no'>df</span>,
-  <span class='no'>...</span>,
-  <span class='kw'>outdir</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempfile</a></span>(<span class='st'>"tmp_disk_frame_hard_group_by"</span>),
-  <span class='kw'>nchunks</span> <span class='kw'>=</span> <span class='kw pkg'>disk.frame</span><span class='kw ns'>::</span><span class='fu'><a href='nchunks.html'>nchunks</a></span>(<span class='no'>df</span>),
-  <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>,
-  <span class='kw'>shardby_function</span> <span class='kw'>=</span> <span class='st'>"hash"</span>,
-  <span class='kw'>sort_splits</span> <span class='kw'>=</span> <span class='kw'>NULL</span>,
-  <span class='kw'>desc_vars</span> <span class='kw'>=</span> <span class='kw'>NULL</span>,
-  <span class='kw'>sort_split_sample_size</span> <span class='kw'>=</span> <span class='fl'>100</span>
-)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>df</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>grouping variables</p></td>
-    </tr>
-    <tr>
-      <th>.add</th>
-      <td><p>same as dplyr::group_by</p></td>
-    </tr>
-    <tr>
-      <th>.drop</th>
-      <td><p>same as dplyr::group_by</p></td>
-    </tr>
-    <tr>
-      <th>outdir</th>
-      <td><p>the output directory</p></td>
-    </tr>
-    <tr>
-      <th>nchunks</th>
-      <td><p>The number of chunks in the output. Defaults = nchunks.disk.frame(df)</p></td>
-    </tr>
-    <tr>
-      <th>overwrite</th>
-      <td><p>overwrite the out put directory</p></td>
-    </tr>
-    <tr>
-      <th>shardby_function</th>
-      <td><p>splitting of chunks: "hash" for hash function or "sort" for semi-sorted chunks</p></td>
-    </tr>
-    <tr>
-      <th>sort_splits</th>
-      <td><p>for the "sort" shardby function, a dataframe with the split values.</p></td>
-    </tr>
-    <tr>
-      <th>desc_vars</th>
-      <td><p>for the "sort" shardby function, the variables to sort descending.</p></td>
-    </tr>
-    <tr>
-      <th>sort_split_sample_size</th>
-      <td><p>for the "sort" shardby function, if sort_splits is null, the number of rows to sample per chunk for random splits.</p></td>
-    </tr>
-    </table>
-
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>iris.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>iris</span>, <span class='kw'>nchunks</span> <span class='kw'>=</span> <span class='fl'>2</span>)
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">hard_group_by</span><span class="op">(</span><span class="va">df</span>, <span class="va">...</span>, .add <span class="op">=</span> <span class="cn">FALSE</span>, .drop <span class="op">=</span> <span class="cn">FALSE</span><span class="op">)</span>
+
+<span class="co"># S3 method for data.frame</span>
+<span class="fu">hard_group_by</span><span class="op">(</span><span class="va">df</span>, <span class="va">...</span>, .add <span class="op">=</span> <span class="cn">FALSE</span>, .drop <span class="op">=</span> <span class="cn">FALSE</span><span class="op">)</span>
+
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu">hard_group_by</span><span class="op">(</span>
+  <span class="va">df</span>,
+  <span class="va">...</span>,
+  outdir <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempfile</a></span><span class="op">(</span><span class="st">"tmp_disk_frame_hard_group_by"</span><span class="op">)</span>,
+  nchunks <span class="op">=</span> <span class="fu">disk.frame</span><span class="fu">::</span><span class="fu"><a href="nchunks.html">nchunks</a></span><span class="op">(</span><span class="va">df</span><span class="op">)</span>,
+  overwrite <span class="op">=</span> <span class="cn">TRUE</span>,
+  shardby_function <span class="op">=</span> <span class="st">"hash"</span>,
+  sort_splits <span class="op">=</span> <span class="cn">NULL</span>,
+  desc_vars <span class="op">=</span> <span class="cn">NULL</span>,
+  sort_split_sample_size <span class="op">=</span> <span class="fl">100</span>
+<span class="op">)</span></code></pre></div>
+    </div>
 
-<span class='co'># group_by iris.df by specifies and ensure rows with the same specifies are in the same chunk</span>
-<span class='no'>iris_hard.df</span> <span class='kw'>=</span> <span class='fu'>hard_group_by</span>(<span class='no'>iris.df</span>, <span class='no'>Species</span>)</div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Appending disk.frames: </span></div><div class='input'>
-<span class='fu'><a href='get_chunk.html'>get_chunk</a></span>(<span class='no'>iris_hard.df</span>, <span class='fl'>1</span>)</div><div class='output co'>#&gt; <span style='color: #949494;'># A tibble: 150 x 5</span><span>
-#&gt; </span><span style='color: #949494;'># Groups:   Species [3]</span><span>
-#&gt;    Sepal.Length Sepal.Width Petal.Length Petal.Width Species
-#&gt;           </span><span style='color: #949494;font-style: italic;'>&lt;dbl&gt;</span><span>       </span><span style='color: #949494;font-style: italic;'>&lt;dbl&gt;</span><span>        </span><span style='color: #949494;font-style: italic;'>&lt;dbl&gt;</span><span>       </span><span style='color: #949494;font-style: italic;'>&lt;dbl&gt;</span><span> </span><span style='color: #949494;font-style: italic;'>&lt;fct&gt;</span><span>  
-#&gt; </span><span style='color: #BCBCBC;'> 1</span><span>          5.1         3.5          1.4         0.2 setosa 
-#&gt; </span><span style='color: #BCBCBC;'> 2</span><span>          4.9         3            1.4         0.2 setosa 
-#&gt; </span><span style='color: #BCBCBC;'> 3</span><span>          4.7         3.2          1.3         0.2 setosa 
-#&gt; </span><span style='color: #BCBCBC;'> 4</span><span>          4.6         3.1          1.5         0.2 setosa 
-#&gt; </span><span style='color: #BCBCBC;'> 5</span><span>          5           3.6          1.4         0.2 setosa 
-#&gt; </span><span style='color: #BCBCBC;'> 6</span><span>          5.4         3.9          1.7         0.4 setosa 
-#&gt; </span><span style='color: #BCBCBC;'> 7</span><span>          4.6         3.4          1.4         0.3 setosa 
-#&gt; </span><span style='color: #BCBCBC;'> 8</span><span>          5           3.4          1.5         0.2 setosa 
-#&gt; </span><span style='color: #BCBCBC;'> 9</span><span>          4.4         2.9          1.4         0.2 setosa 
-#&gt; </span><span style='color: #BCBCBC;'>10</span><span>          4.9         3.1          1.5         0.1 setosa 
-#&gt; </span><span style='color: #949494;'># ... with 140 more rows</span><span></div><div class='input'><span class='fu'><a href='get_chunk.html'>get_chunk</a></span>(<span class='no'>iris_hard.df</span>, <span class='fl'>2</span>)</div><div class='output co'>#&gt; <span class='warning'>Warning: The chunk NA does not exist; returning an empty data.table</span></div><div class='output co'>#&gt; Null data.table (0 rows and 0 cols)</div><div class='input'>
-<span class='co'># clean up cars.df</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>iris.df</span>)
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>iris_hard.df</span>)</div></span></pre>
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>df</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>...</dt>
+<dd><p>grouping variables</p></dd>
+<dt>.add</dt>
+<dd><p>same as dplyr::group_by</p></dd>
+<dt>.drop</dt>
+<dd><p>same as dplyr::group_by</p></dd>
+<dt>outdir</dt>
+<dd><p>the output directory</p></dd>
+<dt>nchunks</dt>
+<dd><p>The number of chunks in the output. Defaults = nchunks.disk.frame(df)</p></dd>
+<dt>overwrite</dt>
+<dd><p>overwrite the out put directory</p></dd>
+<dt>shardby_function</dt>
+<dd><p>splitting of chunks: "hash" for hash function or "sort" for semi-sorted chunks</p></dd>
+<dt>sort_splits</dt>
+<dd><p>for the "sort" shardby function, a dataframe with the split values.</p></dd>
+<dt>desc_vars</dt>
+<dd><p>for the "sort" shardby function, the variables to sort descending.</p></dd>
+<dt>sort_split_sample_size</dt>
+<dd><p>for the "sort" shardby function, if sort_splits is null, the number of rows to sample per chunk for random splits.</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">iris.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">iris</span>, nchunks <span class="op">=</span> <span class="fl">2</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># group_by iris.df by specifies and ensure rows with the same specifies are in the same chunk</span></span>
+<span class="r-in"><span class="va">iris_hard.df</span> <span class="op">=</span> <span class="fu">hard_group_by</span><span class="op">(</span><span class="va">iris.df</span>, <span class="va">Species</span><span class="op">)</span></span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Appending disk.frames: </span>
+<span class="r-in"></span>
+<span class="r-in"><span class="fu"><a href="get_chunk.html">get_chunk</a></span><span class="op">(</span><span class="va">iris_hard.df</span>, <span class="fl">1</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #949494;"># A tibble: 150 x 5</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #949494;"># Groups:   Species [3]</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>    Sepal.Length Sepal.Width Petal.Length Petal.Width Species</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>           <span style="color: #949494; font-style: italic;">&lt;dbl&gt;</span>       <span style="color: #949494; font-style: italic;">&lt;dbl&gt;</span>        <span style="color: #949494; font-style: italic;">&lt;dbl&gt;</span>       <span style="color: #949494; font-style: italic;">&lt;dbl&gt;</span> <span style="color: #949494; font-style: italic;">&lt;fct&gt;</span>  </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 1</span>          5.1         3.5          1.4         0.2 setosa </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 2</span>          4.9         3            1.4         0.2 setosa </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 3</span>          4.7         3.2          1.3         0.2 setosa </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 4</span>          4.6         3.1          1.5         0.2 setosa </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 5</span>          5           3.6          1.4         0.2 setosa </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 6</span>          5.4         3.9          1.7         0.4 setosa </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 7</span>          4.6         3.4          1.4         0.3 setosa </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 8</span>          5           3.4          1.5         0.2 setosa </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;"> 9</span>          4.4         2.9          1.4         0.2 setosa </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #BCBCBC;">10</span>          4.9         3.1          1.5         0.1 setosa </span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> <span style="color: #949494;"># ... with 140 more rows</span></span>
+<span class="r-in"><span class="fu"><a href="get_chunk.html">get_chunk</a></span><span class="op">(</span><span class="va">iris_hard.df</span>, <span class="fl">2</span><span class="op">)</span></span>
+<span class="r-wrn co"><span class="r-pr">#&gt;</span> <span class="warning">Warning: </span>The chunk NA does not exist; returning an empty data.table</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> Null data.table (0 rows and 0 cols)</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up cars.df</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">iris.df</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">iris_hard.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/head_tail.html b/docs/reference/head_tail.html
index da4adf74..6312a2b2 100644
--- a/docs/reference/head_tail.html
+++ b/docs/reference/head_tail.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Head and tail of the disk.frame — head.disk.frame • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Head and tail of the disk.frame — head.disk.frame" />
-<meta property="og:description" content="Head and tail of the disk.frame" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Head and tail of the disk.frame — head.disk.frame • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Head and tail of the disk.frame — head.disk.frame"><meta property="og:description" content="Head and tail of the disk.frame"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Head and tail of the disk.frame</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/disk.frame.r'><code>R/disk.frame.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/disk.frame.r" class="external-link"><code>R/disk.frame.r</code></a></small>
     <div class="hidden name"><code>head_tail.Rd</code></div>
     </div>
 
@@ -162,71 +95,68 @@ <h1>Head and tail of the disk.frame</h1>
     <p>Head and tail of the disk.frame</p>
     </div>
 
-    <pre class="usage"><span class='co'># S3 method for disk.frame</span>
-<span class='fu'><a href='https://rdrr.io/r/utils/head.html'>head</a></span>(<span class='no'>x</span>, <span class='kw'>n</span> <span class='kw'>=</span> <span class='fl'>6L</span>, <span class='no'>...</span>)
-
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'><a href='https://rdrr.io/r/utils/head.html'>tail</a></span>(<span class='no'>x</span>, <span class='kw'>n</span> <span class='kw'>=</span> <span class='fl'>6L</span>, <span class='no'>...</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>x</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>n</th>
-      <td><p>number of rows to include</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>passed to base::head or base::tail</p></td>
-    </tr>
-    </table>
-
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
-<span class='fu'><a href='https://rdrr.io/r/utils/head.html'>head</a></span>(<span class='no'>cars.df</span>)</div><div class='output co'>#&gt;    speed dist
-#&gt; 1:     4    2
-#&gt; 2:     4   10
-#&gt; 3:     7    4
-#&gt; 4:     7   22
-#&gt; 5:     8   16
-#&gt; 6:     9   10</div><div class='input'><span class='fu'><a href='https://rdrr.io/r/utils/head.html'>tail</a></span>(<span class='no'>cars.df</span>)</div><div class='output co'>#&gt;    speed dist
-#&gt; 1:    24   70
-#&gt; 2:    24   92
-#&gt; 3:    24   93
-#&gt; 4:    24  120
-#&gt; 5:    25   85</div><div class='input'>
-<span class='co'># clean up </span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)</div></pre>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://rdrr.io/r/utils/head.html" class="external-link">head</a></span><span class="op">(</span><span class="va">x</span>, n <span class="op">=</span> <span class="fl">6L</span>, <span class="va">...</span><span class="op">)</span>
+
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://rdrr.io/r/utils/head.html" class="external-link">tail</a></span><span class="op">(</span><span class="va">x</span>, n <span class="op">=</span> <span class="fl">6L</span>, <span class="va">...</span><span class="op">)</span></code></pre></div>
+    </div>
+
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>x</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>n</dt>
+<dd><p>number of rows to include</p></dd>
+<dt>...</dt>
+<dd><p>passed to base::head or base::tail</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="https://rdrr.io/r/utils/head.html" class="external-link">head</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>    speed dist</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 1:     4    2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 2:     4   10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 3:     7    4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 4:     7   22</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 5:     8   16</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 6:     9   10</span>
+<span class="r-in"><span class="fu"><a href="https://rdrr.io/r/utils/head.html" class="external-link">tail</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>    speed dist</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 1:    24   70</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 2:    24   92</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 3:    24   93</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 4:    24  120</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 5:    25   85</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up </span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/index.html b/docs/reference/index.html
index 7a9bcfdc..482f042c 100644
--- a/docs/reference/index.html
+++ b/docs/reference/index.html
@@ -1,66 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Function reference • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Function reference" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Function reference • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Function reference"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-index">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -71,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -92,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -126,409 +64,270 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="contents col-md-9">
     <div class="page-header">
       <h1>Reference</h1>
     </div>
 
-    <table class="ref-index">
-
-    <colgroup>
-      
-      <col class="alias" />
-      <col class="title" />
-    </colgroup>
-
-    <tbody>
-      <tr>
-        <th colspan="2">
-          <h2 id="section-all-functions" class="hasAnchor"><a href="#section-all-functions" class="anchor"></a>All functions</h2>
+    <table class="ref-index"><colgroup><col class="alias"><col class="title"></colgroup><tbody><tr><th colspan="2">
+          <h2 id="all-functions">All functions <a href="#all-functions" class="anchor" aria-hidden="true"></a></h2>
           <p class="section-desc"></p>
         </th>
-      </tr>
-      
-      
-    </tbody><tbody>
-      
-      
-      <tr>
-        
-        <td>
+      </tr></tbody><tbody><tr><td>
           <p><code><a href="add_chunk.html">add_chunk()</a></code> </p>
         </td>
         <td><p>Add a chunk to the disk.frame</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="as.data.frame.disk.frame.html">as.data.frame(<i>&lt;disk.frame&gt;</i>)</a></code> </p>
         </td>
         <td><p>Convert disk.frame to data.frame by collecting all chunks</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="as.data.table.disk.frame.html">as.data.table(<i>&lt;disk.frame&gt;</i>)</a></code> </p>
         </td>
         <td><p>Convert disk.frame to data.table by collecting all chunks</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="as.disk.frame.html">as.disk.frame()</a></code> </p>
         </td>
         <td><p>Make a data.frame into a disk.frame</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="chunk_group_by.html">chunk_summarize()</a></code> <code><a href="chunk_group_by.html">chunk_summarise()</a></code> <code><a href="chunk_group_by.html">chunk_group_by()</a></code> <code><a href="chunk_group_by.html">chunk_ungroup()</a></code> </p>
         </td>
         <td><p>Group by within each disk.frame</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="cmap.html">cmap()</a></code> <code><a href="cmap.html">cmap_dfr()</a></code> <code><a href="cmap.html">cimap()</a></code> <code><a href="cmap.html">cimap_dfr()</a></code> <code><a href="cmap.html">lazy()</a></code> <code><a href="cmap.html">delayed()</a></code> <code><a href="cmap.html">chunk_lapply()</a></code> <code><a href="cmap.html">map()</a></code> <code><a href="cmap.html">imap_dfr()</a></code> <code><a href="cmap.html">imap()</a></code> <code><a href="cmap.html">map_dfr(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="cmap.html">map_dfr(<i>&lt;default&gt;</i>)</a></code> </p>
         </td>
         <td><p>Apply the same function to all chunks</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="cmap2.html">cmap2()</a></code> <code><a href="cmap2.html">map2()</a></code> <code><a href="cmap2.html">map_by_chunk_id()</a></code> </p>
         </td>
         <td><p>`cmap2` a function to two disk.frames</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="collect.html">collect(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="collect.html">collect_list()</a></code> <code><a href="collect.html">collect(<i>&lt;summarized_disk.frame&gt;</i>)</a></code> </p>
         </td>
         <td><p>Bring the disk.frame into R</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="colnames.html">colnames()</a></code> <code><a href="colnames.html">names(<i>&lt;disk.frame&gt;</i>)</a></code> </p>
         </td>
         <td><p>Return the column names of the disk.frame</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="compute.disk.frame.html">compute(<i>&lt;disk.frame&gt;</i>)</a></code> </p>
         </td>
         <td><p>Compute without writing</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="create_chunk_mapper.html">create_chunk_mapper()</a></code> </p>
         </td>
         <td><p>Create function that applies to each chunk if disk.frame</p></td>
-      </tr><tr>
-        
-        <td>
-          <p><code><a href="create_dplyr_mapper.html">create_dplyr_mapper()</a></code> </p>
-        </td>
-        <td><p>Kept for backwards-compatibility to be removed in 0.3</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="csv_to_disk.frame.html">csv_to_disk.frame()</a></code> </p>
         </td>
         <td><p>Convert CSV file(s) to disk.frame format</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="delete.html">delete()</a></code> </p>
         </td>
         <td><p>Delete a disk.frame</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="dfglm.html">dfglm()</a></code> </p>
         </td>
         <td><p>Fit generalized linear models (glm) with disk.frame</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="df_ram_size.html">df_ram_size()</a></code> </p>
         </td>
         <td><p>Get the size of RAM in gigabytes</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="disk.frame.html">disk.frame()</a></code> </p>
         </td>
         <td><p>Create a disk.frame from a folder</p></td>
-      </tr><tr>
-        
-        <td>
-          <p><code><a href="dplyr_verbs.html">select(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="dplyr_verbs.html">rename(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="dplyr_verbs.html">filter(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="dplyr_verbs.html">mutate(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="dplyr_verbs.html">transmute(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="dplyr_verbs.html">arrange(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="dplyr_verbs.html">chunk_arrange()</a></code> <code><a href="dplyr_verbs.html">tally.disk.frame()</a></code> <code><a href="dplyr_verbs.html">count.disk.frame()</a></code> <code><a href="dplyr_verbs.html">add_count.disk.frame()</a></code> <code><a href="dplyr_verbs.html">add_tally.disk.frame()</a></code> <code><a href="dplyr_verbs.html">do(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="dplyr_verbs.html">distinct(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="dplyr_verbs.html">chunk_distinct()</a></code> <code><a href="dplyr_verbs.html">glimpse(<i>&lt;disk.frame&gt;</i>)</a></code> </p>
+      </tr><tr><td>
+          <p><code><a href="dplyr_verbs.html">select(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="dplyr_verbs.html">rename(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="dplyr_verbs.html">filter(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="dplyr_verbs.html">mutate(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="dplyr_verbs.html">transmute(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="dplyr_verbs.html">arrange(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="dplyr_verbs.html">chunk_arrange()</a></code> <code><a href="dplyr_verbs.html">add_tally.disk.frame()</a></code> <code><a href="dplyr_verbs.html">do(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="dplyr_verbs.html">distinct(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="dplyr_verbs.html">chunk_distinct()</a></code> <code><a href="dplyr_verbs.html">glimpse(<i>&lt;disk.frame&gt;</i>)</a></code> </p>
         </td>
         <td><p>The dplyr verbs implemented for disk.frame</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="evalparseglue.html">evalparseglue()</a></code> </p>
         </td>
         <td><p>Helper function to evalparse some `glue::glue` string</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="foverlaps.disk.frame.html">foverlaps.disk.frame()</a></code> </p>
         </td>
         <td><p>Apply data.table's foverlaps to the disk.frame</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="gen_datatable_synthetic.html">gen_datatable_synthetic()</a></code> </p>
         </td>
         <td><p>Generate synthetic dataset for testing</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="get_chunk.html">get_chunk()</a></code> </p>
         </td>
         <td><p>Obtain one chunk by chunk id</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="get_chunk_ids.html">get_chunk_ids()</a></code> </p>
         </td>
         <td><p>Get the chunk IDs and files names</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="groups.disk.frame.html">groups(<i>&lt;disk.frame&gt;</i>)</a></code> </p>
         </td>
         <td><p>The shard keys of the disk.frame</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="group_by.html">summarise(<i>&lt;grouped_disk.frame&gt;</i>)</a></code> <code><a href="group_by.html">summarize(<i>&lt;grouped_disk.frame&gt;</i>)</a></code> <code><a href="group_by.html">group_by(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="group_by.html">summarize(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="group_by.html">summarise(<i>&lt;disk.frame&gt;</i>)</a></code> </p>
         </td>
         <td><p>A function to parse the summarize function</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="hard_arrange.html">hard_arrange()</a></code> </p>
         </td>
         <td><p>Perform a hard arrange</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="hard_group_by.html">hard_group_by()</a></code> </p>
         </td>
         <td><p>Perform a hard group</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="head_tail.html">head(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="head_tail.html">tail(<i>&lt;disk.frame&gt;</i>)</a></code> </p>
         </td>
         <td><p>Head and tail of the disk.frame</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="is_disk.frame.html">is_disk.frame()</a></code> </p>
         </td>
         <td><p>Checks if a folder is a disk.frame</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="join.html">anti_join(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="join.html">full_join(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="join.html">inner_join(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="join.html">left_join(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="join.html">semi_join(<i>&lt;disk.frame&gt;</i>)</a></code> </p>
         </td>
         <td><p>Performs join/merge for disk.frames</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="make_glm_streaming_fn.html">make_glm_streaming_fn()</a></code> </p>
         </td>
         <td><p>A streaming function for speedglm</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="merge.disk.frame.html">merge(<i>&lt;disk.frame&gt;</i>)</a></code> </p>
         </td>
         <td><p>Merge function for disk.frames</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="move_to.html">move_to()</a></code> <code><a href="move_to.html">copy_df_to()</a></code> </p>
         </td>
         <td><p>Move or copy a disk.frame to another location</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="nchunks.html">nchunks()</a></code> <code><a href="nchunks.html">nchunk()</a></code> </p>
         </td>
         <td><p>Returns the number of chunks in a disk.frame</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="ncol_nrow.html">nrow()</a></code> <code><a href="ncol_nrow.html">ncol()</a></code> </p>
         </td>
         <td><p>Number of rows or columns</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="one-stage-group-by-verbs.html">var_df.chunk_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">var_df.collected_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">sd_df.chunk_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">sd_df.collected_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">mean_df.chunk_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">mean_df.collected_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">sum_df.chunk_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">sum_df.collected_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">min_df.chunk_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">min_df.collected_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">max_df.chunk_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">max_df.collected_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">median_df.chunk_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">median_df.collected_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">n_df.chunk_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">n_df.collected_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">length_df.chunk_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">length_df.collected_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">any_df.chunk_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">any_df.collected_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">all_df.chunk_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">all_df.collected_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">n_distinct_df.chunk_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">n_distinct_df.collected_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">quantile_df.chunk_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">quantile_df.collected_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">IQR_df.chunk_agg.disk.frame()</a></code> <code><a href="one-stage-group-by-verbs.html">IQR_df.collected_agg.disk.frame()</a></code> </p>
         </td>
         <td><p>One Stage function</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="overwrite_check.html">overwrite_check()</a></code> </p>
         </td>
         <td><p>Check if the outdir exists or not</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="print.disk.frame.html">print(<i>&lt;disk.frame&gt;</i>)</a></code> </p>
         </td>
         <td><p>Print disk.frame</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="pull.disk.frame.html">pull(<i>&lt;disk.frame&gt;</i>)</a></code> </p>
         </td>
         <td><p>Pull a column from table similar to `dplyr::pull`.</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="rbindlist.disk.frame.html">rbindlist.disk.frame()</a></code> </p>
         </td>
         <td><p>rbindlist disk.frames together</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="rechunk.html">rechunk()</a></code> </p>
         </td>
         <td><p>Increase or decrease the number of chunks in the disk.frame</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="recommend_nchunks.html">recommend_nchunks()</a></code> </p>
         </td>
         <td><p>Recommend number of chunks based on input size</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="remove_chunk.html">remove_chunk()</a></code> </p>
         </td>
         <td><p>Removes a chunk from the disk.frame</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="sample.html">sample_frac(<i>&lt;disk.frame&gt;</i>)</a></code> </p>
         </td>
         <td><p>Sample n rows from a disk.frame</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="setup_disk.frame.html">setup_disk.frame()</a></code> </p>
         </td>
         <td><p>Set up disk.frame environment</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="shard.html">shard()</a></code> <code><a href="shard.html">distribute()</a></code> </p>
         </td>
         <td><p>Shard a data.frame/data.table or disk.frame into chunk and saves it into a disk.frame</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="shardkey.html">shardkey()</a></code> </p>
         </td>
         <td><p>Returns the shardkey (not implemented yet)</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="shardkey_equal.html">shardkey_equal()</a></code> </p>
         </td>
         <td><p>Compare two disk.frame shardkeys</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="show_ceremony.html">show_ceremony()</a></code> <code><a href="show_ceremony.html">ceremony_text()</a></code> <code><a href="show_ceremony.html">show_boilerplate()</a></code> <code><a href="show_ceremony.html">insert_ceremony()</a></code> </p>
         </td>
         <td><p>Show the code to setup disk.frame</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="srckeep.html">srckeep()</a></code> <code><a href="srckeep.html">srckeepchunks()</a></code> </p>
         </td>
         <td><p>Keep only the variables from the input listed in selections</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="sub-.disk.frame.html">`[`(<i>&lt;disk.frame&gt;</i>)</a></code> </p>
         </td>
         <td><p>[ interface for disk.frame using fst backend</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="tbl_vars.disk.frame.html">tbl_vars(<i>&lt;disk.frame&gt;</i>)</a></code> <code><a href="tbl_vars.disk.frame.html">group_vars(<i>&lt;disk.frame&gt;</i>)</a></code> </p>
         </td>
         <td><p>Column names for RStudio auto-complete</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="write_disk.frame.html">write_disk.frame()</a></code> <code><a href="write_disk.frame.html">output_disk.frame()</a></code> </p>
         </td>
         <td><p>Write disk.frame to disk</p></td>
-      </tr><tr>
-        
-        <td>
+      </tr><tr><td>
           <p><code><a href="zip_to_disk.frame.html">zip_to_disk.frame()</a></code> </p>
         </td>
         <td><p>`zip_to_disk.frame` is used to read and convert every CSV file within the zip
 file to disk.frame format</p></td>
-      </tr>
-    </tbody>
-    </table>
-  </div>
+      </tr></tbody></table></div>
 
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/is_disk.frame.html b/docs/reference/is_disk.frame.html
index 3b294687..c56ab38f 100644
--- a/docs/reference/is_disk.frame.html
+++ b/docs/reference/is_disk.frame.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Checks if a folder is a disk.frame — is_disk.frame • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Checks if a folder is a disk.frame — is_disk.frame" />
-<meta property="og:description" content="Checks if a folder is a disk.frame" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Checks if a folder is a disk.frame — is_disk.frame • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Checks if a folder is a disk.frame — is_disk.frame"><meta property="og:description" content="Checks if a folder is a disk.frame"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Checks if a folder is a disk.frame</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/is_disk.frame.r'><code>R/is_disk.frame.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/is_disk.frame.r" class="external-link"><code>R/is_disk.frame.r</code></a></small>
     <div class="hidden name"><code>is_disk.frame.Rd</code></div>
     </div>
 
@@ -162,49 +95,50 @@ <h1>Checks if a folder is a disk.frame</h1>
     <p>Checks if a folder is a disk.frame</p>
     </div>
 
-    <pre class="usage"><span class='fu'>is_disk.frame</span>(<span class='no'>df</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>df</th>
-      <td><p>a disk.frame or directory to check</p></td>
-    </tr>
-    </table>
-
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">is_disk.frame</span><span class="op">(</span><span class="va">df</span><span class="op">)</span></code></pre></div>
+    </div>
 
-<span class='fu'>is_disk.frame</span>(<span class='no'>cars</span>) <span class='co'># FALSE</span></div><div class='output co'>#&gt; [1] FALSE</div><div class='input'><span class='fu'>is_disk.frame</span>(<span class='no'>cars.df</span>) <span class='co'># TRUE</span></div><div class='output co'>#&gt; [1] TRUE</div><div class='input'>
-<span class='co'># clean up cars.df</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)</div></pre>
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>df</dt>
+<dd><p>a disk.frame or directory to check</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="fu">is_disk.frame</span><span class="op">(</span><span class="va">cars</span><span class="op">)</span> <span class="co"># FALSE</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] FALSE</span>
+<span class="r-in"><span class="fu">is_disk.frame</span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span> <span class="co"># TRUE</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] TRUE</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up cars.df</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/join.html b/docs/reference/join.html
index 3caac2ed..6bdc7ff7 100644
--- a/docs/reference/join.html
+++ b/docs/reference/join.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Performs join/merge for disk.frames — anti_join.disk.frame • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Performs join/merge for disk.frames — anti_join.disk.frame" />
-<meta property="og:description" content="Performs join/merge for disk.frames" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Performs join/merge for disk.frames — anti_join.disk.frame • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Performs join/merge for disk.frames — anti_join.disk.frame"><meta property="og:description" content="Performs join/merge for disk.frames"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Performs join/merge for disk.frames</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/anti_join.r'><code>R/anti_join.r</code></a>, <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/full_join.r'><code>R/full_join.r</code></a>, <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/inner_join.r'><code>R/inner_join.r</code></a>, and 2 more</small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/anti_join.r" class="external-link"><code>R/anti_join.r</code></a>, <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/full_join.r" class="external-link"><code>R/full_join.r</code></a>, <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/inner_join.r" class="external-link"><code>R/inner_join.r</code></a>, and 2 more</small>
     <div class="hidden name"><code>join.Rd</code></div>
     </div>
 
@@ -162,179 +95,208 @@ <h1>Performs join/merge for disk.frames</h1>
     <p>Performs join/merge for disk.frames</p>
     </div>
 
-    <pre class="usage"><span class='co'># S3 method for disk.frame</span>
-<span class='fu'>anti_join</span>(
-  <span class='no'>x</span>,
-  <span class='no'>y</span>,
-  <span class='kw'>by</span> <span class='kw'>=</span> <span class='kw'>NULL</span>,
-  <span class='kw'>copy</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>,
-  <span class='no'>...</span>,
-  <span class='kw'>outdir</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempfile</a></span>(<span class='st'>"tmp_disk_frame_anti_join"</span>),
-  <span class='kw'>merge_by_chunk_id</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>,
-  <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>,
-  <span class='kw'>.progress</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>
-)
-
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>full_join</span>(
-  <span class='no'>x</span>,
-  <span class='no'>y</span>,
-  <span class='kw'>by</span> <span class='kw'>=</span> <span class='kw'>NULL</span>,
-  <span class='kw'>copy</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>,
-  <span class='no'>...</span>,
-  <span class='kw'>outdir</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempfile</a></span>(<span class='st'>"tmp_disk_frame_full_join"</span>),
-  <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>,
-  <span class='no'>merge_by_chunk_id</span>,
-  <span class='kw'>.progress</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>
-)
-
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>inner_join</span>(
-  <span class='no'>x</span>,
-  <span class='no'>y</span>,
-  <span class='kw'>by</span> <span class='kw'>=</span> <span class='kw'>NULL</span>,
-  <span class='kw'>copy</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>,
-  <span class='no'>...</span>,
-  <span class='kw'>outdir</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempfile</a></span>(<span class='st'>"tmp_disk_frame_inner_join"</span>),
-  <span class='kw'>merge_by_chunk_id</span> <span class='kw'>=</span> <span class='kw'>NULL</span>,
-  <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>,
-  <span class='kw'>.progress</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>
-)
-
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>left_join</span>(
-  <span class='no'>x</span>,
-  <span class='no'>y</span>,
-  <span class='kw'>by</span> <span class='kw'>=</span> <span class='kw'>NULL</span>,
-  <span class='kw'>copy</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>,
-  <span class='no'>...</span>,
-  <span class='kw'>outdir</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempfile</a></span>(<span class='st'>"tmp_disk_frame_left_join"</span>),
-  <span class='kw'>merge_by_chunk_id</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>,
-  <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>,
-  <span class='kw'>.progress</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>
-)
-
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>semi_join</span>(
-  <span class='no'>x</span>,
-  <span class='no'>y</span>,
-  <span class='kw'>by</span> <span class='kw'>=</span> <span class='kw'>NULL</span>,
-  <span class='kw'>copy</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>,
-  <span class='no'>...</span>,
-  <span class='kw'>outdir</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempfile</a></span>(<span class='st'>"tmp_disk_frame_semi_join"</span>),
-  <span class='kw'>merge_by_chunk_id</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>,
-  <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>,
-  <span class='kw'>.progress</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>
-)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>x</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>y</th>
-      <td><p>a data.frame or disk.frame. If data.frame then returns lazily; if disk.frame it performs the join eagerly and return a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>by</th>
-      <td><p>join by</p></td>
-    </tr>
-    <tr>
-      <th>copy</th>
-      <td><p>same as dplyr::anti_join</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>same as dplyr's joins</p></td>
-    </tr>
-    <tr>
-      <th>outdir</th>
-      <td><p>output directory for disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>merge_by_chunk_id</th>
-      <td><p>the merge is performed by chunk id</p></td>
-    </tr>
-    <tr>
-      <th>overwrite</th>
-      <td><p>overwrite output directory</p></td>
-    </tr>
-    <tr>
-      <th>.progress</th>
-      <td><p>Show progress or not. Defaults to FALSE</p></td>
-    </tr>
-    </table>
-
-    <h2 class="hasAnchor" id="value"><a class="anchor" href="#value"></a>Value</h2>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/filter-joins.html" class="external-link">anti_join</a></span><span class="op">(</span>
+  <span class="va">x</span>,
+  <span class="va">y</span>,
+  by <span class="op">=</span> <span class="cn">NULL</span>,
+  copy <span class="op">=</span> <span class="cn">FALSE</span>,
+  <span class="va">...</span>,
+  outdir <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempfile</a></span><span class="op">(</span><span class="st">"tmp_disk_frame_anti_join"</span><span class="op">)</span>,
+  merge_by_chunk_id <span class="op">=</span> <span class="cn">FALSE</span>,
+  overwrite <span class="op">=</span> <span class="cn">TRUE</span>,
+  .progress <span class="op">=</span> <span class="cn">FALSE</span>
+<span class="op">)</span>
+
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate-joins.html" class="external-link">full_join</a></span><span class="op">(</span>
+  <span class="va">x</span>,
+  <span class="va">y</span>,
+  by <span class="op">=</span> <span class="cn">NULL</span>,
+  copy <span class="op">=</span> <span class="cn">FALSE</span>,
+  <span class="va">...</span>,
+  outdir <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempfile</a></span><span class="op">(</span><span class="st">"tmp_disk_frame_full_join"</span><span class="op">)</span>,
+  overwrite <span class="op">=</span> <span class="cn">TRUE</span>,
+  <span class="va">merge_by_chunk_id</span>,
+  .progress <span class="op">=</span> <span class="cn">FALSE</span>
+<span class="op">)</span>
+
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate-joins.html" class="external-link">inner_join</a></span><span class="op">(</span>
+  <span class="va">x</span>,
+  <span class="va">y</span>,
+  by <span class="op">=</span> <span class="cn">NULL</span>,
+  copy <span class="op">=</span> <span class="cn">FALSE</span>,
+  <span class="va">...</span>,
+  outdir <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempfile</a></span><span class="op">(</span><span class="st">"tmp_disk_frame_inner_join"</span><span class="op">)</span>,
+  merge_by_chunk_id <span class="op">=</span> <span class="cn">NULL</span>,
+  overwrite <span class="op">=</span> <span class="cn">TRUE</span>,
+  .progress <span class="op">=</span> <span class="cn">FALSE</span>
+<span class="op">)</span>
+
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate-joins.html" class="external-link">left_join</a></span><span class="op">(</span>
+  <span class="va">x</span>,
+  <span class="va">y</span>,
+  by <span class="op">=</span> <span class="cn">NULL</span>,
+  copy <span class="op">=</span> <span class="cn">FALSE</span>,
+  <span class="va">...</span>,
+  outdir <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempfile</a></span><span class="op">(</span><span class="st">"tmp_disk_frame_left_join"</span><span class="op">)</span>,
+  merge_by_chunk_id <span class="op">=</span> <span class="cn">FALSE</span>,
+  overwrite <span class="op">=</span> <span class="cn">TRUE</span>,
+  .progress <span class="op">=</span> <span class="cn">FALSE</span>
+<span class="op">)</span>
+
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/filter-joins.html" class="external-link">semi_join</a></span><span class="op">(</span>
+  <span class="va">x</span>,
+  <span class="va">y</span>,
+  by <span class="op">=</span> <span class="cn">NULL</span>,
+  copy <span class="op">=</span> <span class="cn">FALSE</span>,
+  <span class="va">...</span>,
+  outdir <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempfile</a></span><span class="op">(</span><span class="st">"tmp_disk_frame_semi_join"</span><span class="op">)</span>,
+  merge_by_chunk_id <span class="op">=</span> <span class="cn">FALSE</span>,
+  overwrite <span class="op">=</span> <span class="cn">TRUE</span>,
+  .progress <span class="op">=</span> <span class="cn">FALSE</span>
+<span class="op">)</span></code></pre></div>
+    </div>
 
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>x</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>y</dt>
+<dd><p>a data.frame or disk.frame. If data.frame then returns lazily; if disk.frame it performs the join eagerly and return a disk.frame</p></dd>
+<dt>by</dt>
+<dd><p>join by</p></dd>
+<dt>copy</dt>
+<dd><p>same as dplyr::anti_join</p></dd>
+<dt>...</dt>
+<dd><p>same as dplyr's joins</p></dd>
+<dt>outdir</dt>
+<dd><p>output directory for disk.frame</p></dd>
+<dt>merge_by_chunk_id</dt>
+<dd><p>the merge is performed by chunk id</p></dd>
+<dt>overwrite</dt>
+<dd><p>overwrite output directory</p></dd>
+<dt>.progress</dt>
+<dd><p>Show progress or not. Defaults to FALSE</p></dd>
+</dl></div>
+    <div id="value">
+    <h2>Value</h2>
     <p>disk.frame or data.frame/data.table</p>
+    </div>
 
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>df.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='fu'><a href='https://rdrr.io/r/base/data.frame.html'>data.frame</a></span>(<span class='kw'>x</span> <span class='kw'>=</span> <span class='fl'>1</span>:<span class='fl'>3</span>, <span class='kw'>y</span> <span class='kw'>=</span> <span class='fl'>4</span>:<span class='fl'>6</span>), <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>)
-<span class='no'>df2.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='fu'><a href='https://rdrr.io/r/base/data.frame.html'>data.frame</a></span>(<span class='kw'>x</span> <span class='kw'>=</span> <span class='fl'>1</span>:<span class='fl'>2</span>, <span class='kw'>z</span> <span class='kw'>=</span> <span class='fl'>10</span>:<span class='fl'>11</span>), <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>)
-
-<span class='no'>anti_joined.df</span> <span class='kw'>=</span> <span class='fu'>anti_join</span>(<span class='no'>df.df</span>, <span class='no'>df2.df</span>)</div><div class='output co'>#&gt; <span class='warning'>Warning: merge_by_chunk_id = FALSE. This will take significantly longer and the preparations needed are performed eagerly which may lead to poor performance. Consider making y a data.frame or set merge_by_chunk_id = TRUE for better performance.</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Appending disk.frames: </span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Appending disk.frames: </span></div><div class='input'>
-<span class='no'>anti_joined.df</span> <span class='kw'>%&gt;%</span> <span class='no'>collect</span></div><div class='output co'>#&gt;    x y
-#&gt; 1: 3 6</div><div class='input'>
-<span class='no'>anti_joined.data.frame</span> <span class='kw'>=</span> <span class='fu'>anti_join</span>(<span class='no'>df.df</span>, <span class='fu'><a href='https://rdrr.io/r/base/data.frame.html'>data.frame</a></span>(<span class='kw'>x</span> <span class='kw'>=</span> <span class='fl'>1</span>:<span class='fl'>2</span>, <span class='kw'>z</span> <span class='kw'>=</span> <span class='fl'>10</span>:<span class='fl'>11</span>))</div><div class='output co'>#&gt; <span class='message'>Joining, by = "x"</span></div><div class='output co'>#&gt; <span class='message'>Joining, by = "x"</span></div><div class='output co'>#&gt; <span class='message'>Joining, by = "x"</span></div><div class='input'>
-<span class='co'># clean up</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>df.df</span>)
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>df2.df</span>)
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>anti_joined.df</span>)
-<span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
-
-<span class='no'>join.df</span> <span class='kw'>=</span> <span class='fu'>full_join</span>(<span class='no'>cars.df</span>, <span class='no'>cars.df</span>, <span class='kw'>merge_by_chunk_id</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>)
-
-<span class='co'># clean up cars.df</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>join.df</span>)
-<span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
-
-<span class='no'>join.df</span> <span class='kw'>=</span> <span class='fu'>inner_join</span>(<span class='no'>cars.df</span>, <span class='no'>cars.df</span>, <span class='kw'>merge_by_chunk_id</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>)
-
-<span class='co'># clean up cars.df</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>join.df</span>)
-<span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
-
-<span class='no'>join.df</span> <span class='kw'>=</span> <span class='fu'>left_join</span>(<span class='no'>cars.df</span>, <span class='no'>cars.df</span>)</div><div class='output co'>#&gt; <span class='warning'>Warning: merge_by_chunk_id = FALSE. This will take significantly longer and the preparations needed are performed eagerly which may lead to poor performance. Consider making y a data.frame or set merge_by_chunk_id = TRUE for better performance.</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Appending disk.frames: </span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Appending disk.frames: </span></div><div class='input'>
-<span class='co'># clean up cars.df</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>join.df</span>)
-<span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
-
-<span class='no'>join.df</span> <span class='kw'>=</span> <span class='fu'>semi_join</span>(<span class='no'>cars.df</span>, <span class='no'>cars.df</span>)</div><div class='output co'>#&gt; <span class='warning'>Warning: merge_by_chunk_id = FALSE. This will take significantly longer and the preparations needed are performed eagerly which may lead to poor performance. Consider making y a data.frame or set merge_by_chunk_id = TRUE for better performance.</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Appending disk.frames: </span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Appending disk.frames: </span></div><div class='input'>
-<span class='co'># clean up cars.df</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>join.df</span>)</div></pre>
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">df.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/data.frame.html" class="external-link">data.frame</a></span><span class="op">(</span>x <span class="op">=</span> <span class="fl">1</span><span class="op">:</span><span class="fl">3</span>, y <span class="op">=</span> <span class="fl">4</span><span class="op">:</span><span class="fl">6</span><span class="op">)</span>, overwrite <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span></span>
+<span class="r-in"><span class="va">df2.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/data.frame.html" class="external-link">data.frame</a></span><span class="op">(</span>x <span class="op">=</span> <span class="fl">1</span><span class="op">:</span><span class="fl">2</span>, z <span class="op">=</span> <span class="fl">10</span><span class="op">:</span><span class="fl">11</span><span class="op">)</span>, overwrite <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="va">anti_joined.df</span> <span class="op">=</span> <span class="fu"><a href="https://dplyr.tidyverse.org/reference/filter-joins.html" class="external-link">anti_join</a></span><span class="op">(</span><span class="va">df.df</span>, <span class="va">df2.df</span><span class="op">)</span> </span>
+<span class="r-wrn co"><span class="r-pr">#&gt;</span> <span class="warning">Warning: </span>merge_by_chunk_id = FALSE. This will take significantly longer and the preparations needed are performed eagerly which may lead to poor performance. Consider making y a data.frame or set merge_by_chunk_id = TRUE for better performance.</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Appending disk.frames: </span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Appending disk.frames: </span>
+<span class="r-in"></span>
+<span class="r-in"><span class="va">anti_joined.df</span> <span class="op"><a href="https://magrittr.tidyverse.org/reference/pipe.html" class="external-link">%&gt;%</a></span> <span class="va">collect</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>    x y</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 1: 3 6</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="va">anti_joined.data.frame</span> <span class="op">=</span> <span class="fu"><a href="https://dplyr.tidyverse.org/reference/filter-joins.html" class="external-link">anti_join</a></span><span class="op">(</span><span class="va">df.df</span>, <span class="fu"><a href="https://rdrr.io/r/base/data.frame.html" class="external-link">data.frame</a></span><span class="op">(</span>x <span class="op">=</span> <span class="fl">1</span><span class="op">:</span><span class="fl">2</span>, z <span class="op">=</span> <span class="fl">10</span><span class="op">:</span><span class="fl">11</span><span class="op">)</span><span class="op">)</span></span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Joining, by = "x"</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Joining, by = "x"</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Joining, by = "x"</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">df.df</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">df2.df</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">anti_joined.df</span><span class="op">)</span></span>
+<span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="va">join.df</span> <span class="op">=</span> <span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate-joins.html" class="external-link">full_join</a></span><span class="op">(</span><span class="va">cars.df</span>, <span class="va">cars.df</span>, merge_by_chunk_id <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up cars.df</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">join.df</span><span class="op">)</span></span>
+<span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="va">join.df</span> <span class="op">=</span> <span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate-joins.html" class="external-link">inner_join</a></span><span class="op">(</span><span class="va">cars.df</span>, <span class="va">cars.df</span>, merge_by_chunk_id <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up cars.df</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">join.df</span><span class="op">)</span></span>
+<span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="va">join.df</span> <span class="op">=</span> <span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate-joins.html" class="external-link">left_join</a></span><span class="op">(</span><span class="va">cars.df</span>, <span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-wrn co"><span class="r-pr">#&gt;</span> <span class="warning">Warning: </span>merge_by_chunk_id = FALSE. This will take significantly longer and the preparations needed are performed eagerly which may lead to poor performance. Consider making y a data.frame or set merge_by_chunk_id = TRUE for better performance.</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Appending disk.frames: </span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Appending disk.frames: </span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up cars.df</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">join.df</span><span class="op">)</span></span>
+<span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="va">join.df</span> <span class="op">=</span> <span class="fu"><a href="https://dplyr.tidyverse.org/reference/filter-joins.html" class="external-link">semi_join</a></span><span class="op">(</span><span class="va">cars.df</span>, <span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-wrn co"><span class="r-pr">#&gt;</span> <span class="warning">Warning: </span>merge_by_chunk_id = FALSE. This will take significantly longer and the preparations needed are performed eagerly which may lead to poor performance. Consider making y a data.frame or set merge_by_chunk_id = TRUE for better performance.</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Appending disk.frames: </span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Appending disk.frames: </span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up cars.df</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">join.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/make_glm_streaming_fn.html b/docs/reference/make_glm_streaming_fn.html
index e6df5579..91b68bc6 100644
--- a/docs/reference/make_glm_streaming_fn.html
+++ b/docs/reference/make_glm_streaming_fn.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>A streaming function for speedglm — make_glm_streaming_fn • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="A streaming function for speedglm — make_glm_streaming_fn" />
-<meta property="og:description" content="Define a function that can be used to feed data into speedglm and biglm" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>A streaming function for speedglm — make_glm_streaming_fn • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="A streaming function for speedglm — make_glm_streaming_fn"><meta property="og:description" content="Define a function that can be used to feed data into speedglm and biglm"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>A streaming function for speedglm</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/make_glm_streaming_fn.r'><code>R/make_glm_streaming_fn.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/make_glm_streaming_fn.r" class="external-link"><code>R/make_glm_streaming_fn.r</code></a></small>
     <div class="hidden name"><code>make_glm_streaming_fn.Rd</code></div>
     </div>
 
@@ -162,118 +95,116 @@ <h1>A streaming function for speedglm</h1>
     <p>Define a function that can be used to feed data into speedglm and biglm</p>
     </div>
 
-    <pre class="usage"><span class='fu'>make_glm_streaming_fn</span>(<span class='no'>data</span>, <span class='kw'>verbose</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>data</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>verbose</th>
-      <td><p>Whether to print the status of data loading. Default to FALSE</p></td>
-    </tr>
-    </table>
-
-    <h2 class="hasAnchor" id="value"><a class="anchor" href="#value"></a>Value</h2>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">make_glm_streaming_fn</span><span class="op">(</span><span class="va">data</span>, verbose <span class="op">=</span> <span class="cn">FALSE</span><span class="op">)</span></code></pre></div>
+    </div>
 
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>data</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>verbose</dt>
+<dd><p>Whether to print the status of data loading. Default to FALSE</p></dd>
+</dl></div>
+    <div id="value">
+    <h2>Value</h2>
     <p>return a function, fn, that can be used as the data argument in biglm::bigglm or speedglm::shglm</p>
-    <h2 class="hasAnchor" id="see-also"><a class="anchor" href="#see-also"></a>See also</h2>
-
-    <div class='dont-index'><p>Other Machine Learning (ML): 
-<code><a href='dfglm.html'>dfglm</a>()</code></p></div>
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
-<span class='no'>streamacq</span> <span class='kw'>=</span> <span class='fu'>make_glm_streaming_fn</span>(<span class='no'>cars.df</span>, <span class='kw'>verbose</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>)
+    </div>
+    <div id="see-also">
+    <h2>See also</h2>
+    <div class="dont-index"><p>Other Machine Learning (ML): 
+<code><a href="dfglm.html">dfglm</a>()</code></p></div>
+    </div>
 
-<span class='no'>majorv</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/integer.html'>as.integer</a></span>(<span class='no'>version</span>$<span class='no'>major</span>)
-<span class='no'>minorv</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/integer.html'>as.integer</a></span>(<span class='fu'><a href='https://rdrr.io/r/base/strsplit.html'>strsplit</a></span>(<span class='no'>version</span>$<span class='no'>minor</span>, <span class='st'>"."</span>, <span class='kw'>fixed</span><span class='kw'>=</span><span class='fl'>TRUE</span>)<span class='kw'>[[</span><span class='fl'>1</span>]][<span class='fl'>1</span>])
-<span class='kw'>if</span>(((<span class='no'>majorv</span> <span class='kw'>==</span> <span class='fl'>3</span>) <span class='kw'>&amp;</span> (<span class='no'>minorv</span> <span class='kw'>&gt;=</span> <span class='fl'>6</span>)) <span class='kw'>|</span> (<span class='no'>majorv</span> <span class='kw'>&gt;</span> <span class='fl'>3</span>)) {
-  <span class='no'>m</span> <span class='kw'>=</span> <span class='kw pkg'>biglm</span><span class='kw ns'>::</span><span class='fu'><a href='https://rdrr.io/pkg/biglm/man/bigglm.html'>bigglm</a></span>(<span class='no'>dist</span> ~ <span class='no'>speed</span>, <span class='kw'>data</span> <span class='kw'>=</span> <span class='no'>streamacq</span>)
-  <span class='fu'><a href='https://rdrr.io/r/base/summary.html'>summary</a></span>(<span class='no'>m</span>)
-  <span class='fu'><a href='https://rdrr.io/r/stats/predict.html'>predict</a></span>(<span class='no'>m</span>, <span class='fu'><a href='get_chunk.html'>get_chunk</a></span>(<span class='no'>cars.df</span>, <span class='fl'>1</span>))
-  <span class='fu'><a href='https://rdrr.io/r/stats/predict.html'>predict</a></span>(<span class='no'>m</span>, <span class='fu'>collect</span>(<span class='no'>cars.df</span>, <span class='fl'>1</span>))
-} <span class='kw'>else</span> {
-  <span class='no'>m</span> <span class='kw'>=</span> <span class='kw pkg'>speedglm</span><span class='kw ns'>::</span><span class='fu'><a href='https://rdrr.io/pkg/speedglm/man/speedglm.html'>shglm</a></span>(<span class='no'>dist</span> ~ <span class='no'>speed</span>, <span class='kw'>data</span> <span class='kw'>=</span> <span class='no'>streamacq</span>)
-}</div><div class='output co'>#&gt;         [,1]
-#&gt; 1  -1.849460
-#&gt; 2  -1.849460
-#&gt; 3   9.947766
-#&gt; 4   9.947766
-#&gt; 5  13.880175
-#&gt; 6  17.812584
-#&gt; 7  21.744993
-#&gt; 8  21.744993
-#&gt; 9  21.744993
-#&gt; 10 25.677401
-#&gt; 11 25.677401
-#&gt; 12 29.609810
-#&gt; 13 29.609810
-#&gt; 14 29.609810
-#&gt; 15 29.609810
-#&gt; 16 33.542219
-#&gt; 17 33.542219
-#&gt; 18 33.542219
-#&gt; 19 33.542219
-#&gt; 20 37.474628
-#&gt; 21 37.474628
-#&gt; 22 37.474628
-#&gt; 23 37.474628
-#&gt; 24 41.407036
-#&gt; 25 41.407036
-#&gt; 26 41.407036
-#&gt; 27 45.339445
-#&gt; 28 45.339445
-#&gt; 29 49.271854
-#&gt; 30 49.271854
-#&gt; 31 49.271854
-#&gt; 32 53.204263
-#&gt; 33 53.204263
-#&gt; 34 53.204263
-#&gt; 35 53.204263
-#&gt; 36 57.136672
-#&gt; 37 57.136672
-#&gt; 38 57.136672
-#&gt; 39 61.069080
-#&gt; 40 61.069080
-#&gt; 41 61.069080
-#&gt; 42 61.069080
-#&gt; 43 61.069080
-#&gt; 44 68.933898
-#&gt; 45 72.866307
-#&gt; 46 76.798715
-#&gt; 47 76.798715
-#&gt; 48 76.798715
-#&gt; 49 76.798715
-#&gt; 50 80.731124</div></pre>
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"><span class="va">streamacq</span> <span class="op">=</span> <span class="fu">make_glm_streaming_fn</span><span class="op">(</span><span class="va">cars.df</span>, verbose <span class="op">=</span> <span class="cn">FALSE</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="va">majorv</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/integer.html" class="external-link">as.integer</a></span><span class="op">(</span><span class="va">version</span><span class="op">$</span><span class="va">major</span><span class="op">)</span></span>
+<span class="r-in"><span class="va">minorv</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/integer.html" class="external-link">as.integer</a></span><span class="op">(</span><span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/tstrsplit.html" class="external-link">strsplit</a></span><span class="op">(</span><span class="va">version</span><span class="op">$</span><span class="va">minor</span>, <span class="st">"."</span>, fixed<span class="op">=</span><span class="cn">TRUE</span><span class="op">)</span><span class="op">[[</span><span class="fl">1</span><span class="op">]</span><span class="op">]</span><span class="op">[</span><span class="fl">1</span><span class="op">]</span><span class="op">)</span></span>
+<span class="r-in"><span class="kw">if</span><span class="op">(</span><span class="op">(</span><span class="op">(</span><span class="va">majorv</span> <span class="op">==</span> <span class="fl">3</span><span class="op">)</span> <span class="op">&amp;</span> <span class="op">(</span><span class="va">minorv</span> <span class="op">&gt;=</span> <span class="fl">6</span><span class="op">)</span><span class="op">)</span> <span class="op">|</span> <span class="op">(</span><span class="va">majorv</span> <span class="op">&gt;</span> <span class="fl">3</span><span class="op">)</span><span class="op">)</span> <span class="op">{</span></span>
+<span class="r-in">  <span class="va">m</span> <span class="op">=</span> <span class="fu">biglm</span><span class="fu">::</span><span class="fu"><a href="https://rdrr.io/pkg/biglm/man/bigglm.html" class="external-link">bigglm</a></span><span class="op">(</span><span class="va">dist</span> <span class="op">~</span> <span class="va">speed</span>, data <span class="op">=</span> <span class="va">streamacq</span><span class="op">)</span></span>
+<span class="r-in">  <span class="fu"><a href="https://rdrr.io/r/base/summary.html" class="external-link">summary</a></span><span class="op">(</span><span class="va">m</span><span class="op">)</span></span>
+<span class="r-in">  <span class="fu"><a href="https://rdrr.io/r/stats/predict.html" class="external-link">predict</a></span><span class="op">(</span><span class="va">m</span>, <span class="fu"><a href="get_chunk.html">get_chunk</a></span><span class="op">(</span><span class="va">cars.df</span>, <span class="fl">1</span><span class="op">)</span><span class="op">)</span></span>
+<span class="r-in">  <span class="fu"><a href="https://rdrr.io/r/stats/predict.html" class="external-link">predict</a></span><span class="op">(</span><span class="va">m</span>, <span class="fu"><a href="https://dplyr.tidyverse.org/reference/compute.html" class="external-link">collect</a></span><span class="op">(</span><span class="va">cars.df</span>, <span class="fl">1</span><span class="op">)</span><span class="op">)</span></span>
+<span class="r-in"><span class="op">}</span> <span class="kw">else</span> <span class="op">{</span></span>
+<span class="r-in">  <span class="va">m</span> <span class="op">=</span> <span class="fu">speedglm</span><span class="fu">::</span><span class="fu"><a href="https://rdrr.io/pkg/speedglm/man/speedglm.html" class="external-link">shglm</a></span><span class="op">(</span><span class="va">dist</span> <span class="op">~</span> <span class="va">speed</span>, data <span class="op">=</span> <span class="va">streamacq</span><span class="op">)</span></span>
+<span class="r-in"><span class="op">}</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>         [,1]</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 1  -1.849460</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 2  -1.849460</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 3   9.947766</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 4   9.947766</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 5  13.880175</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 6  17.812584</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 7  21.744993</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 8  21.744993</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 9  21.744993</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 10 25.677401</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 11 25.677401</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 12 29.609810</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 13 29.609810</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 14 29.609810</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 15 29.609810</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 16 33.542219</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 17 33.542219</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 18 33.542219</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 19 33.542219</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 20 37.474628</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 21 37.474628</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 22 37.474628</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 23 37.474628</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 24 41.407036</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 25 41.407036</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 26 41.407036</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 27 45.339445</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 28 45.339445</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 29 49.271854</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 30 49.271854</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 31 49.271854</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 32 53.204263</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 33 53.204263</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 34 53.204263</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 35 53.204263</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 36 57.136672</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 37 57.136672</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 38 57.136672</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 39 61.069080</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 40 61.069080</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 41 61.069080</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 42 61.069080</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 43 61.069080</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 44 68.933898</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 45 72.866307</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 46 76.798715</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 47 76.798715</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 48 76.798715</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 49 76.798715</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 50 80.731124</span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/merge.disk.frame.html b/docs/reference/merge.disk.frame.html
index 7e9d9792..26cafba5 100644
--- a/docs/reference/merge.disk.frame.html
+++ b/docs/reference/merge.disk.frame.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Merge function for disk.frames — merge.disk.frame • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Merge function for disk.frames — merge.disk.frame" />
-<meta property="og:description" content="Merge function for disk.frames" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Merge function for disk.frames — merge.disk.frame • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Merge function for disk.frames — merge.disk.frame"><meta property="og:description" content="Merge function for disk.frames"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Merge function for disk.frames</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/merge.disk.frame.r'><code>R/merge.disk.frame.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/merge.disk.frame.r" class="external-link"><code>R/merge.disk.frame.r</code></a></small>
     <div class="hidden name"><code>merge.disk.frame.Rd</code></div>
     </div>
 
@@ -162,85 +95,70 @@ <h1>Merge function for disk.frames</h1>
     <p>Merge function for disk.frames</p>
     </div>
 
-    <pre class="usage"><span class='co'># S3 method for disk.frame</span>
-<span class='fu'><a href='https://rdrr.io/r/base/merge.html'>merge</a></span>(
-  <span class='no'>x</span>,
-  <span class='no'>y</span>,
-  <span class='no'>by</span>,
-  <span class='kw'>outdir</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempfile</a></span>(<span class='kw'>fileext</span> <span class='kw'>=</span> <span class='st'>".df"</span>),
-  <span class='no'>...</span>,
-  <span class='kw'>merge_by_chunk_id</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>,
-  <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>
-)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>x</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>y</th>
-      <td><p>a disk.frame or data.frame</p></td>
-    </tr>
-    <tr>
-      <th>by</th>
-      <td><p>the merge by keys</p></td>
-    </tr>
-    <tr>
-      <th>outdir</th>
-      <td><p>The output directory for the disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>passed to merge and cmap.disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>merge_by_chunk_id</th>
-      <td><p>if TRUE then only chunks in df1 and df2 with the same chunk id will get merged</p></td>
-    </tr>
-    <tr>
-      <th>overwrite</th>
-      <td><p>overwrite the outdir or not</p></td>
-    </tr>
-    </table>
-
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>b</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='fu'><a href='https://rdrr.io/r/base/data.frame.html'>data.frame</a></span>(<span class='kw'>a</span> <span class='kw'>=</span> <span class='fl'>51</span>:<span class='fl'>150</span>, <span class='kw'>b</span> <span class='kw'>=</span> <span class='fl'>1</span>:<span class='fl'>100</span>))
-<span class='no'>d</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='fu'><a href='https://rdrr.io/r/base/data.frame.html'>data.frame</a></span>(<span class='kw'>a</span> <span class='kw'>=</span> <span class='fl'>151</span>:<span class='fl'>250</span>, <span class='kw'>b</span> <span class='kw'>=</span> <span class='fl'>1</span>:<span class='fl'>100</span>))
-<span class='no'>bd.df</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/merge.html'>merge</a></span>(<span class='no'>b</span>, <span class='no'>d</span>, <span class='kw'>by</span> <span class='kw'>=</span> <span class='st'>"b"</span>, <span class='kw'>merge_by_chunk_id</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>)
-
-<span class='co'># clean up cars.df</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>b</span>)
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>d</span>)
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>bd.df</span>)</div></pre>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/merge.html" class="external-link">merge</a></span><span class="op">(</span>
+  <span class="va">x</span>,
+  <span class="va">y</span>,
+  <span class="va">by</span>,
+  outdir <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempfile</a></span><span class="op">(</span>fileext <span class="op">=</span> <span class="st">".df"</span><span class="op">)</span>,
+  <span class="va">...</span>,
+  merge_by_chunk_id <span class="op">=</span> <span class="cn">FALSE</span>,
+  overwrite <span class="op">=</span> <span class="cn">FALSE</span>
+<span class="op">)</span></code></pre></div>
+    </div>
+
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>x</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>y</dt>
+<dd><p>a disk.frame or data.frame</p></dd>
+<dt>by</dt>
+<dd><p>the merge by keys</p></dd>
+<dt>outdir</dt>
+<dd><p>The output directory for the disk.frame</p></dd>
+<dt>...</dt>
+<dd><p>passed to merge and cmap.disk.frame</p></dd>
+<dt>merge_by_chunk_id</dt>
+<dd><p>if TRUE then only chunks in df1 and df2 with the same chunk id will get merged</p></dd>
+<dt>overwrite</dt>
+<dd><p>overwrite the outdir or not</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">b</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/data.frame.html" class="external-link">data.frame</a></span><span class="op">(</span>a <span class="op">=</span> <span class="fl">51</span><span class="op">:</span><span class="fl">150</span>, b <span class="op">=</span> <span class="fl">1</span><span class="op">:</span><span class="fl">100</span><span class="op">)</span><span class="op">)</span></span>
+<span class="r-in"><span class="va">d</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/data.frame.html" class="external-link">data.frame</a></span><span class="op">(</span>a <span class="op">=</span> <span class="fl">151</span><span class="op">:</span><span class="fl">250</span>, b <span class="op">=</span> <span class="fl">1</span><span class="op">:</span><span class="fl">100</span><span class="op">)</span><span class="op">)</span></span>
+<span class="r-in"><span class="va">bd.df</span> <span class="op">=</span> <span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/merge.html" class="external-link">merge</a></span><span class="op">(</span><span class="va">b</span>, <span class="va">d</span>, by <span class="op">=</span> <span class="st">"b"</span>, merge_by_chunk_id <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up cars.df</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">b</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">d</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">bd.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/move_to.html b/docs/reference/move_to.html
index 4755299f..9037467e 100644
--- a/docs/reference/move_to.html
+++ b/docs/reference/move_to.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Move or copy a disk.frame to another location — move_to • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Move or copy a disk.frame to another location — move_to" />
-<meta property="og:description" content="Move or copy a disk.frame to another location" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Move or copy a disk.frame to another location — move_to • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Move or copy a disk.frame to another location — move_to"><meta property="og:description" content="Move or copy a disk.frame to another location"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Move or copy a disk.frame to another location</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/move_to.r'><code>R/move_to.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/move_to.r" class="external-link"><code>R/move_to.r</code></a></small>
     <div class="hidden name"><code>move_to.Rd</code></div>
     </div>
 
@@ -162,70 +95,62 @@ <h1>Move or copy a disk.frame to another location</h1>
     <p>Move or copy a disk.frame to another location</p>
     </div>
 
-    <pre class="usage"><span class='fu'>move_to</span>(<span class='no'>df</span>, <span class='no'>outdir</span>, <span class='no'>...</span>, <span class='kw'>copy</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>)
-
-<span class='fu'>copy_df_to</span>(<span class='no'>df</span>, <span class='no'>outdir</span>, <span class='no'>...</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>df</th>
-      <td><p>The disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>outdir</th>
-      <td><p>The new location</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>NOT USED</p></td>
-    </tr>
-    <tr>
-      <th>copy</th>
-      <td><p>Merely copy and not move</p></td>
-    </tr>
-    </table>
-
-    <h2 class="hasAnchor" id="value"><a class="anchor" href="#value"></a>Value</h2>
-
-    <p>a disk.frame</p>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">move_to</span><span class="op">(</span><span class="va">df</span>, <span class="va">outdir</span>, <span class="va">...</span>, copy <span class="op">=</span> <span class="cn">FALSE</span><span class="op">)</span>
 
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
-
-<span class='no'>cars_copy.df</span> <span class='kw'>=</span> <span class='fu'>copy_df_to</span>(<span class='no'>cars.df</span>, <span class='kw'>outdir</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempfile</a></span>(<span class='kw'>fileext</span><span class='kw'>=</span><span class='st'>".df"</span>))
+<span class="fu">copy_df_to</span><span class="op">(</span><span class="va">df</span>, <span class="va">outdir</span>, <span class="va">...</span><span class="op">)</span></code></pre></div>
+    </div>
 
-<span class='no'>cars2.df</span> <span class='kw'>=</span> <span class='fu'>move_to</span>(<span class='no'>cars.df</span>, <span class='kw'>outdir</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempfile</a></span>(<span class='kw'>fileext</span><span class='kw'>=</span><span class='st'>".df"</span>))
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>df</dt>
+<dd><p>The disk.frame</p></dd>
+<dt>outdir</dt>
+<dd><p>The new location</p></dd>
+<dt>...</dt>
+<dd><p>NOT USED</p></dd>
+<dt>copy</dt>
+<dd><p>Merely copy and not move</p></dd>
+</dl></div>
+    <div id="value">
+    <h2>Value</h2>
+    <p>a disk.frame</p>
+    </div>
 
-<span class='co'># clean up</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars_copy.df</span>)
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars2.df</span>)</div></pre>
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="va">cars_copy.df</span> <span class="op">=</span> <span class="fu">copy_df_to</span><span class="op">(</span><span class="va">cars.df</span>, outdir <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempfile</a></span><span class="op">(</span>fileext<span class="op">=</span><span class="st">".df"</span><span class="op">)</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="va">cars2.df</span> <span class="op">=</span> <span class="fu">move_to</span><span class="op">(</span><span class="va">cars.df</span>, outdir <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempfile</a></span><span class="op">(</span>fileext<span class="op">=</span><span class="st">".df"</span><span class="op">)</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars_copy.df</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars2.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/nchunks.html b/docs/reference/nchunks.html
index 19440550..988619c1 100644
--- a/docs/reference/nchunks.html
+++ b/docs/reference/nchunks.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Returns the number of chunks in a disk.frame — nchunks • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Returns the number of chunks in a disk.frame — nchunks" />
-<meta property="og:description" content="Returns the number of chunks in a disk.frame" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Returns the number of chunks in a disk.frame — nchunks • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Returns the number of chunks in a disk.frame — nchunks"><meta property="og:description" content="Returns the number of chunks in a disk.frame"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Returns the number of chunks in a disk.frame</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/nchunks.r'><code>R/nchunks.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/nchunks.r" class="external-link"><code>R/nchunks.r</code></a></small>
     <div class="hidden name"><code>nchunks.Rd</code></div>
     </div>
 
@@ -162,66 +95,63 @@ <h1>Returns the number of chunks in a disk.frame</h1>
     <p>Returns the number of chunks in a disk.frame</p>
     </div>
 
-    <pre class="usage"><span class='fu'>nchunks</span>(<span class='no'>df</span>, <span class='no'>...</span>)
-
-<span class='fu'>nchunk</span>(<span class='no'>df</span>, <span class='no'>...</span>)
-
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>nchunk</span>(<span class='no'>df</span>, <span class='no'>...</span>)
-
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>nchunks</span>(<span class='no'>df</span>, <span class='kw'>skip.ready.check</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>, <span class='no'>...</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>df</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>not used</p></td>
-    </tr>
-    <tr>
-      <th>skip.ready.check</th>
-      <td><p>NOT implemented</p></td>
-    </tr>
-    </table>
-
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
-
-<span class='co'># return the number of chunks</span>
-<span class='fu'>nchunks</span>(<span class='no'>cars.df</span>)</div><div class='output co'>#&gt; [1] 6</div><div class='input'><span class='fu'>nchunk</span>(<span class='no'>cars.df</span>)</div><div class='output co'>#&gt; [1] 6</div><div class='input'>
-<span class='co'># clean up cars.df</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)</div></pre>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">nchunks</span><span class="op">(</span><span class="va">df</span>, <span class="va">...</span><span class="op">)</span>
+
+<span class="fu">nchunk</span><span class="op">(</span><span class="va">df</span>, <span class="va">...</span><span class="op">)</span>
+
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu">nchunk</span><span class="op">(</span><span class="va">df</span>, <span class="va">...</span><span class="op">)</span>
+
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu">nchunks</span><span class="op">(</span><span class="va">df</span>, skip.ready.check <span class="op">=</span> <span class="cn">FALSE</span>, <span class="va">...</span><span class="op">)</span></code></pre></div>
+    </div>
+
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>df</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>...</dt>
+<dd><p>not used</p></dd>
+<dt>skip.ready.check</dt>
+<dd><p>NOT implemented</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># return the number of chunks</span></span>
+<span class="r-in"><span class="fu">nchunks</span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] 6</span>
+<span class="r-in"><span class="fu">nchunk</span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] 6</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up cars.df</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/ncol_nrow.html b/docs/reference/ncol_nrow.html
index 3b071e74..a8a9d09a 100644
--- a/docs/reference/ncol_nrow.html
+++ b/docs/reference/ncol_nrow.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Number of rows or columns — nrow • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Number of rows or columns — nrow" />
-<meta property="og:description" content="Number of rows or columns" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Number of rows or columns — nrow • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Number of rows or columns — nrow"><meta property="og:description" content="Number of rows or columns"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Number of rows or columns</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/ncol-nrow.r'><code>R/ncol-nrow.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/ncol-nrow.r" class="external-link"><code>R/ncol-nrow.r</code></a></small>
     <div class="hidden name"><code>ncol_nrow.Rd</code></div>
     </div>
 
@@ -162,62 +95,61 @@ <h1>Number of rows or columns</h1>
     <p>Number of rows or columns</p>
     </div>
 
-    <pre class="usage"><span class='fu'>nrow</span>(<span class='no'>df</span>, <span class='no'>...</span>)
-
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>nrow</span>(<span class='no'>df</span>, <span class='no'>...</span>)
-
-<span class='fu'>ncol</span>(<span class='no'>df</span>)
-
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>ncol</span>(<span class='no'>df</span>)</pre>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">nrow</span><span class="op">(</span><span class="va">df</span>, <span class="va">...</span><span class="op">)</span>
 
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>df</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>passed to base::nrow</p></td>
-    </tr>
-    </table>
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu">nrow</span><span class="op">(</span><span class="va">df</span>, <span class="va">...</span><span class="op">)</span>
 
+<span class="fu">ncol</span><span class="op">(</span><span class="va">df</span><span class="op">)</span>
 
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu">ncol</span><span class="op">(</span><span class="va">df</span><span class="op">)</span></code></pre></div>
+    </div>
 
-<span class='co'># return total number of column and rows</span>
-<span class='fu'>ncol</span>(<span class='no'>cars.df</span>)</div><div class='output co'>#&gt; [1] 2</div><div class='input'><span class='fu'>nrow</span>(<span class='no'>cars.df</span>)</div><div class='output co'>#&gt; [1] 50</div><div class='input'>
-<span class='co'># clean up cars.df</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)</div></pre>
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>df</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>...</dt>
+<dd><p>passed to base::nrow</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># return total number of column and rows</span></span>
+<span class="r-in"><span class="fu">ncol</span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] 2</span>
+<span class="r-in"><span class="fu">nrow</span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] 50</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up cars.df</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/one-stage-group-by-verbs.html b/docs/reference/one-stage-group-by-verbs.html
index 5aa4d240..22b7a93c 100644
--- a/docs/reference/one-stage-group-by-verbs.html
+++ b/docs/reference/one-stage-group-by-verbs.html
@@ -1,69 +1,14 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>One Stage function — var_df.chunk_agg.disk.frame • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="One Stage function — var_df.chunk_agg.disk.frame" />
-<meta property="og:description" content="One Stage function
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>One Stage function — var_df.chunk_agg.disk.frame • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="One Stage function — var_df.chunk_agg.disk.frame"><meta property="og:description" content="One Stage function
 mean chunk_agg
-mean collected_agg" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+mean collected_agg"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -74,19 +19,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -95,8 +33,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -129,34 +66,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>One Stage function</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/one-stage-verbs.R'><code>R/one-stage-verbs.R</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/one-stage-verbs.R" class="external-link"><code>R/one-stage-verbs.R</code></a></small>
     <div class="hidden name"><code>one-stage-group-by-verbs.Rd</code></div>
     </div>
 
@@ -166,109 +99,97 @@ <h1>One Stage function</h1>
 <p>mean collected_agg</p>
     </div>
 
-    <pre class="usage"><span class='fu'>var_df.chunk_agg.disk.frame</span>(<span class='no'>x</span>, <span class='kw'>na.rm</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>)
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">var_df.chunk_agg.disk.frame</span><span class="op">(</span><span class="va">x</span>, na.rm <span class="op">=</span> <span class="cn">FALSE</span><span class="op">)</span>
 
-<span class='fu'>var_df.collected_agg.disk.frame</span>(<span class='no'>listx</span>)
+<span class="fu">var_df.collected_agg.disk.frame</span><span class="op">(</span><span class="va">listx</span><span class="op">)</span>
 
-<span class='fu'>sd_df.chunk_agg.disk.frame</span>(<span class='no'>x</span>, <span class='kw'>na.rm</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>)
+<span class="fu">sd_df.chunk_agg.disk.frame</span><span class="op">(</span><span class="va">x</span>, na.rm <span class="op">=</span> <span class="cn">FALSE</span><span class="op">)</span>
 
-<span class='fu'>sd_df.collected_agg.disk.frame</span>(<span class='no'>listx</span>)
+<span class="fu">sd_df.collected_agg.disk.frame</span><span class="op">(</span><span class="va">listx</span><span class="op">)</span>
 
-<span class='fu'>mean_df.chunk_agg.disk.frame</span>(<span class='no'>x</span>, <span class='kw'>na.rm</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>, <span class='no'>...</span>)
+<span class="fu">mean_df.chunk_agg.disk.frame</span><span class="op">(</span><span class="va">x</span>, na.rm <span class="op">=</span> <span class="cn">FALSE</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>mean_df.collected_agg.disk.frame</span>(<span class='no'>listx</span>)
+<span class="fu">mean_df.collected_agg.disk.frame</span><span class="op">(</span><span class="va">listx</span><span class="op">)</span>
 
-<span class='fu'>sum_df.chunk_agg.disk.frame</span>(<span class='no'>x</span>, <span class='no'>...</span>)
+<span class="fu">sum_df.chunk_agg.disk.frame</span><span class="op">(</span><span class="va">x</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>sum_df.collected_agg.disk.frame</span>(<span class='no'>listx</span>, <span class='no'>...</span>)
+<span class="fu">sum_df.collected_agg.disk.frame</span><span class="op">(</span><span class="va">listx</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>min_df.chunk_agg.disk.frame</span>(<span class='no'>x</span>, <span class='no'>...</span>)
+<span class="fu">min_df.chunk_agg.disk.frame</span><span class="op">(</span><span class="va">x</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>min_df.collected_agg.disk.frame</span>(<span class='no'>listx</span>, <span class='no'>...</span>)
+<span class="fu">min_df.collected_agg.disk.frame</span><span class="op">(</span><span class="va">listx</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>max_df.chunk_agg.disk.frame</span>(<span class='no'>x</span>, <span class='no'>...</span>)
+<span class="fu">max_df.chunk_agg.disk.frame</span><span class="op">(</span><span class="va">x</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>max_df.collected_agg.disk.frame</span>(<span class='no'>listx</span>, <span class='no'>...</span>)
+<span class="fu">max_df.collected_agg.disk.frame</span><span class="op">(</span><span class="va">listx</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>median_df.chunk_agg.disk.frame</span>(<span class='no'>x</span>, <span class='no'>...</span>)
+<span class="fu">median_df.chunk_agg.disk.frame</span><span class="op">(</span><span class="va">x</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>median_df.collected_agg.disk.frame</span>(<span class='no'>listx</span>, <span class='no'>...</span>)
+<span class="fu">median_df.collected_agg.disk.frame</span><span class="op">(</span><span class="va">listx</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>n_df.chunk_agg.disk.frame</span>(<span class='no'>...</span>)
+<span class="fu">n_df.chunk_agg.disk.frame</span><span class="op">(</span><span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>n_df.collected_agg.disk.frame</span>(<span class='no'>listx</span>, <span class='no'>...</span>)
+<span class="fu">n_df.collected_agg.disk.frame</span><span class="op">(</span><span class="va">listx</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>length_df.chunk_agg.disk.frame</span>(<span class='no'>x</span>, <span class='no'>...</span>)
+<span class="fu">length_df.chunk_agg.disk.frame</span><span class="op">(</span><span class="va">x</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>length_df.collected_agg.disk.frame</span>(<span class='no'>listx</span>, <span class='no'>...</span>)
+<span class="fu">length_df.collected_agg.disk.frame</span><span class="op">(</span><span class="va">listx</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>any_df.chunk_agg.disk.frame</span>(<span class='no'>x</span>, <span class='no'>...</span>)
+<span class="fu">any_df.chunk_agg.disk.frame</span><span class="op">(</span><span class="va">x</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>any_df.collected_agg.disk.frame</span>(<span class='no'>listx</span>, <span class='no'>...</span>)
+<span class="fu">any_df.collected_agg.disk.frame</span><span class="op">(</span><span class="va">listx</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>all_df.chunk_agg.disk.frame</span>(<span class='no'>x</span>, <span class='no'>...</span>)
+<span class="fu">all_df.chunk_agg.disk.frame</span><span class="op">(</span><span class="va">x</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>all_df.collected_agg.disk.frame</span>(<span class='no'>listx</span>, <span class='no'>...</span>)
+<span class="fu">all_df.collected_agg.disk.frame</span><span class="op">(</span><span class="va">listx</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>n_distinct_df.chunk_agg.disk.frame</span>(<span class='no'>x</span>, <span class='kw'>na.rm</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>, <span class='no'>...</span>)
+<span class="fu">n_distinct_df.chunk_agg.disk.frame</span><span class="op">(</span><span class="va">x</span>, na.rm <span class="op">=</span> <span class="cn">FALSE</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>n_distinct_df.collected_agg.disk.frame</span>(<span class='no'>listx</span>, <span class='no'>...</span>)
+<span class="fu">n_distinct_df.collected_agg.disk.frame</span><span class="op">(</span><span class="va">listx</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>quantile_df.chunk_agg.disk.frame</span>(<span class='no'>x</span>, <span class='no'>...</span>)
+<span class="fu">quantile_df.chunk_agg.disk.frame</span><span class="op">(</span><span class="va">x</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>quantile_df.collected_agg.disk.frame</span>(<span class='no'>listx</span>, <span class='no'>...</span>)
+<span class="fu">quantile_df.collected_agg.disk.frame</span><span class="op">(</span><span class="va">listx</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>IQR_df.chunk_agg.disk.frame</span>(<span class='no'>x</span>, <span class='kw'>na.rm</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>, <span class='no'>...</span>)
+<span class="fu">IQR_df.chunk_agg.disk.frame</span><span class="op">(</span><span class="va">x</span>, na.rm <span class="op">=</span> <span class="cn">FALSE</span>, <span class="va">...</span><span class="op">)</span>
 
-<span class='fu'>IQR_df.collected_agg.disk.frame</span>(<span class='no'>listx</span>, <span class='no'>...</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>x</th>
-      <td><p>the input</p></td>
-    </tr>
-    <tr>
-      <th>na.rm</th>
-      <td><p>Remove NAs. TRUE of FALSE</p></td>
-    </tr>
-    <tr>
-      <th>listx</th>
-      <td><p>a list</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>additional options</p></td>
-    </tr>
-    </table>
+<span class="fu">IQR_df.collected_agg.disk.frame</span><span class="op">(</span><span class="va">listx</span>, <span class="va">...</span><span class="op">)</span></code></pre></div>
+    </div>
 
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>x</dt>
+<dd><p>the input</p></dd>
+<dt>na.rm</dt>
+<dd><p>Remove NAs. TRUE of FALSE</p></dd>
+<dt>listx</dt>
+<dd><p>a list</p></dd>
+<dt>...</dt>
+<dd><p>additional options</p></dd>
+</dl></div>
 
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/overwrite_check.html b/docs/reference/overwrite_check.html
index 235c9466..f4d07be2 100644
--- a/docs/reference/overwrite_check.html
+++ b/docs/reference/overwrite_check.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Check if the outdir exists or not — overwrite_check • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Check if the outdir exists or not — overwrite_check" />
-<meta property="og:description" content="If the overwrite is TRUE then the folder will be deleted, otherwise the folder will be created." />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Check if the outdir exists or not — overwrite_check • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Check if the outdir exists or not — overwrite_check"><meta property="og:description" content="If the overwrite is TRUE then the folder will be deleted, otherwise the folder will be created."><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Check if the outdir exists or not</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/overwrite_check.r'><code>R/overwrite_check.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/overwrite_check.r" class="external-link"><code>R/overwrite_check.r</code></a></small>
     <div class="hidden name"><code>overwrite_check.Rd</code></div>
     </div>
 
@@ -162,54 +95,49 @@ <h1>Check if the outdir exists or not</h1>
     <p>If the overwrite is TRUE then the folder will be deleted, otherwise the folder will be created.</p>
     </div>
 
-    <pre class="usage"><span class='fu'>overwrite_check</span>(<span class='no'>outdir</span>, <span class='no'>overwrite</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>outdir</th>
-      <td><p>the output directory</p></td>
-    </tr>
-    <tr>
-      <th>overwrite</th>
-      <td><p>TRUE or FALSE if `outdir`` exists and overwrite = FALSE then throw an error</p></td>
-    </tr>
-    </table>
-
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>tf</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempfile</a></span>()
-<span class='fu'>overwrite_check</span>(<span class='no'>tf</span>, <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>)
-<span class='fu'>overwrite_check</span>(<span class='no'>tf</span>, <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>)
-
-<span class='co'># clean up</span>
-<span class='kw pkg'>fs</span><span class='kw ns'>::</span><span class='fu'><a href='http://fs.r-lib.org/reference/delete.html'>dir_delete</a></span>(<span class='no'>tf</span>)</div></pre>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">overwrite_check</span><span class="op">(</span><span class="va">outdir</span>, <span class="va">overwrite</span><span class="op">)</span></code></pre></div>
+    </div>
+
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>outdir</dt>
+<dd><p>the output directory</p></dd>
+<dt>overwrite</dt>
+<dd><p>TRUE or FALSE if `outdir`` exists and overwrite = FALSE then throw an error</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">tf</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempfile</a></span><span class="op">(</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu">overwrite_check</span><span class="op">(</span><span class="va">tf</span>, overwrite <span class="op">=</span> <span class="cn">FALSE</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu">overwrite_check</span><span class="op">(</span><span class="va">tf</span>, overwrite <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up</span></span>
+<span class="r-in"><span class="fu">fs</span><span class="fu">::</span><span class="fu"><a href="https://fs.r-lib.org/reference/delete.html" class="external-link">dir_delete</a></span><span class="op">(</span><span class="va">tf</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/print.disk.frame.html b/docs/reference/print.disk.frame.html
index b8402b06..a0ef8db4 100644
--- a/docs/reference/print.disk.frame.html
+++ b/docs/reference/print.disk.frame.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Print disk.frame — print.disk.frame • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Print disk.frame — print.disk.frame" />
-<meta property="og:description" content="a new print method for disk.frame" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Print disk.frame — print.disk.frame • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Print disk.frame — print.disk.frame"><meta property="og:description" content="a new print method for disk.frame"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Print disk.frame</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/print.disk.frame.r'><code>R/print.disk.frame.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/print.disk.frame.r" class="external-link"><code>R/print.disk.frame.r</code></a></small>
     <div class="hidden name"><code>print.disk.frame.Rd</code></div>
     </div>
 
@@ -162,48 +95,40 @@ <h1>Print disk.frame</h1>
     <p>a new print method for disk.frame</p>
     </div>
 
-    <pre class="usage"><span class='co'># S3 method for disk.frame</span>
-<span class='fu'><a href='https://rdrr.io/r/base/print.html'>print</a></span>(<span class='no'>x</span>, <span class='no'>...</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>x</th>
-      <td><p>disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>not used</p></td>
-    </tr>
-    </table>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://rdrr.io/r/base/print.html" class="external-link">print</a></span><span class="op">(</span><span class="va">x</span>, <span class="va">...</span><span class="op">)</span></code></pre></div>
+    </div>
 
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>x</dt>
+<dd><p>disk.frame</p></dd>
+<dt>...</dt>
+<dd><p>not used</p></dd>
+</dl></div>
 
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/pull.disk.frame.html b/docs/reference/pull.disk.frame.html
index e22e0329..ff438239 100644
--- a/docs/reference/pull.disk.frame.html
+++ b/docs/reference/pull.disk.frame.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Pull a column from table similar to `dplyr::pull`. — pull.disk.frame • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Pull a column from table similar to `dplyr::pull`. — pull.disk.frame" />
-<meta property="og:description" content="Pull a column from table similar to `dplyr::pull`." />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Pull a column from table similar to `dplyr::pull`. — pull.disk.frame • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Pull a column from table similar to `dplyr::pull`. — pull.disk.frame"><meta property="og:description" content="Pull a column from table similar to `dplyr::pull`."><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Pull a column from table similar to `dplyr::pull`.</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/pull.r'><code>R/pull.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/pull.r" class="external-link"><code>R/pull.r</code></a></small>
     <div class="hidden name"><code>pull.disk.frame.Rd</code></div>
     </div>
 
@@ -162,56 +95,44 @@ <h1>Pull a column from table similar to `dplyr::pull`.</h1>
     <p>Pull a column from table similar to `dplyr::pull`.</p>
     </div>
 
-    <pre class="usage"><span class='co'># S3 method for disk.frame</span>
-<span class='fu'>pull</span>(<span class='no'>.data</span>, <span class='kw'>var</span> <span class='kw'>=</span> -<span class='fl'>1</span>, <span class='kw'>name</span> <span class='kw'>=</span> <span class='kw'>NULL</span>, <span class='no'>...</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>.data</th>
-      <td><p>The disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>var</th>
-      <td><p>can be an positive or negative integer or a character/string. See dplyr::pull documentation</p></td>
-    </tr>
-    <tr>
-      <th>name</th>
-      <td><p>See dplyr::pull documentation</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>Not used, kept for compatibility with `dplyr::pull`</p></td>
-    </tr>
-    </table>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/pull.html" class="external-link">pull</a></span><span class="op">(</span><span class="va">.data</span>, var <span class="op">=</span> <span class="op">-</span><span class="fl">1</span>, name <span class="op">=</span> <span class="cn">NULL</span>, <span class="va">...</span><span class="op">)</span></code></pre></div>
+    </div>
 
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>.data</dt>
+<dd><p>The disk.frame</p></dd>
+<dt>var</dt>
+<dd><p>can be an positive or negative integer or a character/string. See dplyr::pull documentation</p></dd>
+<dt>name</dt>
+<dd><p>See dplyr::pull documentation</p></dd>
+<dt>...</dt>
+<dd><p>Not used, kept for compatibility with `dplyr::pull`</p></dd>
+</dl></div>
 
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/rbindlist.disk.frame.html b/docs/reference/rbindlist.disk.frame.html
index 9226c689..081dadec 100644
--- a/docs/reference/rbindlist.disk.frame.html
+++ b/docs/reference/rbindlist.disk.frame.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>rbindlist disk.frames together — rbindlist.disk.frame • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="rbindlist disk.frames together — rbindlist.disk.frame" />
-<meta property="og:description" content="rbindlist disk.frames together" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>rbindlist disk.frames together — rbindlist.disk.frame • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="rbindlist disk.frames together — rbindlist.disk.frame"><meta property="og:description" content="rbindlist disk.frames together"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>rbindlist disk.frames together</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/rbindlist.disk.frame.r'><code>R/rbindlist.disk.frame.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/rbindlist.disk.frame.r" class="external-link"><code>R/rbindlist.disk.frame.r</code></a></small>
     <div class="hidden name"><code>rbindlist.disk.frame.Rd</code></div>
     </div>
 
@@ -162,83 +95,70 @@ <h1>rbindlist disk.frames together</h1>
     <p>rbindlist disk.frames together</p>
     </div>
 
-    <pre class="usage"><span class='fu'>rbindlist.disk.frame</span>(
-  <span class='no'>df_list</span>,
-  <span class='kw'>outdir</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempfile</a></span>(<span class='kw'>fileext</span> <span class='kw'>=</span> <span class='st'>".df"</span>),
-  <span class='kw'>by_chunk_id</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>,
-  <span class='kw'>parallel</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>,
-  <span class='kw'>compress</span> <span class='kw'>=</span> <span class='fl'>50</span>,
-  <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>,
-  <span class='kw'>.progress</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>
-)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>df_list</th>
-      <td><p>A list of disk.frames</p></td>
-    </tr>
-    <tr>
-      <th>outdir</th>
-      <td><p>Output directory of the row-bound disk.frames</p></td>
-    </tr>
-    <tr>
-      <th>by_chunk_id</th>
-      <td><p>If TRUE then only the chunks with the same chunk IDs will be bound</p></td>
-    </tr>
-    <tr>
-      <th>parallel</th>
-      <td><p>if TRUE then bind multiple disk.frame simultaneously, Defaults to TRUE</p></td>
-    </tr>
-    <tr>
-      <th>compress</th>
-      <td><p>0-100, 100 being the highest compression rate.</p></td>
-    </tr>
-    <tr>
-      <th>overwrite</th>
-      <td><p>overwrite the output directory</p></td>
-    </tr>
-    <tr>
-      <th>.progress</th>
-      <td><p>A logical, for whether or not to print a progress bar for multiprocess, multisession, and multicore plans. From furrr</p></td>
-    </tr>
-    </table>
-
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
-
-<span class='co'># row-bind two disk.frames</span>
-<span class='no'>cars2.df</span> <span class='kw'>=</span> <span class='fu'>rbindlist.disk.frame</span>(<span class='fu'><a href='https://rdrr.io/r/base/list.html'>list</a></span>(<span class='no'>cars.df</span>, <span class='no'>cars.df</span>))</div><div class='output co'>#&gt; <span class='message'>Appending disk.frames: </span></div><div class='input'>
-<span class='co'># clean up cars.df</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars2.df</span>)</div></pre>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">rbindlist.disk.frame</span><span class="op">(</span>
+  <span class="va">df_list</span>,
+  outdir <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempfile</a></span><span class="op">(</span>fileext <span class="op">=</span> <span class="st">".df"</span><span class="op">)</span>,
+  by_chunk_id <span class="op">=</span> <span class="cn">TRUE</span>,
+  parallel <span class="op">=</span> <span class="cn">TRUE</span>,
+  compress <span class="op">=</span> <span class="fl">50</span>,
+  overwrite <span class="op">=</span> <span class="cn">TRUE</span>,
+  .progress <span class="op">=</span> <span class="cn">TRUE</span>
+<span class="op">)</span></code></pre></div>
+    </div>
+
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>df_list</dt>
+<dd><p>A list of disk.frames</p></dd>
+<dt>outdir</dt>
+<dd><p>Output directory of the row-bound disk.frames</p></dd>
+<dt>by_chunk_id</dt>
+<dd><p>If TRUE then only the chunks with the same chunk IDs will be bound</p></dd>
+<dt>parallel</dt>
+<dd><p>if TRUE then bind multiple disk.frame simultaneously, Defaults to TRUE</p></dd>
+<dt>compress</dt>
+<dd><p>0-100, 100 being the highest compression rate.</p></dd>
+<dt>overwrite</dt>
+<dd><p>overwrite the output directory</p></dd>
+<dt>.progress</dt>
+<dd><p>A logical, for whether or not to print a progress bar for multiprocess, multisession, and multicore plans. From furrr</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># row-bind two disk.frames</span></span>
+<span class="r-in"><span class="va">cars2.df</span> <span class="op">=</span> <span class="fu">rbindlist.disk.frame</span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/list.html" class="external-link">list</a></span><span class="op">(</span><span class="va">cars.df</span>, <span class="va">cars.df</span><span class="op">)</span><span class="op">)</span></span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Appending disk.frames: </span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up cars.df</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars2.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/rechunk.html b/docs/reference/rechunk.html
index 2abbba00..1ad617e3 100644
--- a/docs/reference/rechunk.html
+++ b/docs/reference/rechunk.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Increase or decrease the number of chunks in the disk.frame — rechunk • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Increase or decrease the number of chunks in the disk.frame — rechunk" />
-<meta property="og:description" content="Increase or decrease the number of chunks in the disk.frame" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Increase or decrease the number of chunks in the disk.frame — rechunk • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Increase or decrease the number of chunks in the disk.frame — rechunk"><meta property="og:description" content="Increase or decrease the number of chunks in the disk.frame"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Increase or decrease the number of chunks in the disk.frame</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/rechunk.r'><code>R/rechunk.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/rechunk.r" class="external-link"><code>R/rechunk.r</code></a></small>
     <div class="hidden name"><code>rechunk.Rd</code></div>
     </div>
 
@@ -162,97 +95,88 @@ <h1>Increase or decrease the number of chunks in the disk.frame</h1>
     <p>Increase or decrease the number of chunks in the disk.frame</p>
     </div>
 
-    <pre class="usage"><span class='fu'>rechunk</span>(
-  <span class='no'>df</span>,
-  <span class='no'>nchunks</span>,
-  <span class='kw'>outdir</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/attr.html'>attr</a></span>(<span class='no'>df</span>, <span class='st'>"path"</span>, <span class='kw'>exact</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>),
-  <span class='kw'>shardby</span> <span class='kw'>=</span> <span class='kw'>NULL</span>,
-  <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>,
-  <span class='kw'>shardby_function</span> <span class='kw'>=</span> <span class='st'>"hash"</span>,
-  <span class='kw'>sort_splits</span> <span class='kw'>=</span> <span class='kw'>NULL</span>,
-  <span class='kw'>desc_vars</span> <span class='kw'>=</span> <span class='kw'>NULL</span>
-)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>df</th>
-      <td><p>the disk.frame to rechunk</p></td>
-    </tr>
-    <tr>
-      <th>nchunks</th>
-      <td><p>number of chunks</p></td>
-    </tr>
-    <tr>
-      <th>outdir</th>
-      <td><p>the output directory</p></td>
-    </tr>
-    <tr>
-      <th>shardby</th>
-      <td><p>the shardkeys</p></td>
-    </tr>
-    <tr>
-      <th>overwrite</th>
-      <td><p>overwrite the output directory</p></td>
-    </tr>
-    <tr>
-      <th>shardby_function</th>
-      <td><p>splitting of chunks: "hash" for hash function or "sort" for semi-sorted chunks</p></td>
-    </tr>
-    <tr>
-      <th>sort_splits</th>
-      <td><p>for the "sort" shardby function, a dataframe with the split values.</p></td>
-    </tr>
-    <tr>
-      <th>desc_vars</th>
-      <td><p>for the "sort" shardby function, the variables to sort descending.</p></td>
-    </tr>
-    </table>
-
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='co'># create a disk.frame with 2 chunks in tempdir()</span>
-<span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>, <span class='kw'>nchunks</span> <span class='kw'>=</span> <span class='fl'>2</span>)
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">rechunk</span><span class="op">(</span>
+  <span class="va">df</span>,
+  <span class="va">nchunks</span>,
+  outdir <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/attr.html" class="external-link">attr</a></span><span class="op">(</span><span class="va">df</span>, <span class="st">"path"</span>, exact <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span>,
+  shardby <span class="op">=</span> <span class="cn">NULL</span>,
+  overwrite <span class="op">=</span> <span class="cn">TRUE</span>,
+  shardby_function <span class="op">=</span> <span class="st">"hash"</span>,
+  sort_splits <span class="op">=</span> <span class="cn">NULL</span>,
+  desc_vars <span class="op">=</span> <span class="cn">NULL</span>
+<span class="op">)</span></code></pre></div>
+    </div>
 
-<span class='co'># re-chunking cars.df to 3 chunks, done "in-place" to the same folder as cars.df</span>
-<span class='fu'>rechunk</span>(<span class='no'>cars.df</span>, <span class='fl'>3</span>)</div><div class='output co'>#&gt; <span class='message'>files have been backed up to temporary dir C:\Users\RTX2080\AppData\Local\Temp\RtmpInritK\back_up_tmp_dir187c185718b5. You can recover there files until you restart your R session</span></div><div class='output co'>#&gt; <span class='message'>path: "C:\Users\RTX2080\AppData\Local\Temp\RtmpInritK\file187c36421ee.df"</span>
-#&gt; <span class='message'>nchunks: 3</span>
-#&gt; <span class='message'>nrow (at source): 50</span>
-#&gt; <span class='message'>ncol (at source): 2</span>
-#&gt; <span class='message'>nrow (post operations): ???</span>
-#&gt; <span class='message'>ncol (post operations): ???</span></div><div class='input'>
-<span class='no'>new_path</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempfile</a></span>(<span class='kw'>fileext</span> <span class='kw'>=</span> <span class='st'>".df"</span>)
-<span class='co'># re-chunking cars.df to 4 chunks, shard by speed, and done "out-of-place" to a new directory</span>
-<span class='no'>cars2.df</span> <span class='kw'>=</span> <span class='fu'>rechunk</span>(<span class='no'>cars.df</span>, <span class='fl'>4</span>, <span class='kw'>outdir</span><span class='kw'>=</span><span class='no'>new_path</span>, <span class='kw'>shardby</span> <span class='kw'>=</span> <span class='st'>"speed"</span>)</div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='output co'>#&gt; <span class='message'>Appending disk.frames: </span></div><div class='input'>
-<span class='co'># clean up cars.df</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars2.df</span>)</div></pre>
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>df</dt>
+<dd><p>the disk.frame to rechunk</p></dd>
+<dt>nchunks</dt>
+<dd><p>number of chunks</p></dd>
+<dt>outdir</dt>
+<dd><p>the output directory</p></dd>
+<dt>shardby</dt>
+<dd><p>the shardkeys</p></dd>
+<dt>overwrite</dt>
+<dd><p>overwrite the output directory</p></dd>
+<dt>shardby_function</dt>
+<dd><p>splitting of chunks: "hash" for hash function or "sort" for semi-sorted chunks</p></dd>
+<dt>sort_splits</dt>
+<dd><p>for the "sort" shardby function, a dataframe with the split values.</p></dd>
+<dt>desc_vars</dt>
+<dd><p>for the "sort" shardby function, the variables to sort descending.</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="co"># create a disk.frame with 2 chunks in tempdir()</span></span>
+<span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span>, nchunks <span class="op">=</span> <span class="fl">2</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># re-chunking cars.df to 3 chunks, done "in-place" to the same folder as cars.df</span></span>
+<span class="r-in"><span class="fu">rechunk</span><span class="op">(</span><span class="va">cars.df</span>, <span class="fl">3</span><span class="op">)</span></span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> files have been backed up to temporary dir C:\Users\RTX2080\AppData\Local\Temp\Rtmp2rQjw5\back_up_tmp_dir56f4356b56cb. You can recover there files until you restart your R session</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> path: "C:\Users\RTX2080\AppData\Local\Temp\Rtmp2rQjw5\file56f4c8a34c9.df"</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nchunks: 3</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nrow (at source): 50</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> ncol (at source): 2</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nrow (post operations): ???</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> ncol (post operations): ???</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="va">new_path</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempfile</a></span><span class="op">(</span>fileext <span class="op">=</span> <span class="st">".df"</span><span class="op">)</span></span>
+<span class="r-in"><span class="co"># re-chunking cars.df to 4 chunks, shard by speed, and done "out-of-place" to a new directory</span></span>
+<span class="r-in"><span class="va">cars2.df</span> <span class="op">=</span> <span class="fu">rechunk</span><span class="op">(</span><span class="va">cars.df</span>, <span class="fl">4</span>, outdir<span class="op">=</span><span class="va">new_path</span>, shardby <span class="op">=</span> <span class="st">"speed"</span><span class="op">)</span></span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Appending disk.frames: </span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up cars.df</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars2.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/recommend_nchunks.html b/docs/reference/recommend_nchunks.html
index f0c9e401..e549d81c 100644
--- a/docs/reference/recommend_nchunks.html
+++ b/docs/reference/recommend_nchunks.html
@@ -1,68 +1,13 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Recommend number of chunks based on input size — recommend_nchunks • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Recommend number of chunks based on input size — recommend_nchunks" />
-<meta property="og:description" content="Computes the recommended number of chunks to break a data.frame
-into. It can accept filesizes in bytes (as integer) or a data.frame" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Recommend number of chunks based on input size — recommend_nchunks • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Recommend number of chunks based on input size — recommend_nchunks"><meta property="og:description" content="Computes the recommended number of chunks to break a data.frame
+into. It can accept filesizes in bytes (as integer) or a data.frame"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -73,19 +18,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -94,8 +32,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -128,34 +65,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Recommend number of chunks based on input size</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/recommend_nchunks.r'><code>R/recommend_nchunks.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/recommend_nchunks.r" class="external-link"><code>R/recommend_nchunks.r</code></a></small>
     <div class="hidden name"><code>recommend_nchunks.Rd</code></div>
     </div>
 
@@ -164,75 +97,67 @@ <h1>Recommend number of chunks based on input size</h1>
 into. It can accept filesizes in bytes (as integer) or a data.frame</p>
     </div>
 
-    <pre class="usage"><span class='fu'>recommend_nchunks</span>(
-  <span class='no'>df</span>,
-  <span class='kw'>type</span> <span class='kw'>=</span> <span class='st'>"csv"</span>,
-  <span class='kw'>minchunks</span> <span class='kw'>=</span> <span class='kw pkg'>data.table</span><span class='kw ns'>::</span><span class='fu'><a href='https://Rdatatable.gitlab.io/data.table/reference/openmp-utils.html'>getDTthreads</a></span>(),
-  <span class='kw'>conservatism</span> <span class='kw'>=</span> <span class='fl'>8</span>,
-  <span class='kw'>ram_size</span> <span class='kw'>=</span> <span class='fu'><a href='df_ram_size.html'>df_ram_size</a></span>()
-)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>df</th>
-      <td><p>a disk.frame or the file size in bytes of a CSV file holding the
-data</p></td>
-    </tr>
-    <tr>
-      <th>type</th>
-      <td><p>only = "csv" is supported. It indicates the file type
-corresponding to file size `df`</p></td>
-    </tr>
-    <tr>
-      <th>minchunks</th>
-      <td><p>the minimum number of chunks. Defaults to the number of CPU
-cores (without hyper-threading)</p></td>
-    </tr>
-    <tr>
-      <th>conservatism</th>
-      <td><p>a multiplier to the recommended number of chunks. The
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">recommend_nchunks</span><span class="op">(</span>
+  <span class="va">df</span>,
+  type <span class="op">=</span> <span class="st">"csv"</span>,
+  minchunks <span class="op">=</span> <span class="fu">data.table</span><span class="fu">::</span><span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/openmp-utils.html" class="external-link">getDTthreads</a></span><span class="op">(</span><span class="op">)</span>,
+  conservatism <span class="op">=</span> <span class="fl">8</span>,
+  ram_size <span class="op">=</span> <span class="fu"><a href="df_ram_size.html">df_ram_size</a></span><span class="op">(</span><span class="op">)</span>
+<span class="op">)</span></code></pre></div>
+    </div>
+
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>df</dt>
+<dd><p>a disk.frame or the file size in bytes of a CSV file holding the
+data</p></dd>
+<dt>type</dt>
+<dd><p>only = "csv" is supported. It indicates the file type
+corresponding to file size `df`</p></dd>
+<dt>minchunks</dt>
+<dd><p>the minimum number of chunks. Defaults to the number of CPU
+cores (without hyper-threading)</p></dd>
+<dt>conservatism</dt>
+<dd><p>a multiplier to the recommended number of chunks. The
 more chunks the smaller the chunk size and more likely that each chunk can
-fit into RAM</p></td>
-    </tr>
-    <tr>
-      <th>ram_size</th>
-      <td><p>The amount of RAM available which is usually computed. Except on RStudio with R3.6+</p></td>
-    </tr>
-    </table>
-
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='co'># recommend nchunks based on data.frame</span>
-<span class='fu'>recommend_nchunks</span>(<span class='no'>cars</span>)</div><div class='output co'>#&gt; [1] 6</div><div class='input'>
-<span class='co'># recommend nchunks based on file size ONLY CSV is implemented at the moment</span>
-<span class='fu'>recommend_nchunks</span>(<span class='fl'>1024</span>^<span class='fl'>3</span>)</div><div class='output co'>#&gt; [1] 6</div></pre>
+fit into RAM</p></dd>
+<dt>ram_size</dt>
+<dd><p>The amount of RAM available which is usually computed. Except on RStudio with R3.6+</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="co"># recommend nchunks based on data.frame</span></span>
+<span class="r-in"><span class="fu">recommend_nchunks</span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] 6</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># recommend nchunks based on file size ONLY CSV is implemented at the moment</span></span>
+<span class="r-in"><span class="fu">recommend_nchunks</span><span class="op">(</span><span class="fl">1024</span><span class="op">^</span><span class="fl">3</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] 6</span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/remove_chunk.html b/docs/reference/remove_chunk.html
index 00048845..974ae319 100644
--- a/docs/reference/remove_chunk.html
+++ b/docs/reference/remove_chunk.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Removes a chunk from the disk.frame — remove_chunk • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Removes a chunk from the disk.frame — remove_chunk" />
-<meta property="og:description" content="Removes a chunk from the disk.frame" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Removes a chunk from the disk.frame — remove_chunk • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Removes a chunk from the disk.frame — remove_chunk"><meta property="og:description" content="Removes a chunk from the disk.frame"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Removes a chunk from the disk.frame</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/remove_chunk.r'><code>R/remove_chunk.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/remove_chunk.r" class="external-link"><code>R/remove_chunk.r</code></a></small>
     <div class="hidden name"><code>remove_chunk.Rd</code></div>
     </div>
 
@@ -162,78 +95,83 @@ <h1>Removes a chunk from the disk.frame</h1>
     <p>Removes a chunk from the disk.frame</p>
     </div>
 
-    <pre class="usage"><span class='fu'>remove_chunk</span>(<span class='no'>df</span>, <span class='no'>chunk_id</span>, <span class='kw'>full.names</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>df</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>chunk_id</th>
-      <td><p>the chunk ID of the chunk to remove. If it's a number then return number.fst</p></td>
-    </tr>
-    <tr>
-      <th>full.names</th>
-      <td><p>TRUE or FALSE. Defaults to FALSE. If true then chunk_id is the full path to the chunk otherwise it's the relative path</p></td>
-    </tr>
-    </table>
-
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='co'># TODO add these to tests</span>
-<span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>, <span class='kw'>nchunks</span> <span class='kw'>=</span> <span class='fl'>4</span>)
-
-<span class='co'># removes 3rd chunk</span>
-<span class='fu'>remove_chunk</span>(<span class='no'>cars.df</span>, <span class='fl'>3</span>)</div><div class='output co'>#&gt; <span class='message'>path: "C:\Users\RTX2080\AppData\Local\Temp\RtmpInritK\file187c1fad1470.df"</span>
-#&gt; <span class='message'>nchunks: 3</span>
-#&gt; <span class='message'>nrow (at source): 37</span>
-#&gt; <span class='message'>ncol (at source): 2</span>
-#&gt; <span class='message'>nrow (post operations): ???</span>
-#&gt; <span class='message'>ncol (post operations): ???</span></div><div class='input'><span class='fu'><a href='nchunks.html'>nchunks</a></span>(<span class='no'>cars.df</span>) <span class='co'># 3</span></div><div class='output co'>#&gt; [1] 3</div><div class='input'>
-<span class='co'># removes 4th chunk</span>
-<span class='fu'>remove_chunk</span>(<span class='no'>cars.df</span>, <span class='st'>"4.fst"</span>)</div><div class='output co'>#&gt; <span class='message'>path: "C:\Users\RTX2080\AppData\Local\Temp\RtmpInritK\file187c1fad1470.df"</span>
-#&gt; <span class='message'>nchunks: 2</span>
-#&gt; <span class='message'>nrow (at source): 26</span>
-#&gt; <span class='message'>ncol (at source): 2</span>
-#&gt; <span class='message'>nrow (post operations): ???</span>
-#&gt; <span class='message'>ncol (post operations): ???</span></div><div class='input'><span class='fu'><a href='nchunks.html'>nchunks</a></span>(<span class='no'>cars.df</span>) <span class='co'># 3</span></div><div class='output co'>#&gt; [1] 2</div><div class='input'>
-<span class='co'># removes 2nd chunk</span>
-<span class='fu'>remove_chunk</span>(<span class='no'>cars.df</span>, <span class='fu'><a href='https://rdrr.io/r/base/file.path.html'>file.path</a></span>(<span class='fu'><a href='https://rdrr.io/r/base/attr.html'>attr</a></span>(<span class='no'>cars.df</span>, <span class='st'>"path"</span>, <span class='kw'>exact</span><span class='kw'>=</span><span class='fl'>TRUE</span>), <span class='st'>"2.fst"</span>), <span class='kw'>full.names</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>)</div><div class='output co'>#&gt; <span class='message'>path: "C:\Users\RTX2080\AppData\Local\Temp\RtmpInritK\file187c1fad1470.df"</span>
-#&gt; <span class='message'>nchunks: 1</span>
-#&gt; <span class='message'>nrow (at source): 13</span>
-#&gt; <span class='message'>ncol (at source): 2</span>
-#&gt; <span class='message'>nrow (post operations): ???</span>
-#&gt; <span class='message'>ncol (post operations): ???</span></div><div class='input'><span class='fu'><a href='nchunks.html'>nchunks</a></span>(<span class='no'>cars.df</span>) <span class='co'># 1</span></div><div class='output co'>#&gt; [1] 1</div><div class='input'>
-<span class='co'># clean up cars.df</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)</div></pre>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">remove_chunk</span><span class="op">(</span><span class="va">df</span>, <span class="va">chunk_id</span>, full.names <span class="op">=</span> <span class="cn">FALSE</span><span class="op">)</span></code></pre></div>
+    </div>
+
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>df</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>chunk_id</dt>
+<dd><p>the chunk ID of the chunk to remove. If it's a number then return number.fst</p></dd>
+<dt>full.names</dt>
+<dd><p>TRUE or FALSE. Defaults to FALSE. If true then chunk_id is the full path to the chunk otherwise it's the relative path</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="co"># TODO add these to tests</span></span>
+<span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span>, nchunks <span class="op">=</span> <span class="fl">4</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># removes 3rd chunk</span></span>
+<span class="r-in"><span class="fu">remove_chunk</span><span class="op">(</span><span class="va">cars.df</span>, <span class="fl">3</span><span class="op">)</span></span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> path: "C:\Users\RTX2080\AppData\Local\Temp\Rtmp2rQjw5\file56f45e4b14bd.df"</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nchunks: 3</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nrow (at source): 37</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> ncol (at source): 2</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nrow (post operations): ???</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> ncol (post operations): ???</span>
+<span class="r-in"><span class="fu"><a href="nchunks.html">nchunks</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span> <span class="co"># 3</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] 3</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># removes 4th chunk</span></span>
+<span class="r-in"><span class="fu">remove_chunk</span><span class="op">(</span><span class="va">cars.df</span>, <span class="st">"4.fst"</span><span class="op">)</span></span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> path: "C:\Users\RTX2080\AppData\Local\Temp\Rtmp2rQjw5\file56f45e4b14bd.df"</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nchunks: 2</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nrow (at source): 26</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> ncol (at source): 2</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nrow (post operations): ???</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> ncol (post operations): ???</span>
+<span class="r-in"><span class="fu"><a href="nchunks.html">nchunks</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span> <span class="co"># 3</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] 2</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># removes 2nd chunk</span></span>
+<span class="r-in"><span class="fu">remove_chunk</span><span class="op">(</span><span class="va">cars.df</span>, <span class="fu"><a href="https://rdrr.io/r/base/file.path.html" class="external-link">file.path</a></span><span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/attr.html" class="external-link">attr</a></span><span class="op">(</span><span class="va">cars.df</span>, <span class="st">"path"</span>, exact<span class="op">=</span><span class="cn">TRUE</span><span class="op">)</span>, <span class="st">"2.fst"</span><span class="op">)</span>, full.names <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span></span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> path: "C:\Users\RTX2080\AppData\Local\Temp\Rtmp2rQjw5\file56f45e4b14bd.df"</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nchunks: 1</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nrow (at source): 13</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> ncol (at source): 2</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> nrow (post operations): ???</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> ncol (post operations): ???</span>
+<span class="r-in"><span class="fu"><a href="nchunks.html">nchunks</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span> <span class="co"># 1</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> [1] 1</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up cars.df</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/sample.html b/docs/reference/sample.html
index 161546d8..719d4244 100644
--- a/docs/reference/sample.html
+++ b/docs/reference/sample.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Sample n rows from a disk.frame — sample_frac.disk.frame • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Sample n rows from a disk.frame — sample_frac.disk.frame" />
-<meta property="og:description" content="Sample n rows from a disk.frame" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Sample n rows from a disk.frame — sample_frac.disk.frame • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Sample n rows from a disk.frame — sample_frac.disk.frame"><meta property="og:description" content="Sample n rows from a disk.frame"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Sample n rows from a disk.frame</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/sample_frac.R'><code>R/sample_frac.R</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/sample_frac.R" class="external-link"><code>R/sample_frac.R</code></a></small>
     <div class="hidden name"><code>sample.Rd</code></div>
     </div>
 
@@ -162,97 +95,87 @@ <h1>Sample n rows from a disk.frame</h1>
     <p>Sample n rows from a disk.frame</p>
     </div>
 
-    <pre class="usage"><span class='co'># S3 method for disk.frame</span>
-<span class='fu'>sample_frac</span>(<span class='no'>tbl</span>, <span class='kw'>size</span> <span class='kw'>=</span> <span class='fl'>1</span>, <span class='kw'>replace</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>, <span class='kw'>weight</span> <span class='kw'>=</span> <span class='kw'>NULL</span>, <span class='kw'>.env</span> <span class='kw'>=</span> <span class='kw'>NULL</span>, <span class='no'>...</span>)</pre>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/sample_n.html" class="external-link">sample_frac</a></span><span class="op">(</span><span class="va">tbl</span>, size <span class="op">=</span> <span class="fl">1</span>, replace <span class="op">=</span> <span class="cn">FALSE</span>, weight <span class="op">=</span> <span class="cn">NULL</span>, .env <span class="op">=</span> <span class="cn">NULL</span>, <span class="va">...</span><span class="op">)</span></code></pre></div>
+    </div>
 
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>tbl</th>
-      <td><p>A data.frame.</p></td>
-    </tr>
-    <tr>
-      <th>size</th>
-      <td><p>&lt;<code><a href='https://dplyr.tidyverse.org/reference/dplyr_tidy_select.html'>tidy-select</a></code>&gt;
-For <code>sample_n()</code>, the number of rows to select.
-For <code>sample_frac()</code>, the fraction of rows to select.
-If <code>tbl</code> is grouped, <code>size</code> applies to each group.</p></td>
-    </tr>
-    <tr>
-      <th>replace</th>
-      <td><p>Sample with or without replacement?</p></td>
-    </tr>
-    <tr>
-      <th>weight</th>
-      <td><p>&lt;<code><a href='https://dplyr.tidyverse.org/reference/dplyr_tidy_select.html'>tidy-select</a></code>&gt; Sampling weights.
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>tbl</dt>
+<dd><p>A data.frame.</p></dd>
+<dt>size</dt>
+<dd><p>&lt;<code><a href="https://dplyr.tidyverse.org/reference/dplyr_tidy_select.html" class="external-link">tidy-select</a></code>&gt;
+For <code><a href="https://dplyr.tidyverse.org/reference/sample_n.html" class="external-link">sample_n()</a></code>, the number of rows to select.
+For <code><a href="https://dplyr.tidyverse.org/reference/sample_n.html" class="external-link">sample_frac()</a></code>, the fraction of rows to select.
+If <code>tbl</code> is grouped, <code>size</code> applies to each group.</p></dd>
+<dt>replace</dt>
+<dd><p>Sample with or without replacement?</p></dd>
+<dt>weight</dt>
+<dd><p>&lt;<code><a href="https://dplyr.tidyverse.org/reference/dplyr_tidy_select.html" class="external-link">tidy-select</a></code>&gt; Sampling weights.
 This must evaluate to a vector of non-negative numbers the same length as
-the input. Weights are automatically standardised to sum to 1.</p></td>
-    </tr>
-    <tr>
-      <th>.env</th>
-      <td><p>DEPRECATED.</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>ignored</p></td>
-    </tr>
-    </table>
-
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
-
-<span class='fu'>collect</span>(<span class='fu'>sample_frac</span>(<span class='no'>cars.df</span>, <span class='fl'>0.5</span>))</div><div class='output co'>#&gt;    speed dist
-#&gt; 1     10   34
-#&gt; 2      8   16
-#&gt; 3      4   10
-#&gt; 4     10   26
-#&gt; 5     12   14
-#&gt; 6     13   26
-#&gt; 7     11   28
-#&gt; 8     13   34
-#&gt; 9     13   46
-#&gt; 10    15   26
-#&gt; 11    16   32
-#&gt; 12    15   54
-#&gt; 13    18   42
-#&gt; 14    17   32
-#&gt; 15    18   84
-#&gt; 16    17   40
-#&gt; 17    22   66
-#&gt; 18    19   68
-#&gt; 19    20   48
-#&gt; 20    20   52
-#&gt; 21    24  120
-#&gt; 22    25   85</div><div class='input'>
-<span class='co'># clean up cars.df</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)</div></pre>
+the input. Weights are automatically standardised to sum to 1.</p></dd>
+<dt>.env</dt>
+<dd><p>DEPRECATED.</p></dd>
+<dt>...</dt>
+<dd><p>ignored</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="fu"><a href="https://dplyr.tidyverse.org/reference/compute.html" class="external-link">collect</a></span><span class="op">(</span><span class="fu"><a href="https://dplyr.tidyverse.org/reference/sample_n.html" class="external-link">sample_frac</a></span><span class="op">(</span><span class="va">cars.df</span>, <span class="fl">0.5</span><span class="op">)</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>     speed dist</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  1:     7   22</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  2:     7    4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  3:     9   10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  4:    10   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  5:    13   34</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  6:    11   17</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  7:    12   20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  8:    11   28</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  9:    14   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 10:    14   36</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 11:    15   26</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 12:    14   80</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 13:    18   84</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 14:    18   56</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 15:    18   76</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 16:    17   50</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 17:    20   56</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 18:    19   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 19:    19   68</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 20:    20   32</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 21:    25   85</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 22:    24   70</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>     speed dist</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up cars.df</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/setup_disk.frame.html b/docs/reference/setup_disk.frame.html
index 2c8a7cda..4b1ee1c7 100644
--- a/docs/reference/setup_disk.frame.html
+++ b/docs/reference/setup_disk.frame.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Set up disk.frame environment — setup_disk.frame • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Set up disk.frame environment — setup_disk.frame" />
-<meta property="og:description" content="Set up disk.frame environment" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Set up disk.frame environment — setup_disk.frame • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Set up disk.frame environment — setup_disk.frame"><meta property="og:description" content="Set up disk.frame environment"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Set up disk.frame environment</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/setup.r'><code>R/setup.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/setup.r" class="external-link"><code>R/setup.r</code></a></small>
     <div class="hidden name"><code>setup_disk.frame.Rd</code></div>
     </div>
 
@@ -162,76 +95,71 @@ <h1>Set up disk.frame environment</h1>
     <p>Set up disk.frame environment</p>
     </div>
 
-    <pre class="usage"><span class='fu'>setup_disk.frame</span>(
-  <span class='kw'>workers</span> <span class='kw'>=</span> <span class='kw pkg'>data.table</span><span class='kw ns'>::</span><span class='fu'><a href='https://Rdatatable.gitlab.io/data.table/reference/openmp-utils.html'>getDTthreads</a></span>(),
-  <span class='kw'>future_backend</span> <span class='kw'>=</span> <span class='kw pkg'>future</span><span class='kw ns'>::</span><span class='no'><a href='https://rdrr.io/pkg/future/man/multisession.html'>multisession</a></span>,
-  <span class='no'>...</span>,
-  <span class='kw'>gui</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>
-)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>workers</th>
-      <td><p>the number of workers (background R processes in the</p></td>
-    </tr>
-    <tr>
-      <th>future_backend</th>
-      <td><p>which future backend to use for parallelization</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>passed to `future::plan`</p></td>
-    </tr>
-    <tr>
-      <th>gui</th>
-      <td><p>Whether to use a Graphical User Interface (GUI) for selecting the options. Defaults to FALSE</p></td>
-    </tr>
-    </table>
-
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='kw'>if</span> (<span class='fu'><a href='https://rdrr.io/r/base/interactive.html'>interactive</a></span>()) {
-  <span class='co'># setup disk.frame to use multiple workers these may use more than two</span>
-  <span class='co'># cores, and is therefore not allowed on CRAN. Hence it's set to run only in</span>
-  <span class='co'># interactive session</span>
-  <span class='fu'>setup_disk.frame</span>()
-
-  <span class='co'># use a Shiny GUI to adjust settings</span>
-  <span class='co'># only run in interactive()</span>
-  <span class='fu'>setup_disk.frame</span>(<span class='kw'>gui</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>)
-}
-
-<span class='co'># set the number workers to 2</span>
-<span class='fu'>setup_disk.frame</span>(<span class='fl'>2</span>)</div><div class='output co'>#&gt; <span class='message'>The number of workers available for disk.frame is 2</span></div><div class='input'>
-<span class='co'># if you do not wish to use multiple workers you can set it to sequential</span>
-<span class='fu'>setup_disk.frame</span>(<span class='kw'>future_backend</span><span class='kw'>=</span><span class='kw pkg'>future</span><span class='kw ns'>::</span><span class='no'><a href='https://rdrr.io/pkg/future/man/sequential.html'>sequential</a></span>)</div><div class='output co'>#&gt; <span class='warning'>Warning: Ignored 2 unknown arguments: 'workers', 'gc'</span></div><div class='output co'>#&gt; <span class='message'>The number of workers available for disk.frame is 1</span></div></pre>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">setup_disk.frame</span><span class="op">(</span>
+  workers <span class="op">=</span> <span class="fu">data.table</span><span class="fu">::</span><span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/openmp-utils.html" class="external-link">getDTthreads</a></span><span class="op">(</span><span class="op">)</span>,
+  future_backend <span class="op">=</span> <span class="fu">future</span><span class="fu">::</span><span class="va"><a href="https://future.futureverse.org/reference/multisession.html" class="external-link">multisession</a></span>,
+  <span class="va">...</span>,
+  gui <span class="op">=</span> <span class="cn">FALSE</span>
+<span class="op">)</span></code></pre></div>
+    </div>
+
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>workers</dt>
+<dd><p>the number of workers (background R processes in the</p></dd>
+<dt>future_backend</dt>
+<dd><p>which future backend to use for parallelization</p></dd>
+<dt>...</dt>
+<dd><p>passed to `future::plan`</p></dd>
+<dt>gui</dt>
+<dd><p>Whether to use a Graphical User Interface (GUI) for selecting the options. Defaults to FALSE</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="kw">if</span> <span class="op">(</span><span class="fu"><a href="https://rdrr.io/r/base/interactive.html" class="external-link">interactive</a></span><span class="op">(</span><span class="op">)</span><span class="op">)</span> <span class="op">{</span></span>
+<span class="r-in">  <span class="co"># setup disk.frame to use multiple workers these may use more than two</span></span>
+<span class="r-in">  <span class="co"># cores, and is therefore not allowed on CRAN. Hence it's set to run only in</span></span>
+<span class="r-in">  <span class="co"># interactive session</span></span>
+<span class="r-in">  <span class="fu">setup_disk.frame</span><span class="op">(</span><span class="op">)</span></span>
+<span class="r-in">  </span>
+<span class="r-in">  <span class="co"># use a Shiny GUI to adjust settings</span></span>
+<span class="r-in">  <span class="co"># only run in interactive()</span></span>
+<span class="r-in">  <span class="fu">setup_disk.frame</span><span class="op">(</span>gui <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span></span>
+<span class="r-in"><span class="op">}</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># set the number workers to 2</span></span>
+<span class="r-in"><span class="fu">setup_disk.frame</span><span class="op">(</span><span class="fl">2</span><span class="op">)</span></span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> The number of workers available for disk.frame is 2</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># if you do not wish to use multiple workers you can set it to sequential</span></span>
+<span class="r-in"><span class="fu">setup_disk.frame</span><span class="op">(</span>future_backend<span class="op">=</span><span class="fu">future</span><span class="fu">::</span><span class="va"><a href="https://future.futureverse.org/reference/sequential.html" class="external-link">sequential</a></span><span class="op">)</span></span>
+<span class="r-wrn co"><span class="r-pr">#&gt;</span> <span class="warning">Warning: </span>Detected 1 unknown future arguments: 'workers'</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> The number of workers available for disk.frame is 1</span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/shard.html b/docs/reference/shard.html
index 13f9501d..eca41f84 100644
--- a/docs/reference/shard.html
+++ b/docs/reference/shard.html
@@ -1,68 +1,13 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Shard a data.frame/data.table or disk.frame into chunk and saves it into a disk.frame — shard • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Shard a data.frame/data.table or disk.frame into chunk and saves it into a disk.frame — shard" />
-<meta property="og:description" content="Shard a data.frame/data.table or disk.frame into chunk and saves it into a disk.frame
-`distribute` is an alias for `shard`" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Shard a data.frame/data.table or disk.frame into chunk and saves it into a disk.frame — shard • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Shard a data.frame/data.table or disk.frame into chunk and saves it into a disk.frame — shard"><meta property="og:description" content="Shard a data.frame/data.table or disk.frame into chunk and saves it into a disk.frame
+`distribute` is an alias for `shard`"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -73,19 +18,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -94,8 +32,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -128,34 +65,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Shard a data.frame/data.table or disk.frame into chunk and saves it into a disk.frame</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/shard.r'><code>R/shard.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/shard.r" class="external-link"><code>R/shard.r</code></a></small>
     <div class="hidden name"><code>shard.Rd</code></div>
     </div>
 
@@ -164,93 +97,76 @@ <h1>Shard a data.frame/data.table or disk.frame into chunk and saves it into a d
 <p>`distribute` is an alias for `shard`</p>
     </div>
 
-    <pre class="usage"><span class='fu'>shard</span>(
-  <span class='no'>df</span>,
-  <span class='no'>shardby</span>,
-  <span class='kw'>outdir</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempfile</a></span>(<span class='kw'>fileext</span> <span class='kw'>=</span> <span class='st'>".df"</span>),
-  <span class='no'>...</span>,
-  <span class='kw'>nchunks</span> <span class='kw'>=</span> <span class='fu'><a href='recommend_nchunks.html'>recommend_nchunks</a></span>(<span class='no'>df</span>),
-  <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>,
-  <span class='kw'>shardby_function</span> <span class='kw'>=</span> <span class='st'>"hash"</span>,
-  <span class='kw'>sort_splits</span> <span class='kw'>=</span> <span class='kw'>NULL</span>,
-  <span class='kw'>desc_vars</span> <span class='kw'>=</span> <span class='kw'>NULL</span>
-)
-
-<span class='fu'>distribute</span>(<span class='no'>...</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>df</th>
-      <td><p>A data.frame/data.table or disk.frame. If disk.frame, then rechunk(df, ...) is run</p></td>
-    </tr>
-    <tr>
-      <th>shardby</th>
-      <td><p>The column(s) to shard the data by.</p></td>
-    </tr>
-    <tr>
-      <th>outdir</th>
-      <td><p>The output directory of the disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>not used</p></td>
-    </tr>
-    <tr>
-      <th>nchunks</th>
-      <td><p>The number of chunks</p></td>
-    </tr>
-    <tr>
-      <th>overwrite</th>
-      <td><p>If TRUE then the chunks are overwritten</p></td>
-    </tr>
-    <tr>
-      <th>shardby_function</th>
-      <td><p>splitting of chunks: "hash" for hash function or "sort" for semi-sorted chunks</p></td>
-    </tr>
-    <tr>
-      <th>sort_splits</th>
-      <td><p>If shardby_function is "sort", the split values for sharding</p></td>
-    </tr>
-    <tr>
-      <th>desc_vars</th>
-      <td><p>for the "sort" shardby function, the variables to sort descending.</p></td>
-    </tr>
-    </table>
-
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">shard</span><span class="op">(</span>
+  <span class="va">df</span>,
+  <span class="va">shardby</span>,
+  outdir <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempfile</a></span><span class="op">(</span>fileext <span class="op">=</span> <span class="st">".df"</span><span class="op">)</span>,
+  <span class="va">...</span>,
+  nchunks <span class="op">=</span> <span class="fu"><a href="recommend_nchunks.html">recommend_nchunks</a></span><span class="op">(</span><span class="va">df</span><span class="op">)</span>,
+  overwrite <span class="op">=</span> <span class="cn">FALSE</span>,
+  shardby_function <span class="op">=</span> <span class="st">"hash"</span>,
+  sort_splits <span class="op">=</span> <span class="cn">NULL</span>,
+  desc_vars <span class="op">=</span> <span class="cn">NULL</span>
+<span class="op">)</span>
+
+<span class="fu">distribute</span><span class="op">(</span><span class="va">...</span><span class="op">)</span></code></pre></div>
+    </div>
 
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'>
-<span class='co'># shard the cars data.frame by speed so that rows with the same speed are in the same chunk</span>
-<span class='no'>iris.df</span> <span class='kw'>=</span> <span class='fu'>shard</span>(<span class='no'>iris</span>, <span class='st'>"Species"</span>)</div><div class='output co'>#&gt; <span class='message'>Hashing...</span></div><div class='input'>
-<span class='co'># clean up cars.df</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>iris.df</span>)</div></pre>
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>df</dt>
+<dd><p>A data.frame/data.table or disk.frame. If disk.frame, then rechunk(df, ...) is run</p></dd>
+<dt>shardby</dt>
+<dd><p>The column(s) to shard the data by.</p></dd>
+<dt>outdir</dt>
+<dd><p>The output directory of the disk.frame</p></dd>
+<dt>...</dt>
+<dd><p>not used</p></dd>
+<dt>nchunks</dt>
+<dd><p>The number of chunks</p></dd>
+<dt>overwrite</dt>
+<dd><p>If TRUE then the chunks are overwritten</p></dd>
+<dt>shardby_function</dt>
+<dd><p>splitting of chunks: "hash" for hash function or "sort" for semi-sorted chunks</p></dd>
+<dt>sort_splits</dt>
+<dd><p>If shardby_function is "sort", the split values for sharding</p></dd>
+<dt>desc_vars</dt>
+<dd><p>for the "sort" shardby function, the variables to sort descending.</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"></span>
+<span class="r-in"><span class="co"># shard the cars data.frame by speed so that rows with the same speed are in the same chunk</span></span>
+<span class="r-in"><span class="va">iris.df</span> <span class="op">=</span> <span class="fu">shard</span><span class="op">(</span><span class="va">iris</span>, <span class="st">"Species"</span><span class="op">)</span></span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span> Hashing...</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up cars.df</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">iris.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/shardkey.html b/docs/reference/shardkey.html
index 4e99bbca..eeca73d7 100644
--- a/docs/reference/shardkey.html
+++ b/docs/reference/shardkey.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Returns the shardkey (not implemented yet) — shardkey • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Returns the shardkey (not implemented yet) — shardkey" />
-<meta property="og:description" content="Returns the shardkey (not implemented yet)" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Returns the shardkey (not implemented yet) — shardkey • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Returns the shardkey (not implemented yet) — shardkey"><meta property="og:description" content="Returns the shardkey (not implemented yet)"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Returns the shardkey (not implemented yet)</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/shardkey.r'><code>R/shardkey.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/shardkey.r" class="external-link"><code>R/shardkey.r</code></a></small>
     <div class="hidden name"><code>shardkey.Rd</code></div>
     </div>
 
@@ -162,43 +95,37 @@ <h1>Returns the shardkey (not implemented yet)</h1>
     <p>Returns the shardkey (not implemented yet)</p>
     </div>
 
-    <pre class="usage"><span class='fu'>shardkey</span>(<span class='no'>df</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>df</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    </table>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">shardkey</span><span class="op">(</span><span class="va">df</span><span class="op">)</span></code></pre></div>
+    </div>
 
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>df</dt>
+<dd><p>a disk.frame</p></dd>
+</dl></div>
 
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/shardkey_equal.html b/docs/reference/shardkey_equal.html
index 5c4e1ad8..e51669c5 100644
--- a/docs/reference/shardkey_equal.html
+++ b/docs/reference/shardkey_equal.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Compare two disk.frame shardkeys — shardkey_equal • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Compare two disk.frame shardkeys — shardkey_equal" />
-<meta property="og:description" content="Compare two disk.frame shardkeys" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Compare two disk.frame shardkeys — shardkey_equal • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Compare two disk.frame shardkeys — shardkey_equal"><meta property="og:description" content="Compare two disk.frame shardkeys"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Compare two disk.frame shardkeys</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/shardkey.r'><code>R/shardkey.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/shardkey.r" class="external-link"><code>R/shardkey.r</code></a></small>
     <div class="hidden name"><code>shardkey_equal.Rd</code></div>
     </div>
 
@@ -162,47 +95,39 @@ <h1>Compare two disk.frame shardkeys</h1>
     <p>Compare two disk.frame shardkeys</p>
     </div>
 
-    <pre class="usage"><span class='fu'>shardkey_equal</span>(<span class='no'>sk1</span>, <span class='no'>sk2</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>sk1</th>
-      <td><p>shardkey1</p></td>
-    </tr>
-    <tr>
-      <th>sk2</th>
-      <td><p>shardkey2</p></td>
-    </tr>
-    </table>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">shardkey_equal</span><span class="op">(</span><span class="va">sk1</span>, <span class="va">sk2</span><span class="op">)</span></code></pre></div>
+    </div>
 
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>sk1</dt>
+<dd><p>shardkey1</p></dd>
+<dt>sk2</dt>
+<dd><p>shardkey2</p></dd>
+</dl></div>
 
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/show_ceremony.html b/docs/reference/show_ceremony.html
index 7481dc90..a4e1badc 100644
--- a/docs/reference/show_ceremony.html
+++ b/docs/reference/show_ceremony.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Show the code to setup disk.frame — show_ceremony • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Show the code to setup disk.frame — show_ceremony" />
-<meta property="og:description" content="Show the code to setup disk.frame" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Show the code to setup disk.frame — show_ceremony • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Show the code to setup disk.frame — show_ceremony"><meta property="og:description" content="Show the code to setup disk.frame"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Show the code to setup disk.frame</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/show_ceremony.R'><code>R/show_ceremony.R</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/show_ceremony.R" class="external-link"><code>R/show_ceremony.R</code></a></small>
     <div class="hidden name"><code>show_ceremony.Rd</code></div>
     </div>
 
@@ -162,41 +95,38 @@ <h1>Show the code to setup disk.frame</h1>
     <p>Show the code to setup disk.frame</p>
     </div>
 
-    <pre class="usage"><span class='fu'>show_ceremony</span>()
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">show_ceremony</span><span class="op">(</span><span class="op">)</span>
 
-<span class='fu'>ceremony_text</span>()
+<span class="fu">ceremony_text</span><span class="op">(</span><span class="op">)</span>
 
-<span class='fu'>show_boilerplate</span>()
-
-<span class='fu'>insert_ceremony</span>()</pre>
+<span class="fu">show_boilerplate</span><span class="op">(</span><span class="op">)</span>
 
+<span class="fu">insert_ceremony</span><span class="op">(</span><span class="op">)</span></code></pre></div>
+    </div>
 
 
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/srckeep.html b/docs/reference/srckeep.html
index fe997fbd..934352ba 100644
--- a/docs/reference/srckeep.html
+++ b/docs/reference/srckeep.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Keep only the variables from the input listed in selections — srckeep • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Keep only the variables from the input listed in selections — srckeep" />
-<meta property="og:description" content="Keep only the variables from the input listed in selections" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Keep only the variables from the input listed in selections — srckeep • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Keep only the variables from the input listed in selections — srckeep"><meta property="og:description" content="Keep only the variables from the input listed in selections"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Keep only the variables from the input listed in selections</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/srckeep.disk.frame.r'><code>R/srckeep.disk.frame.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/srckeep.disk.frame.r" class="external-link"><code>R/srckeep.disk.frame.r</code></a></small>
     <div class="hidden name"><code>srckeep.Rd</code></div>
     </div>
 
@@ -162,115 +95,108 @@ <h1>Keep only the variables from the input listed in selections</h1>
     <p>Keep only the variables from the input listed in selections</p>
     </div>
 
-    <pre class="usage"><span class='fu'>srckeep</span>(<span class='no'>diskf</span>, <span class='no'>selections</span>, <span class='no'>...</span>)
-
-<span class='fu'>srckeepchunks</span>(<span class='no'>diskf</span>, <span class='no'>chunks</span>, <span class='no'>...</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>diskf</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>selections</th>
-      <td><p>The list of variables to keep from the input source</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>not yet used</p></td>
-    </tr>
-    <tr>
-      <th>chunks</th>
-      <td><p>The chunks to load</p></td>
-    </tr>
-    </table>
-
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">srckeep</span><span class="op">(</span><span class="va">diskf</span>, <span class="va">selections</span>, <span class="va">...</span><span class="op">)</span>
 
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
+<span class="fu">srckeepchunks</span><span class="op">(</span><span class="va">diskf</span>, <span class="va">chunks</span>, <span class="va">...</span><span class="op">)</span></code></pre></div>
+    </div>
 
-<span class='co'># when loading cars's chunks into RAM, load only the column speed</span>
-<span class='fu'>collect</span>(<span class='fu'>srckeep</span>(<span class='no'>cars.df</span>, <span class='st'>"speed"</span>))</div><div class='output co'>#&gt;     speed
-#&gt;  1:     4
-#&gt;  2:     4
-#&gt;  3:     7
-#&gt;  4:     7
-#&gt;  5:     8
-#&gt;  6:     9
-#&gt;  7:    10
-#&gt;  8:    10
-#&gt;  9:    10
-#&gt; 10:    11
-#&gt; 11:    11
-#&gt; 12:    12
-#&gt; 13:    12
-#&gt; 14:    12
-#&gt; 15:    12
-#&gt; 16:    13
-#&gt; 17:    13
-#&gt; 18:    13
-#&gt; 19:    13
-#&gt; 20:    14
-#&gt; 21:    14
-#&gt; 22:    14
-#&gt; 23:    14
-#&gt; 24:    15
-#&gt; 25:    15
-#&gt; 26:    15
-#&gt; 27:    16
-#&gt; 28:    16
-#&gt; 29:    17
-#&gt; 30:    17
-#&gt; 31:    17
-#&gt; 32:    18
-#&gt; 33:    18
-#&gt; 34:    18
-#&gt; 35:    18
-#&gt; 36:    19
-#&gt; 37:    19
-#&gt; 38:    19
-#&gt; 39:    20
-#&gt; 40:    20
-#&gt; 41:    20
-#&gt; 42:    20
-#&gt; 43:    20
-#&gt; 44:    22
-#&gt; 45:    23
-#&gt; 46:    24
-#&gt; 47:    24
-#&gt; 48:    24
-#&gt; 49:    24
-#&gt; 50:    25
-#&gt;     speed</div><div class='input'>
-<span class='co'># clean up cars.df</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)</div></pre>
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>diskf</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>selections</dt>
+<dd><p>The list of variables to keep from the input source</p></dd>
+<dt>...</dt>
+<dd><p>not yet used</p></dd>
+<dt>chunks</dt>
+<dd><p>The chunks to load</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># when loading cars's chunks into RAM, load only the column speed</span></span>
+<span class="r-in"><span class="fu"><a href="https://dplyr.tidyverse.org/reference/compute.html" class="external-link">collect</a></span><span class="op">(</span><span class="fu">srckeep</span><span class="op">(</span><span class="va">cars.df</span>, <span class="st">"speed"</span><span class="op">)</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>     speed</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  1:     4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  2:     4</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  3:     7</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  4:     7</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  5:     8</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  6:     9</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  7:    10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  8:    10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>  9:    10</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 10:    11</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 11:    11</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 12:    12</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 13:    12</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 14:    12</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 15:    12</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 16:    13</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 17:    13</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 18:    13</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 19:    13</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 20:    14</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 21:    14</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 22:    14</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 23:    14</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 24:    15</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 25:    15</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 26:    15</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 27:    16</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 28:    16</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 29:    17</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 30:    17</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 31:    17</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 32:    18</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 33:    18</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 34:    18</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 35:    18</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 36:    19</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 37:    19</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 38:    19</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 39:    20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 40:    20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 41:    20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 42:    20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 43:    20</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 44:    22</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 45:    23</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 46:    24</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 47:    24</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 48:    24</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 49:    24</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 50:    25</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>     speed</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up cars.df</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/sub-.disk.frame.html b/docs/reference/sub-.disk.frame.html
index 961cbbe9..b3ecb1b5 100644
--- a/docs/reference/sub-.disk.frame.html
+++ b/docs/reference/sub-.disk.frame.html
@@ -1,67 +1,12 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>[ interface for disk.frame using fst backend — [.disk.frame • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="[ interface for disk.frame using fst backend — [.disk.frame" />
-<meta property="og:description" content="[ interface for disk.frame using fst backend" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>[ interface for disk.frame using fst backend — [.disk.frame • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="[ interface for disk.frame using fst backend — [.disk.frame"><meta property="og:description" content="[ interface for disk.frame using fst backend"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -72,19 +17,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -93,8 +31,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -127,34 +64,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>[ interface for disk.frame using fst backend</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/data.table.r'><code>R/data.table.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/data.table.r" class="external-link"><code>R/data.table.r</code></a></small>
     <div class="hidden name"><code>sub-.disk.frame.Rd</code></div>
     </div>
 
@@ -162,7 +95,8 @@ <h1>[ interface for disk.frame using fst backend</h1>
     <p>[ interface for disk.frame using fst backend</p>
     </div>
 
-    <pre class="usage"># S3 method for disk.frame
+    <div id="ref-usage">
+    <div class="sourceCode"><pre><code># S3 method for disk.frame
 [(
   df,
   ...,
@@ -171,73 +105,59 @@ <h1>[ interface for disk.frame using fst backend</h1>
   use.names = TRUE,
   fill = FALSE,
   idcol = NULL
-)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>df</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>same as data.table</p></td>
-    </tr>
-    <tr>
-      <th>keep</th>
-      <td><p>the columns to srckeep</p></td>
-    </tr>
-    <tr>
-      <th>rbind</th>
-      <td><p>Whether to rbind the chunks. Defaults to TRUE</p></td>
-    </tr>
-    <tr>
-      <th>use.names</th>
-      <td><p>Same as in data.table::rbindlist</p></td>
-    </tr>
-    <tr>
-      <th>fill</th>
-      <td><p>Same as in data.table::rbindlist</p></td>
-    </tr>
-    <tr>
-      <th>idcol</th>
-      <td><p>Same as in data.table::rbindlist</p></td>
-    </tr>
-    </table>
-
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
-<span class='no'>speed_limit</span> <span class='kw'>=</span> <span class='fl'>50</span>
-<span class='no'>cars.df</span>[<span class='no'>speed</span> <span class='kw'>&lt;</span> <span class='no'>speed_limit</span> ,<span class='no'>.N</span>, <span class='fu'><a href='https://rdrr.io/r/base/cut.html'>cut</a></span>(<span class='no'>dist</span>, <span class='fu'><a href='https://rdrr.io/r/base/pretty.html'>pretty</a></span>(<span class='no'>dist</span>))]</div><div class='output co'>#&gt; <span class='error'>Error in .checkTypos(e, names_x): Object 'speed_limit' not found amongst speed, dist</span></div><div class='input'>
-<span class='co'># clean up</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)</div></pre>
+)</code></pre></div>
+    </div>
+
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>df</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>...</dt>
+<dd><p>same as data.table</p></dd>
+<dt>keep</dt>
+<dd><p>the columns to srckeep</p></dd>
+<dt>rbind</dt>
+<dd><p>Whether to rbind the chunks. Defaults to TRUE</p></dd>
+<dt>use.names</dt>
+<dd><p>Same as in data.table::rbindlist</p></dd>
+<dt>fill</dt>
+<dd><p>Same as in data.table::rbindlist</p></dd>
+<dt>idcol</dt>
+<dd><p>Same as in data.table::rbindlist</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"><span class="va">speed_limit</span> <span class="op">=</span> <span class="fl">50</span></span>
+<span class="r-in"><span class="va">cars.df</span><span class="op">[</span><span class="va">speed</span> <span class="op">&lt;</span> <span class="va">speed_limit</span> ,<span class="va">.N</span>, <span class="fu"><a href="https://rdrr.io/r/base/cut.html" class="external-link">cut</a></span><span class="op">(</span><span class="va">dist</span>, <span class="fu"><a href="https://rdrr.io/r/base/pretty.html" class="external-link">pretty</a></span><span class="op">(</span><span class="va">dist</span><span class="op">)</span><span class="op">)</span><span class="op">]</span></span>
+<span class="r-err co"><span class="r-pr">#&gt;</span> <span class="error">Error in .checkTypos(e, names_x):</span> Object 'speed_limit' not found amongst speed, dist</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/tbl_vars.disk.frame.html b/docs/reference/tbl_vars.disk.frame.html
index f7d0febf..d61fa7a6 100644
--- a/docs/reference/tbl_vars.disk.frame.html
+++ b/docs/reference/tbl_vars.disk.frame.html
@@ -1,68 +1,13 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Column names for RStudio auto-complete — tbl_vars.disk.frame • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Column names for RStudio auto-complete — tbl_vars.disk.frame" />
-<meta property="og:description" content="Returns the names of the columns. Needed for RStudio to complete variable
-names" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Column names for RStudio auto-complete — tbl_vars.disk.frame • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Column names for RStudio auto-complete — tbl_vars.disk.frame"><meta property="og:description" content="Returns the names of the columns. Needed for RStudio to complete variable
+names"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -73,19 +18,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -94,8 +32,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -128,34 +65,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Column names for RStudio auto-complete</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/tbl_vars.r'><code>R/tbl_vars.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/tbl_vars.r" class="external-link"><code>R/tbl_vars.r</code></a></small>
     <div class="hidden name"><code>tbl_vars.disk.frame.Rd</code></div>
     </div>
 
@@ -164,47 +97,41 @@ <h1>Column names for RStudio auto-complete</h1>
 names</p>
     </div>
 
-    <pre class="usage"><span class='co'># S3 method for disk.frame</span>
-<span class='fu'>tbl_vars</span>(<span class='no'>x</span>)
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/tbl_vars.html" class="external-link">tbl_vars</a></span><span class="op">(</span><span class="va">x</span><span class="op">)</span>
 
-<span class='co'># S3 method for disk.frame</span>
-<span class='fu'>group_vars</span>(<span class='no'>x</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>x</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    </table>
+<span class="co"># S3 method for disk.frame</span>
+<span class="fu"><a href="https://dplyr.tidyverse.org/reference/group_data.html" class="external-link">group_vars</a></span><span class="op">(</span><span class="va">x</span><span class="op">)</span></code></pre></div>
+    </div>
 
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>x</dt>
+<dd><p>a disk.frame</p></dd>
+</dl></div>
 
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/write_disk.frame.html b/docs/reference/write_disk.frame.html
index b8e57f50..5f3f9fdb 100644
--- a/docs/reference/write_disk.frame.html
+++ b/docs/reference/write_disk.frame.html
@@ -1,68 +1,13 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>Write disk.frame to disk — write_disk.frame • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="Write disk.frame to disk — write_disk.frame" />
-<meta property="og:description" content="Write a data.frame/disk.frame to a disk.frame location. If df is a data.frame
-then using the as.disk.frame function is recommended for most cases" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>Write disk.frame to disk — write_disk.frame • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="Write disk.frame to disk — write_disk.frame"><meta property="og:description" content="Write a data.frame/disk.frame to a disk.frame location. If df is a data.frame
+then using the as.disk.frame function is recommended for most cases"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-
-  </head>
-
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -73,19 +18,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -94,8 +32,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -128,34 +65,30 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>Write disk.frame to disk</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/write_disk.frame.r'><code>R/write_disk.frame.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/write_disk.frame.r" class="external-link"><code>R/write_disk.frame.r</code></a></small>
     <div class="hidden name"><code>write_disk.frame.Rd</code></div>
     </div>
 
@@ -164,108 +97,89 @@ <h1>Write disk.frame to disk</h1>
 then using the as.disk.frame function is recommended for most cases</p>
     </div>
 
-    <pre class="usage"><span class='fu'>write_disk.frame</span>(
-  <span class='no'>df</span>,
-  <span class='kw'>outdir</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempfile</a></span>(<span class='kw'>fileext</span> <span class='kw'>=</span> <span class='st'>".df"</span>),
-  <span class='kw'>nchunks</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/ifelse.html'>ifelse</a></span>(<span class='st'>"disk.frame"</span> <span class='kw'>%in%</span> <span class='fu'><a href='https://rdrr.io/r/base/class.html'>class</a></span>(<span class='no'>df</span>), <span class='fu'><a href='nchunks.html'>nchunks.disk.frame</a></span>(<span class='no'>df</span>),
-    <span class='fu'><a href='recommend_nchunks.html'>recommend_nchunks</a></span>(<span class='no'>df</span>)),
-  <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>,
-  <span class='kw'>shardby</span> <span class='kw'>=</span> <span class='kw'>NULL</span>,
-  <span class='kw'>compress</span> <span class='kw'>=</span> <span class='fl'>50</span>,
-  <span class='kw'>shardby_function</span> <span class='kw'>=</span> <span class='st'>"hash"</span>,
-  <span class='kw'>sort_splits</span> <span class='kw'>=</span> <span class='kw'>NULL</span>,
-  <span class='kw'>desc_vars</span> <span class='kw'>=</span> <span class='kw'>NULL</span>,
-  <span class='no'>...</span>
-)
-
-<span class='fu'>output_disk.frame</span>(<span class='no'>...</span>)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>df</th>
-      <td><p>a disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>outdir</th>
-      <td><p>output directory for the disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>nchunks</th>
-      <td><p>number of chunks</p></td>
-    </tr>
-    <tr>
-      <th>overwrite</th>
-      <td><p>overwrite output directory</p></td>
-    </tr>
-    <tr>
-      <th>shardby</th>
-      <td><p>the columns to shard by</p></td>
-    </tr>
-    <tr>
-      <th>compress</th>
-      <td><p>compression ratio for fst files</p></td>
-    </tr>
-    <tr>
-      <th>shardby_function</th>
-      <td><p>splitting of chunks: "hash" for hash function or "sort" for semi-sorted chunks</p></td>
-    </tr>
-    <tr>
-      <th>sort_splits</th>
-      <td><p>for the "sort" shardby function, a dataframe with the split values.</p></td>
-    </tr>
-    <tr>
-      <th>desc_vars</th>
-      <td><p>for the "sort" shardby function, the variables to sort descending.</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>passed to cmap.disk.frame</p></td>
-    </tr>
-    </table>
-
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='no'>cars.df</span> <span class='kw'>=</span> <span class='fu'><a href='as.disk.frame.html'>as.disk.frame</a></span>(<span class='no'>cars</span>)
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">write_disk.frame</span><span class="op">(</span>
+  <span class="va">df</span>,
+  outdir <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempfile</a></span><span class="op">(</span>fileext <span class="op">=</span> <span class="st">".df"</span><span class="op">)</span>,
+  nchunks <span class="op">=</span> <span class="fu"><a href="https://Rdatatable.gitlab.io/data.table/reference/fifelse.html" class="external-link">ifelse</a></span><span class="op">(</span><span class="st">"disk.frame"</span> <span class="op"><a href="https://rdrr.io/r/base/match.html" class="external-link">%in%</a></span> <span class="fu"><a href="https://rdrr.io/r/base/class.html" class="external-link">class</a></span><span class="op">(</span><span class="va">df</span><span class="op">)</span>, <span class="fu"><a href="nchunks.html">nchunks.disk.frame</a></span><span class="op">(</span><span class="va">df</span><span class="op">)</span>,
+    <span class="fu"><a href="recommend_nchunks.html">recommend_nchunks</a></span><span class="op">(</span><span class="va">df</span><span class="op">)</span><span class="op">)</span>,
+  overwrite <span class="op">=</span> <span class="cn">FALSE</span>,
+  shardby <span class="op">=</span> <span class="cn">NULL</span>,
+  compress <span class="op">=</span> <span class="fl">50</span>,
+  shardby_function <span class="op">=</span> <span class="st">"hash"</span>,
+  sort_splits <span class="op">=</span> <span class="cn">NULL</span>,
+  desc_vars <span class="op">=</span> <span class="cn">NULL</span>,
+  <span class="va">...</span>
+<span class="op">)</span>
+
+<span class="fu">output_disk.frame</span><span class="op">(</span><span class="va">...</span><span class="op">)</span></code></pre></div>
+    </div>
 
-<span class='co'># write out a lazy disk.frame to disk</span>
-<span class='no'>cars2.df</span> <span class='kw'>=</span> <span class='fu'>write_disk.frame</span>(<span class='fu'><a href='cmap.html'>cmap</a></span>(<span class='no'>cars.df</span>, ~<span class='no'>.x</span>[<span class='fl'>1</span>,]), <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>)
-<span class='fu'>collect</span>(<span class='no'>cars2.df</span>)</div><div class='output co'>#&gt;    speed dist
-#&gt; 1:     4    2
-#&gt; 2:    11   17
-#&gt; 3:    13   46
-#&gt; 4:    16   40
-#&gt; 5:    19   46
-#&gt; 6:    24   70</div><div class='input'>
-<span class='co'># clean up cars.df</span>
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars.df</span>)
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>cars2.df</span>)</div></pre>
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>df</dt>
+<dd><p>a disk.frame</p></dd>
+<dt>outdir</dt>
+<dd><p>output directory for the disk.frame</p></dd>
+<dt>nchunks</dt>
+<dd><p>number of chunks</p></dd>
+<dt>overwrite</dt>
+<dd><p>overwrite output directory</p></dd>
+<dt>shardby</dt>
+<dd><p>the columns to shard by</p></dd>
+<dt>compress</dt>
+<dd><p>compression ratio for fst files</p></dd>
+<dt>shardby_function</dt>
+<dd><p>splitting of chunks: "hash" for hash function or "sort" for semi-sorted chunks</p></dd>
+<dt>sort_splits</dt>
+<dd><p>for the "sort" shardby function, a dataframe with the split values.</p></dd>
+<dt>desc_vars</dt>
+<dd><p>for the "sort" shardby function, the variables to sort descending.</p></dd>
+<dt>...</dt>
+<dd><p>passed to cmap.disk.frame</p></dd>
+</dl></div>
+
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="va">cars.df</span> <span class="op">=</span> <span class="fu"><a href="as.disk.frame.html">as.disk.frame</a></span><span class="op">(</span><span class="va">cars</span><span class="op">)</span></span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># write out a lazy disk.frame to disk</span></span>
+<span class="r-in"><span class="va">cars2.df</span> <span class="op">=</span> <span class="fu">write_disk.frame</span><span class="op">(</span><span class="fu"><a href="cmap.html">cmap</a></span><span class="op">(</span><span class="va">cars.df</span>, <span class="op">~</span><span class="va">.x</span><span class="op">[</span><span class="fl">1</span>,<span class="op">]</span><span class="op">)</span>, overwrite <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="https://dplyr.tidyverse.org/reference/compute.html" class="external-link">collect</a></span><span class="op">(</span><span class="va">cars2.df</span><span class="op">)</span></span>
+<span class="r-out co"><span class="r-pr">#&gt;</span>    speed dist</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 1:     4    2</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 2:    11   17</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 3:    13   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 4:    16   40</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 5:    19   46</span>
+<span class="r-out co"><span class="r-pr">#&gt;</span> 6:    24   70</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up cars.df</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars.df</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">cars2.df</span><span class="op">)</span></span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/reference/zip_to_disk.frame.html b/docs/reference/zip_to_disk.frame.html
index 862dab16..9188f8ac 100644
--- a/docs/reference/zip_to_disk.frame.html
+++ b/docs/reference/zip_to_disk.frame.html
@@ -1,70 +1,15 @@
-<!-- Generated by pkgdown: do not edit by hand -->
 <!DOCTYPE html>
-<html lang="en">
-  <head>
-  <meta charset="utf-8">
-<meta http-equiv="X-UA-Compatible" content="IE=edge">
-<meta name="viewport" content="width=device-width, initial-scale=1.0">
-
-<title>`zip_to_disk.frame` is used to read and convert every CSV file within the zip
-file to disk.frame format — zip_to_disk.frame • disk.frame</title>
-
-
-<!-- jquery -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script>
-<!-- Bootstrap -->
-
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous" />
-
-<script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script>
-
-<!-- bootstrap-toc -->
-<link rel="stylesheet" href="../bootstrap-toc.css">
-<script src="../bootstrap-toc.js"></script>
-
-<!-- Font Awesome icons -->
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous" />
-<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous" />
-
-<!-- clipboard.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script>
-
-<!-- headroom.js -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script>
-
-<!-- pkgdown -->
-<link href="../pkgdown.css" rel="stylesheet">
-<script src="../pkgdown.js"></script>
-
-
-
-
-<meta property="og:title" content="`zip_to_disk.frame` is used to read and convert every CSV file within the zip
-file to disk.frame format — zip_to_disk.frame" />
-<meta property="og:description" content="`zip_to_disk.frame` is used to read and convert every CSV file within the zip
-file to disk.frame format" />
-
-
-
-
-<!-- mathjax -->
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
-
-<!--[if lt IE 9]>
+<!-- Generated by pkgdown: do not edit by hand --><html lang="en"><head><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta charset="utf-8"><meta http-equiv="X-UA-Compatible" content="IE=edge"><meta name="viewport" content="width=device-width, initial-scale=1.0"><title>`zip_to_disk.frame` is used to read and convert every CSV file within the zip
+file to disk.frame format — zip_to_disk.frame • disk.frame</title><!-- jquery --><script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous"></script><!-- Bootstrap --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/css/bootstrap.min.css" integrity="sha256-bZLfwXAP04zRMK2BjiO8iu9pf4FbLqX6zitd+tIvLhE=" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity="sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin="anonymous"></script><!-- bootstrap-toc --><link rel="stylesheet" href="../bootstrap-toc.css"><script src="../bootstrap-toc.js"></script><!-- Font Awesome icons --><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity="sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin="anonymous"><link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity="sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin="anonymous"><!-- clipboard.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity="sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin="anonymous"></script><!-- headroom.js --><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity="sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity="sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin="anonymous"></script><!-- pkgdown --><link href="../pkgdown.css" rel="stylesheet"><script src="../pkgdown.js"></script><meta property="og:title" content="`zip_to_disk.frame` is used to read and convert every CSV file within the zip
+file to disk.frame format — zip_to_disk.frame"><meta property="og:description" content="`zip_to_disk.frame` is used to read and convert every CSV file within the zip
+file to disk.frame format"><!-- mathjax --><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script><script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script><!--[if lt IE 9]>
 <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
-<![endif]-->
-
-
-
-  </head>
+<![endif]--></head><body data-spy="scroll" data-target="#toc">
+    
 
-  <body data-spy="scroll" data-target="#toc">
     <div class="container template-reference-topic">
-      <header>
-      <div class="navbar navbar-default navbar-fixed-top" role="navigation">
+      <header><div class="navbar navbar-default navbar-fixed-top" role="navigation">
   <div class="container">
     <div class="navbar-header">
       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
@@ -75,19 +20,12 @@
       </button>
       <span class="navbar-brand">
         <a class="navbar-link" href="../index.html">disk.frame</a>
-        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.3.6</span>
+        <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="">0.5.0</span>
       </span>
     </div>
 
     <div id="navbar" class="navbar-collapse collapse">
-      <ul class="nav navbar-nav">
-        <li>
-  <a href="../index.html">
-    <span class="fas fa fas fa-home fa-lg"></span>
-     
-  </a>
-</li>
-<li>
+      <ul class="nav navbar-nav"><li>
   <a href="../reference/index.html">Reference</a>
 </li>
 <li class="dropdown">
@@ -96,8 +34,7 @@
      
     <span class="caret"></span>
   </a>
-  <ul class="dropdown-menu" role="menu">
-    <li>
+  <ul class="dropdown-menu" role="menu"><li>
       <a href="../articles/01-intro.html">Preface - The birth of `disk.frame`</a>
     </li>
     <li>
@@ -130,35 +67,31 @@
     <li>
       <a href="../articles/11-custom-group-by.html">Custom One-Stage Group-by functions</a>
     </li>
-  </ul>
-</li>
+    <li>
+      <a href="../articles/88-trouble-shooting.html">Trouble shooting</a>
+    </li>
+  </ul></li>
 <li>
   <a href="../news/index.html">Changelog</a>
 </li>
-      </ul>
-      <ul class="nav navbar-nav navbar-right">
-        <li>
-  <a href="https://github.com/xiaodaigh/disk.frame/">
-    <span class="fab fa fab fa-github fa-lg"></span>
+      </ul><ul class="nav navbar-nav navbar-right"><li>
+  <a href="https://github.com/xiaodaigh/disk.frame/" class="external-link">
+    <span class="fab fa-github fa-lg"></span>
      
   </a>
 </li>
-      </ul>
-      
-    </div><!--/.nav-collapse -->
+      </ul></div><!--/.nav-collapse -->
   </div><!--/.container -->
 </div><!--/.navbar -->
 
       
 
-      </header>
-
-<div class="row">
+      </header><div class="row">
   <div class="col-md-9 contents">
     <div class="page-header">
     <h1>`zip_to_disk.frame` is used to read and convert every CSV file within the zip
 file to disk.frame format</h1>
-    <small class="dont-index">Source: <a href='https://github.com/xiaodaigh/disk.frame/blob/master/R/zip_to_disk.frame.r'><code>R/zip_to_disk.frame.r</code></a></small>
+    <small class="dont-index">Source: <a href="https://github.com/xiaodaigh/disk.frame/blob/HEAD/R/zip_to_disk.frame.r" class="external-link"><code>R/zip_to_disk.frame.r</code></a></small>
     <div class="hidden name"><code>zip_to_disk.frame.Rd</code></div>
     </div>
 
@@ -167,93 +100,84 @@ <h1>`zip_to_disk.frame` is used to read and convert every CSV file within the zi
 file to disk.frame format</p>
     </div>
 
-    <pre class="usage"><span class='fu'>zip_to_disk.frame</span>(
-  <span class='no'>zipfile</span>,
-  <span class='no'>outdir</span>,
-  <span class='no'>...</span>,
-  <span class='kw'>validation.check</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>,
-  <span class='kw'>overwrite</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>
-)</pre>
-
-    <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
-    <table class="ref-arguments">
-    <colgroup><col class="name" /><col class="desc" /></colgroup>
-    <tr>
-      <th>zipfile</th>
-      <td><p>The zipfile</p></td>
-    </tr>
-    <tr>
-      <th>outdir</th>
-      <td><p>The output directory for disk.frame</p></td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td><p>passed to fread</p></td>
-    </tr>
-    <tr>
-      <th>validation.check</th>
-      <td><p>should the function perform a check at the end to check for validity of output. It can detect issues with conversion</p></td>
-    </tr>
-    <tr>
-      <th>overwrite</th>
-      <td><p>overwrite output directory</p></td>
-    </tr>
-    </table>
-
-    <h2 class="hasAnchor" id="value"><a class="anchor" href="#value"></a>Value</h2>
+    <div id="ref-usage">
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="fu">zip_to_disk.frame</span><span class="op">(</span>
+  <span class="va">zipfile</span>,
+  <span class="va">outdir</span>,
+  <span class="va">...</span>,
+  validation.check <span class="op">=</span> <span class="cn">FALSE</span>,
+  overwrite <span class="op">=</span> <span class="cn">TRUE</span>
+<span class="op">)</span></code></pre></div>
+    </div>
 
+    <div id="arguments">
+    <h2>Arguments</h2>
+    <dl><dt>zipfile</dt>
+<dd><p>The zipfile</p></dd>
+<dt>outdir</dt>
+<dd><p>The output directory for disk.frame</p></dd>
+<dt>...</dt>
+<dd><p>passed to fread</p></dd>
+<dt>validation.check</dt>
+<dd><p>should the function perform a check at the end to check for validity of output. It can detect issues with conversion</p></dd>
+<dt>overwrite</dt>
+<dd><p>overwrite output directory</p></dd>
+</dl></div>
+    <div id="value">
+    <h2>Value</h2>
     <p>a list of disk.frame</p>
-    <h2 class="hasAnchor" id="see-also"><a class="anchor" href="#see-also"></a>See also</h2>
-
-    <div class='dont-index'><p>Other ingesting data: 
-<code><a href='csv_to_disk.frame.html'>csv_to_disk.frame</a>()</code></p></div>
-
-    <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
-    <pre class="examples"><div class='input'><span class='co'># create a zip file containing a csv</span>
-<span class='no'>csvfile</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempfile</a></span>(<span class='kw'>fileext</span> <span class='kw'>=</span> <span class='st'>".csv"</span>)
-<span class='fu'><a href='https://rdrr.io/r/utils/write.table.html'>write.csv</a></span>(<span class='no'>cars</span>, <span class='no'>csvfile</span>)
-<span class='no'>zipfile</span> <span class='kw'>=</span> <span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempfile</a></span>(<span class='kw'>fileext</span> <span class='kw'>=</span> <span class='st'>".zip"</span>)
-<span class='fu'><a href='https://rdrr.io/r/utils/zip.html'>zip</a></span>(<span class='no'>zipfile</span>, <span class='no'>csvfile</span>)
-
-<span class='co'># read every file and convert it to a disk.frame</span>
-<span class='no'>zip.df</span> <span class='kw'>=</span> <span class='fu'>zip_to_disk.frame</span>(<span class='no'>zipfile</span>, <span class='fu'><a href='https://rdrr.io/r/base/tempfile.html'>tempfile</a></span>(<span class='kw'>fileext</span> <span class='kw'>=</span> <span class='st'>".df"</span>))
+    </div>
+    <div id="see-also">
+    <h2>See also</h2>
+    <div class="dont-index"><p>Other ingesting data: 
+<code><a href="csv_to_disk.frame.html">csv_to_disk.frame</a>()</code></p></div>
+    </div>
 
-<span class='co'># there is only one csv file so it return a list of one disk.frame</span>
-<span class='no'>zip.df</span><span class='kw'>[[</span><span class='fl'>1</span>]]</div><div class='output co'>#&gt; <span class='message'>path: "C:\Users\RTX2080\AppData\Local\Temp\RtmpInritK\file187c1d9666ec.df/Users/RTX2080/AppData/Local/Temp/RtmpInritK/file187c725c4b4.csv"</span>
-#&gt; <span class='message'>nchunks: 6</span>
-#&gt; <span class='message'>nrow (at source): 50</span>
-#&gt; <span class='message'>ncol (at source): 3</span>
-#&gt; <span class='message'>nrow (post operations): ???</span>
-#&gt; <span class='message'>ncol (post operations): ???</span></div><div class='input'>
-<span class='co'># clean up</span>
-<span class='fu'><a href='https://rdrr.io/r/base/unlink.html'>unlink</a></span>(<span class='no'>csvfile</span>)
-<span class='fu'><a href='https://rdrr.io/r/base/unlink.html'>unlink</a></span>(<span class='no'>zipfile</span>)
-<span class='fu'><a href='delete.html'>delete</a></span>(<span class='no'>zip.df</span><span class='kw'>[[</span><span class='fl'>1</span>]])</div></pre>
+    <div id="ref-examples">
+    <h2>Examples</h2>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span class="r-in"><span class="co"># create a zip file containing a csv</span></span>
+<span class="r-in"><span class="va">csvfile</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempfile</a></span><span class="op">(</span>fileext <span class="op">=</span> <span class="st">".csv"</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="https://rdrr.io/r/utils/write.table.html" class="external-link">write.csv</a></span><span class="op">(</span><span class="va">cars</span>, <span class="va">csvfile</span><span class="op">)</span></span>
+<span class="r-in"><span class="va">zipfile</span> <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempfile</a></span><span class="op">(</span>fileext <span class="op">=</span> <span class="st">".zip"</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="https://rdrr.io/r/utils/zip.html" class="external-link">zip</a></span><span class="op">(</span><span class="va">zipfile</span>, <span class="va">csvfile</span><span class="op">)</span></span>
+<span class="r-wrn co"><span class="r-pr">#&gt;</span> <span class="warning">Warning: </span>'"zip"' not found</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># read every file and convert it to a disk.frame</span></span>
+<span class="r-in"><span class="va">zip.df</span> <span class="op">=</span> <span class="fu">zip_to_disk.frame</span><span class="op">(</span><span class="va">zipfile</span>, <span class="fu"><a href="https://rdrr.io/r/base/tempfile.html" class="external-link">tempfile</a></span><span class="op">(</span>fileext <span class="op">=</span> <span class="st">".df"</span><span class="op">)</span><span class="op">)</span></span>
+<span class="r-err co"><span class="r-pr">#&gt;</span> <span class="error">Error in unzip(zipfile, list = TRUE):</span> zip file 'C:\Users\RTX2080\AppData\Local\Temp\Rtmp2rQjw5\file56f44b886b42.zip' cannot be opened</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># there is only one csv file so it return a list of one disk.frame</span></span>
+<span class="r-in"><span class="va">zip.df</span><span class="op">[[</span><span class="fl">1</span><span class="op">]</span><span class="op">]</span></span>
+<span class="r-err co"><span class="r-pr">#&gt;</span> <span class="error">Error in eval(expr, envir, enclos):</span> object 'zip.df' not found</span>
+<span class="r-in"></span>
+<span class="r-in"><span class="co"># clean up</span></span>
+<span class="r-in"><span class="fu"><a href="https://rdrr.io/r/base/unlink.html" class="external-link">unlink</a></span><span class="op">(</span><span class="va">csvfile</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="https://rdrr.io/r/base/unlink.html" class="external-link">unlink</a></span><span class="op">(</span><span class="va">zipfile</span><span class="op">)</span></span>
+<span class="r-in"><span class="fu"><a href="delete.html">delete</a></span><span class="op">(</span><span class="va">zip.df</span><span class="op">[[</span><span class="fl">1</span><span class="op">]</span><span class="op">]</span><span class="op">)</span></span>
+<span class="r-err co"><span class="r-pr">#&gt;</span> <span class="error">Error in "disk.frame" %in% class(df):</span> object 'zip.df' not found</span>
+</code></pre></div>
+    </div>
   </div>
   <div class="col-md-3 hidden-xs hidden-sm" id="pkgdown-sidebar">
-    <nav id="toc" data-toggle="toc" class="sticky-top">
-      <h2 data-toc-skip>Contents</h2>
-    </nav>
-  </div>
+    <nav id="toc" data-toggle="toc" class="sticky-top"><h2 data-toc-skip>Contents</h2>
+    </nav></div>
 </div>
 
 
-      <footer>
-      <div class="copyright">
-  <p>Developed by Dai ZJ.</p>
+      <footer><div class="copyright">
+  <p></p><p>Developed by Dai ZJ.</p>
 </div>
 
 <div class="pkgdown">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.5.1.</p>
+  <p></p><p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.0.2.</p>
 </div>
 
-      </footer>
-   </div>
+      </footer></div>
 
   
 
 
-  </body>
-</html>
+  
 
+  </body></html>
 
diff --git a/docs/sitemap.xml b/docs/sitemap.xml
new file mode 100644
index 00000000..4aa93c2a
--- /dev/null
+++ b/docs/sitemap.xml
@@ -0,0 +1,294 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
+  <url>
+    <loc>/02-intro-disk-frame.html</loc>
+  </url>
+  <url>
+    <loc>/404.html</loc>
+  </url>
+  <url>
+    <loc>/articles/01-intro-disk-frame.html</loc>
+  </url>
+  <url>
+    <loc>/articles/01-intro.html</loc>
+  </url>
+  <url>
+    <loc>/articles/02-common-questions.html</loc>
+  </url>
+  <url>
+    <loc>/articles/02-intro-disk-frame.html</loc>
+  </url>
+  <url>
+    <loc>/articles/03-concepts.html</loc>
+  </url>
+  <url>
+    <loc>/articles/03_concepts.html</loc>
+  </url>
+  <url>
+    <loc>/articles/04-ingesting-data.html</loc>
+  </url>
+  <url>
+    <loc>/articles/04_ingesting-data.html</loc>
+  </url>
+  <url>
+    <loc>/articles/05-data-table-syntax.html</loc>
+  </url>
+  <url>
+    <loc>/articles/06-vs-dask-juliadb.html</loc>
+  </url>
+  <url>
+    <loc>/articles/07-glm.html</loc>
+  </url>
+  <url>
+    <loc>/articles/08-more-epic.html</loc>
+  </url>
+  <url>
+    <loc>/articles/09-convenience-features.html</loc>
+  </url>
+  <url>
+    <loc>/articles/10-group-by.html</loc>
+  </url>
+  <url>
+    <loc>/articles/11-custom-group-by.html</loc>
+  </url>
+  <url>
+    <loc>/articles/88-trouble-shooting.html</loc>
+  </url>
+  <url>
+    <loc>/articles/common-questions.html</loc>
+  </url>
+  <url>
+    <loc>/articles/concepts.html</loc>
+  </url>
+  <url>
+    <loc>/articles/convenience-features.html</loc>
+  </url>
+  <url>
+    <loc>/articles/custom-group-by.html</loc>
+  </url>
+  <url>
+    <loc>/articles/data-table-syntax.html</loc>
+  </url>
+  <url>
+    <loc>/articles/glm.html</loc>
+  </url>
+  <url>
+    <loc>/articles/group-by.html</loc>
+  </url>
+  <url>
+    <loc>/articles/index.html</loc>
+  </url>
+  <url>
+    <loc>/articles/ingesting-data.html</loc>
+  </url>
+  <url>
+    <loc>/articles/intro-disk-frame.html</loc>
+  </url>
+  <url>
+    <loc>/articles/intro.html</loc>
+  </url>
+  <url>
+    <loc>/articles/more-epic.html</loc>
+  </url>
+  <url>
+    <loc>/articles/vs-dask-juliadb-2.html</loc>
+  </url>
+  <url>
+    <loc>/articles/vs-dask-juliadb.html</loc>
+  </url>
+  <url>
+    <loc>/authors.html</loc>
+  </url>
+  <url>
+    <loc>/index.html</loc>
+  </url>
+  <url>
+    <loc>/LICENSE-text.html</loc>
+  </url>
+  <url>
+    <loc>/news/index.html</loc>
+  </url>
+  <url>
+    <loc>/reference/add_chunk.html</loc>
+  </url>
+  <url>
+    <loc>/reference/as.data.frame.disk.frame.html</loc>
+  </url>
+  <url>
+    <loc>/reference/as.data.table.disk.frame.html</loc>
+  </url>
+  <url>
+    <loc>/reference/as.disk.frame.html</loc>
+  </url>
+  <url>
+    <loc>/reference/bloomfilter.html</loc>
+  </url>
+  <url>
+    <loc>/reference/chunk_group_by.html</loc>
+  </url>
+  <url>
+    <loc>/reference/cmap.html</loc>
+  </url>
+  <url>
+    <loc>/reference/cmap2.html</loc>
+  </url>
+  <url>
+    <loc>/reference/collect.html</loc>
+  </url>
+  <url>
+    <loc>/reference/colnames.html</loc>
+  </url>
+  <url>
+    <loc>/reference/compute.disk.frame.html</loc>
+  </url>
+  <url>
+    <loc>/reference/create_chunk_mapper.html</loc>
+  </url>
+  <url>
+    <loc>/reference/create_dplyr_mapper.html</loc>
+  </url>
+  <url>
+    <loc>/reference/csv_to_disk.frame.html</loc>
+  </url>
+  <url>
+    <loc>/reference/delete.html</loc>
+  </url>
+  <url>
+    <loc>/reference/dfglm.html</loc>
+  </url>
+  <url>
+    <loc>/reference/df_ram_size.html</loc>
+  </url>
+  <url>
+    <loc>/reference/disk.frame.html</loc>
+  </url>
+  <url>
+    <loc>/reference/dplyr_verbs.html</loc>
+  </url>
+  <url>
+    <loc>/reference/evalparseglue.html</loc>
+  </url>
+  <url>
+    <loc>/reference/foverlaps.disk.frame.html</loc>
+  </url>
+  <url>
+    <loc>/reference/gen_datatable_synthetic.html</loc>
+  </url>
+  <url>
+    <loc>/reference/get_chunk.html</loc>
+  </url>
+  <url>
+    <loc>/reference/get_chunk_ids.html</loc>
+  </url>
+  <url>
+    <loc>/reference/groups.disk.frame.html</loc>
+  </url>
+  <url>
+    <loc>/reference/group_by.html</loc>
+  </url>
+  <url>
+    <loc>/reference/hard_arrange.html</loc>
+  </url>
+  <url>
+    <loc>/reference/hard_group_by.html</loc>
+  </url>
+  <url>
+    <loc>/reference/head_tail.html</loc>
+  </url>
+  <url>
+    <loc>/reference/index.html</loc>
+  </url>
+  <url>
+    <loc>/reference/is_disk.frame.html</loc>
+  </url>
+  <url>
+    <loc>/reference/join.html</loc>
+  </url>
+  <url>
+    <loc>/reference/make_glm_streaming_fn.html</loc>
+  </url>
+  <url>
+    <loc>/reference/map.html</loc>
+  </url>
+  <url>
+    <loc>/reference/map2.html</loc>
+  </url>
+  <url>
+    <loc>/reference/mean.chunk_agg.disk.frame.html</loc>
+  </url>
+  <url>
+    <loc>/reference/mean.collected_agg.disk.frame.html</loc>
+  </url>
+  <url>
+    <loc>/reference/merge.disk.frame.html</loc>
+  </url>
+  <url>
+    <loc>/reference/move_to.html</loc>
+  </url>
+  <url>
+    <loc>/reference/nchunks.html</loc>
+  </url>
+  <url>
+    <loc>/reference/ncol_nrow.html</loc>
+  </url>
+  <url>
+    <loc>/reference/one-stage-group-by-verbs.html</loc>
+  </url>
+  <url>
+    <loc>/reference/overwrite_check.html</loc>
+  </url>
+  <url>
+    <loc>/reference/print.disk.frame.html</loc>
+  </url>
+  <url>
+    <loc>/reference/pull.disk.frame.html</loc>
+  </url>
+  <url>
+    <loc>/reference/rbindlist.disk.frame.html</loc>
+  </url>
+  <url>
+    <loc>/reference/rechunk.html</loc>
+  </url>
+  <url>
+    <loc>/reference/recommend_nchunks.html</loc>
+  </url>
+  <url>
+    <loc>/reference/remove_chunk.html</loc>
+  </url>
+  <url>
+    <loc>/reference/sample.html</loc>
+  </url>
+  <url>
+    <loc>/reference/setup_disk.frame.html</loc>
+  </url>
+  <url>
+    <loc>/reference/shard.html</loc>
+  </url>
+  <url>
+    <loc>/reference/shardkey.html</loc>
+  </url>
+  <url>
+    <loc>/reference/shardkey_equal.html</loc>
+  </url>
+  <url>
+    <loc>/reference/show_ceremony.html</loc>
+  </url>
+  <url>
+    <loc>/reference/srckeep.html</loc>
+  </url>
+  <url>
+    <loc>/reference/sub-.disk.frame.html</loc>
+  </url>
+  <url>
+    <loc>/reference/summarise.grouped_disk.frame.html</loc>
+  </url>
+  <url>
+    <loc>/reference/tbl_vars.disk.frame.html</loc>
+  </url>
+  <url>
+    <loc>/reference/write_disk.frame.html</loc>
+  </url>
+  <url>
+    <loc>/reference/zip_to_disk.frame.html</loc>
+  </url>
+</urlset>
diff --git a/man/dplyr_verbs.Rd b/man/dplyr_verbs.Rd
index d3930c57..340e6958 100644
--- a/man/dplyr_verbs.Rd
+++ b/man/dplyr_verbs.Rd
@@ -8,7 +8,6 @@
 \alias{transmute.disk.frame}
 \alias{arrange.disk.frame}
 \alias{chunk_arrange}
-\alias{add_count.disk.frame}
 \alias{add_tally.disk.frame}
 \alias{do.disk.frame}
 \alias{distinct.disk.frame}
@@ -30,8 +29,6 @@
 
 chunk_arrange(.data, ...)
 
-add_count.disk.frame(.data, ...)
-
 add_tally.disk.frame(.data, ...)
 
 \method{do}{disk.frame}(.data, ...)
diff --git a/presentation/rstudio conf 2021/1min video script b/presentation/rstudio conf 2021/1min video script
new file mode 100644
index 00000000..53337167
--- /dev/null
+++ b/presentation/rstudio conf 2021/1min video script	
@@ -0,0 +1,11 @@
+Hi my name is ZedJ and I am a Data Scientist local to Melbourne. I am a keen contributor to open source data science projects, one of which I want to talk about at rstudio:conf 2021. That project is {disk.frame} - a larger-than-RAM data manipulation package.
+
+R needs to load the data in its entirety into RAM. However, RAM is a precious resource and often do run out.
+
+{disk.frame} solves this issue by providing a 100%-R framework to manipulate data on disk. A modern laptop with {disk.frame} can comfortably handle 100GB's of data.
+
+Also, {disk.frame} uses {dplyr} verbs to manipulate data so useRs will find it very easy to pick up.
+
+Finally, because {disk.frame} is 100%-R, you can use any R package with it at no extra cost unlike Spark.
+
+The talk I propose will introduce {disk.frame} to users with the needs to manipulate large amounts of data with minimal setup. They will find {disk.frame} very familiar, as {disk.frame} uses {dplyr} verbs directly;. Some users rely on DBMS (e.g. PostgresSQL), Spark, or SAS to manage their large datasets. They will find lots of benefits in switching to {disk.frame}, which will allow them to keep their workflow in R for as long as possible. Because {disk.frame} can run R functions natively, they will find that {disk.frame} allows them to many R packages directly with {disk.frame}.
diff --git a/presentation/rstudio conf 2021/Abstract proposal.md b/presentation/rstudio conf 2021/Abstract proposal.md
new file mode 100644
index 00000000..e7406d3f
--- /dev/null
+++ b/presentation/rstudio conf 2021/Abstract proposal.md	
@@ -0,0 +1,5 @@
+Learn how to handle 100GBs of data with ease using {disk.frame} - the larger-than-RAM-data manipulation package.
+
+R loads data in its entirety into RAM. However, RAM is a precious resource and often do run out. That's why most R user would have run into the "cannot allocate vector of size xxB." error at some point.
+
+However, the need to handle larger-than-RAM data doesn't go away just because RAM isn't large enough. So many useRs turn to big data tools like Spark for the task. In this talk, I will make the case that {disk.frame} is sufficient and often preferable for manipulating larger-than-RAM data that fit on disk. I will show how you can apply familiar {dplyr}-verbs to manipulate larger-than-RAM data with {disk.frame}.
\ No newline at end of file
diff --git a/presentation/twin cities/.gitignore b/presentation/twin cities/.gitignore
new file mode 100644
index 00000000..26416673
--- /dev/null
+++ b/presentation/twin cities/.gitignore	
@@ -0,0 +1 @@
+*.mp4
diff --git a/tests/testthat.R b/tests/testthat.R
deleted file mode 100644
index 6681ff05..00000000
--- a/tests/testthat.R
+++ /dev/null
@@ -1,4 +0,0 @@
-library(testthat)
-library(disk.frame)
-
-test_check("disk.frame")
diff --git a/tests/testthat/test-Rcpp.R b/tests/testthat/test-Rcpp.R
deleted file mode 100644
index d4144ca9..00000000
--- a/tests/testthat/test-Rcpp.R
+++ /dev/null
@@ -1,6 +0,0 @@
-context("test-RcppExprts")
-
-
-test_that("testing Rccpexports nothing here", {
-  expect_equal(2L, 2L)
-})
\ No newline at end of file
diff --git a/tests/testthat/test-add-chunk.r b/tests/testthat/test-add-chunk.r
deleted file mode 100644
index 07855ac3..00000000
--- a/tests/testthat/test-add-chunk.r
+++ /dev/null
@@ -1,41 +0,0 @@
-context("test-add-chunk")
-
-setup({
-  setup_disk.frame(workers = 2)
-})
-
-test_that("testing add chunk without naming chunk_id", {
-  a = data.frame(a = 1:100, b = 1:100)
-  
-  a1 = as.disk.frame(a, overwrite = TRUE)
-  
-  b = data.frame(a = 51:150, b = 1:100)
-  d = data.frame(a = 1:50, b = 1:50)
-  
-  add_chunk(a1, b)
-  expect_equal(nrow(a1), 200)
-  
-  add_chunk(a1, d)
-  expect_equal(nrow(a1), 250)
-  
-  delete(a1)
-})
-
-test_that("testing add chunk by naming chunk_id", {
-  a = data.frame(a = 1:100, b = 1:100)
-  
-  a1 = as.disk.frame(a, overwrite = TRUE)
-  b = data.frame(a = 51:150, b = 1:100)
-  d = data.frame(a = 1:50, b = 1:50)
-  
-  add_chunk(a1, b, chunk_id = nchunks(a1)+2)
-  expect_equal(nrow(a1), 200)
-  
-  add_chunk(a1, d, chunk_id = nchunks(a1)+2)
-  expect_equal(nrow(a1), 250)
-  
-  delete(a1)
-})
-
-teardown({
-})
\ No newline at end of file
diff --git a/tests/testthat/test-anti_join.R b/tests/testthat/test-anti_join.R
deleted file mode 100644
index 348ebaf2..00000000
--- a/tests/testthat/test-anti_join.R
+++ /dev/null
@@ -1,75 +0,0 @@
-context("test-anti_join")
-
-setup({
-  setup_disk.frame(workers = 2)
-  
-  a = data.frame(a = 1:100, b = 1:100)
-  b = data.frame(a = 51:150, b = 1:100)
-  d = data.frame(a = 1:50, b = 1:50)
-
-  as.disk.frame(a, file.path(tempdir(), "tmp_a_aj.df"), nchunks = 4, overwrite = TRUE)
-  as.disk.frame(b, file.path(tempdir(), "tmp_b_aj.df"), nchunks = 5, overwrite = TRUE)
-  as.disk.frame(d, file.path(tempdir(), "tmp_d_aj.df"), overwrite = TRUE)
-
-  as.disk.frame(a, file.path(tempdir(), "tmp_a_aj2.df"), nchunks = 4, overwrite = TRUE)
-  as.disk.frame(b, file.path(tempdir(), "tmp_b_aj2.df"), nchunks = 5, overwrite = TRUE)
-  as.disk.frame(d, file.path(tempdir(), "tmp_d_aj2.df"), overwrite = TRUE)
-})
-
-test_that("testing anti_join where right is data.frame", {
-  #skip_on_cran()
-  a = disk.frame(file.path(tempdir(), "tmp_a_aj.df"))
-  b = disk.frame(file.path(tempdir(), "tmp_b_aj.df"))
-  d = disk.frame(file.path(tempdir(), "tmp_d_aj.df"))
-  bc = collect(b)
-  dc = collect(d)
-  
-  abc = anti_join(a, bc, by = "a") %>% collect
-  expect_equal(nrow(abc), 50)
-  
-  abc0 = anti_join(a, bc, by = c("a","b")) %>% collect
-  expect_equal(nrow(abc0), 100)
-  
-  abc100 = anti_join(a, bc, by = "b") %>% collect
-  expect_equal(nrow(abc100), 0)
-  
-  abd50 = anti_join(a, dc, by = "b") %>% collect
-  expect_equal(nrow(abd50), 50)
-})
-
-test_that("testing anti_join where right is disk.frame", {
-  #skip_on_cran()
-  a = disk.frame(file.path(tempdir(),"tmp_a_aj2.df"))
-  b = disk.frame(file.path(tempdir(),"tmp_b_aj2.df"))
-  d = disk.frame(file.path(tempdir(),"tmp_d_aj2.df"))
-  
-  expect_warning({
-    ab <- anti_join(a, b, by = "a", merge_by_chunk_id = FALSE) %>% collect
-    })
-  expect_equal(nrow(ab), 50)
-  
-  expect_warning({
-    ab0 = anti_join(a, b, by = c("a","b"), merge_by_chunk_id = FALSE) %>% collect
-    })
-  expect_equal(nrow(ab0), 100)
-  
-  expect_warning({
-    ab100 = anti_join(a, b, by = "b", merge_by_chunk_id = FALSE) %>% collect
-    })
-  expect_equal(nrow(ab100), 0)
-  
-  expect_warning({
-    ad50 = anti_join(a, d, by = "b", merge_by_chunk_id = FALSE) %>% collect
-    })
-  expect_equal(nrow(ad50), 50)
-})
-
-teardown({
-  fs::dir_delete(file.path(tempdir(),"tmp_a_aj.df"))
-  fs::dir_delete(file.path(tempdir(),"tmp_b_aj.df"))
-  fs::dir_delete(file.path(tempdir(),"tmp_d_aj.df"))
-
-  fs::dir_delete(file.path(tempdir(),"tmp_a_aj2.df"))
-  fs::dir_delete(file.path(tempdir(),"tmp_b_aj2.df"))
-  fs::dir_delete(file.path(tempdir(),"tmp_d_aj2.df"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-as-data-frame.R b/tests/testthat/test-as-data-frame.R
deleted file mode 100644
index 0cb853fb..00000000
--- a/tests/testthat/test-as-data-frame.R
+++ /dev/null
@@ -1,14 +0,0 @@
-context("test-as-data-frame")
-
-test_that("as.data.frame works", {
-  tmpdir = tempfile("disk.frame.tmp")
-  df = as.disk.frame(disk.frame:::gen_datatable_synthetic(1e5+11, 100), tmpdir, overwrite = T)
-  dff = as.data.frame(df)
-  dft = data.table::as.data.table(df)
-  expect_s3_class(dff, "data.frame")
-  expect_s3_class(dft, "data.table")
-  expect_equal(nrow(dff), 1e5+11)
-  
-  delete(df)
-})
-
diff --git a/tests/testthat/test-as-disk-frame.R b/tests/testthat/test-as-disk-frame.R
deleted file mode 100644
index b1ac42dc..00000000
--- a/tests/testthat/test-as-disk-frame.R
+++ /dev/null
@@ -1,15 +0,0 @@
-context("test-as-disk-frame")
-
-test_that("as.disk.frame works", {
-  ROWS = 1e5+11
-  
-  df = disk.frame:::gen_datatable_synthetic(ROWS)
-  tf = file.path(tempdir(), "tmp_as_disk_frame_delete")
-  
-  dfdf <- as.disk.frame(df, outdir = tf, overwrite=TRUE)
-  
-  expect_equal(nrow(dfdf), ROWS)
-  expect_error(dfdf <- as.disk.frame(df, tf, overwrite=FALSE))
-  
-  delete(dfdf)
-})
diff --git a/tests/testthat/test-bloom-filter.r b/tests/testthat/test-bloom-filter.r
deleted file mode 100644
index 9fa4ad42..00000000
--- a/tests/testthat/test-bloom-filter.r
+++ /dev/null
@@ -1,16 +0,0 @@
-# context("test-bloomfilter")
-# 
-# test_that("bloomfilter should fail here", {
-#   expect_error(make_bloomfilter(df, c("origin", "dest")))
-# })
-# 
-# test_that("bloomfilter should succeed", {
-#   df = nycflights13::flights %>% as.disk.frame(shardby = c("carrier"))
-#   make_bloomfilter(df, "carrier")
-#   expect_true(length(bf_likely_in_chunks(df, "carrier", "UA")) == 1)
-#   
-#   expect_equal(nrow(collect(use_bloom_filter(df, "carrier", "UA"))), nrow(filter(nycflights13::flights, carrier == "UA")))
-#   
-#   # clean up
-#   delete(df)
-# })
diff --git a/tests/testthat/test-collect.R b/tests/testthat/test-collect.R
deleted file mode 100644
index b5a174c8..00000000
--- a/tests/testthat/test-collect.R
+++ /dev/null
@@ -1,57 +0,0 @@
-context("test-collect")
-
-setup({
-  df = as.disk.frame(disk.frame:::gen_datatable_synthetic(1e5+11), file.path(tempdir(),"tmp_col_delete"), overwrite=T)
-})
-
-test_that("collect works on simple data", {
-  df = disk.frame(file.path(tempdir(),"tmp_col_delete"))
-  dff = dplyr::collect(df)
-  expect_equal(nrow(dff), 1e5+11)
-  expect_s3_class(dff, "data.frame")
-  expect_s3_class(dff, "data.table")
-})
-
-test_that("collect works on lazy stream", {
-  df = disk.frame(file.path(tempdir(),"tmp_col_delete"))
-  df = cmap(df, lazy = T, ~{
-    .x[1:10, ]
-  })
-  dff = dplyr::collect(df)
-  expect_equal(nrow(dff), nchunks(df)*10)
-  expect_s3_class(dff, "data.frame")
-  expect_s3_class(dff, "data.table")
-})
-
-test_that("collect works on lazy stream followed by dplyr", {
-  df = disk.frame(file.path(tempdir(),"tmp_col_delete"))
-  df = cmap(df, lazy = T, ~{
-    .x[1:10, ]
-  }) %>% select(id1, id4)
-  
-  dff = dplyr::collect(df)
-  expect_equal(nrow(dff), nchunks(df)*10)
-  expect_equal(ncol(dff), 2)
-  expect_s3_class(dff, "data.frame")
-  expect_s3_class(dff, "data.table")
-})
-
-
-test_that("collect works on dplyr::select followed by lazy", {
-  df = disk.frame(file.path(tempdir(),"tmp_col_delete"))
-  df = df %>% select(id1, id4) %>%
-    cmap.disk.frame(lazy = T, ~{
-      .x[1:10, ]
-    })
-  
-  dff = dplyr::collect(df)
-  expect_equal(nrow(dff), nchunks(df)*10)
-  expect_equal(ncol(dff), 2)
-  expect_s3_class(dff, "data.frame")
-  expect_s3_class(dff, "data.table")
-})
-
-
-teardown({
-  fs::dir_delete(file.path(tempdir(),"tmp_col_delete"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-compute.r b/tests/testthat/test-compute.r
deleted file mode 100644
index 3a1bd56e..00000000
--- a/tests/testthat/test-compute.r
+++ /dev/null
@@ -1,55 +0,0 @@
-context("test-compute")
-
-setup({
-  setup_disk.frame(workers = 2)
-  df = as.disk.frame(disk.frame:::gen_datatable_synthetic(1e5+11), file.path(tempdir(),"tmp_compute_delete"), overwrite=T)
-})
-
-test_that("compute works on simple data", {
-  df = disk.frame(file.path(tempdir(),"tmp_compute_delete"))
-  dff = compute(df)
-  
-  expect_equal(nrow(dff), 1e5+11)
-  expect_s3_class(dff, "disk.frame")
-})
-
-test_that("compute works on lazy stream", {
-  df = disk.frame(file.path(tempdir(),"tmp_compute_delete"))
-  df = cmap(df, lazy = T, ~{
-    .x[1:10, ]
-  })
-  dff = compute(df)
-  expect_equal(nrow(dff), nchunks(df)*10)
-  expect_s3_class(dff, "disk.frame")
-})
-
-test_that("compute works on lazy stream followed by dplyr", {
-  df = disk.frame(file.path(tempdir(),"tmp_compute_delete"))
-  df = cmap(df, lazy = T, ~{
-    .x[1:10, ]
-  }) %>% select(id1, id4)
-  
-  dff = compute(df)
-  expect_equal(nrow(dff), nchunks(df)*10)
-  expect_equal(ncol(dff), 2)
-  expect_s3_class(dff, "disk.frame")
-})
-
-
-test_that("compute works on dplyr::select followed by lazy", {
-  df = disk.frame(file.path(tempdir(),"tmp_compute_delete"))
-  df = df %>% select(id1, id4) %>%
-    cmap(lazy = T, ~{
-      .x[1:10, ]
-    })
-  
-  dff = dplyr::collect(df)
-  expect_equal(nrow(dff), nchunks(df)*10)
-  expect_equal(ncol(dff), 2)
-  expect_s3_class(dff, "data.frame")
-})
-
-
-teardown({
-  fs::dir_delete(file.path(tempdir(),"tmp_compute_delete"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-csv2disk.frame.r b/tests/testthat/test-csv2disk.frame.r
deleted file mode 100644
index dcc73652..00000000
--- a/tests/testthat/test-csv2disk.frame.r
+++ /dev/null
@@ -1,84 +0,0 @@
-context("test-csv2disk.frame")
-
-setup({
-  df = disk.frame:::gen_datatable_synthetic(1e3+11)
-  data.table::fwrite(df, file.path(tempdir(), "tmp_pls_delete_csv2df.csv"))
-  data.table::fwrite(df, file.path(tempdir(), "tmp_pls_delete_csv2df2.csv"))
-  data.table::fwrite(df, file.path(tempdir(), "tmp_pls_delete_csv2df3.csv"))
-})
-
-test_that("csv2disk.frame works with no shard", {
-  dff = csv_to_disk.frame(
-    file.path(tempdir(), "tmp_pls_delete_csv2df.csv"),
-    file.path(tempdir(), "tmp_pls_delete_csv2df.df"), 
-    overwrite=TRUE, 
-    nchunks=max(2, recommend_nchunks(file.size(file.path(tempdir(), "tmp_pls_delete_csv2df.csv")))))
-  dff1 = dff[,sum(v1), id1]
-  dff2 = dff1[,sum(V1), id1]
-  expect_false(nrow(dff1) == nrow(dff2))
-  expect_equal(nrow(dff), 1e3+11)
-  expect_equal(ncol(dff), 10)
-})
-
-test_that("csv2disk.frame works with shard", {
-  dff = csv_to_disk.frame(
-    file.path(tempdir(), "tmp_pls_delete_csv2df2.csv"),
-    file.path(tempdir(), "tmp_pls_delete_csv2df2.df"), 
-    shardby = "id1", overwrite = TRUE)
-  dff1 = dff[,sum(v1), id1]
-  dff2 = dff1[,sum(V1), id1]
-  expect_true(nrow(dff1) == nrow(dff2))
-  expect_equal(nrow(dff), 1e3+11)
-  expect_equal(ncol(dff), 10)
-  
-  dff = csv_to_disk.frame(
-    file.path(tempdir(), "tmp_pls_delete_csv2df3.csv"), 
-    file.path(tempdir(), "tmp_pls_delete_csv2df3.df"), 
-    shardby = c("id1","id2"))
-  
-  dff1 = dff[,sum(v1), .(id1,id2)]
-  dff2 = dff1[,sum(V1), .(id1,id2)]
-  expect_true(nrow(dff1) == nrow(dff2))
-  expect_equal(nrow(dff), 1e3+11)
-  expect_equal(ncol(dff), 10)
-})
-
-test_that("csv2disk.frame tests readr", {
-  library(dplyr)
-  library(disk.frame)
-  library(data.table)
-  library(nycflights13)
-  
-  expect_equal(1,1)
-  
-  # TODO make this test better
-  # convert from a data frame
-  # flights <- flights %>%
-  #   dplyr::mutate(date = as.Date(paste(year, month, day, sep = "-")))
-  # str(flights) # time_hour is POSIXct
-  # 
-  # flights.df <- as.disk.frame(
-  #   flights,
-  #   outdir = file.path(tempdir(), "tmp_flights.df"),
-  #   overwrite = TRUE)
-  # flights.df
-  # str(collect(flights.df)) 
-  # 
-  # # with sharding
-  # df_path = file.path(tempdir(), "tmp_flights.df")
-  # flights.df <- csv_to_disk.frame(
-  #   csv_path,
-  #   outdir = df_path,
-  #   shardby = "minute",
-  #   overwrite = T,
-  #   backend = "readr")
-})
-
-teardown({
-  fs::dir_delete(file.path(tempdir(), "tmp_pls_delete_csv2df.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_pls_delete_csv2df2.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_pls_delete_csv2df3.df"))
-  fs::file_delete(file.path(tempdir(), "tmp_pls_delete_csv2df.csv"))
-  fs::file_delete(file.path(tempdir(), "tmp_pls_delete_csv2df2.csv"))
-  fs::file_delete(file.path(tempdir(), "tmp_pls_delete_csv2df3.csv"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-data-table.r b/tests/testthat/test-data-table.r
deleted file mode 100644
index 0275ee4a..00000000
--- a/tests/testthat/test-data-table.r
+++ /dev/null
@@ -1,41 +0,0 @@
-context("test-data.table [")
-
-setup({
-  library(data.table)
-  setup_disk.frame(workers = 2)
-  df = as.disk.frame(disk.frame:::gen_datatable_synthetic(1e5+11), file.path(tempdir(), "tmp_col_delete"), overwrite=TRUE, nchunks = 8)
-})
-
-test_that("data.table .N", {
-  library(data.table)
-  df = disk.frame(file.path(tempdir(), "tmp_col_delete"))
-  res <- sum(unlist(df[,.N]))
-  expect_equal(res , 1e5+11)
-})
-
-test_that("data.table .N+y V1", {
-  df = disk.frame(file.path(tempdir(), "tmp_col_delete"))
-  if(interactive()) {
-    y = 2
-    
-    {y = 3; a <- df[,.(n_plus_y = .N + y), v1]}
-    b <- df[,.N, v1]
-    
-    expect_equal(a$n_plus_y, b$N + y)
-  } else {
-    # TODO figure out why the above fails
-    expect_equal(2L, 2L)
-  }
-})
-
-test_that("data.table do not return a data.table", {
-  library(data.table)
-  df = disk.frame(file.path(tempdir(), "tmp_col_delete"))
-  res <- df[,.(.N), rbind=FALSE]
-  expect_equal(typeof(res), "list")
-  expect_equal(length(res), 8)
-})
-
-teardown({
-  fs::dir_delete(file.path(tempdir(), "tmp_col_delete"))
-})
diff --git a/tests/testthat/test-delete.r b/tests/testthat/test-delete.r
deleted file mode 100644
index cc13cce8..00000000
--- a/tests/testthat/test-delete.r
+++ /dev/null
@@ -1,20 +0,0 @@
-context("test-delete")
-
-setup({
-  setup_disk.frame(workers = 2)
-  df = as.disk.frame(disk.frame:::gen_datatable_synthetic(1e5+11), file.path(tempdir(), "tmp_del_delete"), overwrite = TRUE)
-})
-
-test_that("data.table .N", {
-  df = disk.frame(file.path(tempdir(), "tmp_del_delete"))
-  p = attr(df, "path", exact=TRUE)
-  expect_true(fs::dir_exists(p))
-  
-  delete(df)
-  
-  expect_false(fs::dir_exists(p))
-})
-
-teardown({
-  #fs::dir_delete("tmp_del_delete")
-})
\ No newline at end of file
diff --git a/tests/testthat/test-disk-frame.r b/tests/testthat/test-disk-frame.r
deleted file mode 100644
index 236e7a18..00000000
--- a/tests/testthat/test-disk-frame.r
+++ /dev/null
@@ -1,34 +0,0 @@
-context("test-disk.frame")
-
-# TODO add in tests here
-
-test_that("test add_meta", {
-  # it works so how to test this?
-  expect_equal(2L, 2L)
-  
-})
-
-test_that("test head", {
-  # it works so how to test this?
-  expect_equal(2L, 2L)
-  
-})
-
-test_that("test tail", {
-  # it works so how to test this?
-  expect_equal(2L, 2L)
-  
-})
-
-
-test_that("test nrow", {
-  # it works so how to test this?
-  
-  expect_equal(2L, 2L)
-})
-
-test_that("test ncol", {
-  # it works so how to test this?
-  
-  expect_equal(2L, 2L)
-})
\ No newline at end of file
diff --git a/tests/testthat/test-dplyr-verbs.r b/tests/testthat/test-dplyr-verbs.r
deleted file mode 100644
index f8f18f35..00000000
--- a/tests/testthat/test-dplyr-verbs.r
+++ /dev/null
@@ -1,175 +0,0 @@
-context("test-dplyr-verbs")
-
-setup({
-  b = data.frame(a = 51:150, b = 1:100)
-  as.disk.frame(b, file.path(tempdir(), "tmp_b_dv.df"), nchunks = 5, overwrite = T)
-})
-
-test_that("testing select", {
-  b = disk.frame(file.path(tempdir(), "tmp_b_dv.df"))
-  
-  df = b %>% 
-    select(a) %>% 
-    collect
-  
-  expect_equal(ncol(df), 1)
-})
-
-test_that("testing rename", {
-  b = disk.frame(file.path(tempdir(), "tmp_b_dv.df"))
-  
-  df = b %>% 
-    rename(a_new_name = a) %>% 
-    collect
-  
-  expect_setequal(colnames(df), c("a_new_name", "b"))
-})
-
-test_that("testing filter", {
-  b = disk.frame(file.path(tempdir(), "tmp_b_dv.df"))
-  
-  df = b %>% 
-    filter(a <= 100, b <= 10) %>% 
-    collect
-  
-  expect_setequal(nrow(df), 10)
-})
-
-test_that("testing filter - global vars", {
-  b = disk.frame(file.path(tempdir(), "tmp_b_dv.df"))
-  
-  one_hundred = 100
-  
-  df = b %>% 
-    filter(a <= one_hundred, b <= 10) %>% 
-    collect
-  
-  expect_setequal(nrow(df), 10)
-})
-
-test_that("testing mutate", {
-  b = disk.frame(file.path(tempdir(), "tmp_b_dv.df"))
-  
-  
-  df = b %>% 
-    mutate(d = a + b) %>% 
-    collect
-  
-  expect_setequal(sum(df$d), sum(df$a, df$b))
-  
-  df = b %>% 
-    mutate(e = rank(desc(a))) %>%
-    collect
-  
-  expect_equal(nrow(df), 100)
-  
-  # need to test
-  value <- as.disk.frame(tibble(char = LETTERS,
-                                num = 1:26))
-  df2 = value %>%
-    dplyr::mutate(b =  case_when(
-      char %in% c("A", "B", "C") ~ "1",
-      TRUE ~ char)) %>% 
-    collect
-  
-  expect_equal(ncol(df2), 3)
-  
-  # testing
-  fn = function(a, b) {
-    a+b
-  }
-  
-  df3 = value %>%
-    dplyr::mutate(b =  fn(num, num)) %>%
-    collect
-  
-  expect_equal(ncol(df3), 3)
-  
-  
-  global_var = 100
-  
-  df4 = value %>%
-    dplyr::mutate(b =  fn(num, num), d = global_var*2) %>%
-    collect
-  
-  expect_equal(ncol(df4), 4)
-  expect_true(all(df4$d == 200))
-})
-
-test_that("testing mutate user-defined function", {
-   b = disk.frame(file.path(tempdir(), "tmp_b_dv.df"))
-   
-   
-   udf = function(a1, b1) {
-     a1 + b1
-   }
-   
-   df = b %>%
-     mutate(d = udf(a,b)) %>%
-     collect
-   
-   expect_setequal(sum(df$d), sum(df$a, df$b))
-})
-
-test_that("testing transmute", {
-  b = disk.frame(file.path(tempdir(), "tmp_b_dv.df"))
-  
-  df = b %>% 
-    transmute(d = a + b) %>% 
-    collect
-  
-  expect_setequal(names(df), c("d"))
-})
-
-test_that("testing arrange", {
-  b = disk.frame(file.path(tempdir(), "tmp_b_dv.df"))
-  
-  expect_warning(df <- b %>%
-    mutate(random_unif = runif(dplyr::n())) %>% 
-    arrange(desc(random_unif)))
-  
-  df <- b %>%
-    mutate(random_unif = runif(dplyr::n())) %>% 
-    chunk_arrange(desc(random_unif))
-  
-  x = purrr::map_lgl(1:nchunks(df), ~{
-    is.unsorted(.x) == FALSE
-  })
-  
-  expect_true(all(x))
-})
-
-test_that("testing chunk_summarise", {
-  b = disk.frame(file.path(tempdir(), "tmp_b_dv.df"))
-  
-  df = b %>%
-    chunk_summarise(suma = sum(a)) %>% 
-    collect %>% 
-    summarise(suma = sum(suma))
-  
-  expect_equal(df$suma, collect(b)$a %>% sum)
-})
-
-test_that("testing mutate within function works", {
-  test_f <- function(params, x_df){
-    x_df %>% mutate(aha = params[1]*cyl + params[2]*disp)
-  }
-  
-  expect_true("aha" %in% names(test_f(c(1, 2), mtcars)))
-})
-
-test_that("filter failure: prevent github #191 regression",  {
-  flights_df = as.disk.frame(nycflights13::flights)
-  
-  # expect error due to syntax error
-  expect_warning(expect_error(flights_df %>% 
-    filter(tailnum %in% paste0(unique(nycflights13::flights$tailnum)[1:60]), "") %>% 
-    collect))
-  
-  delete(flights_df)
-})
-
-
-teardown({
-  fs::dir_delete(file.path(tempdir(), "tmp_b_dv.df"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-dtplyr-support.r b/tests/testthat/test-dtplyr-support.r
deleted file mode 100644
index a3499435..00000000
--- a/tests/testthat/test-dtplyr-support.r
+++ /dev/null
@@ -1,46 +0,0 @@
-context("test-dtplyr-verbs")
-
-setup({
-  b = data.frame(a = 51:150, b = 1:100)
-  tf = file.path(tempdir(), "test-dtplyr.df")
-  as.disk.frame(b, outdir = tf, nchunks = 5, overwrite = TRUE)
-})
-
-test_that("testing dtplyr", {
-  # TODO add tests when new version of dtplyr on CRAN
-  # iris_df = as.disk.frame(iris)
-  # 
-  # iris_df %>% 
-  #   filter(Sepal.Length > 7) %>% 
-  #   collect()
-  # 
-  # 
-  # aa = iris_df %>% 
-  #   cmap(~{
-  #     dtplyr::lazy_dt(.x) %>% 
-  #       filter(Sepal.Length > 7) %>% 
-  #       collect()
-  #   }) %>% 
-  #   collect
-  # 
-  # 
-  # lazy_dt <- function(...) {
-  #   UseMethod("lazy_dt")
-  # }
-  # 
-  # lazy_dt.disk.frame <- function(df, ...) {
-  #   cmap(df, )
-  # }
-  # 
-  # lazy_dt.default <- function(...) {
-  #   dtplyr::lazy_dt(...)
-  # }
-  expect_true(TRUE)
-})
-
-
-
-teardown({
-  fs::dir_delete(file.path(tempdir(), "test-dtplyr.df"))
-})
-
diff --git a/tests/testthat/test-foverlaps.r b/tests/testthat/test-foverlaps.r
deleted file mode 100644
index a4438aa0..00000000
--- a/tests/testthat/test-foverlaps.r
+++ /dev/null
@@ -1,42 +0,0 @@
-context("test-foverlaps")
-
-setup({
-  #setup_disk.frame(workers = 1)
-})
-
-# TODO currently it's not possible to do 
-test_that("test foverlap with data.frame", {
-  x = as.disk.frame(data.table(start=c(5,31,22,16), end=c(8,50,25,18), val2 = 7:10))
-  y = as.disk.frame(data.table(start=c(10, 20, 30), end=c(15, 35, 45), val1 = 1:3))
-  byxy = c("start", "end")
-  xy.df = foverlaps.disk.frame(
-    x, y, by.x = byxy, by.y = byxy,
-    merge_by_chunk_id = TRUE, overwrite = TRUE)
-  
-  collect(xy.df)
-  
-  testthat::expect_equal(nrow(xy.df), 3)
-})
-  
-
-# TODO this is also not a good test case
-# test_that("test foverlap with disk.frame", {  
-#   x = data.table(start=c(5,31,22,16), end=c(8,50,25,18), val2 = 7:10)
-#   y = data.table(start=c(10, 20, 30), end=c(15, 35, 45), val1 = 1:3)
-#   setkey(y, start, end)
-#   
-#   dx = shard(x, "tmp_fo.df", overwrite = T, shardby=c("start","end"))
-#   dy = shard(y, "tmp_to.df", overwrite = T, shardby=c("start","end"))
-#   
-#   xy1 = foverlaps(x,y, type="any", which = T)
-#   
-#   dxy1 = foverlaps.disk.frame(dx, dy, type="any", outdir="tmp_fo_out2.df") ## return overlap join
-#   dxy1c = dxy1 %>% collect
-#   
-#   foverlaps.disk.frame(dx, dy, type="any", mult="first", outdir="tmp_fo_out2.df") ## returns only first match
-#   foverlaps.disk.frame(dx, dy, type="within", outdir="tmp_fo_out3.df") ## matches iff 'x' is within 'y'
-# })
-
-teardown({
-  
-})
\ No newline at end of file
diff --git a/tests/testthat/test-full_join.R b/tests/testthat/test-full_join.R
deleted file mode 100644
index f40e8cb8..00000000
--- a/tests/testthat/test-full_join.R
+++ /dev/null
@@ -1,58 +0,0 @@
-context("test-full_join")
-
-setup({
-  a = data.frame(a = 1:100, b = 1:100)
-  b = data.frame(a = 51:150, b = 1:100)
-  d = data.frame(a = 1:50, b = 1:50)
-  
-  as.disk.frame(a, file.path(tempdir(), "tmp_a_fj.df"), nchunks = 4, overwrite = T)
-  as.disk.frame(b, file.path(tempdir(), "tmp_b_fj.df"), nchunks = 5, overwrite = T)
-  as.disk.frame(d, file.path(tempdir(), "tmp_d_fj.df"), overwrite = T)
-})
-
-test_that("testing full_join where right is data.frame", {
-  a = disk.frame(file.path(tempdir(), "tmp_a_fj.df"))
-  b = disk.frame(file.path(tempdir(), "tmp_b_fj.df"))
-  d = disk.frame(file.path(tempdir(), "tmp_d_fj.df"))
-  bc = collect(b)
-  dc = collect(d)
-  
-  abc <- full_join(a, bc, by = "a") %>% collect
-  expect_equal(nrow(abc), 150)
-  
-  abc0 <- full_join(a, bc, by = c("a","b")) %>% collect
-  expect_equal(nrow(abc0), 200)
-  
-  abc100 <- full_join(a, bc, by = "b") %>% collect
-  expect_equal(nrow(abc100), 100)
-  
-  abd50 <- full_join(a, dc, by = "b") %>% collect
-  expect_equal(nrow(abd50), 100)
-})
-
-test_that("testing full_join where right is disk.frame", {
-  a = disk.frame(file.path(tempdir(), "tmp_a_fj.df"))
-  b = disk.frame(file.path(tempdir(), "tmp_b_fj.df"))
-  d = disk.frame(file.path(tempdir(), "tmp_d_fj.df"))
-  
-  expect_warning({
-    ab <- full_join(a, b, by = "a", merge_by_chunk_id = F) %>% collect
-    })
-  expect_equal(nrow(ab), 150)
-  
-  expect_warning({ab0 = full_join(a, b, by = c("a","b"), merge_by_chunk_id = F) %>% collect})
-  expect_equal(nrow(ab0), 200)
-  
-  expect_warning({ab100 = full_join(a, b, by = "b", merge_by_chunk_id = F) %>% collect})
-  expect_equal(nrow(ab100), 100)
-  
-  expect_warning({ad50 = full_join(a, d, by = "b", merge_by_chunk_id = F) %>% collect})
-  expect_equal(nrow(ad50), 100)
-})
-
-
-teardown({
-  fs::dir_delete(file.path(tempdir(), "tmp_a_fj.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_b_fj.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_d_fj.df"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-get_chunk.r b/tests/testthat/test-get_chunk.r
deleted file mode 100644
index d33c336e..00000000
--- a/tests/testthat/test-get_chunk.r
+++ /dev/null
@@ -1,17 +0,0 @@
-context("test-get_chunk")
-
-setup({
-  #setup_disk.frame(workers = 1)
-  df = as.disk.frame(disk.frame:::gen_datatable_synthetic(1e5+11), file.path(tempdir(), "tmp_del_delete"), overwrite=T)
-})
-
-test_that("data.table .N", {
-  df = disk.frame(file.path(tempdir(), "tmp_del_delete"))
-  expect_s3_class(get_chunk(df, 1), "data.frame")
-
-  expect_s3_class(get_chunk(df, "1.fst"), "data.frame")
-})
-
-teardown({
-  fs::dir_delete(file.path(tempdir(), "tmp_del_delete"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-get_chunk_ids.r b/tests/testthat/test-get_chunk_ids.r
deleted file mode 100644
index 5e95c701..00000000
--- a/tests/testthat/test-get_chunk_ids.r
+++ /dev/null
@@ -1,20 +0,0 @@
-context("test-get_chunk_ids")
-
-setup({
-  #setup_disk.frame(workers = 1)
-  df = as.disk.frame(disk.frame:::gen_datatable_synthetic(1e5+11), file.path(tempdir(), "tmp_del_delete"), overwrite=T)
-})
-
-test_that("get_chunk_ids", {
-  df = disk.frame(file.path(tempdir(), "tmp_del_delete"))
-  
-  gci = get_chunk_ids(df)
-  expect_type(get_chunk_ids(df), "character")
-
-  gcis = get_chunk_ids(df, strip_extension = F)
-  expect_true("1.fst" %in% gcis)
-})
-
-teardown({
-  fs::dir_delete(file.path(tempdir(), "tmp_del_delete"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-glm.r b/tests/testthat/test-glm.r
deleted file mode 100644
index efa0122a..00000000
--- a/tests/testthat/test-glm.r
+++ /dev/null
@@ -1,30 +0,0 @@
-context("test-glm")
-
-setup({
-  #setup_disk.frame(workers = 1)
-})
-
-test_that("glm", {
-  cars.df = as.disk.frame(cars, outdir = file.path(tempdir(), "cars.df"), overwrite = TRUE)
-  
-  majorv = as.integer(version$major)
-  minorv = as.integer(strsplit(version$minor, ".", fixed=TRUE)[[1]][1])
-  
-  if((majorv == 3) & (minorv < 6)) {
-    expect_warning({m <- dfglm(dist~speed, cars.df, glm_backend = "biglm")})
-  } else {
-    m <- dfglm(dist~speed, cars.df, glm_backend = "biglm")
-  }
-  summary(m)
-  
-  if((majorv == 3) & (minorv >= 6) ) {
-    broom::tidy(m)
-  }
-  
-  m <- dfglm(dist~speed, cars.df, glm_backend = "speedglm")
-  summary(m)
-})
-
-teardown({
-  fs::dir_delete(file.path(tempdir(), "cars.df"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-group-by.R b/tests/testthat/test-group-by.R
deleted file mode 100644
index d6684114..00000000
--- a/tests/testthat/test-group-by.R
+++ /dev/null
@@ -1,309 +0,0 @@
-context("test-group_by")
-
-setup({
-  df = disk.frame:::gen_datatable_synthetic(1e3+11)
-  data.table::fwrite(df, file.path(tempdir(), "tmp_pls_delete_gb.csv"))
-})
-
-
-test_that("new group_by framework", {
-  if(interactive()) {
-    iris.df = iris %>% 
-      as.disk.frame
-    
-    grpby = iris.df %>% 
-        group_by(Species) %>% 
-        summarize(mean(Petal.Length), sumx = sum(Petal.Length/Sepal.Width), sd(Sepal.Width/ Petal.Length), var(Sepal.Width/ Sepal.Width)) %>% 
-        collect
-    
-    grpby2 = iris %>% 
-      group_by(Species) %>% 
-      summarize(mean(Petal.Length), sumx = sum(Petal.Length/Sepal.Width), sd(Sepal.Width/ Petal.Length), var(Sepal.Width/ Sepal.Width)) %>% 
-      arrange()
-    
-    for (n in names(grpby)) {
-      expect_true(all(grpby2[, n] == grpby[, n]) || all(abs(grpby2[, n] - grpby[, n]) < 0.0001))
-    }
-    
-    delete(iris.df)
-  }
-  expect_true(TRUE)
-})
-
-test_that("new group_by framework - no group-by just summarise", {
-  if(interactive()) {
-    iris.df = iris %>% 
-      as.disk.frame
-    
-    grpby = iris.df %>% 
-      summarize(mean(Petal.Length), sumx = sum(Petal.Length/Sepal.Width), sd(Sepal.Width/ Petal.Length), var(Sepal.Width/ Sepal.Width)) %>% 
-      collect
-    
-    grpby2 = iris %>% 
-      summarize(mean(Petal.Length), sumx = sum(Petal.Length/Sepal.Width), sd(Sepal.Width/ Petal.Length), var(Sepal.Width/ Sepal.Width)) %>% 
-      arrange()
-    
-    for (n in names(grpby)) {
-      expect_true(all(grpby2[, n] == grpby[, n]) || all(abs(grpby2[, n] - grpby[, n]) < 0.0001))
-    }
-    
-    delete(iris.df)
-  }
-  expect_true(TRUE)
-})
-
-# test_that("new group_by framework - nested-group-by", {
-  # if(interactive()) {
-  #   iris.df = iris %>% 
-  #     as.disk.frame
-  #   
-  #   expect_error(grpby <- iris.df %>% 
-  #     summarize(mean(Petal.Length + max(Petal.Length))) %>% 
-  #     collect)
-  #   
-  #   expect_error(grpby <- iris.df %>% 
-  #     summarize(mean(Petal.Length) + max(Petal.Length)) %>% 
-  #     collect)
-  #   
-  #   expect_error(grpby <- iris.df %>% 
-  #     summarize(mean(Petal.Length) + 1) %>% 
-  #     collect)
-  #   
-  #   expect_error(grpby <- iris.df %>% 
-  #     summarize(list(mean(Petal.Length))) %>% 
-  #     collect)
-  #   
-  #   fn_tmp = function(x) x + 1
-  #   grpby <- iris.df %>% 
-  #       summarize(mean(fn_tmp(Petal.Length))) %>% 
-  #       collect
-  #   
-  #   grpby2 <- iris %>% 
-  #     summarize(mean(fn_tmp(Petal.Length)))
-  #   
-  #   for (n in names(grpby)) {
-  #     expect_true(all(grpby2[, n] == grpby[, n]) || all(abs(grpby2[, n] - grpby[, n]) < 0.0001))
-  #   }
-  #   delete(iris.df)
-  # }
-  # expect_true(TRUE)
-# })
-
-test_that("guard against github #241", {
-  if(interactive()) {
-    # I suspect there was an issue with number of chunk = 1
-    result_from_disk.frame = iris %>%
-      as.disk.frame(nchunks = 1) %>%
-      group_by(Species) %>%
-      summarize(
-        mean(Petal.Length),
-        sumx = sum(Petal.Length/Sepal.Width),
-        sd(Sepal.Width/ Petal.Length),
-        var(Sepal.Width/ Sepal.Width),
-        l = length(Sepal.Width/ Sepal.Width + 2),
-        max(Sepal.Width),
-        min(Sepal.Width),
-        median(Sepal.Width)
-      ) %>%
-      collect
-  } else {
-    expect_true(TRUE)
-  }
-})
-
-
-test_that("group_by", {
-  dff = csv_to_disk.frame(
-    file.path(tempdir(), "tmp_pls_delete_gb.csv"), 
-    file.path(tempdir(), "tmp_pls_delete_gb.df"))
-  
-  dff_res = dff %>% 
-    collect %>% 
-    group_by(id1) %>% 
-    summarise(mv1 = mean(v1))
-  
-  dff1 <- dff %>% 
-    chunk_group_by(id1, id2) %>%
-    chunk_summarise(mv1 = mean(v1)) %>% 
-    collect
-
-  expect_false(nrow(dff1) == nrow(dff_res))
-})
-
-test_that("test hard_group_by on disk.frame", {
-  dff = csv_to_disk.frame(
-    file.path(tempdir(), "tmp_pls_delete_gb.csv"), 
-    file.path(tempdir(), "tmp_pls_delete_gb.df"))
-  
-  dff_res = dff %>% 
-    collect %>% 
-    group_by(id1, id2) %>% 
-    summarise(mv1 = mean(v1))
-  
-  dff1 <- dff %>% 
-      hard_group_by(id1, id2) %>%
-      chunk_summarise(mv1 = mean(v1)) %>% collect
-  
-  expect_equal(nrow(dff1), nrow(dff_res))
-})
-
-test_that("test hard_group_by on data.frame", {
-  df = disk.frame:::gen_datatable_synthetic(1e3+11)
-  
-  df1 = df %>% 
-    group_by(id1, id2) %>% 
-    summarise(mv1 = mean(v1))
-  
-  dff1 <- df %>% 
-    hard_group_by(id1,id2) %>%
-    summarise(mv1 = mean(v1))
-  
-  expect_equal(nrow(dff1), nrow(df1))
-})
-
-
-test_that("test hard_group_by on disk.frame (sort)", {
-  dff = csv_to_disk.frame(
-    file.path(tempdir(), "tmp_pls_delete_gb.csv"), 
-    file.path(tempdir(), "tmp_pls_delete_gb.df"))
-  
-  dff_res = dff %>% 
-    collect %>% 
-    group_by(id1, id2) %>% 
-    summarise(mv1 = mean(v1))
-  
-  dff1 <- dff %>% 
-    hard_group_by(id1, id2, shardby_function="sort") %>%
-    chunk_summarise(mv1 = mean(v1)) %>% collect
-  
-  expect_equal(nrow(dff1), nrow(dff_res))
-})
-
-test_that("test hard_group_by on data.frame (sort)", {
-  df = disk.frame:::gen_datatable_synthetic(1e3+11)
-  
-  df1 = df %>% 
-    group_by(id1, id2) %>% 
-    summarise(mv1 = mean(v1))
-  
-  dff1 <- df %>% 
-    hard_group_by(id1, id2, shardby_function="sort") %>%
-    summarise(mv1 = mean(v1))
-  
-  expect_equal(nrow(dff1), nrow(df1))
-})
-
-test_that("guard against github 256", {
-  test2 <- tibble::tibble(
-    date = lubridate::ymd(rep(c("2019-01-02", "2019-02-03", "2019-03-04"), 4)),
-    uid = as.factor(rep(c(uuid::UUIDgenerate(), uuid::UUIDgenerate()), 6)),
-    proto = as.factor(rep(c("TCP", "UDP", "ICMP"), 4)),
-    port = as.double(rep(c(22, 21, 0), 4))
-  )
-  
-  correct_result = test2 %>%
-    group_by(date, uid, proto, port) %>%
-    summarize(n=n()) %>% 
-    collect
-  
-  test_df = as.disk.frame(test2, nchunks = 2, overwrite=TRUE)
-  
-  incorrect_result = test_df %>%
-    group_by(date, uid, proto, port) %>%
-    summarize(n=n()) %>% 
-    collect
-  
-  expect_equal(dim(incorrect_result), dim(correct_result))
-})
-
-test_that("guard against github 256 #2", {
-  test2 <- tibble::tibble(
-    date = lubridate::ymd(rep(c("2019-01-02", "2019-02-03", "2019-03-04"), 4)),
-    uid = as.factor(rep(c(uuid::UUIDgenerate(), uuid::UUIDgenerate()), 6)),
-    proto = as.factor(rep(c("TCP", "UDP", "ICMP"), 4)),
-    port = as.double(rep(c(22, 21, 0), 4))
-  )
-  
-  test_df = as.disk.frame(test2, nchunks = 2, overwrite=TRUE)
-  
-  
-  correct_result = test_df %>%
-    group_by(!!!syms(names(test_df))) %>%
-    summarize(n=n()) %>% 
-    collect
-  
-  incorrect_result = test_df %>%
-    group_by(date, uid, proto, port) %>%
-    summarize(n=n()) %>% 
-    collect
-  
-  expect_equal(dim(incorrect_result), dim(correct_result))
-})
-
-test_that("guard against github 256 #3", {
-  library(testthat)
-  library(disk.frame)
-  setup_disk.frame()
-  
-  test2 <- tibble::tibble(
-    date = sample(1:10, 20, replace = TRUE),
-    uid = sample(1:10, 20, replace = TRUE)
-  )
-  
-  test_df = as.disk.frame(test2, nchunks = 2, overwrite=TRUE)
-  
-  ntd = names(test_df)
-  
-  correct_result = test_df %>%
-    group_by(!!!syms(ntd)) %>%
-    summarize(n=n()) %>% 
-    collect
-  
-  incorrect_result = test_df %>%
-    group_by(date, uid) %>%
-    summarize(n=n()) %>% 
-    collect
-  
-  expect_equal(dim(incorrect_result), dim(correct_result))
-})
-
-test_that("tests for github #250", {
-  aggregate_expressions <- list(n = quote(n()))
-  
-  result1 = iris %>% 
-    as.disk.frame() %>% 
-    group_by(Species) %>%
-    summarise(n = n()) %>% 
-    collect
-  
-  result2 <- iris %>% 
-    as.disk.frame() %>% 
-    group_by(Species) %>%
-    summarize(!!!(aggregate_expressions)) %>% 
-    collect
-  
-  expect_equal(result1, result2)
-})
-
-test_that("tests for github #250 2", {
-  aggregate_expressions <- list(n = quote(n()), quote(n()))
-  
-  result1 = iris %>% 
-    as.disk.frame() %>% 
-    group_by(Species) %>%
-    summarise(n = n(), n()) %>% 
-    collect; result1
-  
-  result2 <- iris %>% 
-    as.disk.frame() %>% 
-    group_by(Species) %>%
-    summarize(!!!(aggregate_expressions)) %>% 
-    collect
-  
-  expect_equal(result1, result2)
-})
-
-teardown({
-  fs::file_delete(file.path(tempdir(), "tmp_pls_delete_gb.csv"))
-  fs::dir_delete(file.path(tempdir(), "tmp_pls_delete_gb.df"))
-})
diff --git a/tests/testthat/test-hard-arrange.R b/tests/testthat/test-hard-arrange.R
deleted file mode 100644
index 0419cee8..00000000
--- a/tests/testthat/test-hard-arrange.R
+++ /dev/null
@@ -1,111 +0,0 @@
-context("test-arrange")
-
-setup({
-  
-  df = disk.frame:::gen_datatable_synthetic(1e3+11)
-  data.table::fwrite(df, file.path(tempdir(), "tmp_pls_delete_gb.csv"))
-})
-
-test_that("test hard_arrange on disk.frame, single chunk", {
-  # Randomise rows since rows are already sorted
-  iris.df = as.disk.frame(sample_n(iris, nrow(iris)), nchunks = 1)
-  iris_hard.df = hard_arrange(iris.df, Species)
-  
-  # Check sort
-  expect_true(!is.unsorted(iris_hard.df$Species))
-})
-
-test_that("test hard_arrange on disk.frame, single variable", {
-  dff = csv_to_disk.frame(
-    file.path(tempdir(), "tmp_pls_delete_gb.csv"), 
-    file.path(tempdir(), "tmp_pls_delete_gb.df"))
-  
-  # Sort ascending, one level
-  sorted_dff <- dff %>% hard_arrange(id1)
-  sorted_df <- sorted_dff %>% collect
-  
-  expect_true(!is.unsorted(sorted_df$id1))
-})
-
-test_that("test hard_arrange on disk.frame, factor data type", {
-  iris.df = as.disk.frame(sample_n(iris, nrow(iris)), nchunks = 2)
-  iris_hard.df = hard_arrange(iris.df, Species)
-
-  expect_true(!is.unsorted(iris_hard.df$Species))  
-})
-
-test_that("test hard_arrange on disk.frame, date data type", {
-  dff = csv_to_disk.frame(
-    file.path(tempdir(), "tmp_pls_delete_gb.csv"), 
-    file.path(tempdir(), "tmp_pls_delete_gb.df"))
-  sorted_dff <- dff %>% hard_arrange(date1)
-  
-  expect_true(!is.unsorted(sorted_dff$date1))    
-})
-
-test_that("test hard_arrange on disk.frame, two and three variables", {   
-  dff = csv_to_disk.frame(
-    file.path(tempdir(), "tmp_pls_delete_gb.csv"), 
-    file.path(tempdir(), "tmp_pls_delete_gb.df"))
-  
-  dfp <- read.csv(file.path(tempdir(), "tmp_pls_delete_gb.csv"))
-  
-  # Sort ascending, two levels
-  sorted_dff <- dff %>% hard_arrange(id1, id4) %>% collect
-  sorted_dfp <- dff %>% collect %>% dplyr::arrange(id1, id4) 
-  
-  # Compare vs dplyr
-  expect_true(all(sorted_dff$id1 == sorted_dfp$id1))
-  expect_true(all(sorted_dff$id4 == sorted_dfp$id4))
-  
-  # Sort ascending, three levels, from already partially sorted disk frame
-  sorted_dff2 <- sorted_dff %>% hard_arrange(id1, id4, id6) %>% collect
-  sorted_dfp2 <- dff %>% collect %>% dplyr::arrange(id1, id4, id6) 
-  
-  # Compare vs dplyr
-  expect_true(all(sorted_dff2$id1 == sorted_dfp2$id1))
-  expect_true(all(sorted_dff2$id4 == sorted_dfp2$id4))
-  expect_true(all(sorted_dff2$id6 == sorted_dfp2$id6))  
-})
-
-test_that("test hard_arrange on disk.frame, two factors", { 
-  dff = csv_to_disk.frame(
-    file.path(tempdir(), "tmp_pls_delete_gb.csv"), 
-    file.path(tempdir(), "tmp_pls_delete_gb.df"))
-    
-  # Sort decending, two levels
-  desc_dff <- dff %>% hard_arrange(desc(id4), id2)
-  desc_dff <- desc_dff %>% collect
-  
-  #  Level 1
-  expect_true(!is.unsorted(-desc_dff$id4))
-  
-  #  Level 2
-  desc_dff$id4_id2 <- paste0(
-    formatC(max(desc_dff$id4) - desc_dff$id4, width=3, format="d", flag= "0"), 
-    desc_dff$id2)
-  expect_true(!is.unsorted(-desc_dff$id4))
-})
-
-test_that("test hard_arrange on data.frame vs dplyr", {
-  df = disk.frame:::gen_datatable_synthetic(1e3+11)
-  
-  # Sort ascending
-  sorted_dff <- df %>% hard_arrange(id1, id4) %>% collect
-  sorted_dfp <- df %>% dplyr::arrange(id1, id4)
-  
-  expect_true(all(sorted_dff$id1 == sorted_dfp$id1))
-  expect_true(all(sorted_dff$id4 == sorted_dfp$id4))
-  
-  # Sort decending
-  desc_dff <- df %>% hard_arrange(desc(id4), id2) %>% collect
-  desc_dfp <- df %>% dplyr::arrange(desc(id4), id2) 
-  
-  expect_true(all(sorted_dff$id4 == sorted_dfp$id4))
-  expect_true(all(sorted_dff$id2 == sorted_dfp$dfp))  
-})
-
-teardown({
-  fs::file_delete(file.path(tempdir(), "tmp_pls_delete_gb.csv"))
-  fs::dir_delete(file.path(tempdir(), "tmp_pls_delete_gb.df"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-inner_join.R b/tests/testthat/test-inner_join.R
deleted file mode 100644
index e165a142..00000000
--- a/tests/testthat/test-inner_join.R
+++ /dev/null
@@ -1,64 +0,0 @@
-context("test-inner_join")
-
-setup({
-  a = data.frame(a = 1:100, b = 1:100)
-  b = data.frame(a = 51:150, b = 1:100)
-  d = data.frame(a = 1:50, b = 1:50)
-  
-  as.disk.frame(a, file.path(tempdir(), "tmp_a_ij.df"), nchunks = 4, overwrite = T)
-  as.disk.frame(b, file.path(tempdir(), "tmp_b_ij.df"), nchunks = 5, overwrite = T)
-  as.disk.frame(d, file.path(tempdir(), "tmp_d_ij.df"), overwrite = T)
-
-  as.disk.frame(a, file.path(tempdir(), "tmp_a_ij2.df"), nchunks = 4, overwrite = T)
-  as.disk.frame(b, file.path(tempdir(), "tmp_b_ij2.df"), nchunks = 5, overwrite = T)
-  as.disk.frame(d, file.path(tempdir(), "tmp_d_ij2.df"), overwrite = T)
-})
-
-test_that("testing inner_join where right is data.frame", {
-  a = disk.frame(file.path(tempdir(), "tmp_a_ij.df"))
-  b = disk.frame(file.path(tempdir(), "tmp_b_ij.df"))
-  d = disk.frame(file.path(tempdir(), "tmp_d_ij.df"))
-  bc = collect(b)
-  dc = collect(d)
-  
-  abc = inner_join(a, bc, by = "a") %>% collect
-  expect_equal(nrow(abc), 50)
-  
-  abc0 = inner_join(a, bc, by = c("a","b")) %>% collect
-  expect_equal(nrow(abc0), 0)
-  
-  abc100 = inner_join(a, bc, by = "b") %>% collect
-  expect_equal(nrow(abc100), 100)
-  
-  abd50 = inner_join(a, dc, by = "b") %>% collect
-  expect_equal(nrow(abd50), 50)
-})
-
-test_that("testing inner_join where right is disk.frame", {
-  a = disk.frame(file.path(tempdir(), "tmp_a_ij2.df"))
-  b = disk.frame(file.path(tempdir(), "tmp_b_ij2.df"))
-  d = disk.frame(file.path(tempdir(), "tmp_d_ij2.df"))
-  
-  ab = inner_join(a, b, by = "a", merge_by_chunk_id = F) %>% collect
-  expect_equal(nrow(ab), 50)
-  
-  # expecting a warning for some chunks being 0 rows
-  expect_warning(ab0 <- inner_join(a, b, by = c("a","b"), merge_by_chunk_id = F) %>% collect)
-  expect_equal(nrow(ab0), 0)
-  
-  ab100 = inner_join(a, b, by = "b", merge_by_chunk_id = F) %>% collect
-  expect_equal(nrow(ab100), 100)
-  
-  ad50 = inner_join(a, d, by = "b", merge_by_chunk_id = F) %>% collect
-  expect_equal(nrow(ad50), 50)
-})
-
-
-teardown({
-  fs::dir_delete(file.path(tempdir(), "tmp_a_ij.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_b_ij.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_d_ij.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_a_ij2.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_b_ij2.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_d_ij2.df"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-is-disk.frame.r b/tests/testthat/test-is-disk.frame.r
deleted file mode 100644
index 87d4fde4..00000000
--- a/tests/testthat/test-is-disk.frame.r
+++ /dev/null
@@ -1,12 +0,0 @@
-context("test-is-disk-frame")
-
-test_that("testing is_disk.frame", {
-  fs::dir_create(file.path(tempdir(), "tmp_is_disk_frame"))
-  fst::write_fst(data.frame(a= 1, b = 1), file.path(tempdir(), "tmp_is_disk_frame/1.fst"))
-  fst::write_fst(data.frame(a= 1, b = 1), file.path(tempdir(), "tmp_is_disk_frame/2.fst"))
-  
-  df = disk.frame(file.path(tempdir(), "tmp_is_disk_frame"))
-  expect_true(is_disk.frame(df))
-  
-  disk.frame::delete(df)
-})
diff --git a/tests/testthat/test-left_join.R b/tests/testthat/test-left_join.R
deleted file mode 100644
index 66801085..00000000
--- a/tests/testthat/test-left_join.R
+++ /dev/null
@@ -1,71 +0,0 @@
-context("test-left_join")
-
-setup({
-  
-  a = data.frame(a = 1:100, b = 1:100)
-  b = data.frame(a = 51:150, b = 1:100)
-  d = data.frame(a = 1:50, b = 1:50)
-  
-  as.disk.frame(a, file.path(tempdir(), "tmp_a_lj.df"), nchunks = 4, overwrite = T)
-  as.disk.frame(b, file.path(tempdir(), "tmp_b_lj.df"), nchunks = 5, overwrite = T)
-  as.disk.frame(d, file.path(tempdir(), "tmp_d_lj.df"), overwrite = T)
-
-  as.disk.frame(a, file.path(tempdir(), "tmp_a_lj2.df"), nchunks = 4, overwrite = T)
-  as.disk.frame(b, file.path(tempdir(), "tmp_b_lj2.df"), nchunks = 5, overwrite = T)
-  as.disk.frame(d, file.path(tempdir(), "tmp_d_lj2.df"), overwrite = T)
-})
-
-test_that("testing left_join where right is data.frame", {
-  a = disk.frame(file.path(tempdir(), "tmp_a_lj.df"))
-  b = disk.frame(file.path(tempdir(), "tmp_b_lj.df"))
-  d = disk.frame(file.path(tempdir(), "tmp_d_lj.df"))
-  bc = collect(b)
-  dc = collect(d)
-  
-  abc = left_join(a, bc, by = "a") %>% collect
-  expect_equal(nrow(abc), 100)
-  
-  abc0 = left_join(a, bc, by = c("a","b")) %>% collect
-  expect_equal(nrow(abc0), 100)
-  
-  abc100 = left_join(a, bc, by = "b") %>% collect
-  expect_equal(nrow(abc100), 100)
-  
-  abd50 = left_join(a, dc, by = "b") %>% collect
-  expect_equal(nrow(abd50), 100)
-})
-
-test_that("testing left_join where right is disk.frame", {
-  a = disk.frame(file.path(tempdir(), "tmp_a_lj2.df"))
-  b = disk.frame(file.path(tempdir(), "tmp_b_lj2.df"))
-  d = disk.frame(file.path(tempdir(), "tmp_d_lj2.df"))
-  
-  expect_warning({
-    ab = left_join(a, b, by = "a", merge_by_chunk_id = F) %>% collect
-    })
-  expect_equal(nrow(ab), 100)
-  
-  expect_warning({
-    ab0 = left_join(a, b, by = c("a","b"), merge_by_chunk_id = F) %>% collect
-    })
-  expect_equal(nrow(ab0), 100)
-  
-  expect_warning({
-    ab100 = left_join(a, b, by = "b", merge_by_chunk_id = F) %>% collect
-    })
-  expect_equal(nrow(ab100), 100)
-  
-  expect_warning({
-    ad50 = left_join(a, d, by = "b", merge_by_chunk_id = F) %>% collect
-    })
-  expect_equal(nrow(ad50), 100)
-})
-
-teardown({
-  fs::dir_delete(file.path(tempdir(), "tmp_a_lj.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_b_lj.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_d_lj.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_a_lj2.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_b_lj2.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_d_lj2.df"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-map.r b/tests/testthat/test-map.r
deleted file mode 100644
index beec44ba..00000000
--- a/tests/testthat/test-map.r
+++ /dev/null
@@ -1,76 +0,0 @@
-context("test-cmap")
-
-setup({
-  b = data.frame(a = 51:150, b = 1:100)
-  as.disk.frame(b, file.path(tempdir(), "tmp_map.df"), nchunks = 5, overwrite = T)
-})
-
-test_that("testing cmap lazy", {
-  b = disk.frame(file.path(tempdir(), "tmp_map.df"))
-  
-  # return 1 row from each chunk
-  df = b %>% cmap(~.x[1])
-  
-  expect_s3_class(df, "disk.frame")
-  
-  df2 = df %>% collect
-  
-  expect_s3_class(df2, "data.frame")
-  
-  expect_equal(nrow(df2), 5L)
-})
-
-test_that("testing cmap eager", {
-  b = disk.frame(file.path(tempdir(), "tmp_map.df"))
-  
-  # return 1 row from each chunk
-  df = b %>% cmap(~.x[1], lazy = F)
-  expect_false("disk.frame" %in% class(df))
-
-  # return 1 row from each chunk
-  df = b %>% cmap_dfr(~.x[1])
-  expect_false("disk.frame" %in% class(df))
-  expect_true("data.frame" %in% class(df))
-})
-
-test_that("testing delayed", {
-  b = disk.frame(file.path(tempdir(), "tmp_map.df"))
-  
-  # return 1 row from each chunk
-  df = b %>% delayed(~.x[1])
-  
-  expect_s3_class(df, "disk.frame")
-  
-  df1 = collect(df)
-  
-  expect_equal(nrow(df1), 5)
-})
-
-
-test_that("testing map_dfr", {
-  b = disk.frame(file.path(tempdir(), "tmp_map.df"))
-  
-  # return 1 row from each chunk
-  df = b %>% cmap_dfr(~.x[1,])
-  
-  expect_s3_class(df, "data.frame")
-})
-
-
-test_that("testing imap", {
-  b = disk.frame(file.path(tempdir(), "tmp_map.df"))
-  
-  # return 1 row from each chunk
-  df = b %>% cimap_dfr(~{
-    y = .x[1,]
-    y[,ok := .y]
-    y
-    })
-  
-  expect_s3_class(df, "data.frame")
-})
-
-
-teardown({
-  fs::dir_delete(file.path(tempdir(), "tmp_map.df"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-map2.r b/tests/testthat/test-map2.r
deleted file mode 100644
index 926d49ee..00000000
--- a/tests/testthat/test-map2.r
+++ /dev/null
@@ -1,46 +0,0 @@
-context("test-cmap2")
-
-setup({
-  b = data.frame(a = 51:150, b = 1:100)
-  d = data.frame(a = 151:250, b = 1:100)
-  as.disk.frame(b, file.path(tempdir(), "tmp_map2.df"), nchunks = 5, overwrite = T)
-  as.disk.frame(d, file.path(tempdir(), "tmp_map2d.df"), nchunks = 5, overwrite = T)
-})
-
-test_that("testing cmap2 .y is disk.frame", {
-  b = disk.frame(file.path(tempdir(), "tmp_map2.df"))
-  d = disk.frame(file.path(tempdir(), "tmp_map2d.df"))
-  
-  # return 1 row from each chunk
-  df = cmap2(b, d, ~rbindlist(list(.x[1,],.y[1,])), outdir = file.path(tempdir(), "tmp_map2_out.df"))
-  
-  expect_s3_class(df, "disk.frame")
-  
-  df2 = df %>% collect
-  
-  expect_s3_class(df2, "data.frame")
-  
-  expect_equal(nrow(df2), 10L)
-})
-
-test_that("testing map2 .y is not disk.frame", {
-  b = disk.frame(file.path(tempdir(), "tmp_map2.df"))
-  d = 1:nchunks(b)
-  
-  # return 1 row from each chunk
-  expect_warning(df <- cmap2(b, d, ~.x[1,.(y = .y)], outdir = "tmp_map2_out2.df"))
-  
-  expect_type(df, "list")
-  
-  df2 = df %>% rbindlist
-  
-  expect_s3_class(df2, "data.frame")
-  
-  expect_equal(nrow(df2), 5L)
-})
-
-teardown({
-  fs::dir_delete(file.path(tempdir(), "tmp_map2.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_map2d.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_map2_out.df"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-merge.r b/tests/testthat/test-merge.r
deleted file mode 100644
index 41bb37e4..00000000
--- a/tests/testthat/test-merge.r
+++ /dev/null
@@ -1,59 +0,0 @@
-context("test-merge.disk.frame")
-
-setup({
-  b = data.frame(a = 51:150, b = 1:100)
-  d = data.frame(a = 151:250, b = 1:100)
-  as.disk.frame(b, file.path(tempdir(), "tmp_merge.df"), nchunks = 5, overwrite = TRUE)
-  as.disk.frame(d, file.path(tempdir(), "tmp_merge2.df"), nchunks = 5, overwrite = TRUE)
-})
-
-test_that("testing merge of disk.frame", {
-  b.df = disk.frame(file.path(tempdir(), "tmp_merge.df"))
-  d.df = disk.frame(file.path(tempdir(), "tmp_merge2.df"))
-  
-  bd.df = merge(b.df, d.df, by = "b", outdir = file.path(tempdir(), "tmp_bd_merge.df"), overwrite = TRUE, merge_by_chunk_id = TRUE)
-  
-  expect_s3_class(bd.df, "disk.frame")
-  expect_equal(nrow(bd.df), 100)
-})
-
-test_that("testing merge of data.frame", {
-  b.df = disk.frame(file.path(tempdir(), "tmp_merge.df"))
-  d = data.frame(a = 151:250, b = 1:100)
-
-  bd.df = merge(b.df, d, by = "b", outdir = file.path(tempdir(), "tmp_bd_merge2.df"), overwrite = TRUE)
-
-  expect_s3_class(bd.df, "disk.frame")
-  expect_equal(nrow(bd.df), 100)
-
-  tmp  = collect(bd.df)
-
-  expect_s3_class(tmp, "data.frame")
-  expect_equal(nrow(tmp), 100)
-})
-
-test_that("testing error when merge_by_chunk = FALSE", {
-  b.df = disk.frame(file.path(tempdir(), "tmp_merge.df"))
-  d.df = disk.frame(file.path(tempdir(), "tmp_merge2.df"))
-  
-  testthat::expect_error()
-  expect_error(
-    merge(
-      b.df, 
-      d.df, 
-      by = "b", 
-      outdir = file.path(tempdir(), "tmp_bd_merge.df"), 
-      overwrite = TRUE, 
-      merge_by_chunkd_id  = FALSE
-    )
-  )
-})
-
-
-
-teardown({
-  fs::dir_delete(file.path(tempdir(), "tmp_merge.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_merge2.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_bd_merge.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_bd_merge2.df"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-names.r b/tests/testthat/test-names.r
deleted file mode 100644
index 0441136b..00000000
--- a/tests/testthat/test-names.r
+++ /dev/null
@@ -1,18 +0,0 @@
-context("test-names")
-
-setup({
-  b = data.frame(a = 51:150, b = 1:100)
-  as.disk.frame(b, file.path(tempdir(), "tmp_names.df"), nchunks = 5, overwrite = T)
-})
-
-test_that("testing names", {
-  b = disk.frame(file.path(tempdir(), "tmp_names.df"))
-  
-  expect_setequal(colnames(b), c("a","b"))
-  expect_setequal(names(b), c("a","b"))
-})
-
-
-teardown({
-  fs::dir_delete(file.path(tempdir(), "tmp_names.df"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-nchunks.r b/tests/testthat/test-nchunks.r
deleted file mode 100644
index bf716810..00000000
--- a/tests/testthat/test-nchunks.r
+++ /dev/null
@@ -1,18 +0,0 @@
-context("test-nchunks")
-
-setup({
-  b = data.frame(a = 51:150, b = 1:100)
-  as.disk.frame(b, file.path(tempdir(), "tmp_chunks.df"), nchunks = 5, overwrite = T)
-})
-
-test_that("testing nchunks", {
-  b = disk.frame(file.path(tempdir(), "tmp_chunks.df"))
-  
-  expect_equal(nchunks(b), 5)
-  expect_equal(nchunk(b), 5)
-})
-
-
-teardown({
-  fs::dir_delete(file.path(tempdir(), "tmp_chunks.df"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-nrow-ncol.R b/tests/testthat/test-nrow-ncol.R
deleted file mode 100644
index 05b33601..00000000
--- a/tests/testthat/test-nrow-ncol.R
+++ /dev/null
@@ -1,20 +0,0 @@
-context("test-nrow-ncol")
-
-setup({
-  df = disk.frame:::gen_datatable_synthetic(1e3+11)
-  data.table::fwrite(df, file.path(tempdir(), "tmp_pls_delete.csv"))
-})
-
-test_that("nrow ncol", {
-  dff = csv_to_disk.frame(
-    file.path(tempdir(), "tmp_pls_delete.csv"), 
-    file.path(tempdir(), "tmp_pls_delete.df"))
-  
-  expect_equal(nrow(dff), 1e3+11)
-  expect_equal(ncol(dff), 10)
-})
-
-teardown({
-  fs::file_delete(file.path(tempdir(), "tmp_pls_delete.csv"))
-  fs::dir_delete(file.path(tempdir(), "tmp_pls_delete.df"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-overwrite_check.r b/tests/testthat/test-overwrite_check.r
deleted file mode 100644
index 59f6548e..00000000
--- a/tests/testthat/test-overwrite_check.r
+++ /dev/null
@@ -1,21 +0,0 @@
-context("test-overwrite_check")
-
-setup({
-})
-
-test_that("testing overwrite_check", {
-  b = data.frame(a = 51:150, b = 1:100)
-  
-  fs::dir_create(file.path(tempdir(), "tmp_overwrite-check"))
-  fs::file_create(file.path(tempdir(), "tmp_overwrite-check/tmp"))
-  
-  
-  expect_error(disk.frame::overwrite_check(file.path(tempdir(), "tmp_overwrite-check"), overwrite = TRUE))
-  
-  expect_error(disk.frame::overwrite_check(file.path(tempdir(), "tmp_overwrite-check"), overwrite = FALSE))
-})
-
-
-teardown({
-  fs::dir_delete(file.path(tempdir(), "tmp_overwrite-check"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-pls-add.r b/tests/testthat/test-pls-add.r
deleted file mode 100644
index 29f0e78b..00000000
--- a/tests/testthat/test-pls-add.r
+++ /dev/null
@@ -1,44 +0,0 @@
-context("test-pls-add")
-
-setup({
-  #setup_disk.frame(workers = 1)
-})
-
-test_that("pls-add", {
-  
-  if (interactive()) {
-    library(disk.frame)
-    library(tidyverse)
-    
-    setup_disk.frame(2)
-    example <- as.disk.frame(
-      data.frame(
-        purchase_date=c("2020-03-20","2020-04-20"),
-        a = 1:2,
-        b = 3:4
-      )
-    )
-    example %>% 
-      mutate(Panel_Month = str_sub(purchase_date, 6, 7)) %>% 
-      collect
-    
-    str_sub2 = function(xx, yy) xx + yy
-    
-    example %>% 
-      mutate(Panel_Month = str_sub2(a, b)) %>% 
-      collect
-    
-    example %>% 
-      mutate(Panel_Month = str_sub2(a, 7)) %>% 
-      collect
-    
-    example %>% 
-      mutate(Panel_Month = str_sub2(6, 7)) %>% 
-      collect
-    
-    
-    example %>% 
-      mutate(Panel_Month = str_subs(purchase_date, 7)) %>% 
-      collect
-  }
-})
\ No newline at end of file
diff --git a/tests/testthat/test-print.r b/tests/testthat/test-print.r
deleted file mode 100644
index 9d1053cc..00000000
--- a/tests/testthat/test-print.r
+++ /dev/null
@@ -1,14 +0,0 @@
-context("test-print")
-
-setup({
-})
-
-test_that("testing print", {
-  # TODO proper tests
-  expect_equal(2L, 2L)
-})
-
-
-teardown({
-  
-})
\ No newline at end of file
diff --git a/tests/testthat/test-pull.r b/tests/testthat/test-pull.r
deleted file mode 100644
index 4acfa8d4..00000000
--- a/tests/testthat/test-pull.r
+++ /dev/null
@@ -1,50 +0,0 @@
-context("test-pull")
-
-
-test_that("pull with",  {
-  flights_df = as.disk.frame(nycflights13::flights)
-  
-  a = flights_df %>% 
-    pull(carrier, carrier)
-  
-  b = flights_df %>% collect() %>% pull(carrier, carrier)
-  
-  expect_equal(a, b)
-  
-  a = flights_df %>% 
-    pull(2, 2)
-  b = flights_df %>% collect() %>% pull(2, 2)
-  
-  expect_equal(a, b)
-  
-  a = flights_df %>% 
-    pull(-1, -1)
-  b = flights_df %>% collect() %>% pull(-1, -1)
-  expect_equal(a, b)
-  
-  delete(flights_df)
-})
-
-
-test_that("pull",  {
-  flights_df = as.disk.frame(nycflights13::flights)
-  
-  a = flights_df %>% 
-    pull(carrier)
-  b = flights_df %>% collect() %>% pull(carrier)
-  
-  expect_setequal(a, b)
-  
-  a = flights_df %>% 
-    pull(2)
-  b = flights_df %>% collect() %>% pull(2)
-  
-  expect_setequal(a, b)
-  
-  a = flights_df %>% 
-    pull(-1)
-  b = flights_df %>% collect() %>% pull(-1)
-  expect_setequal(a, b)
-  
-  delete(flights_df)
-})
diff --git a/tests/testthat/test-rbindlist.r b/tests/testthat/test-rbindlist.r
deleted file mode 100644
index d30cada0..00000000
--- a/tests/testthat/test-rbindlist.r
+++ /dev/null
@@ -1,31 +0,0 @@
-context("test-rbindlist")
-
-setup({
-  as.disk.frame(disk.frame:::gen_datatable_synthetic(1e3+11), file.path(tempdir(), "tmp_rbindlist1.df"), overwrite=TRUE)
-  as.disk.frame(disk.frame:::gen_datatable_synthetic(1e3+11), file.path(tempdir(), "tmp_rbindlist2.df"), overwrite=TRUE)
-  as.disk.frame(disk.frame:::gen_datatable_synthetic(1e3+11), file.path(tempdir(), "tmp_rbindlist4.df"), overwrite=TRUE)
-})
-
-test_that("test rbindlist", {
-  df1 = disk.frame(file.path(tempdir(), "tmp_rbindlist1.df"))
-  df2 = disk.frame(file.path(tempdir(), "tmp_rbindlist2.df"))
-  
-  df3 = rbindlist.disk.frame(list(df1, df2), outdir = file.path(tempdir(), "tmp_rbindlist3.df"), overwrite=TRUE)
-  
-  expect_equal(nrow(df3), 2*(1e3+11))
-})
-
-test_that("test rbindlist accepts only list", {
-  df1 = disk.frame(file.path(tempdir(), "tmp_rbindlist4.df"))
-
-  expect_error(rbindlist.disk.frame(df1, outdir = file.path(tempdir(), "tmp_rbindlist5.df")))
-})
-
-
-teardown({
-  fs::dir_delete(file.path(tempdir(), "tmp_rbindlist1.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_rbindlist2.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_rbindlist3.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_rbindlist4.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_rbindlist5.df"))
-})
diff --git a/tests/testthat/test-rechunk.r b/tests/testthat/test-rechunk.r
deleted file mode 100644
index 68f59938..00000000
--- a/tests/testthat/test-rechunk.r
+++ /dev/null
@@ -1,82 +0,0 @@
-context("test-rechunk")
-
-setup({
-})
-
-test_that("testing rechunk 5 to 4", {
-  b = data.frame(a = 51:150, b = 1:100)
-  as.disk.frame(b, file.path(tempdir(), "tmp_rechunks.df"), nchunks = 5, overwrite = T)
-
-  b = disk.frame(file.path(tempdir(), "tmp_rechunks.df"))
-  
-  b = rechunk(b, 4)
-  expect_equal(nrow(b), 100)
-  expect_equal(ncol(b), 2)
-  expect_equal(nchunk(b), 4)
-  
-  res = collect(b)[order(b)]
-  
-  expect_equal(res$b, 1:100)
-  expect_equal(res$a, 51:150)
-})
-
-test_that("testing rechunk 5 to 3", {
-  b = data.frame(a = 51:150, b = 1:100)
-  as.disk.frame(b, file.path(tempdir(), "tmp_rechunks2.df"), nchunks = 5, overwrite = T)
-  
-  b = disk.frame(file.path(tempdir(), "tmp_rechunks2.df"))
-  
-  b = rechunk(b, 3)
-  expect_equal(nrow(b), 100)
-  expect_equal(ncol(b), 2)
-  expect_equal(nchunk(b), 3)
-  
-  res = collect(b)[order(b)]
-  
-  expect_equal(res$b, 1:100)
-  expect_equal(res$a, 51:150)
-})
-
-test_that("testing rechunk 5 to 6", {
-  b = data.frame(a = 51:150, b = 1:100)
-  as.disk.frame(b, file.path(tempdir(), "tmp_rechunks3.df"), nchunks = 5, overwrite = T)
-  
-  b = disk.frame(file.path(tempdir(), "tmp_rechunks3.df"))
-  
-  b = rechunk(b, 6)
-  expect_equal(nrow(b), 100)
-  expect_equal(ncol(b), 2)
-  expect_equal(nchunk(b), 6)
-  
-  res = collect(b)[order(b)]
-  
-  expect_equal(res$b, 1:100)
-  expect_equal(res$a, 51:150)
-})
-
-test_that("testing rechunk 5 to 7", {
-  b = data.frame(a = 51:150, b = 1:100)
-  as.disk.frame(b, file.path(tempdir(), "tmp_rechunks4.df"), nchunks = 5, overwrite = T)
-  
-  b = disk.frame(file.path(tempdir(), "tmp_rechunks4.df"))
-  
-  b = rechunk(b, 7)
-  expect_equal(nrow(b), 100)
-  expect_equal(ncol(b), 2)
-  expect_equal(nchunk(b), 7)
-  
-  res = collect(b)[order(b)]
-  
-  expect_equal(res$b, 1:100)
-  expect_equal(res$a, 51:150)
-})
-
-# TODO do shardby; it's kinda of mitigated by thorough testing on Fannie Mae
-
-
-teardown({
-  fs::dir_delete(file.path(tempdir(), "tmp_rechunks.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_rechunks2.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_rechunks3.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_rechunks4.df"))
-})
diff --git a/tests/testthat/test-recommend_nchunk.R b/tests/testthat/test-recommend_nchunk.R
deleted file mode 100644
index c5fbb109..00000000
--- a/tests/testthat/test-recommend_nchunk.R
+++ /dev/null
@@ -1,16 +0,0 @@
-context("test-recommend_nchunk")
-
-test_that("testing df_ram_size", {
-  expect_true(is.numeric(df_ram_size()))
-  
-  expect_true(!is.na(df_ram_size()))
-  expect_true(!is.null(df_ram_size()))
-  expect_true(!is.nan(df_ram_size()))
-  expect_true(is.finite(df_ram_size()))
-})
-  
-test_that("testing df_ram_size; guards #213", {
-  # TODO tests
-  expect_true(df_ram_size() >= 1)
-})
-
diff --git a/tests/testthat/test-remove_chunk.r b/tests/testthat/test-remove_chunk.r
deleted file mode 100644
index 8aec02ae..00000000
--- a/tests/testthat/test-remove_chunk.r
+++ /dev/null
@@ -1,18 +0,0 @@
-context("test-remove")
-
-test_that("testing remove chunk 3 of 5", {
-  b = data.frame(a = 51:150, b = 1:100)
-  tmp = file.path(tempdir(), "tmp_remove.df")
-  b = as.disk.frame(b, tmp, nchunks = 5, overwrite = T)
-  
-  b = remove_chunk(b, 3)
-  expect_equal(nrow(b), 80)
-  expect_equal(ncol(b), 2)
-  expect_equal(nchunk(b), 4)
-  
-  res <- collect(b)[order(b)]
-  
-  expect_equal(nrow(res), 80)
-  
-  delete(b)
-})
diff --git a/tests/testthat/test-right_join.r b/tests/testthat/test-right_join.r
deleted file mode 100644
index 27e532b4..00000000
--- a/tests/testthat/test-right_join.r
+++ /dev/null
@@ -1,7 +0,0 @@
-context("test-right_join")
-
-test_that("testing right_join", {
-  # TODO tests
-  expect_equal(2L, 2L)
-})
-
diff --git a/tests/testthat/test-sample_frac.r b/tests/testthat/test-sample_frac.r
deleted file mode 100644
index 8c45f8f7..00000000
--- a/tests/testthat/test-sample_frac.r
+++ /dev/null
@@ -1,20 +0,0 @@
-context("test-sampe_frac")
-
-setup({
-  a = data.frame(a = 1:100, b = 1:100)
-  
-  as.disk.frame(a, file.path(tempdir(), "tmp_sample_frac.df"), nchunks = 5, overwrite = T)
-})
-
-test_that("testing sample_frac", {
-  a = disk.frame(file.path(tempdir(), "tmp_sample_frac.df"))
-  a40 <- sample_frac(a, 0.4) %>% collect
-  
-  expect_equal(nrow(a40), 40)
-  
-  expect_error(a40 <- sample_frac(a, 0.4, weight = 1) %>% collect)
-})
-
-teardown({
-  fs::dir_delete(file.path(tempdir(), "tmp_sample_frac.df"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-sample_n.r b/tests/testthat/test-sample_n.r
deleted file mode 100644
index faf76259..00000000
--- a/tests/testthat/test-sample_n.r
+++ /dev/null
@@ -1,16 +0,0 @@
-context("test-sample_n")
-
-setup({
-  a = data.frame(a = 1:100, b = 1:100)
-  
-  as.disk.frame(a, file.path(tempdir(), "tmp_sample_n.df"), nchunks = 5, overwrite = T)
-})
-
-test_that("testing semi_join where right is data.frame", {
-  a = disk.frame(file.path(tempdir(), "tmp_sample_n.df"))
-  expect_error(a40 <- sample_n(a, 40) %>% collect)
-})
-
-teardown({
-  fs::dir_delete(file.path(tempdir(), "tmp_sample_n.df"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-sas_to_csv.r b/tests/testthat/test-sas_to_csv.r
deleted file mode 100644
index 0bdd6fa4..00000000
--- a/tests/testthat/test-sas_to_csv.r
+++ /dev/null
@@ -1,8 +0,0 @@
-# TODO everything
-
-context("test-sas_to_csv")
-
-test_that("testing sas_to_csv", {
-  # TODO tests
-  expect_equal(2L, 2L)
-})
diff --git a/tests/testthat/test-sas_to_disk.frame.r b/tests/testthat/test-sas_to_disk.frame.r
deleted file mode 100644
index dbd64e3e..00000000
--- a/tests/testthat/test-sas_to_disk.frame.r
+++ /dev/null
@@ -1,10 +0,0 @@
-# TODO everything
-
-context("test-sas_to_disk.frame")
-
-
-test_that("testing sas_to_disk.frame", {
-  # TODO tests
-  expect_equal(2L, 2L)
-})
-
diff --git a/tests/testthat/test-semi_join.R b/tests/testthat/test-semi_join.R
deleted file mode 100644
index 7b96c3ac..00000000
--- a/tests/testthat/test-semi_join.R
+++ /dev/null
@@ -1,72 +0,0 @@
-context("test-semi_join")
-
-setup({
-  
-  a = data.frame(a = 1:100, b = 1:100)
-  b = data.frame(a = 51:150, b = 1:100)
-  d = data.frame(a = 1:50, b = 1:50)
-  
-  as.disk.frame(a, file.path(tempdir(), "tmp_a_sj.df"), nchunks = 4, overwrite = TRUE)
-  as.disk.frame(b, file.path(tempdir(), "tmp_b_sj.df"), nchunks = 5, overwrite = TRUE)
-  as.disk.frame(d, file.path(tempdir(), "tmp_d_sj.df"), overwrite = TRUE)
-
-  as.disk.frame(a, file.path(tempdir(), "tmp_a_sj2.df"), nchunks = 4, overwrite = TRUE)
-  as.disk.frame(b, file.path(tempdir(), "tmp_b_sj2.df"), nchunks = 5, overwrite = TRUE)
-  as.disk.frame(d, file.path(tempdir(), "tmp_d_sj2.df"), overwrite = TRUE)
-})
-
-test_that("testing semi_join where right is data.frame", {
-  a = disk.frame(file.path(tempdir(), "tmp_a_sj.df"))
-  b = disk.frame(file.path(tempdir(), "tmp_b_sj.df"))
-  d = disk.frame(file.path(tempdir(), "tmp_d_sj.df"))
-  bc = collect(b)
-  dc = collect(d)
-  
-  abc = semi_join(a, bc, by = "a") %>% collect
-  expect_equal(nrow(abc), 50)
-  
-  abc0 = semi_join(a, bc, by = c("a","b")) %>% collect
-  expect_equal(nrow(abc0), 0)
-  
-  abc100 = semi_join(a, bc, by = "b") %>% collect
-  expect_equal(nrow(abc100), 100)
-  
-  abd50 = semi_join(a, dc, by = "b") %>% collect
-  expect_equal(nrow(abd50), 50)
-})
-
-test_that("testing semi_join where right is disk.frame", {
-  a = disk.frame(file.path(tempdir(), "tmp_a_sj2.df"))
-  b = disk.frame(file.path(tempdir(), "tmp_b_sj2.df"))
-  d = disk.frame(file.path(tempdir(), "tmp_d_sj2.df"))
-  
-  expect_warning({
-    ab = semi_join(a, b, by = "a", merge_by_chunk_id = F) %>% collect
-    })
-  expect_equal(nrow(ab), 50)
-  
-  expect_warning({
-    ab0 = semi_join(a, b, by = c("a","b"), merge_by_chunk_id = F) %>% collect
-    })
-  expect_equal(nrow(ab0), 0)
-  
-  expect_warning({
-    ab100 = semi_join(a, b, by = "b", merge_by_chunk_id = F) %>% collect
-    })
-  expect_equal(nrow(ab100), 100)
-  
-  expect_warning({
-    ad50 = semi_join(a, d, by = "b", merge_by_chunk_id = F) %>% collect
-    })
-  expect_equal(nrow(ad50), 50)
-})
-
-teardown({
-  fs::dir_delete(file.path(tempdir(), "tmp_a_sj.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_b_sj.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_d_sj.df"))
-  
-  fs::dir_delete(file.path(tempdir(), "tmp_a_sj2.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_b_sj2.df"))
-  fs::dir_delete(file.path(tempdir(), "tmp_d_sj2.df"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-setup.r b/tests/testthat/test-setup.r
deleted file mode 100644
index 4d3473d1..00000000
--- a/tests/testthat/test-setup.r
+++ /dev/null
@@ -1,7 +0,0 @@
-context("test-setup")
-
-test_that("testing sas_to_disk.frame", {
-  setup_disk.frame(workers = 2)
-  a = future::nbrOfWorkers()
-  expect_equal(a, 2)
-})
\ No newline at end of file
diff --git a/tests/testthat/test-shard.r b/tests/testthat/test-shard.r
deleted file mode 100644
index 0a2e28e5..00000000
--- a/tests/testthat/test-shard.r
+++ /dev/null
@@ -1,28 +0,0 @@
-context("test-shard")
-
-setup({
-})
-
-test_that("testing shard data.frame", {
-  set.seed(1)
-  a = data.table(a = rep(1:10, 10), b = 1:100)
-  a = shard(a, "a", nchunks = 2, overwrite = TRUE, outdir=file.path(tempdir(), "tmp_shard.df"))
-  
-  expect_equal(nchunks(a), 2)
-  expect_equal(nrow(a), 100)
-  expect_equal(ncol(a), 2)
-  
-  a1 = unique(get_chunk(a,1)$a)
-  a2 = unique(get_chunk(a,2)$a)
-  expect_equal(length(intersect(a1, a2)), 0)
-  
-  a3 = shard(a, "a", nchunks = 4, overwrite = TRUE)
-  
-  expect_equal(nchunks(a3), 4)
-  expect_equal(nrow(a3), 100)
-})
-
-
-teardown({
-  fs::dir_delete(file.path(tempdir(), "tmp_shard.df"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-shardkey.r b/tests/testthat/test-shardkey.r
deleted file mode 100644
index 846b81bb..00000000
--- a/tests/testthat/test-shardkey.r
+++ /dev/null
@@ -1,17 +0,0 @@
-context("test-shardkey")
-
-setup({
-})
-
-test_that("testing shardkey", {
-  set.seed(1)
-  a = data.table(a = rep(1:10, 10), b = 1:100)
-  a = shard(a, "a", nchunks = 2, overwrite = TRUE, outdir=file.path(tempdir(), "tmp_shardkey.df"))
-  
-  expect_equal(shardkey(a), list(shardkey="a", shardchunks=2))
-})
-
-
-teardown({
-  fs::dir_delete(file.path(tempdir(), "tmp_shardkey.df"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-srckeep.r b/tests/testthat/test-srckeep.r
deleted file mode 100644
index 5b6fa370..00000000
--- a/tests/testthat/test-srckeep.r
+++ /dev/null
@@ -1,17 +0,0 @@
-context("test-keep")
-
-setup({
-  b = data.frame(a = 51:150, b = 1:100)
-  as.disk.frame(b, file.path(tempdir(), "tmp_srckeep.df"), nchunks = 5, overwrite = TRUE)
-})
-
-test_that("testing srckeep", {
-  b = disk.frame(file.path(tempdir(), "tmp_srckeep.df"))
-  b1 = b %>% srckeep("a")
-  expect_equal(ncol(b1 %>% collect), 1)
-  expect_equal(colnames(b1 %>% collect), "a")
-})
-
-teardown({
-  fs::dir_delete(file.path(tempdir(), "tmp_srckeep.df"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-tbl_vars.r b/tests/testthat/test-tbl_vars.r
deleted file mode 100644
index 5cd00ffa..00000000
--- a/tests/testthat/test-tbl_vars.r
+++ /dev/null
@@ -1,16 +0,0 @@
-context("test-tbl_vars")
-
-setup({
-})
-
-test_that("testing tbl_vars", {
-  a = data.table(a = rep(1:10, 10), b = 1:100)
-  a = shard(a, "a", nchunks = 2, overwrite = TRUE, outdir=file.path(tempdir(), "tmp_tbl_vars.df"))
-  
-  expect_setequal(tbl_vars(a), c("a","b"))
-})
-
-
-teardown({
-  fs::dir_delete(file.path(tempdir(), "tmp_tbl_vars.df"))
-})
\ No newline at end of file
diff --git a/tests/testthat/test-util.r b/tests/testthat/test-util.r
deleted file mode 100644
index a9db9f37..00000000
--- a/tests/testthat/test-util.r
+++ /dev/null
@@ -1,8 +0,0 @@
-context("test-util")
-
-test_that("testing evalparseglue", {
-  x = 2
-  y = 3
-  expect_equal(evalparseglue("{x}+{y}"), 5)
-})
-
diff --git a/tests/testthat/test-write_disk.frame.R b/tests/testthat/test-write_disk.frame.R
deleted file mode 100644
index c5650c81..00000000
--- a/tests/testthat/test-write_disk.frame.R
+++ /dev/null
@@ -1,39 +0,0 @@
-context("test-write_disk.frame")
-
-test_that("as.disk.frame works", {
-  ROWS = 1e3+11
-
-  tmp_write_disk.frame = tempfile()
-  tmp_write_disk.frame2 = tempfile()
-  
-  df = disk.frame:::gen_datatable_synthetic(ROWS)
-  dfdf <- as.disk.frame(df, tmp_write_disk.frame, overwrite = TRUE, nchunks = 5)
-
-  a = dfdf %>% cmap(~{
-    .x[1,]
-  }) %>% write_disk.frame(outdir = tmp_write_disk.frame2, overwrite = T)
-
-  expect_equal(nrow(a), 5)
-
-  fs::dir_delete(tmp_write_disk.frame)
-  fs::dir_delete(tmp_write_disk.frame2)
-})
-
-test_that("as.disk.frame fails if data frame has list-columns", {
-    df <- tibble::tibble("a" = c(1,2,3), "b" = list("a", "b", "c"))
-    expect_error(as.disk.frame(df, file.path(tempdir(), "tmp_write_disk.frame"), overwrite = TRUE, nchunks = 6))
-})
-
-test_that("write_disk.frame shard works", {
-  mtcars_df = as.disk.frame(
-    mtcars, 
-    outdir = file.path(tempdir(), "mt_shard_by_cyl"), 
-    shardby = c("cyl","vs"), 
-    nchunks = 3, 
-    overwrite = TRUE)
-  
-  res = mtcars_df %>% collect_list
-  expect_equal(length(res), 3)
-  testthat::expect_type(res, "list")
-  
-})
diff --git a/tests/testthat/test-zip_to_disk.frame.r b/tests/testthat/test-zip_to_disk.frame.r
deleted file mode 100644
index b2e4c31e..00000000
--- a/tests/testthat/test-zip_to_disk.frame.r
+++ /dev/null
@@ -1,7 +0,0 @@
-context("test-zip_to_disk.frame")
-
-# TODO do some testing
-test_that("testing zip_to_disk.frame", {
-  expect_true(TRUE)
-})
-
diff --git a/utils/build_utils.R b/utils/build_utils.R
index b158a0bf..33103cf0 100644
--- a/utils/build_utils.R
+++ b/utils/build_utils.R
@@ -73,19 +73,19 @@ df_setup_vignette <- function(excl = "", strip_number = FALSE) {
 
 df_test <- function() {
   # rename tests
-  if(fs::dir_exists("tests_manual")) {
-    fs::dir_copy("tests_manual", "tests")
-    Sys.sleep(3) # allow enough time for it to happen
-    fs::dir_delete("tests_manual")
-  }
+  # if(fs::dir_exists("tests_manual")) {
+  #   fs::dir_copy("tests_manual", "tests")
+  #   Sys.sleep(3) # allow enough time for it to happen
+  #   fs::dir_delete("tests_manual")
+  # }
   
   devtools::test()
   
-  if(fs::dir_exists("tests")) {
-    fs::dir_copy("tests", "tests_manual")
-    Sys.sleep(8) # allow enough time for it to happen
-    fs::dir_delete("tests")
-  }
+  # if(fs::dir_exists("tests")) {
+  #   fs::dir_copy("tests", "tests_manual")
+  #   Sys.sleep(8) # allow enough time for it to happen
+  #   fs::dir_delete("tests")
+  # }
 }
 
 df_build_vignettes_for_cran <- function() {
diff --git a/vignettes/concepts.Rmd b/vignettes/concepts.Rmd
deleted file mode 100644
index d320fd90..00000000
--- a/vignettes/concepts.Rmd
+++ /dev/null
@@ -1,69 +0,0 @@
----
-title: "Key `{disk.frame}` concepts"
-author: "ZJ"
-output: rmarkdown::html_vignette
-vignette: >
-  %\VignetteIndexEntry{Key disk.frame concepts}
-  %\VignetteEngine{knitr::rmarkdown}
-  %\VignetteEncoding{UTF-8}
----
-
-```{r, include = FALSE}
-knitr::opts_chunk$set(
-  collapse = TRUE,
-  comment = "#>"
-)
-```
-
-# Key `{disk.frame}` concepts
-There are a number of concepts and terminologies that are useful to understand in order to use `disk.frame` effectively.
-
-## What is a `disk.frame` and what are chunks?
-
-A `disk.frame` is a folder containing [`fst`](https://www.fstpackage.org/) files named "1.fst", "2.fst", "3.fst" etc. Each of the ".fst" file is called a _chunk_.
-
-## Workers and parallelism
-
-Parallelism in `disk.frame` is achieved using the [`future` package](https://cran.r-project.org/package=future). When performing many tasks, `disk.frame` uses multiple workers, where each _worker_ is an R session, to perform the tasks in parallel. 
-
-It is recommended that you should run the following immediately after `library(disk.frame)` to set-up multiple workers. For example:
-
-```r
-library(disk.frame)
-setup_disk.frame()
-
-# this will allow unlimited amount of data to be passed from worker to worker
-options(future.globals.maxSize = Inf)
-```
-
-For example, suppose we wish to compute the number of rows for each chunk, we can clearly perform this simultaneously in parallel. The code to do that is
-
-```r
-# use only one column is fastest
-df[,.N, keep = "first_col"]
-```
-
-or equivalent using the `srckeep` function
-
-```r
-# use only one column is fastest
-srckeep(df, "first_col")[,.N, keep = "first_col"]
-```
-
-Say there are `n` chunks in `df`, and there are `m` workers. Then the first `m` chunks will run `chunk[,.N]` simultaneously.
-
-To see how many workers are at work, use
-```r
-# see how many workers are available for work
-future::nbrOfWorkers()
-```
-
-## How `{disk.frame}` works
-
-When `df %>% some_fn %>% collect` is called. The `some_fn` is applied to each chunk of `df`. The collect will row-bind the results from `some_fn(chunk)`together if the returned value of `some_fn` is a data.frame, or it will return a `list` containing the results of `some_fn`.
-
-The session that receives these results is called the **main session**. In general, we should try to minimize the amount of data passed from the worker sessions back to the main session, because passing data around can be slow.
-
-Also, please note that there is no communication between the workers, except for workers passing data back to the main session.
-
-
diff --git a/vignettes/convenience-features.Rmd b/vignettes/convenience-features.Rmd
deleted file mode 100644
index 6269a97b..00000000
--- a/vignettes/convenience-features.Rmd
+++ /dev/null
@@ -1,54 +0,0 @@
----
-title: "Convenience features"
-author: "ZJ"
-output: rmarkdown::html_vignette
-vignette: >
-  %\VignetteIndexEntry{Convenience features}
-  %\VignetteEngine{knitr::rmarkdown}
-  %\VignetteEncoding{UTF-8}
----
-
-```{r, include = FALSE}
-knitr::opts_chunk$set(
-  collapse = TRUE,
-  comment = "#>"
-)
-```
-
-## Convenience Features
-
-### GUI for setting options
-
-I wanted to make `{disk.frame}` as easy to use as possible. I often forget what options are available to me. So I've made a GUI
-
-```r
-setup_disk.frame(gui = TRUE)
-```
-which opens up a Shiny app where the user can choose the options.
-
-### RStudio column name completion
-
-```r
-library(disk.frame)
-mtcars.df = as.disk.frame(mtcars)
-
-mtcars.df %>% 
-  filter(<press tab>)
-```
-
-you can press tab in RStudio and it will show all column available
-
-### Insert ceremony/boilerplate into code in RStudio
-
-The below will insert the recommended ceremony code into your editor
-```r
-disk.frame::insert_ceremony() 
-```
-should insert
-
-```r
-# this willl set disk.frame with multiple workers
-setup_disk.frame()
-# this will allow unlimited amount of data to be passed from worker to worker
-options(future.globals.maxSize = Inf)
-```
diff --git a/vignettes/data-table-syntax.Rmd b/vignettes/data-table-syntax.Rmd
deleted file mode 100644
index e87ca88b..00000000
--- a/vignettes/data-table-syntax.Rmd
+++ /dev/null
@@ -1,78 +0,0 @@
----
-title: "Using data.table syntax with disk.frame"
-author: "ZJ"
-output: rmarkdown::html_vignette
-vignette: >
-  %\VignetteIndexEntry{Using data.table syntax}
-  %\VignetteEngine{knitr::rmarkdown}
-  %\VignetteEncoding{UTF-8}
----
-
-```{r, include = FALSE}
-knitr::opts_chunk$set(
-  collapse = TRUE,
-  comment = "#>"
-)
-```
-
-## `disk.frame` supports `data.table` syntax
-
-
-```{r setup_data_table, cache=TRUE}
-library(disk.frame)
-
-# set-up disk.frame to use multiple workers
-if(interactive()) {
-  setup_disk.frame()
-  # highly recommended, however it is pun into interactive() for CRAN because
-  # change user options are not allowed on CRAN
-  options(future.globals.maxSize = Inf)  
-} else {
-  setup_disk.frame(2)
-}
-
-
-library(nycflights13)
-
-# create a disk.frame
-flights.df = as.disk.frame(nycflights13::flights, outdir = file.path(tempdir(),"flights13"), overwrite = TRUE)
-```
-
-In the following example, I will use the `.N` from the `data.table` package to count the unique combinations `year` and `month` within each chunk.
-
-```{r ok, dependson='setup_data_table'}
-library(data.table)
-library(disk.frame)
-
-flights.df = disk.frame(file.path(tempdir(),"flights13"))
-
-names(flights.df)
-
-flights.df[,.N, .(year, month), keep = c("year", "month")]
-```
-
-All `data.table` syntax are supported. However, `disk.frame` adds the ability to load only those columns required for the analysis using the `keep =` option. In the above analysis, only the `year` and `month` variables are required and hence `keep = c("year", "month")` was used. 
-
-Alternatively, we can use the `srckeep` function to achieve the same, e.g.
-
-```r
-srckeep(flights.df, c("year", "month"))[,.N, .(year, month)]
-```
-
-### External variables are captured
-
-`disk.frame` sends the computation to background workers which are essentially distinct and separate R sessions. Typically, the variables that you have available in your current R session aren't visible in the other R sessions, but `disk.frame` uses the `future` package's variable detection abilities to figure out which variables are in use and then send them to the background workers so they have access to the variables as well. E.g.
-
-```{r var_detect, dependson='setup_data_table'}
-y = 42 
-some_fn <- function(x) x
-
-
-flights.df[,some_fn(y)]
-```
-
-In the above example, neither `some_fn` nor `y` are defined in the background workers' environments, but `disk.frame` still manages to evaluate this code `flights.df[,some_fn(y)]`.
-
-```{r clean_up, include=FALSE}
-fs::dir_delete(file.path(tempdir(),"flights13"))
-```
\ No newline at end of file
diff --git a/vignettes/glm.Rmd b/vignettes/glm.Rmd
deleted file mode 100644
index 1d5fb418..00000000
--- a/vignettes/glm.Rmd
+++ /dev/null
@@ -1,111 +0,0 @@
----
-title: "Generalized Linear Models (GLM) including logistic regression with disk.frame"
-output: rmarkdown::html_vignette
-vignette: >
-  %\VignetteIndexEntry{Generalized Linear Models (logistic regression etc) with disk.frame}
-  %\VignetteEngine{knitr::rmarkdown}
-  %\VignetteEncoding{UTF-8}
----
-
-```{r, include = FALSE}
-knitr::opts_chunk$set(
-  collapse = TRUE,
-  comment = "#>"
-)
-```
-
-```{r setup, cache=TRUE}
-suppressPackageStartupMessages(library(disk.frame))
-
-if(interactive()) {
-  setup_disk.frame() 
-} else {
-  # only use 1 work to pass CRAN check
-  setup_disk.frame(1)
-}
-
-```
-
-# GLMs
-
-### Prerequisites
-In this article, we will assume you are familiar with Generalized Linear Models (GLMs). You are also expected to have basic working knowledge of {`disk.frame`}, see this [{`disk.frame`} Quick Start](http://diskframe.com/articles/intro-disk-frame.html). 
-
-## Introduction
-One can fit a GLM using the `glm` function. For example,
-
-```{r glm, cache=TRUE}
-m = glm(dist ~ speed, data = cars)
-```
-
-would fit a linear model on the data `cars` with `dist` as the target and `speed` as the explanatory variable. You can inspect the results of the model fit using
-
-```{r, depeondson='glm'}
-summary(m)
-```
-
-or if you have `{broom}` installed
-
-```{r, depeondson='glm'}
-broom::tidy(m)
-```
-
-With {`disk.frame`}, you can run GLM `dfglm` function, where the `df` stands for `disk.frame` of course!
-```{r dependson='setup'}
-cars.df = as.disk.frame(cars)
-
-m = dfglm(dist ~ speed, cars.df)
-
-summary(m)
-
-
-majorv = as.integer(version$major)
-minorv = as.integer(strsplit(version$minor, ".", fixed=TRUE)[[1]][1])
-
-if((majorv == 3) & (minorv >= 6)) {
-  broom::tidy(m)
-} else {
-  # broom doesn't work in version < R3.6 because biglm does not work
-}
-
-```
-
-The syntax didn't change at all! You are able to enjoy the benefits of `disk.frame` when dealing with larger-than-RAM data.
-
-## Logistic regression
-Logistic regression is one of the most commonly deployed machine learning (ML) models. It is often used to build binary classification models
-
-```{r dependson='setup'}
-iris.df = as.disk.frame(iris)
-
-# fit a logistic regression model to predict Speciess == "setosa" using all variables
-all_terms_except_species = setdiff(names(iris.df), "Species")
-formula_rhs = paste0(all_terms_except_species, collapse = "+")
-
-formula = as.formula(paste("Species == 'versicolor' ~ ", formula_rhs))
-
-iris_model = dfglm(formula , data = iris.df, family=binomial())
-
-# iris_model = dfglm(Species == "setosa" ~ , data = iris.df, family=binomial())
-
-summary(iris_model)
-
-majorv = as.integer(version$major)
-minorv = as.integer(strsplit(version$minor, ".", fixed=TRUE)[[1]][1])
-
-if((majorv == 3) & (minorv >= 6)) {
-  broom::tidy(iris_model)
-} else {
-  # broom doesn't work in version < R3.6 because biglm does not work
-}
-
-```
-
-The arguments to the `dfglm` function are the same as the arguments to `biglm::bigglm` which are based on the `glm` function. Please check their documentations for other argument options.
-
-## Notes
-`{disk.frame}` uses `{biglm}` and `{speedglm}` as the backend for GLMs. Unfortunately, neither package is managed on open-source platforms, so it's more difficult to contribute to them by making bug fixes and submitting bug reports. So bugs are likely to persists. There is an active effort on `disk.frame` to look for alternatives. Example of avenues to explore include tighter integration with `{keras}`, h2o, or Julia's OnlineStats.jl for model fit purposes.
-
-Another package for larger-than-RAM glm fitting, `{bigFastlm}`, has been taken off CRAN, it is managed on Github.
-
-Currently, parallel processing of GLM fit are not possible with {`disk.frame`}. 
diff --git a/vignettes/ingesting-data.Rmd b/vignettes/ingesting-data.Rmd
deleted file mode 100644
index 541d870a..00000000
--- a/vignettes/ingesting-data.Rmd
+++ /dev/null
@@ -1,174 +0,0 @@
----
-title: "Ingesting Data"
-author: "ZJ"
-output: rmarkdown::html_vignette
-vignette: >
-  %\VignetteIndexEntry{Ingesting data including CSVs}
-  %\VignetteEngine{knitr::rmarkdown}
-  %\VignetteEncoding{UTF-8}
----
-
-```{r, include = FALSE}
-knitr::opts_chunk$set(
-  collapse = TRUE,
-  comment = "#>"
-)
-```
-
-# Ingesting Data
-
-One of the most important tasks to perform before using the `{disk.frame}` package is to make some `disk.frame`s! There are a few functions to help you do that. Before we do that, we set up the `{disk.frame}` as usual
-
-**Setting up**
-
-```r
-library(disk.frame)
-
-# set-up disk.frame to use multiple workers
-if(interactive()) {
-  setup_disk.frame()
-  # highly recommended, however it is pun into interactive() for CRAN because
-  # change user options are not allowed on CRAN
-  options(future.globals.maxSize = Inf)  
-} else {
-  setup_disk.frame(2)
-}
-
-```
-
-## Convert a `data.frame` to `disk.frame`
-Firstly, there is `as.disk.frame()` which allows you to make a `disk.frame` from a `data.frame`, e.g.
-
-```r
-flights.df = as.disk.frame(nycflights13::flights)
-```
-
-will convert the `nycflights13::flights` `data.frame` to a `disk.frame` somewhere in `tempdir()`. To find out the location of the `disk.frame` use:
-
-```r
-attr(flights.df, "path")
-```
-
-You can also specify a location to output the `disk.frame` to using `outdir`
-
-```r
-flights.df = as.disk.frame(nycflights13::flights, outdir = "some/path.df")
-```
-
-it is recommended that you use `.df` as the extension for a `disk.frame`, however this is not an enforced requirement.
-
-However, one of the reasons for `disk.frame` to exist is to handle larger-than-RAM files, hence `as.disk.frame` is not all that useful because it can only convert data that can fit into RAM. `disk.frame` comes with a couple more ways to create `disk.frame`.
-
-## Creating `disk.frame` from CSVs
-The function `csv_to_disk.frame` can convert CSV files to `disk.frame`. The most basic usage is
-
-```r
-some.df = csv_to_disk.frame("some/path.csv", outdir = "some.df")
-```
-
-this will convert the CSV file `"some/path.csv"` to a `disk.frame`. 
-
-## Multiple CSV files
-
-However, sometimes we have multiple CSV files that you want to read in and row-bind into one large `disk.frame`. You can do so by supplying a vector of file paths e.g. from the result of `list.files`
-
-```r
-some.df = csv_to_disk.frame(c("some/path/file1.csv", "some/path/file2.csv"))
-
-# or
-some.df = csv_to_disk.frame(list.files("some/path"))
-```
-
-## Ingesting CSV files chunk-wise
-The `csv_to_disk.frame(path, ...)` function reads the file located at `path` in full into RAM but sometimes the CSV file may be too large to read in one go, as that would require loading the whole file into RAM. In that case, you can read the files chunk-by-chunk by using the `in_chunk_size` argument which controls how many rows you read in per chunk
-
-```r
-# to read in 1 million (=1e6) rows per chunk
-csv_to_disk.frame(path, in_chunk_size = 1e6)
-```
-
-When `in_chunk_size` is specified, the input file is split into many smaller files using `bigreadr`'s split file functions. This is generally the fastest way to ingest large CSVs, as the split files can be processed in parallel using all CPU cores. But the disk space requirement is doubled because the split files are as large as the original file. If you run out of disk space, then you must clean R's temporary folder at `tempdir()` and choose another `chunk_reader` e.g. `csv_to_disk.frame(..., chunk_reader = "LaF")`.
-
-## Sharding
-One of the most important aspects of `disk.frame` is sharding. One can shard a `disk.frame` at read time by using the `shardby`
-
-```r
-csv_to_disk.frame(path, shardby = "id")
-```
-
-In the above case, all rows with the same `id` values will end up in the same chunk.
-
-
-## Just-in-time transformation
-Sometimes, one may wish to perform some transformation on the CSV before writing out to disk. One can use the `inmapfn` argument to do that. The `inmapfn` name comes from INput MAPping FuNction. The general usage pattern is as follows:
-
-```r
-csv_to_disk.frame(file.path(tempdir(), "df.csv"), inmapfn = function(chunk) {
-  some_transformation(chunk)
-})
-```
-
-As a contrived example, suppose you wish to convert a string into date at read time:
-
-```r
-df = data.frame(date_str = c("2019-01-02", "2019-01-02"))
-
-# write the data.frame 
-write.csv(df, file.path(tempdir(), "df.csv"))
-
-
-# this would show that date_str is a string
-str(collect(csv_to_disk.frame(file.path(tempdir(), "df.csv")))$date_str)
-## chr [1:2] "2019-01-02" "2019-01-02"
-
-# this would show that date_str is a string
-df = csv_to_disk.frame(file.path(tempdir(), "df.csv"), inmapfn = function(chunk) {
-  # convert to date_str to date format and store as "date"
-  chunk[, date := as.Date(date_str, "%Y-%m-%d")]
-  chunk[, date_str:=NULL]
-})
-
-str(collect(df)$date)
-## Date[1:2], format: "2019-01-02" "2019-01-02"
-```
-
-## Reading CSVs from zip files
-Often, CSV comes zipped in a zip files. You can use the `zip_to_disk.frame` to convert all CSVs within a zip file
-
-```r
-zip_to_disk.frame(path_to_zip_file)
-```
-
-The arguments for `zip_to_disk.frame` are the same as `csv_to_disk.frame`'s.
-
-
-## Using `add_chunk`
-
-What if the method of converting to a `disk.frame` isn't implemented in `disk.frame` yet? One can use some lower level constructs provided by `disk.frame` to create `disk.frame`s. For example, the `add_chunk` function can be used to add more chunks to a `disk.frame`, e.g.
-
-```r
-a.df = disk.frame() # create an empty disk.frame
-add_chunk(a.df, cars) # adds cars as chunk 1
-add_chunk(a.df, cars) # adds cars as chunk 2
-```
-
-Another example of using `add_chunk` is via `readr`'s chunked read functions to create a delimited file reader
-
-```r
-delimited_to_disk.frame <- function(file, outdir, ...) {
-  res.df = disk.frame(outdir, ...)
-  readr::read_delim_chunked(file, callback = function(chunk) {
-    add_chunk(res.df, chunk)
-  }, ...)
-  
-  res.df
-}
-
-delimited_to_disk.frame(path, outdir = "some.df")
-```
-
-The above code uses `readr`'s `read_delim_chunked` function to read `file` and call `add_chunk`. The problem with this approach is that is it sequential in nature and hence is not able to take advantage of parallelism.
-
-## Exploiting the structure of a disk.frame
-
-Of course, a `disk.frame` is just a folder with many `fst` files named as `1.fst`, `2.fst` etc. So one can simply create these `fst` files and ensure they have the same variable names and put them in a folder.
\ No newline at end of file
diff --git a/vignettes/intro-disk-frame.Rmd b/vignettes/intro-disk-frame.Rmd
deleted file mode 100644
index c3d364fb..00000000
--- a/vignettes/intro-disk-frame.Rmd
+++ /dev/null
@@ -1,378 +0,0 @@
----
-title: "Quick Start: Basic Operations with nycflights13"
-author: "ZJ"
-output: rmarkdown::html_vignette
-vignette: >
-  %\VignetteIndexEntry{Quick Start}
-  %\VignetteEngine{knitr::rmarkdown}
-  %\VignetteEncoding{UTF-8}
----
-
-```{r setup, include = FALSE}
-suppressPackageStartupMessages(library(disk.frame))
-library(fst)
-library(magrittr)
-library(nycflights13)
-library(dplyr)
-library(data.table)
-
-# you need to run this for multi-worker support
-# limit to 2 cores if not running interactively; most likely on CRAN
-# set-up disk.frame to use multiple workers
-if(interactive()) {
-  setup_disk.frame()
-  # highly recommended, however it is pun into interactive() for CRAN because
-  # change user options are not allowed on CRAN
-  options(future.globals.maxSize = Inf)  
-} else {
-  setup_disk.frame(2)
-}
-
-
-knitr::opts_chunk$set(
-	eval = FALSE,
-	collapse = TRUE,
-	comment = "#>",
-	include = TRUE
-)
-```
-
-# Quick Start - replicating dplyr's tutorial on nycflight13 
-
-The [`disk.frame` package](https://github.com/xiaodaigh/disk.frame) aims to be the answer to the question: how do I manipulate structured tabular data that doesn't fit into Random Access Memory (RAM)? 
-
-In a nutshell, `disk.frame` makes use of two simple ideas:
-
-1) split up a larger-than-RAM dataset into chunks and store each chunk in a separate file inside a folder and 
-2) provide a convenient API to manipulate these chunks
-
-`disk.frame` performs a similar role to distributed systems such as Apache Spark, Python's Dask, and Julia's JuliaDB.jl for *medium data* which are datasets that are too large for RAM but not quite large enough to qualify as *big data*.
-
-In this tutorial, we introduce `disk.frame`, address some common questions, and replicate the [sparklyr data manipulation tutorial](https://spark.rstudio.com/dplyr/) using `disk.frame` constructs.
-
-## Installation
-Simply run
-
-```r
-install.packages("disk.frame") # when CRAN ready
-```
-or
-
-```r
-devtools::install_github("xiaodaigh/disk.frame")
-```
-
-## Set-up `disk.frame`
-`disk.frame` works best if it can process multiple data chunks in parallel. The best way to set-up `disk.frame` so that each CPU core runs a background worker is by using
-
-```r
-setup_disk.frame()
-
-# this will allow unlimited amount of data to be passed from worker to worker
-options(future.globals.maxSize = Inf)
-```
-
-The `setup_disk.frame()` function sets up background workers equal to the number of CPU cores available on your machine; please note that, by default, hyper-threaded cores are counted as one not two.
-
-Alternatively, one may specify the number of workers using `setup_disk.frame(workers = n)`.
-
-## Basic Data Operations with `disk.frame`
-
-The `disk.frame` package provides convenient functions to convert `data.frame`s and CSVs to `disk.frame`s.
-
-### Creating a `disk.frame` from `data.frame`
-We convert a `data.frame` to `disk.frame` using the `as.data.frame` function.
-
-```{r asdiskframe, cache=TRUE}
-library(nycflights13)
-library(dplyr)
-library(disk.frame)
-library(data.table)
-
-# convert the flights data to a disk.frame and store the disk.frame in the folder
-# "tmp_flights" and overwrite any content if needed
-flights.df <- as.disk.frame(
-  flights, 
-  outdir = file.path(tempdir(), "tmp_flights.df"),
-  overwrite = TRUE)
-flights.df
-```
-You should now see a folder called `tmp_flights` with some files in it, namely `1.fst`, `2.fst`... where each `fst` files is one chunk of the `disk.frame`.
-
-
-### Creating a `disk.frame` from CSV
-```{r}
-library(nycflights13)
-# write a csv
-csv_path = file.path(tempdir(), "tmp_flights.csv")
-data.table::fwrite(flights, csv_path)
-
-# load the csv into a disk.frame
-df_path = file.path(tempdir(), "tmp_flights.df")
-flights.df <- csv_to_disk.frame(
-  csv_path, 
-  outdir = df_path,
-  overwrite = T)
-  
-flights.df
-```
-
-If the CSV is too large to read in, then we can also use the `in_chunk_size` option to control how many rows to read in at once. For example, to read in the data 100,000 rows at a time:
-
-```{r}
-library(nycflights13)
-library(disk.frame)
-
-# write a csv
-csv_path = file.path(tempdir(), "tmp_flights.csv")
-
-data.table::fwrite(flights, csv_path)
-
-df_path = file.path(tempdir(), "tmp_flights.df")
-
-flights.df <- csv_to_disk.frame(
-  csv_path, 
-  outdir = df_path, 
-  in_chunk_size = 100000)
-  
-flights.df
-```
-
-`disk.frame` also has a function `zip_to_disk.frame` that can convert every CSV in a zip file to a `disk.frame`.
-
-### Simple `dplyr` verbs and lazy evaluation
-```{r dfselect, dependson='asdiskframe', cache=TRUE}
-flights.df1 <- select(flights.df, year:day, arr_delay, dep_delay)
-flights.df1
-```
-
-```{r dependson='dfselect'}
-class(flights.df1)
-```
-
-The class of `flights.df1` is also a `disk.frame` after the `dplyr::select` transformation. Also, `disk.frame` operations are by default (and where possible) **lazy**, meaning they don't perform the operations right away. Instead, these functions wait until you call `collect`. Exceptions to this rule are the `*_join` operations, which evaluate *eagerly* under certain conditions--see **Joins for disk.frame in-depth** for details.
-
-For lazily constructed `disk.frame`s (e.g. `flights.df1`), the function `collect` can be used to bring the results from disk into R, e.g.
-```{r, dependson='dfselect'}
-collect(flights.df1) %>% head(2)
-```
-
-Of course, for larger-than-RAM datasets, one wouldn't call `collect` on the whole `disk.frame` (because why would you need `disk.frame` otherwise). More likely, one would call `collect` on a `filter`ed dataset or one summarized with `group_by`.
-
-Some examples of other dplyr verbs applied:
-
-```{r, dependson='asdiskframe'}
-filter(flights.df, dep_delay > 1000) %>% collect %>% head(2)
-```
-
-```{r, dependson='asdiskframe'}
-mutate(flights.df, speed = distance / air_time * 60) %>% collect %>% head(2)
-```
-
-### Examples of NOT fully supported `dplyr` verbs
-
-The `chunk_arrange` function arranges (sorts) each chunk but not the whole dataset. So use with caution. Similarly, `chunk_summarise` creates summary variables within each chunk and hence also needs to be used with caution. In the **Group-by** section, we demonstrate how to use `summarise` in the `disk.frame` context correctly with `hard_group_by`s.
-
-```{r, dependson='asdiskframe'}
-# this only sorts within each chunk
-chunk_arrange(flights.df, dplyr::desc(dep_delay)) %>% collect %>% head(2)
-```
-
-
-```{r, dependson='asdiskframe'}
-chunk_summarize(flights.df, mean_dep_delay = mean(dep_delay, na.rm =T)) %>% collect
-```
-
-### Piping
-
-One can chain `dplyr` verbs together like with a `data.frame`
-
-```{r, dependson='asdiskframe'}
-c4 <- flights %>%
-  filter(month == 5, day == 17, carrier %in% c('UA', 'WN', 'AA', 'DL')) %>%
-  select(carrier, dep_delay, air_time, distance) %>%
-  mutate(air_time_hours = air_time / 60) %>%
-  collect %>%
-  arrange(carrier)# arrange should occur after `collect`
-
-c4  %>% head
-```
-
-### List of supported `dplyr` verbs
-
-```r
-select
-rename
-filter
-chunk_arrange # within each chunk
-chunk_group_by # within each chunk
-chunk_summarize # within each chunk
-group_by # limited functions
-summarize # limited functions
-mutate
-transmute
-left_join
-inner_join
-full_join # careful. Performance!
-semi_join
-anit_join
-```
-
-## Sharding and distribution of chunks
-
-Like other distributed data manipulation frameworks, `disk.frame` utilizes the *sharding* concept to distribute the data into chunks. For example, "to shard by `cust_id`" means that all rows with the same `cust_id` will be stored in the same chunk. This enables `chunk_group_by` by `cust_id` to produce the same results as non-chunked data.
-
-The `by` variables that were used to shard the dataset are called the `shardkey`s. The *sharding* is performed by computing a deterministic hash on the shard keys (the `by` variables) for each row. The hash function produces an integer between `1` and `n`, where `n` is the number of chunks. 
-
-## Group-by
-
-`{disk.frame}` implements the `group_by` operation with some caveats. In the `{disk.frame}` framework, only a subset of functions are supported in `summarize`. However, the user can create more custom `group-by` functions on the fly.
-
-```{r, dependson='asdiskframe'}
-flights.df %>%
-  group_by(carrier) %>% # notice that hard_group_by needs to be set
-  summarize(count = n(), mean_dep_delay = mean(dep_delay, na.rm=T)) %>%  # mean follows normal R rules
-  collect %>% 
-  arrange(carrier)
-```
-
-## Restrict input columns for faster processing
-
-One can restrict which input columns to load into memory for each chunk; this can significantly increase the speed of data processing. To restrict the input columns, use the `srckeep` function which only accepts column names as a string vector.
-
-```{r, dependson='asdiskframe'}
-flights.df %>%
-  srckeep(c("carrier","dep_delay")) %>%
-  group_by(carrier) %>% 
-  summarize(count = n(), mean_dep_delay = mean(dep_delay, na.rm=T)) %>%  # mean follows normal R rules
-  collect
-```
-
-Input column restriction is one of the most critical efficiencies provided by `disk.frame`. Because the underlying format allows random access to columns (i.e. retrieve only the columns used for processing), hence one can drastically reduce the amount of data loaded into RAM for processing by keeping only those columns that are directly used to produce the results.
-
-## Joins
-
-`disk.frame` supports many dplyr joins including:
-
-```r
-left_join
-inner_join
-semi_join
-inner_join
-full_join # requires hard_group_by on both left and right
-```
-In all cases, the left dataset (`x`) must be a `disk.frame`, and the right dataset (`y`) can be either a `disk.frame` or a `data.frame`. If the right dataset is a `disk.frame` and the `shardkey`s are different between the two `disk.frame`s then two expensive `hard` `group_by` operations are performed *eagerly*, one on the left `disk.frame` and one on the right `disk.frame` to perform the joins correctly. 
-
-However, if the right dataset is a `data.frame` then `hard_group_by`s are only performed in the case of `full_join`.
-
-Note `disk.frame` does not support `right_join`. The user should use `left_join` instead.
-
-The below joins are performed *lazily* because `airlines.dt` is a `data.table` not a `disk.frame`:
-
-```{r airlines_dt, dependson='asdiskframe', cache=TRUE}
-# make airlines a data.table
-airlines.dt <- data.table(airlines)
-# flights %>% left_join(airlines, by = "carrier") #
-flights.df %>% 
-  left_join(airlines.dt, by ="carrier") %>% 
-  collect %>% 
-  head
-```
-
-```{r, dependson='airlines_dt'}
-flights.df %>% 
-  left_join(airlines.dt, by = c("carrier", "carrier")) %>% 
-  collect %>% 
-  tail
-```
-
-## Window functions and arbitrary functions
-
-`{disk.frame}` supports all `data.frame` operations, unlike Spark which can only perform those operations that Spark has implemented. Hence windowing functions like `min_rank` and `rank` are supported out of the box. 
-
-For the following example, we will use the `hard_group_by` which performs a group-by and also reorganises the chunks so that all records with the same `year`, `month`, and `day` end up in the same chunk. This is typically not advised, as `hard_group_by` can be slow for large datasets.
-
-```{r, dependson='asdiskframe'}
-# Find the most and least delayed flight each day
-bestworst <- flights.df %>%
-   srckeep(c("year","month","day", "dep_delay")) %>%
-   hard_group_by(c("year", "month", "day")) %>%
-   filter(dep_delay == min(dep_delay, na.rm = T) || dep_delay == max(dep_delay, na.rm = T)) %>%
-   collect
-   
-bestworst %>% head
-```
-
-Another example:
-
-```{r, dependson='asdiskframe'}
-ranked <- flights.df %>%
-  srckeep(c("year","month","day", "dep_delay")) %>%
-  hard_group_by(c("year", "month", "day")) %>%
-  filter(min_rank(desc(dep_delay)) <= 2 & dep_delay > 0) %>%
-  collect
-
-ranked %>% head
-```
-
-One more example:
-
-```{r, dependson='asdiskframe'}
-# Rank each flight within a daily window
-ranked <- flights.df %>%
-  srckeep(c("year","month","day", "dep_delay")) %>%
-  chunk_group_by(year, month, day) %>%
-  select(dep_delay) %>%
-  mutate(rank = rank(desc(dep_delay))) %>%
-  collect
-
-ranked %>% head
-```
-
-
-## Arbitrary by-chunk processing
-
-One can apply arbitrary transformations to each chunk of the `disk.frame` by using the `delayed` function which evaluates lazily or the `map.disk.frame(lazy = F)` function which evaluates eagerly. For example to return the number of rows in each chunk:
-
-```{r, dependson='asdiskframe'}
-flights.df1 <- delayed(flights.df, ~nrow(.x))
-collect_list(flights.df1) %>% head # returns number of rows for each data.frame in a list
-```
-and to do the same with `map.disk.frame`:
-
-```{r, dependson='asdiskframe'}
-map(flights.df, ~nrow(.x), lazy = F) %>% head
-```
-The `map` function can also output the results to another disk.frame folder, e.g.
-
-```{r, dependson='asdiskframe'}
-# return the first 10 rows of each chunk
-flights.df2 <- map(flights.df, ~.x[1:10,], lazy = F, outdir = file.path(tempdir(), "tmp2"), overwrite = T)
-
-flights.df2 %>% head
-```
-
-Notice `{disk.frame}` supports the `purrr` syntax for defining a function using `~`.
-
-## Sampling
-
-In the `disk.frame` framework, sampling a proportion of rows within each chunk can be performed using `sample_frac`. 
-
-```{r, dependson='asdiskframe'}
-flights.df %>% sample_frac(0.01) %>% collect %>% head
-```
-
-## Writing Data
-
-One can output a `disk.frame` by using the `write_disk.frame` function. E.g.
-
-```r
-write_disk.frame(flights.df, outdir="out")
-```
-this will output a disk.frame to the folder "out"
-
-```{r cleanup}
-fs::dir_delete(file.path(tempdir(), "tmp_flights.df"))
-fs::dir_delete(file.path(tempdir(), "tmp2"))
-fs::file_delete(file.path(tempdir(), "tmp_flights.csv"))
-```