Merge function for disk.frames

# S3 method for disk.frame
merge(
  x,
  y,
  by,
  outdir = tempfile(fileext = ".df"),
  ...,
  merge_by_chunk_id = FALSE,
  overwrite = FALSE
)

Arguments

x

a disk.frame

y

a disk.frame or data.frame

by

the merge by keys

outdir

The output directory for the disk.frame

...

passed to merge and cmap.disk.frame

merge_by_chunk_id

if TRUE then only chunks in df1 and df2 with the same chunk id will get merged

overwrite

overwrite the outdir or not

Examples

b = as.disk.frame(data.frame(a = 51:150, b = 1:100))
d = as.disk.frame(data.frame(a = 151:250, b = 1:100))
bd.df = merge(b, d, by = "b", merge_by_chunk_id = TRUE)

# clean up cars.df
delete(b)
delete(d)
delete(bd.df)