if (FALSE) { # interactive()
# A remote, hive-partitioned Parquet dataset
base <- paste0("https://github.com/duckdb/duckdb/raw/main/",
"data/parquet-testing/hive-partitioning/union_by_name/")
f1 <- paste0(base, "x=1/f1.parquet")
f2 <- paste0(base, "x=1/f2.parquet")
f3 <- paste0(base, "x=2/f2.parquet")
open_dataset(c(f1,f2,f3), unify_schemas = TRUE)
# Access an S3 database specifying an independently-hosted (MINIO) endpoint
efi <- open_dataset("s3://neon4cast-scores/parquet/aquatics",
s3_access_key_id="",
s3_endpoint="data.ecoforecast.org")
# Use parser-options for non-standard csv:
cars <- tempfile() # dummy data
write.table(mtcars, cars, row.names = FALSE)
# Note nested quotes on parser option for delimiter:
df <- open_dataset(cars, format = "csv",
parser_options = c(delim = "' '", header = TRUE))
}
Run the code above in your browser using DataLab