# NOT RUN {
library(sparklyr)
sc <- spark_connect(master = "spark://HOST:PORT")
df <- spark_read_warc(
sc,
system.file("samples/sample.warc", package = "sparkwarc"),
repartition = FALSE,
memory = FALSE,
overwrite = FALSE
)
spark_disconnect(sc)
# }
Run the code above in your browser using DataCamp Workspace