library(sparklyr)
library(apache.sedona)
sc <- spark_connect(master = "spark://HOST:PORT")
if (!inherits(sc, "test_connection")) {
input_location <- "/dev/null" # replace it with the path to your input file
rdd <- sedona_read_dsv_to_typed_rdd(
sc,
location = input_location,
delimiter = ",",
type = "point",
first_spatial_col_index = 1L
)
query_rdd_input_location <- "/dev/null" # replace it with the path to your input file
query_rdd <- sedona_read_shapefile_to_typed_rdd(
sc,
location = query_rdd_input_location,
type = "polygon"
)
join_result_rdd <- sedona_spatial_join(
rdd,
query_rdd,
join_type = "intersect",
partitioner = "quadtree"
)
}
Run the code above in your browser using DataLab