Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

move POINT geometries out of a list column, into a matrix #2059

Open
wants to merge 38 commits into
base: main
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
38 commits
Select commit Hold shift + click to select a range
ec68f40
first shot at implementing sfc_POINT with matrix
edzer Dec 13, 2022
d9c5de0
pass check with points in matrix attribute
edzer Dec 13, 2022
7210201
speed up st_combine
edzer Dec 13, 2022
b16648e
fix as(x, "Spatial") for points in matrix attr
edzer Dec 14, 2022
1bfb7ea
update st_as_sfc.SpatialPoints; see also #2060
edzer Dec 14, 2022
ea0e62a
Merge branch 'main' into pointx
edzer Dec 19, 2022
d0dab0f
Merge branch 'main' into pointx
edzer Dec 23, 2022
fc83931
merge main
edzer Dec 23, 2022
5275389
Merge branch 'main' into pointx
edzer Jan 6, 2023
54a5835
Merge branch 'main' into pointx
edzer Feb 5, 2023
3401d0d
Merge branch 'main' into pointx
edzer Feb 8, 2023
f30aa65
Merge branch 'main' into pointx
edzer Mar 13, 2023
d81f8ca
remove min/max warnings on empty point sets
edzer Mar 13, 2023
f96e0fa
Merge branch 'main' into pointx
edzer Mar 27, 2023
dcda1fd
Merge branch 'main' into pointx
edzer Apr 11, 2023
4713008
Merge branch 'main' into pointx
edzer Apr 27, 2023
250cc44
Merge branch 'main' into pointx
edzer Jun 14, 2023
c0e56b4
Merge branch 'main' into pointx
edzer Jun 14, 2023
86059e2
Merge branch 'main' into pointx
edzer Jun 27, 2023
e3def06
Merge branch 'pointx' of github.com:r-spatial/sf into pointx
edzer Jun 27, 2023
3f03184
Merge branch 'main' into pointx
edzer Jun 29, 2023
3ec76b8
modifications handling c() and st_distance
edzer Jun 29, 2023
b8dc2b3
address comment from @bart1
edzer Jun 30, 2023
203187d
filter empty point; #2059
edzer Jun 30, 2023
1bcce69
Merge branch 'main' into pointx
edzer Aug 21, 2023
4ecabf0
keep crs in dplyr::filter
edzer Aug 30, 2023
d38b3dc
Merge branch 'main' into pointx
edzer Aug 30, 2023
230cde6
Merge branch 'main' into pointx
edzer Jan 23, 2024
4ce501e
update for this branch
edzer Jan 23, 2024
5126cd6
Fix value replacement for sfc_POINT
Feb 16, 2024
c818629
Merge pull request #2345 from bart1/pointx
edzer Feb 22, 2024
4722081
Merge branch 'main' into pointx
edzer Feb 23, 2024
f687956
ensure vctrs operations work
Feb 28, 2024
b90139f
Merge pull request #2350 from bart1/pointx
edzer Feb 28, 2024
d2800ea
Merge branch 'main' into pointx
edzer Mar 17, 2024
4a40825
Merge branch 'pointx' of github.com:r-spatial/sf into pointx
edzer Mar 17, 2024
7fd0ab1
Merge branch 'main' into pointx
edzer Oct 10, 2024
82fe210
align with main
edzer Oct 10, 2024
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions NAMESPACE
Original file line number Diff line number Diff line change
Expand Up @@ -9,6 +9,7 @@ S3method("[",sf)
S3method("[",sfc)
S3method("[<-",sf)
S3method("[<-",sfc)
S3method("[[",sfc)
S3method("[[<-",sf)
S3method("st_agr<-",sf)
S3method("st_crs<-",bbox)
Expand Down
5 changes: 5 additions & 0 deletions R/arith.R
Original file line number Diff line number Diff line change
Expand Up @@ -133,6 +133,11 @@ Ops.sfc <- function(e1, e2) {
if (length(e1) == 0) # empty set
return(e1)

if (inherits(e1, "sfc")) # realize
e1 = e1[]
if (inherits(e2, "sfc"))
e2 = e2[]

if (is.numeric(e2) && !is.matrix(e2) && length(e2) <= 2 && .Generic %in% c("+", "-")) {
if (.Generic == "-")
e2 <- -e2
Expand Down
11 changes: 10 additions & 1 deletion R/bbox.R
Original file line number Diff line number Diff line change
Expand Up @@ -9,6 +9,13 @@ bb_wrap = function(bb) {
structure(as.double(bb), names = c("xmin", "ymin", "xmax", "ymax"), class = "bbox")
}

bbox.pointmatrix = function(obj, ...) {
if (nrow(obj) == 0 || all(is.na(obj)))
bb_wrap(rep(NA_real_, 4))
else
bb_wrap(as.vector(t(apply(obj[,1:2,drop=FALSE], 2, range, na.rm = TRUE))))
}

bbox.Set = function(obj, ...) {
sel = !sfc_is_empty(obj)
if (! any(sel))
Expand Down Expand Up @@ -134,7 +141,9 @@ print.bbox = function(x, ...) {
}

compute_bbox = function(obj) {
switch(class(obj)[1],
if (!is.null(pts <- attr(obj, "points")))
bbox.pointmatrix(pts)
else switch(class(obj)[1],
sfc_POINT = bb_wrap(bbox.Set(obj)),
sfc_MULTIPOINT = bb_wrap(bbox.MtrxSet(obj)),
sfc_LINESTRING = bb_wrap(bbox.MtrxSet(obj)),
Expand Down
7 changes: 6 additions & 1 deletion R/bind.R
Original file line number Diff line number Diff line change
Expand Up @@ -36,7 +36,12 @@ rbind.sf = function(..., deparse.level = 1) {
else
NULL
chk_equal_crs(dots)
ret = st_sf(rbind.data.frame(...), crs = st_crs(dots[[1]]), sf_column_name = sf_column)
crs0 = st_crs(dots[[1]])
for (i in seq_along(dots)) {
if (all(sapply(unclass(st_geometry(dots[[i]])), is.null)))
st_geometry(dots[[i]]) = st_geometry(dots[[i]])[] # realize
}
ret = st_sf(do.call(rbind.data.frame, dots), crs = crs0, sf_column_name = sf_column)
st_geometry(ret) = st_sfc(st_geometry(ret)) # might need to reclass to GEOMETRY
bb = do.call(rbind, lapply(dots, st_bbox))
bb = bb_wrap(c(min(bb[,1L], na.rm = TRUE), min(bb[,2L], na.rm = TRUE),
Expand Down
3 changes: 2 additions & 1 deletion R/geom-measures.R
Original file line number Diff line number Diff line change
Expand Up @@ -206,6 +206,7 @@ st_distance = function(x, y, ..., dist_fun, by_element = FALSE,
else
CPL_geos_dist(x, y, which, par)
}
d[is.nan(d)] = NA_real_
if (!is.null(u <- st_crs(x)$ud_unit))
units(d) = u
d
Expand Down Expand Up @@ -254,7 +255,7 @@ st_line_project = function(line, point, normalized = FALSE) {
is.logical(normalized), length(normalized) == 1,
st_crs(line) == st_crs(point))
line = st_cast(line, "LINESTRING")
point = st_cast(point, "POINT")
point = st_cast(point[], "POINT")
if (isTRUE(st_is_longlat(line)))
message_longlat("st_project_point")
recycled = recycle_common(list(line, point))
Expand Down
12 changes: 9 additions & 3 deletions R/geom-transformers.R
Original file line number Diff line number Diff line change
Expand Up @@ -473,7 +473,7 @@ st_minimum_rotated_rectangle.sf = function(x, dTolerance, ...) {
#' n = 100
#' pts = st_as_sf(data.frame(matrix(runif(n), , 2), id = 1:(n/2)), coords = c("X1", "X2"))
#' # compute Voronoi polygons:
#' pols = st_collection_extract(st_voronoi(do.call(c, st_geometry(pts))))
#' pols = st_collection_extract(st_voronoi(st_combine(pts)))
#' # match them to points:
#' pts$pols = pols[unlist(st_intersects(pts, pols))]
#' plot(pts["id"], pch = 16) # ID is color
Expand Down Expand Up @@ -744,8 +744,14 @@ st_segmentize.sf = function(x, dfMaxLength, ...) {
#' @examples
#' nc = st_read(system.file("shape/nc.shp", package="sf"))
#' st_combine(nc)
st_combine = function(x)
st_sfc(do.call(c, st_geometry(x)), crs = st_crs(x)) # flatten/merge
st_combine = function(x) {
x = st_geometry(x)
if (inherits(x, "sfc_POINT") && !is.null(pts <- attr(x, "points"))) {
mp = structure(list(st_multipoint(pts, attr(x, "point_dim"))), bbox = st_bbox(x))
st_sfc(mp, crs = st_crs(x))
} else
st_sfc(do.call(c, x), crs = st_crs(x)) # flatten/merge
}

# x: object of class sf
# y: object of class sf or sfc
Expand Down
8 changes: 7 additions & 1 deletion R/m_range.R
Original file line number Diff line number Diff line change
Expand Up @@ -9,6 +9,10 @@ mb_wrap = function(mb) {
structure(mb, names = c("mmin", "mmax"), class = "m_range")
}

m_range.pointmatrix = function(obj, ...) {
mb_wrap(range(obj[,ncol(obj)]))
}

m_range.Set = function(obj, ...) {
sel = vapply(obj, function(x) { length(x) && !all(is.na(x)) }, TRUE)
if (! any(sel))
Expand Down Expand Up @@ -130,7 +134,9 @@ print.m_range = function(x, ...) {
}

compute_m_range = function(obj) {
switch(class(obj)[1],
if (!is.null(pts <- attr(obj, "points")))
m_range.pointmatrix(pts)
else switch(class(obj)[1],
sfc_POINT = mb_wrap(m_range.Set(obj)),
sfc_MULTIPOINT = mb_wrap(m_range.MtrxSet(obj)),
sfc_LINESTRING = mb_wrap(m_range.MtrxSet(obj)),
Expand Down
3 changes: 2 additions & 1 deletion R/plot.R
Original file line number Diff line number Diff line change
Expand Up @@ -345,7 +345,8 @@ plot.sfc_POINT = function(x, y, ..., pch = 1, cex = 1, col = 1, bg = 0, lwd = 1,
col = rep(col, length.out = npts)
bg = rep(bg, length.out = npts)
cex = rep(cex, length.out = npts)
mat = t(matrix(unlist(x, use.names = FALSE), ncol = length(x))) #933
#mat = t(matrix(unlist(x, use.names = FALSE), ncol = length(x))) #933
mat = st_coordinates(x)
if (!is.null(mat)) {
ne = !is.na(rowMeans(mat)) ## faster than apply; #933
points(mat[ne,, drop = FALSE], pch = pch[ne], col = col[ne], bg = bg[ne],
Expand Down
34 changes: 21 additions & 13 deletions R/sf.R
Original file line number Diff line number Diff line change
Expand Up @@ -46,24 +46,31 @@ st_as_sf.data.frame = function(x, ..., agr = NA_agr_, coords, wkt,
else
x$geometry = st_as_sfc(as.character(x[[wkt]]))
} else if (! missing(coords)) {
cc = as.data.frame(lapply(x[coords], as.numeric))
if (na.fail && anyNA(cc))
stop("missing values in coordinates not allowed")
# classdim = getClassDim(rep(0, length(coords)), length(coords), dim, "POINT")
if (length(coords) == 1) {
stopifnot(is.matrix(x[[coords]]), is.numeric(x[[coords]]))
cc = x[[coords]]
} else {
if (length(coords) == 2)
dim = "XY"
stopifnot(length(coords) == nchar(dim), dim %in% c("XY", "XYZ", "XYZM", "XYM"))
cc = do.call(cbind, lapply(x[coords], as.numeric))
if (na.fail && anyNA(cc))
stop("missing values in coordinates not allowed")
}
dimnames(cc) = NULL
if (is.null(sf_column_name))
sf_column_name = "geometry"

x[[sf_column_name]] = if (nchar(dim) < 4 && ncol(cc) == 4) { # create POLYGONs:
fn = function(x) st_as_sfc(st_bbox(c(xmin = x[[1]], ymin = x[[2]], xmax = x[[3]], ymax = x[[4]])))
do.call(c, apply(as.matrix(cc), 1, fn))
} else { # points:
structure( points_rcpp(as.matrix(cc), dim),
structure(vector("list", length = nrow(cc)),
points = cc,
points_dim = dim,
n_empty = 0L, precision = 0, crs = NA_crs_,
bbox = structure(
c(xmin = min(cc[[1]], na.rm = TRUE),
ymin = min(cc[[2]], na.rm = TRUE),
xmax = max(cc[[1]], na.rm = TRUE),
ymax = max(cc[[2]], na.rm = TRUE)), class = "bbox"),
class = c("sfc_POINT", "sfc" ), names = NULL)
bbox = bbox.pointmatrix(cc),
class = c("sfc_POINT", "sfc"), names = NULL)
}

if (remove) {
Expand Down Expand Up @@ -430,9 +437,10 @@ print.sf = function(x, ..., n = getOption("sf_max_print", default = 10)) {
app = paste0(app, "\n", "Active geometry column: ", attr(x, "sf_column"))
print(st_geometry(x), n = 0, what = "Simple feature collection with", append = app)
if (n > 0) {
if (inherits(x, c("tbl_df", "tbl")))
if (inherits(x, c("tbl_df", "tbl"))) {
st_geometry(x) = x[[attr(x, "sf_column")]][] # note the extra []: this reloads points
NextMethod()
else {
} else {
y <- x
if (nrow(y) > n) {
cat(paste("First", n, "features:\n"))
Expand Down
103 changes: 87 additions & 16 deletions R/sfc.R
Original file line number Diff line number Diff line change
Expand Up @@ -54,14 +54,24 @@ st_sfc = function(..., crs = NA_crs_, precision = 0.0, check_ring_dir = FALSE, d
lst = lst[[1]]
stopifnot(is.numeric(crs) || is.character(crs) || inherits(crs, "crs"))

points_in_attr <- !is.null(attr(lst, "points"))

# check for NULLs:
a = attributes(lst)
is_null = sfc_is_null(lst)
is_null = if (points_in_attr)
rep(FALSE, length(lst))
else
sfc_is_null(lst)
lst = unclass(lst)
lst = lst[! is_null]
if (!points_in_attr)
lst = lst[! is_null]

attributes(lst) = a

dims_and_types = sfc_unique_sfg_dims_and_types(lst)
dims_and_types = if (points_in_attr)
list(class_dim = attr(lst, "points_dim"), class_type = "POINT")
else
sfc_unique_sfg_dims_and_types(lst)

cls = if (length(lst) == 0) # empty set: no geometries read
c("sfc_GEOMETRY", "sfc")
Expand Down Expand Up @@ -155,21 +165,46 @@ st_sfc = function(..., crs = NA_crs_, precision = 0.0, check_ring_dir = FALSE, d
#' @details if `x` has a `dim` attribute (i.e. is an `array` or `matrix`) then `op` cannot be used.
#' @export
"[.sfc" = function(x, i, j, ..., op = st_intersects) {
precision = st_precision(x)
crs = st_crs(x)
dim = if (length(x)) class(x[[1]])[1] else "XY"
if (!missing(i) && (inherits(i, c("sf", "sfc", "sfg"))))

if (!missing(i) && (inherits(i, "sf") || inherits(i, "sfc") || inherits(i, "sfg")))
i = lengths(op(x, i, ...)) != 0
if (!is.null(dim(x))) # x is an array with geometries
st_sfc(NextMethod(), crs = crs, precision = precision, dim = dim)
else # x is a list but avoid NextMethod() to allow j, ... to be specified & ignored:
st_sfc(unclass(x)[i], crs = crs, precision = precision, dim = dim)
if (inherits(x, "sfc_POINT") && !is.null(attr(x, "points")))
st_sfc(restore_points(x, i), crs = st_crs(x), precision = st_precision(x),
dim = if(length(x)) class(x[[1]])[1] else "XY")
else {
precision = st_precision(x)
crs = st_crs(x)
dim = if (length(x)) class(x[[1]])[1] else "XY"
if (!is.null(dim(x))) # x is an array with geometries
st_sfc(NextMethod(), crs = crs, precision = precision, dim = dim)
else # x is a list but avoid NextMethod() to allow j, ... to be specified & ignored:
st_sfc(unclass(x)[i], crs = crs, precision = precision, dim = dim)
}
}

#' @export
"[<-.sfc" = function (x, i, j, ..., value) {
if (is.null(value) || inherits(value, "sfg"))
"[<-.sfc" = function (x, i, value) {
if (is.null(value) || inherits(value, "sfg")) {
is_points = inherits(value, "POINT")
value = list(value)
} else
is_points = inherits(value, "sfc_POINT")
if (inherits(x, "sfc_POINT") && !is.null(attr(x, "points"))) {
if (is_points) {
repl = if (!is.null(pts <- attr(value, "points")))
pts
else
do.call(rbind, value)
attr(x, "points")[i, ] = repl
return(structure(x,
n_empty = sum(is.na(attr(x, "points")[,1])),
bbox = bbox.pointmatrix(attr(x, "points"))
)) # RETURNS
} else
x = x[] # realize
}
value = value[] # realize in case sfc_POINT while x is not
x = unclass(x) # becomes a list, but keeps attributes
ret = st_sfc(NextMethod(), recompute_bbox = TRUE)
structure(ret, n_empty = sum(sfc_is_empty(ret)))
}
Expand All @@ -188,8 +223,17 @@ c.sfc = function(..., recursive = FALSE) {
else
c(ucls, "sfc")

points_attr = sapply(lst, function(x) !is.null(attr(x, "points")))
if (any(points_attr) && !all(points_attr)) {
for (i in seq_along(lst))
lst[[i]] = lst[[i]][] # realize
points_attr = FALSE
}

ret = unlist(lapply(lst, unclass), recursive = FALSE)
attributes(ret) = attributes(lst[[1]]) # crs
if (all(points_attr))
attr(ret, "points") = do.call(rbind, lapply(lst, attr, "points"))
class(ret) = cls
attr(ret, "bbox") = compute_bbox(ret) # dispatch on class
attr(ret, "n_empty") = sum(sapply(lst, attr, which = "n_empty"))
Expand Down Expand Up @@ -518,16 +562,22 @@ st_coordinates.sfc = function(x, ...) {
return(matrix(nrow = 0, ncol = 2))

ret = switch(class(x)[1],
sfc_POINT = matrix(unlist(x, use.names = FALSE), nrow = length(x), byrow = TRUE,
dimnames = NULL),
sfc_POINT = if (is.null(attr(x, "points"))) {
matrix(unlist(x, use.names = FALSE), nrow = length(x), byrow = TRUE, dimnames = NULL)
} else {
attr(x, "points")
},
sfc_MULTIPOINT = ,
sfc_LINESTRING = coord_2(x),
sfc_MULTILINESTRING = ,
sfc_POLYGON = coord_3(x),
sfc_MULTIPOLYGON = coord_4(x),
stop(paste("not implemented for objects of class", class(x)[1]))
)
Dims = class(x[[1]])[1]
Dims = if (!is.null(attr(x, "points_dim")))
attr(x, "points_dim")
else
class(x[[1]])[1]
ncd = nchar(Dims)
colnames(ret)[1:ncd] = vapply(seq_len(ncd), function(i) substr(Dims, i, i), "")
ret
Expand Down Expand Up @@ -663,3 +713,24 @@ st_is_full.sf = function(x, ...) {
st_is_full.bbox = function(x, ...) {
sf_use_s2() && st_is_longlat(x) && all(x == c(-180,-90,180,90))
}

#' @export
`[[.sfc` = function(x, i, j, ..., exaxt = TRUE) {
if (inherits(x, "sfc_POINT") && !is.null(attr(x, "points")))
restore_point(x, i)
else
NextMethod()
}

restore_point = function(x, i = TRUE) {
restore_points(x, i)[[1]]
}

restore_points = function(x, i = TRUE) {
a = attributes(x)
points = a$points[i, , drop=FALSE]
structure(points_rcpp(points, a$points_dim),
n_empty = 0L, precision = a$precision, crs = a$crs,
bbox = bbox.pointmatrix(points), class = a$class,
points = NULL, points_dim = NULL)
}
2 changes: 2 additions & 0 deletions R/sfg.R
Original file line number Diff line number Diff line change
Expand Up @@ -258,6 +258,8 @@ c.sfg = function(..., recursive = FALSE, flatten = TRUE) {
Paste0 = function(lst) lapply(lst, unclass)
Paste1 = function(lst) do.call(c, lapply(lst, unclass))
lst = list(...)
if (length(lst) && is.null(lst[[1]]))
stop("to combine POINTs into MULTIPOINT, use st_combine(), or realize them first using x[]")
if (flatten) {
cls = vapply(lst, function(x) class(x)[2], "")
ucls = unique(cls)
Expand Down
13 changes: 9 additions & 4 deletions R/sp.R
Original file line number Diff line number Diff line change
Expand Up @@ -93,9 +93,10 @@ handle_bbox = function(sfc, sp) {
st_as_sfc.SpatialPoints = function(x, ..., precision = 0.0) {
cc = x@coords
dimnames(cc) = NULL
lst = lapply(seq_len(nrow(cc)), function(x) st_point(cc[x,]))
handle_bbox(do.call(st_sfc, append(lst, list(crs = st_crs(x@proj4string),
precision = precision))), x)
lst = vector("list", length = nrow(cc))
attr(lst, "points") = cc
attr(lst, "points_dim") = "XY"
handle_bbox(structure(st_sfc(lst, crs = st_crs(x@proj4string), precision = precision), n_empty = 0), x)
}

#' @rdname st_as_sfc
Expand Down Expand Up @@ -341,7 +342,11 @@ as_Spatial = function(from, cast = TRUE, IDs = paste0("ID", seq_along(from))) {
sfc2SpatialPoints = function(from, IDs) {
if (!requireNamespace("sp", quietly = TRUE))
stop("package sp required, please install it first")
sp::SpatialPoints(do.call(rbind, from), proj4string = as(st_crs(from), "CRS"))
m = if (!is.null(pts <- attr(from, "points")))
pts
else
do.call(rbind, from)
sp::SpatialPoints(m, proj4string = as(st_crs(from), "CRS"))
}

sfc2SpatialMultiPoints = function(from) {
Expand Down
3 changes: 1 addition & 2 deletions R/tidyverse-vctrs.R
Original file line number Diff line number Diff line change
Expand Up @@ -3,14 +3,13 @@
# time, this declares `sfc` lists as vectors which is necessary
# because vctrs generally treats S3 lists as scalars.
vec_proxy.sfc = function(x, ...) {
x
x[]
}
# This restores `sfc` attributes after manipulation of the proxy
# (e.g. slicing or combination)
vec_restore.sfc = function(x, to, ...) {
# Ensure restoration of `n_empty` by `st_sfc()`
attr(x, "n_empty") = NULL

st_sfc(x, crs = st_crs(to), precision = st_precision(to))
}

Expand Down
Loading
Loading