From a71793007c6824fd608c9fdbac2b8c79e9093bb3 Mon Sep 17 00:00:00 2001 From: tidwall Date: Sat, 7 Dec 2024 06:00:16 -0700 Subject: [PATCH] Change memory ordering for reference counting This commit changes the way the reference counting behavior, going from add/sub with SEQ_CST/SEQ_CST to add/sub with RELAXED/COMSUME+fence(ACQUIRE). This should make for more efficent clones and frees. This method is inspired by the reference counter implementation in the boost library. https://www.boost.org/doc/libs/1_57_0/doc/html/atomic/usage_examples.html --- tg.c | 35 ++++++++++++++++++++++------------- 1 file changed, 22 insertions(+), 13 deletions(-) diff --git a/tg.c b/tg.c index c40aaf9..27f3788 100644 --- a/tg.c +++ b/tg.c @@ -50,27 +50,36 @@ enum flags { IS_UNLOCATED = 1<<7, // GeoJSON. 'Feature' with 'geometry'=null }; +// Reference counting in TG defaults to zero. This means that a zero value for +// an object with an rc_t field holds a single reference. Only when the rc_t +// falls below zero will the owning object be freed. +// +// rc_add adds a new reference +// rc_sub removes a reference. Returns false if the owning object can be freed. +// // Optionally use non-atomic reference counting when TG_NOATOMICS is defined. #ifdef TG_NOATOMICS typedef int rc_t; -static int rc_sub(rc_t *rc) { +static bool rc_sub(rc_t *rc) { int fetch = *rc; (*rc)--; - return fetch; + return fetch > 0; } -static int rc_add(rc_t *rc) { - int fetch = *rc; +static void rc_add(rc_t *rc) { (*rc)++; - return fetch; } #else #include typedef atomic_int rc_t; -static int rc_sub(rc_t *rc) { - return atomic_fetch_sub(rc, 1); +static bool rc_sub(rc_t *rc) { + if (atomic_fetch_sub_explicit(rc, 1, __ATOMIC_CONSUME) > 0) { + return true; + } + atomic_thread_fence(__ATOMIC_ACQUIRE); + return false; } -static int rc_add(rc_t *rc) { - return atomic_fetch_add(rc, 1); +static void rc_add(rc_t *rc) { + atomic_fetch_add_explicit(rc, 1, __ATOMIC_RELAXED); } #endif @@ -1827,7 +1836,7 @@ struct tg_ring *tg_ring_new_ix(const struct tg_point *points, int npoints, /// @see RingFuncs void tg_ring_free(struct tg_ring *ring) { if (!ring) return; - if (rc_sub(&ring->head.rc) > 0) return; + if (rc_sub(&ring->head.rc)) return; if (ring->ystripes) tg_free(ring->ystripes); tg_free(ring); } @@ -3343,7 +3352,7 @@ void tg_poly_free(struct tg_poly *poly) { tg_ring_free((struct tg_ring*)poly); return; } - if (rc_sub(&poly->head.rc) > 0) return; + if (rc_sub(&poly->head.rc)) return; if (poly->exterior) tg_ring_free(poly->exterior); if (poly->holes) { for (int i = 0; i < poly->nholes; i++) { @@ -3859,7 +3868,7 @@ struct tg_geom *tg_geom_new_point(struct tg_point point) { } static void boxed_point_free(struct boxed_point *point) { - if (rc_sub(&point->head.rc) > 0) return; + if (rc_sub(&point->head.rc)) return; tg_free(point); } @@ -4616,7 +4625,7 @@ struct tg_geom *tg_geom_clone(const struct tg_geom *geom) { } static void geom_free(struct tg_geom *geom) { - if (rc_sub(&geom->head.rc) > 0) return; + if (rc_sub(&geom->head.rc)) return; switch (geom->head.type) { case TG_POINT: break;