Actually rewrite the dsf implementation.

This rewrite improves the core data structure implementation in two ways. Firstly, when merging two equivalence classes, we check their relative sizes, and choose the larger class's canonical element to be the overall root of the new class tree. This minimises the number of overlong paths to the root after the merge. Secondly, we defer path compression until _after_ the two classes are merged, rather than do it beforehand (via using edsf_canonify as a subroutine) and then have to do it wastefully again afterwards. The size-based root selection was what we _used_ to do, and delivers the better asymptotic performance. I reverted it so that Keen could track the min of each equivalence class. But since then I've realised you can have the asymptotic goodness _and_ min-tracking if you store the minima separately from the main data structure. So now Keen does that, and other clients don't have to pay the cost. Similarly, the flip tracking is now a cost that only users of flip dsfs have to pay, because a normal one doesn't store that information at all.
2025-04-20 15:41:30 -07:00 · 2023-04-20 17:13:47 +01:00
parent c5e253a9f9
commit 68d242c587
1 changed files with 261 additions and 117 deletions
--- a/dsf.c
+++ b/dsf.c
@ -5,157 +5,301 @@
 */
 #include <assert.h>
 #include <limits.h>
 #include <string.h>
 #include "puzzles.h"
 #define DSF_INDEX_MASK (UINT_MAX >> 1)
 #define DSF_FLAG_CANONICAL (UINT_MAX & ~(UINT_MAX >> 1))
 #define DSF_MAX (DSF_INDEX_MASK + 1)
 struct DSF {
-    int size;
+    /*
-    int *p;
+     * Size of the dsf.
     */
    size_t size;
    /*
     * Main array storing the data structure.
     *
     * If n is the canonical element of an equivalence class,
     * parent_or_size[n] holds the number of elements in that class,
     * bitwise-ORed with DSF_FLAG_CANONICAL.
     *
     * If n is not the canonical element, parent_or_size[n] holds the
     * index of another element nearer to the root of the tree for
     * that class.
     */
    unsigned *parent_or_size;
    /*
     * Extra storage for flip tracking.
     *
     * If n is not a canonical element, flip[n] indicates whether the
     * sense of this element is flipped relative to parent_or_size[n].
     *
     * If n is a canonical element, flip[n] is unused.
     */
    unsigned char *flip;
    /*
     * Extra storage for minimal-element tracking.
     *
     * If n is a canonical element, min[n] holds the index of the
     * smallest value in n's equivalence class.
     *
     * If n is not a canonical element, min[n] is unused.
     */
    unsigned *min;
 };
 static DSF *dsf_new_internal(int size, bool flip, bool min)
 {
    DSF *dsf;
    assert(0 < size && size <= DSF_MAX && "Bad dsf size");
    dsf = snew(DSF);
    dsf->size = size;
    dsf->parent_or_size = snewn(size, unsigned);
    dsf->flip = flip ? snewn(size, unsigned char) : NULL;
    dsf->min = min ? snewn(size, unsigned) : NULL;
    dsf_reinit(dsf);
    return dsf;
 }
 DSF *dsf_new(int size)
 {
    return dsf_new_internal(size, false, false);
 }
 DSF *dsf_new_flip(int size)
 {
    return dsf_new_internal(size, true, false);
 }
 DSF *dsf_new_min(int size)
 {
    return dsf_new_internal(size, false, true);
 }
 void dsf_reinit(DSF *dsf)
 {
-    int i;
+    size_t i;
    /* Every element starts as the root of an equivalence class of size 1 */
    for (i = 0; i < dsf->size; i++)
-        dsf->p[i] = 6;
+        dsf->parent_or_size[i] = DSF_FLAG_CANONICAL | 1;
-    /* Bottom bit of each element of this array stores whether that
+
-     * element is opposite to its parent, which starts off as
+    /* If we're tracking minima then every element is also its own min */
-     * false. Second bit of each element stores whether that element
+    if (dsf->min)
-     * is the root of its tree or not.  If it's not the root, the
+        for (i = 0; i < dsf->size; i++)
-     * remaining 30 bits are the parent, otherwise the remaining 30
+            dsf->min[i] = i;
-     * bits are the number of elements in the tree.  */
+
    /* No need to initialise dsf->flip, even if it exists, because
     * only the entries for non-root elements are meaningful, and
     * currently there are none. */
 }
 void dsf_copy(DSF *to, DSF *from)
 {
    assert(to->size == from->size && "Mismatch in dsf_copy");
-    memcpy(to->p, from->p, to->size * sizeof(int));
+    memcpy(to->parent_or_size, from->parent_or_size,
           to->size * sizeof(*to->parent_or_size));
    if (to->flip) {
        assert(from->flip && "Copying a non-flip dsf to a flip one");
        memcpy(to->flip, from->flip, to->size * sizeof(*to->flip));
    }
    if (to->min) {
        assert(from->min && "Copying a non-min dsf to a min one");
        memcpy(to->min, from->min, to->size * sizeof(*to->min));
    }
 }
 DSF *dsf_new(int size)
 {
    DSF *ret = snew(DSF);
    ret->size = size;
    ret->p = snewn(size, int);
    dsf_reinit(ret);
    return ret;
 }
 DSF *dsf_new_min(int size) { return dsf_new(size); }
 DSF *dsf_new_flip(int size) { return dsf_new(size); }
 void dsf_free(DSF *dsf)
 {
    if (dsf) {
-        sfree(dsf->p);
+        sfree(dsf->parent_or_size);
        sfree(dsf->flip);
        sfree(dsf->min);
        sfree(dsf);
    }
 }
-int dsf_canonify(DSF *dsf, int index)
+static inline size_t dsf_find_root(DSF *dsf, size_t n)
 {
-    return dsf_canonify_flip(dsf, index, NULL);
+    while (!(dsf->parent_or_size[n] & DSF_FLAG_CANONICAL))
        n = dsf->parent_or_size[n];
    return n;
 }
-int dsf_minimal(DSF *dsf, int index)
+static inline void dsf_path_compress(DSF *dsf, size_t n, size_t root)
 {
-    return dsf_canonify_flip(dsf, index, NULL);
+    while (!(dsf->parent_or_size[n] & DSF_FLAG_CANONICAL)) {
-}
+        size_t prev = n;
-
+        n = dsf->parent_or_size[n];
-bool dsf_equivalent(DSF *dsf, int i1, int i2)
+        dsf->parent_or_size[prev] = root;
 {
    return dsf_canonify(dsf, i1) == dsf_canonify(dsf, i2);
 }
 void dsf_merge(DSF *dsf, int v1, int v2)
 {
    dsf_merge_flip(dsf, v1, v2, false);
 }
 int dsf_size(DSF *dsf, int index) {
    return dsf->p[dsf_canonify(dsf, index)] >> 2;
 }
 int dsf_canonify_flip(DSF *dsf, int index, bool *inverse_return)
 {
    int start_index = index, canonical_index;
    bool inverse = false;
    assert(0 <= index && index < dsf->size && "Overrun in edsf_canonify");
    /* Find the index of the canonical element of the 'equivalence class' of
     * which start_index is a member, and figure out whether start_index is the
     * same as or inverse to that. */
    while ((dsf->p[index] & 2) == 0) {
        inverse ^= (dsf->p[index] & 1);
 	index = dsf->p[index] >> 2;
    }
-    canonical_index = index;
+    assert(n == root);
 }
-    if (inverse_return)
+int dsf_canonify(DSF *dsf, int n)
-        *inverse_return = inverse;
+{
    size_t root;
-    /* Update every member of this 'equivalence class' to point directly at the
+    assert(0 <= n && n < dsf->size && "Overrun in dsf_canonify");
-     * canonical member. */
+
-    index = start_index;
+    root = dsf_find_root(dsf, n);
-    while (index != canonical_index) {
+    dsf_path_compress(dsf, n, root);
-	int nextindex = dsf->p[index] >> 2;
+    return root;
-        bool nextinverse = inverse ^ (dsf->p[index] & 1);
+}
-	dsf->p[index] = (canonical_index << 2) | inverse;
+
-        inverse = nextinverse;
+void dsf_merge(DSF *dsf, int n1, int n2)
-	index = nextindex;
+{
    size_t r1, r2, s1, s2, root;
    assert(0 <= n1 && n1 < dsf->size && "Overrun in dsf_merge");
    assert(0 <= n2 && n2 < dsf->size && "Overrun in dsf_merge");
    assert(!dsf->flip && "dsf_merge on a flip dsf");
    /* Find the root elements */
    r1 = dsf_find_root(dsf, n1);
    r2 = dsf_find_root(dsf, n2);
    if (r1 == r2) {
        /* Classes are already the same, so we have a common root */
        root = r1;
    } else {
        /* Classes must be merged */
        /* Decide which one to use as the overall root, based on size */
        s1 = dsf->parent_or_size[r1] & DSF_INDEX_MASK;
        s2 = dsf->parent_or_size[r2] & DSF_INDEX_MASK;
        if (s1 > s2) {
            dsf->parent_or_size[r2] = root = r1;
        } else {
            dsf->parent_or_size[r1] = root = r2;
        }
        dsf->parent_or_size[root] = (s1 + s2) | DSF_FLAG_CANONICAL;
        if (dsf->min) {
            /* Update the min of the merged class */
            unsigned m1 = dsf->min[r1], m2 = dsf->min[r2];
            dsf->min[root] = m1 < m2 ? m1 : m2;
        }
    }
-    assert(!inverse);
+    /* Path-compress both paths from n1 and n2 so they point at the new root */
-
+    dsf_path_compress(dsf, n1, root);
-    return index;
+    dsf_path_compress(dsf, n2, root);
 }
-void dsf_merge_flip(DSF *dsf, int v1, int v2, bool inverse)
+bool dsf_equivalent(DSF *dsf, int n1, int n2)
 {
-    bool i1, i2;
+    return dsf_canonify(dsf, n1) == dsf_canonify(dsf, n2);
-
+}
-    assert(0 <= v1 && v1 < dsf->size && "Overrun in edsf_merge");
+
-    assert(0 <= v2 && v2 < dsf->size && "Overrun in edsf_merge");
+int dsf_size(DSF *dsf, int n)
-
+{
-    v1 = dsf_canonify_flip(dsf, v1, &i1);
+    size_t root = dsf_canonify(dsf, n);
-    assert(dsf->p[v1] & 2);
+    return dsf->parent_or_size[root] & DSF_INDEX_MASK;
-    inverse ^= i1;
+}
-    v2 = dsf_canonify_flip(dsf, v2, &i2);
+
-    assert(dsf->p[v2] & 2);
+static inline size_t dsf_find_root_flip(DSF *dsf, size_t n, unsigned *flip)
-    inverse ^= i2;
+{
-
+    *flip = 0;
-    if (v1 == v2)
+    while (!(dsf->parent_or_size[n] & DSF_FLAG_CANONICAL)) {
-        assert(!inverse);
+        *flip ^= dsf->flip[n];
-    else {
+        n = dsf->parent_or_size[n];
-	/*
+    }
-	 * We always make the smaller of v1 and v2 the new canonical
+    return n;
-	 * element. This ensures that the canonical element of any
+}
-	 * class in this structure is always the first element in
+
-	 * it. 'Keen' depends critically on this property.
+static inline void dsf_path_compress_flip(DSF *dsf, size_t n, size_t root,
-	 *
+                                          unsigned flip)
-	 * (Jonas Koelker previously had this code choosing which
+{
-	 * way round to connect the trees by examining the sizes of
+    while (!(dsf->parent_or_size[n] & DSF_FLAG_CANONICAL)) {
-	 * the classes being merged, so that the root of the
+        size_t prev = n;
-	 * larger-sized class became the new root. This gives better
+        unsigned flip_prev = flip;
-	 * asymptotic performance, but I've changed it to do it this
+        n = dsf->parent_or_size[n];
-	 * way because I like having a deterministic canonical
+        flip ^= dsf->flip[prev];
-	 * element.)
+        dsf->flip[prev] = flip_prev;
-	 */
+        dsf->parent_or_size[prev] = root;
-	if (v1 > v2) {
+    }
-	    int v3 = v1;
+    assert(n == root);
-	    v1 = v2;
+}
-	    v2 = v3;
+
-	}
+int dsf_canonify_flip(DSF *dsf, int n, bool *inverse)
-	dsf->p[v1] += (dsf->p[v2] >> 2) << 2;
+{
-	dsf->p[v2] = (v1 << 2) | inverse;
+    size_t root;
-    }
+    unsigned flip;
-    
+
-    v2 = dsf_canonify_flip(dsf, v2, &i2);
+    assert(0 <= n && n < dsf->size && "Overrun in dsf_canonify_flip");
-    assert(v2 == v1);
+    assert(dsf->flip && "dsf_canonify_flip on a non-flip dsf");
-    assert(i2 == inverse);
+
    root = dsf_find_root_flip(dsf, n, &flip);
    dsf_path_compress_flip(dsf, n, root, flip);
    *inverse = flip;
    return root;
 }
 void dsf_merge_flip(DSF *dsf, int n1, int n2, bool inverse)
 {
    size_t r1, r2, s1, s2, root;
    unsigned f1, f2;
    assert(0 <= n1 && n1 < dsf->size && "Overrun in dsf_merge_flip");
    assert(0 <= n2 && n2 < dsf->size && "Overrun in dsf_merge_flip");
    assert(dsf->flip && "dsf_merge_flip on a non-flip dsf");
    /* Find the root elements */
    r1 = dsf_find_root_flip(dsf, n1, &f1);
    r2 = dsf_find_root_flip(dsf, n2, &f2);
    if (r1 == r2) {
        /* Classes are already the same, so we have a common root */
        assert((f1 ^ f2 ^ inverse) == 0 && "Inconsistency in dsf_merge_flip");
        root = r1;
    } else {
        /* Classes must be merged */
        /* Decide which one to use as the overall root, based on size */
        s1 = dsf->parent_or_size[r1] & DSF_INDEX_MASK;
        s2 = dsf->parent_or_size[r2] & DSF_INDEX_MASK;
        if (s1 > s2) {
            dsf->parent_or_size[r2] = root = r1;
            dsf->flip[r2] = f1 ^ f2 ^ inverse;
            f2 ^= dsf->flip[r2];
        } else {
            root = r2;
            dsf->parent_or_size[r1] = root = r2;
            dsf->flip[r1] = f1 ^ f2 ^ inverse;
            f1 ^= dsf->flip[r1];
        }
        dsf->parent_or_size[root] = (s1 + s2) | DSF_FLAG_CANONICAL;
        if (dsf->min) {
            /* Update the min of the merged class */
            unsigned m1 = dsf->min[r1], m2 = dsf->min[r2];
            dsf->min[root] = m1 < m2 ? m1 : m2;
        }
    }
    /* Path-compress both paths from n1 and n2 so they point at the new root */
    dsf_path_compress_flip(dsf, n1, root, f1);
    dsf_path_compress_flip(dsf, n2, root, f2);
 }
 int dsf_minimal(DSF *dsf, int n)
 {
    size_t root;
    assert(dsf->min && "dsf_minimal on a non-min dsf");
    root = dsf_canonify(dsf, n);
    return dsf->min[root];
 }