c - 提高union-find的效率-6ren

c - 提高union-find的效率

转载作者：塔克拉玛干更新时间：2023-11-03 04:39:52

24

4

我正在尝试优化 union 查找算法以查找图像中的连通分量。我的图像可以是 2d 或 3d 文件，由 0 和 1 组成。我在这个线程中找到了一个实现:Connected Component Labelling , 用户 Dukering 的回答。

我根据自己的目的调整了该代码。该代码有效，但执行时间很快变得太大。我不明白这个问题。

我的代码如下所示。我用来测试它的文件链接在这里:https://utexas.box.com/s/k12m17rg24fw1yh1p21hytxwq5q8959u这是一个 2223x2223 大小的文件(在下面的程序中定义)。

正如原用户提到的，这是 union-find 的基本实现，可以提高效率。我不明白怎么办。另外，我在Matlab中测试了这张图片，Matlab的速度要快很多。例如，上面链接的图像在我的电脑上需要大约 1.5 分钟，但 Matlab 使用 bwlabel 只需一秒钟。我检查了 bwlabel 使用的算法，它似乎是 union-find 的一些变体，这就是我首先开始这项工作的原因。我如何让我的代码运行得那么快？我还应该提到，我希望在更大的图像(大到 1000^3)上运行我的代码。我当前的版本无法做到这一点。

    #include <time.h>
    #include <stdlib.h>
    #include <stdio.h>

    #define w 2223
    #define h 2223

    void writeArrayInt(int *data, int dims[], char *filename)
    {
     FILE *fp;

     fp = fopen(filename,"w"); 

     /* write grid dimensions */
     fwrite(dims, sizeof(int), 3, fp); 

      /* write data array */
      fwrite(data, sizeof(int), w*h, fp);

      fclose(fp);
      }

      void readArrayInt(int *data, int dims[], char *filename)
      {
       FILE *fp;

       fp = fopen(filename,"r"); 

       /* read grid dimensions */
       fread(dims, sizeof(int), 3, fp); 

       /* read data array */
       fread(data, sizeof(int), w*h, fp);

       fclose(fp);
       }

       void doUnion(int a, int b, int *component)
       {
        // get the root component of a and b, and set the one's parent to the other
       while (component[a] != a)
         a = component[a];
       while (component[b] != b)
         b = component[b];
       component[b] = a;
       }

       void unionCoords(int x, int y, int x2, int y2, int *component, int *input)
       {
        int ind1 = x*h + y;
        int ind2 = x2*h + y2;
        if (y2 < h && x2 < w && input[ind1] && input[ind2] && y2 >= 0 && x2 >= 0)
    doUnion(ind1, ind2, component);
        }

       int main()
       {
       int i, j;
       int *input = (int *)malloc((w*h)*sizeof(int));
       int *output = (int *)malloc((w*h)*sizeof(int));
       int dims[3];

       char fname[256];
       sprintf(fname, "phi_w_bin");
       readArrayInt(input, dims, fname); 

       int *component = (int *)malloc((w*h)*sizeof(int));

       for (i = 0; i < w*h; i++)
         component[i] = i;

 for (int x = 0; x < w; x++)
    for (int y = 0; y < h; y++)
    {
        unionCoords(x, y, x+1, y, component, input);
        unionCoords(x, y, x, y+1, component, input);
        unionCoords(x, y, x-1, y, component, input);
        unionCoords(x, y, x, y-1, component, input);
        unionCoords(x, y, x+1, y+1, component, input);
        unionCoords(x, y, x-1, y+1, component, input);
        unionCoords(x, y, x+1, y-1, component, input);
        unionCoords(x, y, x-1, y-1, component, input);
    }

for (int x = 0; x < w; x++)
{
    for (int y = 0; y < h; y++)
    {
        int c = x*h + y;
        if (input[c] == 0)
        {
            output[c] = input[c];
            continue;
        }
        while (component[c] != c) c = component[c];

        int c1 = x*h + y;
        output[c1] = component[c];
    }
}

sprintf(fname, "outputImage2d");
writeArrayInt(output, dims, fname);  

free(input);
free(output);
free(component);  
}

最佳答案

我建议对您的 union 查找结构进行两项改进:

实际实现 union 和 find! 如果您有一个有效的 find 方法，实现 union 会变得更加简单，因为您不需要 while (component[c] != c) 类的行。供引用，查看信息Wikipedia entry在 union 查找数据结构上
实现一些常见的加速启发式方法，如路径压缩(将 find(x) 返回的值存储在 component[x] 中，从而减少第二次调用 find(x)) 和 union-by-rank 或 union-by-size(使较大的集合成为较小集合的父集合)

编辑:由于似乎需要对另一个答案进行一些澄清，我将自己添加一个最小的实现:

typedef struct {
    int* parent;
    int size;
} union_find;

union_find make_sets(int size) {
    union_find result;
    result.parent = malloc(sizeof(int) * size);
    result.size = size;
    for (int i = 0; i < size; ++i) {
        result.parent[i] = size;
    }

    return result;
}

int find(union_find uf, int i) {
    if (uf.parent[i] < uf.size)
        return uf.parent[i] = find(uf, uf.parent[i]);
    return i;
}

void do_union(union_find uf, int i, int j) {
    int pi = find(uf, i);
    int pj = find(uf, j);
    if (pi == pj) {
        return;
    }
    if (pi < pj) {
        // link the smaller group to the larger one
        uf.parent[pi] = pj;
    } else if (pi > pj) {
        // link the smaller group to the larger one
        uf.parent[pj] = pi;
    } else {
        // equal rank: link arbitrarily and increase rank
        uf.parent[pj] = pi;
        ++uf.parent[pi];  
    }
}

关于c - 提高union-find的效率，我们在Stack Overflow上找到一个类似的问题： https://stackoverflow.com/questions/44877830/

24

4

0

文章推荐： c++ - 理解 vector 乘法

文章推荐： java - 动态添加 JTable 到 JScrollPane

c - 为 union 分配内存以及 union 指针和指针 union 之间的区别
自从我的问题here无法自信地回答，我在这里再次询问，希望有人确切知道: 指向 union 的指针和包含指向其元素的指针的 union 之间有什么区别(除了语法之外)吗？ this中生成的程序集示例是
c - union 内的 union
在 C 语言中，是否可以在另一个 union 体中定义一个 union 体？如果不是，为什么不可能？或者如果可以，可以在哪里使用？最佳答案假设您要定义: union myun { int x;
c - union 中的 union
在 C 中，是否可以在另一个 union 中定义一个 union ？如果不是，为什么不可能？或者如果是，它可以在哪里使用？最佳答案假设你想定义: union myun { int x; s
c - union 内的无名 union
我正在阅读一些代码并发现如下内容: typedef union { int int32; int boolean; time_t date; char *string;
lua - 为什么不能使用Set:union()代替Set.union？
我正在学习Lua，我更愿意使用冒号（:）作为方法。不幸的是，它并非在所有地方都有效。看我的代码：设置= {} 本地mt = {} 函数Set：new（m）本地集= {} setmetatable（
sql - 在同一查询中使用 UNION 和 UNION ALL
我遇到了一些性能问题，我有如下查询: SELECT * FROM Foo UNION SELECT * FROM Boo UNION SELECT * FROM Koo 我确信 Koo 不会返回任何重
c++ - 将C union 转换为C++ union
This question already has answers here: C++ Structure Initialization (16个答案) 上个月关闭。我正在尝试将一些用于嵌入式目标的
sql - UNION 和 UNION ALL 有什么区别？
UNION 和 UNION ALL 有什么区别？最佳答案 UNION 删除重复记录(结果中的所有列都相同)，UNION ALL 则不会。使用 UNION 而不是 UNION ALL 时会影响性能，
sql - Union - 仅删除由 Union 创建的重复项
我想在两个表上使用联合运算符。我希望结果集消除由联合创建的重复值，但不消除表中预先存在的重复值。考虑这段代码... select b from (values (1), (2), (2
Tsql，union 改变结果顺序，union all 不
我知道 UNION 会删除重复项，但即使没有重复项也会更改结果顺序。我有两个 select 语句，任何地方都没有 order by 语句我想将它们合并或不合并(全部) 即 SELECT A UNI
我可以为一个 union 成员分配一个值并从另一个 union 成员那里读取相同的值吗？
基本上，我有一个 struct foo { /* variable denoting active member of union */ enum whichmembe
mysql - 组合多个选择而不使用 Union 或 Union All
我有一个大规模查询，用于对许多表(每个表有数千行)执行 UNION ALL，然后在返回之前输出到临时表。旧形式: SELECT * FROM (SELECT `a` AS `Human rea
sql - UNION 和 UNION ALL 有什么区别？
UNION 和 UNION ALL 有什么区别？最佳答案 UNION 删除重复记录(结果中的所有列都相同)，UNION ALL 则不会。使用 UNION 而不是 UNION ALL 时会影响性能，
c++ - 对象 union 与指针 union
如果我有两个 union 行结构: struct A { A() {} ~A() {} union { vector vi; vector db
关于另一个 union 中 union 字段的编译错误
考虑下面的代码，我已经写了: #include #include union myAccess { uint16_t access16; struct { uint
可以将 union 内的对齐结构强制转换为 union 以访问对齐字段吗？
我想弄清楚你从 C99 中对齐变量的地役权中得到了什么: Exception to strict aliasing rule in C from 6.5.2.3 Structure and union
php - UNION 与 UNION ALL 的性能对比
我正在通过 UNION 或 UNION ALL 从多个表中选择一列外键。当重复无关紧要时，通常建议使用 UNION ALL 而不是 UNION 来解决性能问题。但是，在我的调用 PHP 脚本中，循环
c++ - 为什么 union 静态成员不存储为 union ？
在 C++ 中，union 可以包含静态成员，在类的情况下，这些成员属于一个类，因此对所有对象都是通用的。 union U { long l; int i; static long
c++ - 匿名 union 和普通 union
任何人都可以提及普通和匿名 union (或结构)之间的区别吗？我刚找到一个: 不能在匿名 union 中定义函数。最佳答案您不需要点运算符“.”访问匿名 union 元素。 #include
c - union 成员如何拥有指向 union 实例的指针？
我可能把这个复杂化了.. 我正在尝试在 Arduino 上用 C 语言为嵌入式应用程序制作一个相当可重用的分层菜单系统。我有结构来表示不同类型的菜单项，包括那些子菜单，以及这些菜单项的 union 是

首页

博学

6Ren·AI

商城

c - 提高union-find的效率