algorithm - Etiquetado de componentes conectados

multidimensional-array area (5)

Hace algunos días hice una pregunta similar, pero aún tengo que encontrar una manera eficiente de resolver mi problema. Estoy desarrollando un juego de consola simple, y tengo una matriz 2D como esta:

1,0,0,0,1 1,1,0,1,1 0,1,0,0,1 1,1,1,1,0 0,0,0,1,0

Estoy tratando de encontrar todas las áreas que constan de 1 adyacente (conectividad de 4 vías). Entonces, en este ejemplo las 2 áreas son las siguientes:

1 1,1 1 1,1,1,1 1

1 1,1 1

El algoritmo, en el que he estado trabajando, encuentra a todos los vecinos de los vecinos de una celda y funciona perfectamente bien en este tipo de matrices. Sin embargo, cuando uso matrices más grandes (como 90 * 90), el programa es muy lento y, a veces, las matrices enormes que se usan causan desbordamientos de pila.

Un tipo en mi otra pregunta me habló sobre el etiquetado de componentes conectados como una solución eficiente para mi problema.

¿Alguien me puede mostrar cualquier código C ++ que use este algoritmo, porque estoy un poco confundido acerca de cómo funciona realmente junto con esta cosa de la estructura de datos de conjunto disjunto ...

Muchas gracias por su ayuda y tiempo.

A continuación encontrará el código de ejemplo para el etiquetado de componentes conectados. El código está escrito en Java.

package addressextraction; public class ConnectedComponentLabelling { int[] dx={+1, 0, -1, 0}; int[] dy={0, +1, 0, -1}; int row_count=0; int col_count=0; int[][] m; int[][] label; public ConnectedComponentLabelling(int row_count,int col_count) { this.row_count=row_count; this.col_count=col_count; m=new int[row_count][col_count]; label=new int[row_count][col_count]; } void dfs(int x, int y, int current_label) { if (x < 0 || x == row_count) return; // out of bounds if (y < 0 || y == col_count) return; // out of bounds if (label[x][y]!=0 || m[x][y]!=1) return; // already labeled or not marked with 1 in m // mark the current cell label[x][y] = current_label; // System.out.println("****************************"); // recursively mark the neighbors int direction = 0; for (direction = 0; direction < 4; ++direction) dfs(x + dx[direction], y + dy[direction], current_label); } void find_components() { int component = 0; for (int i = 0; i < row_count; ++i) for (int j = 0; j < col_count; ++j) if (label[i][j]==0 && m[i][j]==1) dfs(i, j, ++component); } public static void main(String[] args) { ConnectedComponentLabelling l=new ConnectedComponentLabelling(4,4); l.m[0][0]=0; l.m[0][1]=0; l.m[0][2]=0; l.m[0][3]=0; l.m[1][0]=0; l.m[1][1]=1; l.m[1][2]=0; l.m[1][3]=0; l.m[2][0]=0; l.m[2][1]=0; l.m[2][2]=0; l.m[2][3]=0; l.m[3][0]=0; l.m[3][1]=1; l.m[3][2]=0; l.m[3][3]=0; l.find_components(); for (int i = 0; i < 4; i++) { for (int j = 0; j < 4; j++) { System.out.print(l.label[i][j]); } System.out.println(""); } } }

Documento muy útil => https://docs.google.com/file/d/0B8gQ5d6E54ZDM204VFVxMkNtYjg/edit

Aplicación java - código abierto - extraer objetos de la imagen - etiquetado de componentes conectados => https://drive.google.com/file/d/0B8gQ5d6E54ZDTVdsWE1ic2lpaHM/edit?usp=sharing

import java.util.ArrayList; public class cclabeling { int neighbourindex;ArrayList<Integer> Temp; ArrayList<ArrayList<Integer>> cc=new ArrayList<>(); public int[][][] cclabel(boolean[] Main,int w){ /* this method return array of arrays "xycc" each array contains the x,y coordinates of pixels of one connected component – Main => binary array of image – w => width of image */ long start=System.nanoTime(); int len=Main.length;int id=0; int[] dir={-w-1,-w,-w+1,-1,+1,+w-1,+w,+w+1}; for(int i=0;i<len;i+=1){ if(Main[i]){ Temp=new ArrayList<>(); Temp.add(i); for(int x=0;x<Temp.size();x+=1){ id=Temp.get(x); for(int u=0;u<8;u+=1){ neighbourindex=id+dir[u]; if(Main[neighbourindex]){ Temp.add(neighbourindex); Main[neighbourindex]=false; } } Main[id]=false; } cc.add(Temp); } } int[][][] xycc=new int[cc.size()][][]; int x;int y; for(int i=0;i<cc.size();i+=1){ xycc[i]=new int[cc.get(i).size()][2]; for(int v=0;v<cc.get(i).size();v+=1){ y=Math.round(cc.get(i).get(v)/w); x=cc.get(i).get(v)-y*w; xycc[i][v][0]=x; xycc[i][v][1]=y; } } long end=System.nanoTime(); long time=end-start; System.out.println("Connected Component Labeling Time =>"+time/1000000+" milliseconds"); System.out.println("Number Of Shapes => "+xycc.length); return xycc; } }

Esto se puede resolver con la búsqueda de unión (aunque DFS, como se muestra en la otra respuesta, es probablemente un poco más simple).

La idea básica detrás de esta estructura de datos es fusionar repetidamente elementos en el mismo componente. Esto se hace representando cada componente como un árbol (con los nodos manteniendo un seguimiento de su propio padre, en lugar de al revés), puede verificar si hay 2 elementos en el mismo componente atravesando el nodo raíz y puede fusionar los nodos. simplemente haciendo que una raíz sea la principal de la otra raíz.

Un ejemplo de código corto que demuestra esto:

const int w = 5, h = 5; int input[w][h] = {{1,0,0,0,1}, {1,1,0,1,1}, {0,1,0,0,1}, {1,1,1,1,0}, {0,0,0,1,0}}; int component[w*h]; void doUnion(int a, int b) { // get the root component of a and b, and set the one''s parent to the other while (component[a] != a) a = component[a]; while (component[b] != b) b = component[b]; component[b] = a; } void unionCoords(int x, int y, int x2, int y2) { if (y2 < h && x2 < w && input[x][y] && input[x2][y2]) doUnion(x*h + y, x2*h + y2); } int main() { for (int i = 0; i < w*h; i++) component[i] = i; for (int x = 0; x < w; x++) for (int y = 0; y < h; y++) { unionCoords(x, y, x+1, y); unionCoords(x, y, x, y+1); } // print the array for (int x = 0; x < w; x++) { for (int y = 0; y < h; y++) { if (input[x][y] == 0) { cout << '' ''; continue; } int c = x*h + y; while (component[c] != c) c = component[c]; cout << (char)(''a''+c); } cout << "/n"; } }

Demo en vivo .

Lo anterior mostrará cada grupo de unos usando una letra diferente del alfabeto.

p i pp ii p i pppp p

Debería ser fácil modificar esto para obtener los componentes por separado u obtener una lista de los elementos correspondientes a cada componente. Una idea es reemplazar cout << (char)(''a''+c); arriba con componentMap[c].add(Point(x,y)) con componentMap como un map<int, list<Point>> - cada entrada en este mapa corresponderá a un componente y dará una lista de puntos.

Hay varias optimizaciones para mejorar la eficiencia de la búsqueda de sindicatos, lo anterior es solo una implementación básica.

Primero te daré el código y luego te lo explicaré un poco:

// direction vectors const int dx[] = {+1, 0, -1, 0}; const int dy[] = {0, +1, 0, -1}; // matrix dimensions int row_count; int col_count; // the input matrix int m[MAX][MAX]; // the labels, 0 means unlabeled int label[MAX][MAX]; void dfs(int x, int y, int current_label) { if (x < 0 || x == row_count) return; // out of bounds if (y < 0 || y == col_count) return; // out of bounds if (label[x][y] || !m[x][y]) return; // already labeled or not marked with 1 in m // mark the current cell label[x][y] = current_label; // recursively mark the neighbors for (int direction = 0; direction < 4; ++direction) dfs(x + dx[direction], y + dy[direction], current_label); } void find_components() { int component = 0; for (int i = 0; i < row_count; ++i) for (int j = 0; j < col_count; ++j) if (!label[i][j] && m[i][j]) dfs(i, j, ++component); }

Esta es una forma común de resolver este problema.

Los vectores de dirección son solo una buena forma de encontrar las celdas vecinas (en cada una de las cuatro direcciones).

La función dfs realiza una búsqueda en profundidad de la cuadrícula. Eso simplemente significa que visitará todas las celdas accesibles desde la celda inicial. Cada celda se marcará con current_label

La función find_components recorre todas las celdas de la cuadrícula e inicia el etiquetado de un componente si encuentra una celda sin etiqueta (marcada con 1).

Esto también se puede hacer iterativamente usando una pila. Si reemplaza la pila con una cola, obtiene los bfs o la búsqueda en primer lugar .

También puede probar este enfoque de cierre transitivo, sin embargo, el triple bucle para el cierre transitivo ralentiza las cosas cuando hay muchos objetos separados en la imagen, los cambios de código sugeridos son bienvenidos

Aclamaciones

Dave

void CC(unsigned char* pBinImage, unsigned char* pOutImage, int width, int height, int CON8) { int i, j, x, y, k, maxIndX, maxIndY, sum, ct, newLabel=1, count, maxVal=0, sumVal=0, maxEQ=10000; int *eq=NULL, list[4]; int bAdd; memcpy(pOutImage, pBinImage, width*height*sizeof(unsigned char)); unsigned char* equivalences=(unsigned char*) calloc(sizeof(unsigned char), maxEQ*maxEQ); // modify labels this should be done with iterators to modify elements // current column for(j=0; j<height; j++) { // current row for(i=0; i<width; i++) { if(pOutImage[i+j*width]>0) { count=0; // go through blocks list[0]=0; list[1]=0; list[2]=0; list[3]=0; if(j>0) { if((i>0)) { if((pOutImage[(i-1)+(j-1)*width]>0) && (CON8 > 0)) list[count++]=pOutImage[(i-1)+(j-1)*width]; } if(pOutImage[i+(j-1)*width]>0) { for(x=0, bAdd=true; x<count; x++) { if(pOutImage[i+(j-1)*width]==list[x]) bAdd=false; } if(bAdd) list[count++]=pOutImage[i+(j-1)*width]; } if(i<width-1) { if((pOutImage[(i+1)+(j-1)*width]>0) && (CON8 > 0)) { for(x=0, bAdd=true; x<count; x++) { if(pOutImage[(i+1)+(j-1)*width]==list[x]) bAdd=false; } if(bAdd) list[count++]=pOutImage[(i+1)+(j-1)*width]; } } } if(i>0) { if(pOutImage[(i-1)+j*width]>0) { for(x=0, bAdd=true; x<count; x++) { if(pOutImage[(i-1)+j*width]==list[x]) bAdd=false; } if(bAdd) list[count++]=pOutImage[(i-1)+j*width]; } } // has a neighbour label if(count==0) pOutImage[i+j*width]=newLabel++; else { pOutImage[i+j*width]=list[0]; if(count>1) { // store equivalences in table for(x=0; x<count; x++) for(y=0; y<count; y++) equivalences[list[x]+list[y]*maxEQ]=1; } } } } } // floyd-Warshall algorithm - transitive closure - slow though :-( for(i=0; i<newLabel; i++) for(j=0; j<newLabel; j++) { if(equivalences[i+j*maxEQ]>0) { for(k=0; k<newLabel; k++) { equivalences[k+j*maxEQ]= equivalences[k+j*maxEQ] || equivalences[k+i*maxEQ]; } } } eq=(int*) calloc(sizeof(int), newLabel); for(i=0; i<newLabel; i++) for(j=0; j<newLabel; j++) { if(equivalences[i+j*maxEQ]>0) { eq[i]=j; break; } } free(equivalences); // label image with equivalents for(i=0; i<width*height; i++) { if(pOutImage[i]>0&&eq[pOutImage[i]]>0) pOutImage[i]=eq[pOutImage[i]]; } free(eq); }