Zhu-Takaoka Two-dimensional Pattern Matching

Two dimensional pattern matching.

Details may be added later....

 

Corresponding more work can be found in Pattern Matching and Text Compression Algorithm, Maxime Crochemore, Thierry Lecroq.

Let's enjoy the code first:

#define REHASH(a, b, h)    (((h - a * d) << 1) + b)

void getNext(char *pattern, int n, int next[]){
	int i = 0, j = -1;
	next[i] = j;
	
	while(i < n){
		while(j >= 0 && pattern[i] != pattern[j])
			j = next[j];
		
		++i; ++j;
		next[i] = j;
	}
}

void bitsCompare(BIG_IMAGE bigImg, SMALL_IMAGE smallImg, int bigRow, int bigCol, int smallRow, int smallCol, int lastRow, int lastCol){
	// The beginning coordinate in big image.
	int i0 = lastRow - smallRow + 1;
	int j0 = lastCol - smallCol + 1;
	
	for(int i = 0; i < smallRow; ++i)
		for(int j = 0; j < smallCol; ++j)
			if(bigImg[i0 + i][j0 + j] != smallImg[i][j])
				return;
	
	// Record the position of successful match.
	OUTPUT(i0, j0);
}

void KMP_Inline(BIG_IMAGE bigImg, SMALL_IMAGE smallImg, int bigRow, int bigCol, int smallRow, int smallCol, int bigImgHashArr[], int smallImgHashArr[], int next[], int lastRow){
	int i = 0, j = 0;
	
	while(i < bigCol){
		while(j >= 0 && bigImgHashArr[i] != smallImgHashArr[j])
			j = next[j];
		
		++i; ++j
		
		// If matched with pattern, then j should be not less than smallCol
		if(j >= smallCol){
			bitsCompare(bigImg, smallImg, bigRow, bigCol, smallRow, smallCol, lastRow, i-1);
			j = next[smallCol];
		}
		
	}
}

void ZT_TwoDimMatch(BIG_IMAGE bigImg, SMALL_IMAGE smallImg, int bigRow, int bigCol, int smallRow, int smallCol){
	int bigImgHashArr[BIG_COL], smallImgHashArr[SMALL_COL], next[SMALL_COL];
	
	// Preprocessing
	// Compute first bigImg hash array
	for(int j = 0; j < bigCol; ++j){
		bigImgHashArr[j] = 0;
		for(int i = 0; i < smallRow; ++ i)
			bigImgHashArr[j] = (bigImgHashArr[j] << 1) + bigImg[i][j];	// The mod we use implicitly here is MAX_INT
	}
	
	// Compute the smallImg hash array
	for(int j = 0; j < smallCol; ++j){
		smallImgHashArr[j] = 0;
		for(int i = 0; i < smallRow; ++i)
			smallImgHashArr[j] = (smallImgHashArr[j] << 1) + smallImg[i][j];	// The mod we use implicitly here is MAX_INT
	}
	
	// Last row of one checking window
	lastRow = smallRow - 1;
	// digit of re-hash
	d = 1;
	for(int j = 1; j < smallRow; ++j)
		d <<= 1;
	
	getNext(smallImgHashArr, smallCol, next);
	
	// Searching
	while(lastRow < bigRow){
		KMP_Inline(bigImg, smallImg, bigRow, bigCol, smallRow, smallCol, bigImgHashArr, smallImgHashArr, next, lastRow);
		
		// Rehash the big hash array
		if(lastRow < bigRow - 1)
			for(int j = 0; j < bigCol; ++j)
				bigImgHashArr[j] = REHASH(bigImg[lastRow - smallRow + 1][j], bigImg[lastRow + 1][j], bigImgHashArr[j]);	// The mod we use implicitly here is MAX_INT
		
		++lastRow;
	}
	
}

 

posted @ 2015-03-27 16:44  kid551  阅读(194)  评论(0编辑  收藏  举报