'Image Recognition/Fundamental' 카테고리의 글 목록 (5 Page)

Statistical Region Merging

Image Recognition/Fundamental 2022. 6. 11. 16:29

Statistical region merging은 이미지의 픽셀을 일정한 기준에 따라 더 큰 영역으로 합병하는 bottom-up 방식의 과정이다. 두 영역 $R 1 R_{1} <math xmlns="http://www.w3.org/1998/Math/MathML"><msub><mi>R</mi><mn>1</mn></msub></math>$ 과 $R 2 R_{2} <math xmlns="http://www.w3.org/1998/Math/MathML"><msub><mi>R</mi><mn>2</mn></msub></math>$ 가 하나의 영역으로 합병이 되기 위해서는 두 영역의 평균 픽셀 값의 차이가

$g√ln(2/δ)2Q(1|R1|+1|R2|)g√ln(2/δ)2Q(1|R1|+1|R2|)<math xmlns="http://www.w3.org/1998/Math/MathML" display="block"><mi>g</mi><msqrt><mfrac><mrow><mi>ln</mi><mo data-mjx-texclass="NONE">⁡</mo><mo stretchy="false">(</mo><mn>2</mn><mrow data-mjx-texclass="ORD"><mo>/</mo></mrow><mi>δ</mi><mo stretchy="false">)</mo></mrow><mrow><mn>2</mn><mi>Q</mi></mrow></mfrac><mrow data-mjx-texclass="ORD"><mo minsize="1.623em" maxsize="1.623em">(</mo></mrow><mfrac><mn>1</mn><mrow><mo stretchy="false">|</mo><msub><mi>R</mi><mn>1</mn></msub><mo stretchy="false">|</mo></mrow></mfrac><mo>+</mo><mfrac><mn>1</mn><mrow><mo stretchy="false">|</mo><msub><mi>R</mi><mn>2</mn></msub><mo stretchy="false">|</mo></mrow></mfrac><mrow data-mjx-texclass="ORD"><mo minsize="1.623em" maxsize="1.623em">)</mo></mrow></msqrt></math>$

를 넘지 않아야 한다. $g = 256 g = 256 <math xmlns="http://www.w3.org/1998/Math/MathML"><mi>g</mi><mo>=</mo><mn>256</mn></math>$ 으로 gray 레벨의 갯수를 의미하고, $| R i | | R_{i} | <math xmlns="http://www.w3.org/1998/Math/MathML"><mo stretchy="false">|</mo><msub><mi>R</mi><mi>i</mi></msub><mo stretchy="false">|</mo></math>$ 는 $R i R_{i} <math xmlns="http://www.w3.org/1998/Math/MathML"><msub><mi>R</mi><mi>i</mi></msub></math>$ 영역에 포함된 픽셀 수를 나타낸다. $δ δ <math xmlns="http://www.w3.org/1998/Math/MathML"><mi>δ</mi></math>$ 는 작은 수로 이미지의 픽셀 수의 제곱에 반비례한다. 보통 $δ = 1 / (6 \times width \times height) 2 δ = 1 / (6 \times width \times height)^{2} <math xmlns="http://www.w3.org/1998/Math/MathML"><mi>δ</mi><mo>=</mo><mn>1</mn><mrow data-mjx-texclass="ORD"><mo>/</mo></mrow><mo stretchy="false">(</mo><mn>6</mn><mo>\times</mo><mtext>width</mtext><mo>\times</mo><mtext>height</mtext><msup><mo stretchy="false">)</mo><mn>2</mn></msup></math>$ 로 선택한다. $Q Q <math xmlns="http://www.w3.org/1998/Math/MathML"><mi>Q</mi></math>$ 는 이미지의 통계적인 복잡성을 정량화하는 양으로 이 알고리즘에서는 외부에서 설정이 되는 값이다. 낮은 $Q Q <math xmlns="http://www.w3.org/1998/Math/MathML"><mi>Q</mi></math>$ 값을 선택하면 분할된 영역의 수가 작아지고(undersegmentation), 반대로 높은 $Q Q <math xmlns="http://www.w3.org/1998/Math/MathML"><mi>Q</mi></math>$ 값을 입력하면 분할된 영상에 너무 많은 영역이 나타나게 된다(oversegmentation).

Ref:

https://en.wikipedia.org/wiki/Statistical_region_merging

http://www.lix.polytechnique.fr/~nielsen/Srmjava.java

Srm::Srm(int width, int height, BYTE *image) {
    this->width  = width;
    this->height = height;
    int n        = width * height;
    this->count = new int [n];
    this->Ravg  = new float [n];
    this->Gavg  = new float [n];
    this->Bavg  = new float [n];
    this->image = image;
    // disjoint sets with n pixels;
    this->UF = new Universe(n);
    // initialize to each pixel a leaf region;
    for (int i = 0, pos = 0; i < n; i++, pos += 3) {
        count[i] = 1;
        Bavg[i] = image[pos    ];
        Gavg[i] = image[pos + 1];
        Ravg[i] = image[pos + 2];
    }
    this->Q = 32;		// adjustable.					    
    this->g = 256.0;
    this->logDelta = 2. * log(6.0 * n);
}
bool Srm::Predicate(int rgn1, int rgn2) {
    double dR = (Ravg[rgn1] - Ravg[rgn2]); dR *= dR;
    double dG = (Gavg[rgn1] - Gavg[rgn2]); dG *= dG;
    double dB = (Bavg[rgn1] - Bavg[rgn2]); dB *= dB;
    double logreg1 = min(g, count[rgn1]) * log(1.0 + count[rgn1]);
    double logreg2 = min(g, count[rgn2]) * log(1.0 + count[rgn2]);
    double factor = g * g / (2.0 * Q);
    double dev1 = factor * (logreg1 + logDelta) / count[rgn1] ;
    double dev2 = factor * (logreg2 + logDelta) / count[rgn2] ;
    double dev = dev1 + dev2;
    return ( (dR < dev) && (dG < dev) && (dB < dev) );
}
void Srm::Merge(int rgn1, int rgn2) {
    if (rgn1 == root2) return;
    int w1 = count[rgn1], w2 = count[rgn2];
    int root = UF->Union(rgn1, rgn2);
    //update the merged region;
    count[root] = w1 + w2;
    double count_sum = w1 + w2;
    Ravg[root] = (w1 * Ravg[rgn1] + w2 * Ravg[rgn2]) / count_sum;
    Gavg[root] = (w1 * Gavg[rgn1] + w2 * Gavg[rgn2]) / count_sum;
    Bavg[root] = (w1 * Bavg[rgn1] + w2 * Bavg[rgn2]) / count_sum;
}
Edge* Srm::Pairs(int nedge) {
    // 4-connectivity;
    int ymax = height - 1, xmax = width - 1;
    Edge* edgeList = new Edge[nedge];
    int cnt = 0;
    for (int y = 0; y < ymax; y++) {
        for (int x = 0; x < xmax; x++) {
            int pos = y * width + x;
            int b1 = image[3 * pos + 0];
            int g1 = image[3 * pos + 1];
            int r1 = image[3 * pos + 2];
            //right: x--x
            edgeList[cnt].r1 = pos;     //current
            edgeList[cnt].r2 = pos + 1; //right
            int bdiff = abs(b1 - image[3 * (pos + 1) + 0]);
            int gdiff = abs(g1 - image[3 * (pos + 1) + 1]);
            int rdiff = abs(r1 - image[3 * (pos + 1) + 2]);
            edgeList[cnt++].diff = max3(bdiff, gdiff, rdiff) ;
            //below: x
            //       |
            //       x
            edgeList[cnt].r1 = pos;
            edgeList[cnt].r2 = pos + width;
            bdiff = abs(b1 - image[3 * (pos + width) + 0]);
            gdiff = abs(g1 - image[3 * (pos + width) + 1]);
            rdiff = abs(r1 - image[3 * (pos + width) + 2]);
            edgeList[cnt++].diff = max3(bdiff, gdiff, rdiff);
        }
    }
    //x=width-1;
    for (int y = 0; y < ymax; y++) {
        int pos = y * width + (width - 1); // (x,y) = (width-1, y)
        // x
        // |
        // x
        edgeList[cnt].r1 = pos;
        edgeList[cnt].r2 = pos + width;
        int bdiff = abs((int)image[3 * pos + 0] - image[3 * (pos + width) + 0]);
        int gdiff = abs((int)image[3 * pos + 1] - image[3 * (pos + width) + 1]);
        int rdiff = abs((int)image[3 * pos + 2] - image[3 * (pos + width) + 2]);
        edgeList[cnt++].diff = max3(bdiff, gdiff, rdiff);
    }
    //y=height-1;
    for (int x = 0; x < xmax; x++) {
        int pos = (height - 1) * width + x;      //(x,y)=(x, height-1);
        //right; x--x
        edgeList[cnt].r1 = pos;
        edgeList[cnt].r2 = pos + 1;
        int bdiff = abs((int)image[3 * pos + 0] - image[3 * (pos + 1) + 0]);
        int gdiff = abs((int)image[3 * pos + 1] - image[3 * (pos + 1) + 1]);
        int rdiff = abs((int)image[3 * pos + 2] - image[3 * (pos + 1) + 2]);
        edgeList[cnt++].diff = max3(bdiff, gdiff, rdiff);
    }
    return edgeList;
}
int Srm::Segment() {
    // 4-connectivity 
    int nedge = 2 * (width - 1) * (height - 1) + (height - 1) + (width - 1);
    Edge* edgeList = Pairs(nedge);
    BucketSort(edgeList, nedge);
    for (int i = 0; i < nedge; i++) {
        Edge &e = edgeList[i];
        int r1 = UF->Find(e.r1);
        int r2 = UF->Find(e.r2);
        if ((r1 != r2) && (Predicate(r1, r2)))
            Merge(r1, r2);
    }
    delete [] edgeList;
    int rgn_count = 0;
    for (int node = width * height; node-- > 0;)
        if (UF->IsRoot(node)) rgn_count++;
    return rgn_count;
}
// sorting with buckets; returns an ordered edgeList;
void BucketSort(Edge* &edgeList, int n) {
    int hist[256] = {0}, chist[256];
    for (int i = 0; i < n; i++) hist[edgeList[i].diff]++;
    // cumulative histogram
    chist[0] = 0;  // Note, chist[0] ne hist[0];
    for (int i = 1; i < 256; i++)
        chist[i] = chist[i - 1] + hist[i - 1];

    Edge *ordered = new Edge [n];
    for (int i = 0; i < n; i++)
        ordered[chist[pair[i].diff]++] = pair[i];        
    delete[] edgeList;
    edgeList = ordered;
}

저작자표시 비영리 변경금지

'Image Recognition > Fundamental' 카테고리의 다른 글

영상에 Impulse Noise 넣기 (2)	2023.02.09
Canny Edge: Non-maximal suppression (0)	2023.01.11
Moment-preserving Thresholding (0)	2022.05.29
Minimum Cross Entropy Thresholding (0)	2022.05.29
Quadtree Segmentation (0)	2022.05.21

Geometry & Recognition 알고리즘,계산기하,물리학,...

Moment-preserving Thresholding

Image Recognition/Fundamental 2022. 5. 29. 22:39

영상의 히스토그램( $h [z] h [z] <math xmlns="http://www.w3.org/1998/Math/MathML"><mi>h</mi><mo stretchy="false">[</mo><mi>z</mi><mo stretchy="false">]</mo></math>$ )이 bimodal로 주어지는 경우 적절한 threshold 값을 선택해서 전경과 배경을 분리할 수 있다. 전경을 대표하는 픽셀 값을 $z f z_{f} <math xmlns="http://www.w3.org/1998/Math/MathML"><msub><mi>z</mi><mi>f</mi></msub></math>$ , 배경을 대표하는 픽셀 값을 $z b z_{b} <math xmlns="http://www.w3.org/1998/Math/MathML"><msub><mi>z</mi><mi>b</mi></msub></math>$ 라면 이진화 후 정규화된 히스토그램은

$˜ h [z] = p b δ z, z b + p f δ z, z f ~ h [z] = p_{b} δ_{z, z_{b}} + p_{f} δ_{z, z_{f}} <math xmlns="http://www.w3.org/1998/Math/MathML" display="block"><mrow data-mjx-texclass="ORD"><mover><mi>h</mi><mo stretchy="false">~</mo></mover></mrow><mo stretchy="false">[</mo><mi>z</mi><mo stretchy="false">]</mo><mo>=</mo><msub><mi>p</mi><mi>b</mi></msub><msub><mi>δ</mi><mrow data-mjx-texclass="ORD"><mi>z</mi><mo>,</mo><msub><mi>z</mi><mrow data-mjx-texclass="ORD"><mi>b</mi></mrow></msub></mrow></msub><mo>+</mo><msub><mi>p</mi><mi>f</mi></msub><msub><mi>δ</mi><mrow data-mjx-texclass="ORD"><mi>z</mi><mo>,</mo><msub><mi>z</mi><mrow data-mjx-texclass="ORD"><mi>f</mi></mrow></msub></mrow></msub></math>$

로 표현된다. $p b p_{b} <math xmlns="http://www.w3.org/1998/Math/MathML"><msub><mi>p</mi><mi>b</mi></msub></math>$ 은 배경에 해당하는 픽셀 비율이고, $p f p_{f} <math xmlns="http://www.w3.org/1998/Math/MathML"><msub><mi>p</mi><mi>f</mi></msub></math>$ 은 전경에 해당하는 픽셀 비율이다.

threshold 값을 어떻게 선택하면 이진화된 영상의 히스토그램이 원 영상의 히스토그램의 특성을 최대한 담게 할 수 있을까? 이에 대한 기준으로 두 히스토그램의 $n n <math xmlns="http://www.w3.org/1998/Math/MathML"><mi>n</mi></math>$ 차 moment가 같은 값을 갖도록 하자. 주어진 미지수가 $p b p_{b} <math xmlns="http://www.w3.org/1998/Math/MathML"><msub><mi>p</mi><mi>b</mi></msub></math>$ , $p f p_{f} <math xmlns="http://www.w3.org/1998/Math/MathML"><msub><mi>p</mi><mi>f</mi></msub></math>$ , $z b z_{b} <math xmlns="http://www.w3.org/1998/Math/MathML"><msub><mi>z</mi><mi>b</mi></msub></math>$ , $z f z_{f} <math xmlns="http://www.w3.org/1998/Math/MathML"><msub><mi>z</mi><mi>f</mi></msub></math>$ 이 있으므로 최소한 4개의 moment가 같도록 만들어야 한다. 가장 낮은 찾수의 moment로부터 시작해서 3차까지 4개의 moments가 같다는 조건에서 아래의 식들을 얻을 수 있다.

$차 차 0-차 moment: m 0 \equiv 255 \sum z = 0 h [z] = p b + p f = 1 <math xmlns="http://www.w3.org/1998/Math/MathML" display="block"><mtext>0-차 moment: </mtext><msub><mi>m</mi><mn>0</mn></msub><mo>\equiv</mo><munderover><mo data-mjx-texclass="OP">\sum</mo><mrow data-mjx-texclass="ORD"><mi>z</mi><mo>=</mo><mn>0</mn></mrow><mrow data-mjx-texclass="ORD"><mn>255</mn></mrow></munderover><mi>h</mi><mo stretchy="false">[</mo><mi>z</mi><mo stretchy="false">]</mo><mo>=</mo><msub><mi>p</mi><mi>b</mi></msub><mo>+</mo><msub><mi>p</mi><mi>f</mi></msub><mo>=</mo><mn>1</mn></math>$

$차 차 1-차 moment: m 1 \equiv 255 \sum z = 0 z h [z] = p b z b + p f z f <math xmlns="http://www.w3.org/1998/Math/MathML" display="block"><mtext>1-차 moment: </mtext><msub><mi>m</mi><mn>1</mn></msub><mo>\equiv</mo><munderover><mo data-mjx-texclass="OP">\sum</mo><mrow data-mjx-texclass="ORD"><mi>z</mi><mo>=</mo><mn>0</mn></mrow><mrow data-mjx-texclass="ORD"><mn>255</mn></mrow></munderover><mi>z</mi><mi>h</mi><mo stretchy="false">[</mo><mi>z</mi><mo stretchy="false">]</mo><mo>=</mo><msub><mi>p</mi><mi>b</mi></msub><msub><mi>z</mi><mi>b</mi></msub><mo>+</mo><msub><mi>p</mi><mi>f</mi></msub><msub><mi>z</mi><mi>f</mi></msub></math>$

$차 차 2-차 moment: m 2 \equiv 255 \sum z = 0 z 2 h [z] = p b z 2 b + p f z 2 f <math xmlns="http://www.w3.org/1998/Math/MathML" display="block"><mtext>2-차 moment: </mtext><msub><mi>m</mi><mn>2</mn></msub><mo>\equiv</mo><munderover><mo data-mjx-texclass="OP">\sum</mo><mrow data-mjx-texclass="ORD"><mi>z</mi><mo>=</mo><mn>0</mn></mrow><mrow data-mjx-texclass="ORD"><mn>255</mn></mrow></munderover><msup><mi>z</mi><mn>2</mn></msup><mi>h</mi><mo stretchy="false">[</mo><mi>z</mi><mo stretchy="false">]</mo><mo>=</mo><msub><mi>p</mi><mi>b</mi></msub><msubsup><mi>z</mi><mi>b</mi><mn>2</mn></msubsup><mo>+</mo><msub><mi>p</mi><mi>f</mi></msub><msubsup><mi>z</mi><mi>f</mi><mn>2</mn></msubsup></math>$

$차 차 3-차 moment: m 3 \equiv 255 \sum z = 0 z 3 h [z] = p b z 3 b + p f z 3 f <math xmlns="http://www.w3.org/1998/Math/MathML" display="block"><mtext>3-차 moment: </mtext><msub><mi>m</mi><mn>3</mn></msub><mo>\equiv</mo><munderover><mo data-mjx-texclass="OP">\sum</mo><mrow data-mjx-texclass="ORD"><mi>z</mi><mo>=</mo><mn>0</mn></mrow><mrow data-mjx-texclass="ORD"><mn>255</mn></mrow></munderover><msup><mi>z</mi><mn>3</mn></msup><mi>h</mi><mo stretchy="false">[</mo><mi>z</mi><mo stretchy="false">]</mo><mo>=</mo><msub><mi>p</mi><mi>b</mi></msub><msubsup><mi>z</mi><mi>b</mi><mn>3</mn></msubsup><mo>+</mo><msub><mi>p</mi><mi>f</mi></msub><msubsup><mi>z</mi><mi>f</mi><mn>3</mn></msubsup></math>$

원 영상의 moment $m 0 <math xmlns="http://www.w3.org/1998/Math/MathML"><msub><mi>m</mi><mn>0</mn></msub></math>$ , $m 1 <math xmlns="http://www.w3.org/1998/Math/MathML"><msub><mi>m</mi><mn>1</mn></msub></math>$ , $m 2 <math xmlns="http://www.w3.org/1998/Math/MathML"><msub><mi>m</mi><mn>2</mn></msub></math>$ , $m 3 <math xmlns="http://www.w3.org/1998/Math/MathML"><msub><mi>m</mi><mn>3</mn></msub></math>$ 을 계산해서 풀면

$c0=m3m1−m22m0m2−m21,c1=m1m2−m0m3m0m2−m21zb=12(−c1−√c21−4c0)zf=12(−c1+√c21−4c0)pb=zf−m1zf−zbpf=1−pb<math xmlns="http://www.w3.org/1998/Math/MathML" display="block"><mtable displaystyle="true" columnspacing="1em" rowspacing="3pt"><mtr><mtd><msub><mi>c</mi><mn>0</mn></msub><mo>=</mo><mfrac><mrow><msub><mi>m</mi><mn>3</mn></msub><msub><mi>m</mi><mn>1</mn></msub><mo>−</mo><msubsup><mi>m</mi><mn>2</mn><mn>2</mn></msubsup></mrow><mrow><msub><mi>m</mi><mn>0</mn></msub><msub><mi>m</mi><mn>2</mn></msub><mo>−</mo><msubsup><mi>m</mi><mn>1</mn><mn>2</mn></msubsup></mrow></mfrac><mo>,</mo><mstyle scriptlevel="0"><mspace width="1em"></mspace></mstyle><msub><mi>c</mi><mn>1</mn></msub><mo>=</mo><mfrac><mrow><msub><mi>m</mi><mn>1</mn></msub><msub><mi>m</mi><mn>2</mn></msub><mo>−</mo><msub><mi>m</mi><mn>0</mn></msub><msub><mi>m</mi><mn>3</mn></msub></mrow><mrow><msub><mi>m</mi><mn>0</mn></msub><msub><mi>m</mi><mn>2</mn></msub><mo>−</mo><msubsup><mi>m</mi><mn>1</mn><mn>2</mn></msubsup></mrow></mfrac></mtd></mtr><mtr><mtd><msub><mi>z</mi><mi>b</mi></msub><mo>=</mo><mfrac><mn>1</mn><mn>2</mn></mfrac><mrow data-mjx-texclass="INNER"><mo data-mjx-texclass="OPEN">(</mo><mo>−</mo><msub><mi>c</mi><mn>1</mn></msub><mo>−</mo><msqrt><msubsup><mi>c</mi><mn>1</mn><mn>2</mn></msubsup><mo>−</mo><mn>4</mn><msub><mi>c</mi><mn>0</mn></msub></msqrt><mo data-mjx-texclass="CLOSE">)</mo></mrow></mtd></mtr><mtr><mtd><msub><mi>z</mi><mi>f</mi></msub><mo>=</mo><mfrac><mn>1</mn><mn>2</mn></mfrac><mrow data-mjx-texclass="INNER"><mo data-mjx-texclass="OPEN">(</mo><mo>−</mo><msub><mi>c</mi><mn>1</mn></msub><mo>+</mo><msqrt><msubsup><mi>c</mi><mn>1</mn><mn>2</mn></msubsup><mo>−</mo><mn>4</mn><msub><mi>c</mi><mn>0</mn></msub></msqrt><mo data-mjx-texclass="CLOSE">)</mo></mrow></mtd></mtr><mtr><mtd><msub><mi>p</mi><mi>b</mi></msub><mo>=</mo><mfrac><mrow><msub><mi>z</mi><mi>f</mi></msub><mo>−</mo><msub><mi>m</mi><mn>1</mn></msub></mrow><mrow><msub><mi>z</mi><mi>f</mi></msub><mo>−</mo><msub><mi>z</mi><mi>b</mi></msub></mrow></mfrac></mtd></mtr><mtr><mtd><msub><mi>p</mi><mi>f</mi></msub><mo>=</mo><mn>1</mn><mo>−</mo><msub><mi>p</mi><mi>b</mi></msub></mtd></mtr></mtable></math>$

따라서 threshold 값

$T - 1 \sum z = 0 h [z] = p b <math xmlns="http://www.w3.org/1998/Math/MathML" display="block"><munderover><mo data-mjx-texclass="OP">\sum</mo><mrow data-mjx-texclass="ORD"><mi>z</mi><mo>=</mo><mn>0</mn></mrow><mrow data-mjx-texclass="ORD"><mi>T</mi><mo>-</mo><mn>1</mn></mrow></munderover><mi>h</mi><mo stretchy="false">[</mo><mi>z</mi><mo stretchy="false">]</mo><mo>=</mo><msub><mi>p</mi><mi>b</mi></msub></math>$

을 만족하는 $T <math xmlns="http://www.w3.org/1998/Math/MathML"><mi>T</mi></math>$ 을 선택하면 된다.

Ref: W. Tsai, "Moment-preserving thresholding: a new approach," Computer Vision, Graphics, and Image Processing, vol. 29, pp. 377-393, 1985.

int MomentsPreseving_threshold(int histogram[256]) {
    int tot = 0;
    for (int i = 0; i < 256; i++)
        tot += histogram[i];
    //normalised histogram
    double hist[256];
    for (int i = 0; i < 256; i++)
        hist[i] = double(histogram[i]) / tot;
    /* moments calculation: zero moment is 1 by defintion*/
    double m0 = 1, m1 = 0, m2 = 0, m3 = 0;
    for (int i = 0; i < 256; i++ ) {
        double h = hist[i];
        m1 += i * h;
        m2 += i * i * h;
        m3 += i * i * i * h;
    }
    double det = m0 * m2 - m1 * m1;
    double c0 = (m1 * m3 - m2 * m2) / det;
    double c1 = (m2 * m1 - m3 * m0) / det;
    double zb = 0.5 * (-c1 - sqrt (c1 * c1 - 4.0 * c0));
    double zf = 0.5 * (-c1 + sqrt (c1 * c1 - 4.0 * c0));
    double pb = (zf - m1) / (zf - zb);  
    double s = 0;
    for (int i = 0; i < 256; i++) {
        s += hist[i];
        if (s > pb)
            return i; // threshold
    }
    return 0;
}

저작자표시 비영리 변경금지

'Image Recognition > Fundamental' 카테고리의 다른 글

Canny Edge: Non-maximal suppression (0)	2023.01.11
Statistical Region Merging (0)	2022.06.11
Minimum Cross Entropy Thresholding (0)	2022.05.29
Quadtree Segmentation (0)	2022.05.21
Harris Corner Detector (0)	2022.04.07

Geometry & Recognition 알고리즘,계산기하,물리학,...

Minimum Cross Entropy Thresholding

Image Recognition/Fundamental 2022. 5. 29. 17:25

$t h r e s h o l d = argmin 0 \leq t < 256 [- p f (t) log (μ f (t)) - p b (t) log (μ b (t))] <math xmlns="http://www.w3.org/1998/Math/MathML" display="block"><mi>t</mi><mi>h</mi><mi>r</mi><mi>e</mi><mi>s</mi><mi>h</mi><mi>o</mi><mi>l</mi><mi>d</mi><mo>=</mo><munder><mtext>argmin</mtext><mrow><mn>0</mn><mo>\leq</mo><mi>t</mi><mo><</mo><mn>256</mn></mrow></munder><mrow data-mjx-texclass="INNER"><mo data-mjx-texclass="OPEN">[</mo><mo>-</mo><msub><mi>p</mi><mi>f</mi></msub><mo stretchy="false">(</mo><mi>t</mi><mo stretchy="false">)</mo><mi>log</mi><mo data-mjx-texclass="NONE"></mo><mo stretchy="false">(</mo><msub><mi>μ</mi><mi>f</mi></msub><mo stretchy="false">(</mo><mi>t</mi><mo stretchy="false">)</mo><mo stretchy="false">)</mo><mo>-</mo><msub><mi>p</mi><mi>b</mi></msub><mo stretchy="false">(</mo><mi>t</mi><mo stretchy="false">)</mo><mi>log</mi><mo data-mjx-texclass="NONE"></mo><mo stretchy="false">(</mo><msub><mi>μ</mi><mi>b</mi></msub><mo stretchy="false">(</mo><mi>t</mi><mo stretchy="false">)</mo><mo stretchy="false">)</mo><mo data-mjx-texclass="CLOSE">]</mo></mrow></math>$

where

$p b (t) = \int t 0 h (z) d z, p f (t) = \int 255 t h (z) d z <math xmlns="http://www.w3.org/1998/Math/MathML" display="block"><msub><mi>p</mi><mi>b</mi></msub><mo stretchy="false">(</mo><mi>t</mi><mo stretchy="false">)</mo><mo>=</mo><msubsup><mo data-mjx-texclass="OP">\int</mo><mn>0</mn><mi>t</mi></msubsup><mi>h</mi><mo stretchy="false">(</mo><mi>z</mi><mo stretchy="false">)</mo><mi>d</mi><mi>z</mi><mo>,</mo><mstyle scriptlevel="0"><mspace width="1em"></mspace></mstyle><msub><mi>p</mi><mi>f</mi></msub><mo stretchy="false">(</mo><mi>t</mi><mo stretchy="false">)</mo><mo>=</mo><msubsup><mo data-mjx-texclass="OP">\int</mo><mi>t</mi><mrow data-mjx-texclass="ORD"><mn>255</mn></mrow></msubsup><mi>h</mi><mo stretchy="false">(</mo><mi>z</mi><mo stretchy="false">)</mo><mi>d</mi><mi>z</mi></math>$

$μb(t)=1pb(t)∫t0zh(z)dz,μf(t)=1pf(t)∫255tzh(z)dz<math xmlns="http://www.w3.org/1998/Math/MathML" display="block"><msub><mi>μ</mi><mi>b</mi></msub><mo stretchy="false">(</mo><mi>t</mi><mo stretchy="false">)</mo><mo>=</mo><mfrac><mn>1</mn><mrow><msub><mi>p</mi><mi>b</mi></msub><mo stretchy="false">(</mo><mi>t</mi><mo stretchy="false">)</mo></mrow></mfrac><msubsup><mo data-mjx-texclass="OP">∫</mo><mn>0</mn><mrow data-mjx-texclass="ORD"><mi>t</mi></mrow></msubsup><mi>z</mi><mi>h</mi><mo stretchy="false">(</mo><mi>z</mi><mo stretchy="false">)</mo><mi>d</mi><mi>z</mi><mo>,</mo><mstyle scriptlevel="0"><mspace width="1em"></mspace></mstyle><msub><mi>μ</mi><mi>f</mi></msub><mo stretchy="false">(</mo><mi>t</mi><mo stretchy="false">)</mo><mo>=</mo><mfrac><mn>1</mn><mrow><msub><mi>p</mi><mi>f</mi></msub><mo stretchy="false">(</mo><mi>t</mi><mo stretchy="false">)</mo></mrow></mfrac><msubsup><mo data-mjx-texclass="OP">∫</mo><mi>t</mi><mrow data-mjx-texclass="ORD"><mn>255</mn></mrow></msubsup><mi>z</mi><mi>h</mi><mo stretchy="false">(</mo><mi>z</mi><mo stretchy="false">)</mo><mi>d</mi><mi>z</mi></math>$

Ref: Li C.H. and Tam P.K.S. (1998) "An Iterative Algorithm for Minimum Cross Entropy Thresholding"Pattern Recognition Letters, 18(8): 771-776

double MCE_threshold(int hist[256]) {
    int chist[256], cxhist[256];
    chist[0] = hist[0]; cxhist[0] = 0;
    for (int i = 1; i < 256; i++) { 
        chist[i] = hist[i] + chist[i - 1];
        cxhist[i] = i * hist[i] + cxhist[i - 1];
    }
    int num = chist[255];
    double mean = double(cxhist[255]) / num;
    /* Initial estimate */
    double threshold = mean;
    while (1) {
        double old_thresh = threshold;
        int t = int(old_thresh + .5);
        /* background */
        int bgnum = chist[t];
        int bgsum = cxhist[t];
        double bgmean = bgnum == 0 ? 0: double(bgsum) / bgnum;
        /* foreground */
        int fgnum = num - bgnum;
        int fgsum = cxhist[255] - bgsum;
        double fgmean = fgnum == 0 ? 0: double(fgsum) / fgnum;
        threshold = (bgmean - fgmean) / (log(bgmean) - log(fgmean));
        // new thresh is a simple round of theta;
        ASSERT(threshold >= 0);
        if (fabs(threshold - old_thresh) < 0.5)
           break;
    }
    return threshold;
}

저작자표시 비영리 변경금지

'Image Recognition > Fundamental' 카테고리의 다른 글

Statistical Region Merging (0)	2022.06.11
Moment-preserving Thresholding (0)	2022.05.29
Quadtree Segmentation (0)	2022.05.21
Harris Corner Detector (0)	2022.04.07
Valley emphasis Otsu threshold (0)	2022.02.23

Geometry & Recognition 알고리즘,계산기하,물리학,...

이전 1 2 3 4 5 6 7 8 ··· 25 다음

내 블로그 - 관리자 홈 전환	`Q` `Q`
새 글 쓰기	`W` `W`

글 수정 (권한 있는 경우)	`E` `E`
댓글 영역으로 이동	`C` `C`

이 페이지의 URL 복사	`S` `S`
맨 위로 이동	`T` `T`
티스토리 홈 이동	`H` `H`
단축키 안내	`Shift` + `/` `⇧` + `/`

Geometry & Recognition

Statistical Region Merging

'Image Recognition > Fundamental' 카테고리의 다른 글

Moment-preserving Thresholding

'Image Recognition > Fundamental' 카테고리의 다른 글

Minimum Cross Entropy Thresholding

'Image Recognition > Fundamental' 카테고리의 다른 글

카테고리

태그목록

최근에 올라온 글

최근에 달린 댓글

글 보관함

티스토리툴바

개인정보

단축키

내 블로그

블로그 게시글

모든 영역