Ex2：用CImg重写、封装给定的Canny代码，并测试(Code0)

本文介绍了如何使用CImg库重写和封装Canny边缘检测算法，详细讨论了不同参数（如低阈值、高阈值、高斯核参数等）对检测结果的影响，并给出了修改参数后的测试分析。

摘要生成于 C知道，由 DeepSeek-R1 满血版支持，前往体验 >

Ex2：用CImg重写、封装给定的Canny代码，并测试(Code0)

github地址:https://github.com/linjiafengyang/ComputerVision

代码文件

用CImg重写Code0文件夹中的canny.c和canny.h为canny.cpp和canny.h，并增加一个main.cpp文件作为图像数据输入并测试。
重写过程：首先替换原来的图像输入为CImg图像输入，以及对像素点的for循环更改为CImg版本cimg_forXY()，最后把原来的C语言struct结构体改成C++类。

canny.h文件

#ifndef canny_h
#define canny_h

#include "CImg.h"
using namespace cimg_library;

class Canny
{
public:
    CImg<unsigned char> canny(CImg<unsigned char> grey, int width, int height);
    CImg<unsigned char> cannyparam(CImg<unsigned char> grey, int width, int height,
                          float lowthreshold, float highthreshold,
                          float gaussiankernelradius, int gaussiankernelwidth,  
                          int contrastnormalised);

    Canny *allocatebuffers(const CImg<unsigned char> & grey, int width, int height);
    void killbuffers(Canny *can);
    int computeGradients(Canny *can, float kernelRadius, int kernelWidth);
    void performHysteresis(Canny *can, int low, int high);
    void follow(Canny *can, int x1, int y1, int i1, int threshold);
    void normalizeContrast(CImg<unsigned char> & data, int width, int height);
    float hypotenuse(float x, float y);
    float gaussian(float x, float sigma);

private:
    CImg<unsigned char> data; /* input image */
    int width;
    int height;
    int *idata;          /* output for edges */
    int *magnitude;      /* edge magnitude as detected by Gaussians */
    float *xConv;        /* temporary for convolution in x direction */
    float *yConv;        /* temporary for convolution in y direction */
    float *xGradient;    /* gradients in x direction, as detected by Gaussians */
    float *yGradient;    /* gradients in x direction,a s detected by Gaussians */

};

#endif

canny.cpp文件

#include "canny.h"
#include <math.h>

#define ffabs(x) ( (x) >= 0 ? (x) : -(x) ) 
#define GAUSSIAN_CUT_OFF 0.005f
#define MAGNITUDE_SCALE 100.0f
#define MAGNITUDE_LIMIT 1000.0f
#define MAGNITUDE_MAX ((int) (MAGNITUDE_SCALE * MAGNITUDE_LIMIT))

/*
  Canny edge detection with default parameters
    Params: grey - the greyscale image
            width, height - image width and height
    Returns: binary image with edges as set pixels
*/
CImg<unsigned char> Canny::canny(CImg<unsigned char> grey, int width, int height)
{
    return cannyparam(grey, width, height, 2.5f, 7.5f, 2.0f, 16, 0);
}

/*
Canny edge detection with parameters passed in by user
Params: grey - the greyscale image
width, height - image dimensions
lowthreshold - default 2.5
highthreshold - default 7.5
gaussiankernelradius - radius of edge detection Gaussian, in standard deviations
(default 2.0)
gaussiankernelwidth - width of Gaussian kernel, in pixels (default 16)
contrastnormalised - flag to normalise image before edge detection (defualt 0)
Returns: binary image with set pixels as edges
*/
CImg<unsigned char> Canny::cannyparam(CImg<unsigned char> grey, int width, int height,
                                        float lowthreshold, float highthreshold,
                                        float gaussiankernelradius, int gaussiankernelwidth,
                                        int contrastnormalised)
{
    Canny *can = 0;
    CImg<unsigned char> answer = CImg<unsigned char>(width, height, 1, 1, 0);
    int low, high;
    int err;
    int i;

    can = allocatebuffers(grey, width, height);

    if (!can)
        goto error_exit;
    if (contrastnormalised)
        normalizeContrast(can->data, width, height);

    err = computeGradients(can, gaussiankernelradius, gaussiankernelwidth);

    if (err < 0)
        goto error_exit;

    low = (int)(lowthreshold * MAGNITUDE_SCALE + 0.5f);
    high = (int)(highthreshold * MAGNITUDE_SCALE + 0.5f);
    performHysteresis(can, low, high);

    cimg_forXY(answer, x, y)
    {
        i = y * width + x;
        answer(x, y, 0) = can->idata[i] > 0 ? 255 : 0;
    }

    killbuffers(can);
    return answer;
error_exit:
    free(answer);
    killbuffers(can);
    return CImg<unsigned char>();
}

/*
buffer allocation
*/
Canny * Canny::allocatebuffers(const CImg<unsigned char> & grey, int width, int height)
{
    Canny *answer;

    answer = new Canny;
    if (!answer)
        goto error_exit;
    answer->data = CImg<unsigned char>(width, height, 1, 1, 0);
    answer->idata = new int[width * height];
    answer->magnitude = new int[width * height];
    answer->xConv = new float[width * height];
    answer->yConv = new float[width * height];
    answer->xGradient = new float[width * height];
    answer->yGradient = new float[width * height];

    if (!answer->data || !answer->idata || !answer->magnitude ||
        !answer->xConv || !answer->yConv ||
        !answer->xGradient || !answer->yGradient)
        goto error_exit;

    cimg_forXY(grey, x, y)
    {
        answer->data(x, y, 0) = grey(x, y, 0);
    }
    answer->width = width;
    answer->height = height;

    return answer;
error_exit:
    killbuffers(answer);
    return 0;
}

/*
buffers destructor
*/
void Canny::killbuffers(Canny *can) {
    if (can)
    {
        delete(can->idata);
        delete(can->magnitude);
        delete(can->xConv);
        delete(can->yConv);
        delete(can->xGradient);
        delete(can->yGradient);
    }
}

/* NOTE: The elements of the method below (specifically the technique for
non-maximal suppression and the technique for gradient computation)
are derived from an implementation posted in the following forum (with the
clear intent of others using the code):
http://forum.java.sun.com/thread.jspa?threadID=546211&start=45&tstart=0
My code effectively mimics the algorithm exhibited above.
Since I don't know the providence of the code that was posted it is a
possibility (though I think a very remote one) that this code violates
someone's intellectual property rights. If this concerns you feel free to
contact me for an alternative, though less efficient, implementation.
*/
int Canny::computeGradients(Canny *can, float kernelRadius, int kernelWidth)
{
    float *kernel;
    float *diffKernel;
    int kwidth;

    int width, height;

    int initX;
    int maxX;
    int initY;
    int maxY;

    int x, y;
    int i;
    int flag;

    width = can->width;
    height = can->height;

    kernel = new float[kernelWidth];
    diffKernel = new float[kernelWidth];

    if (!kernel || !diffKernel)
        goto error_exit;

    /* initialise the Gaussian kernel */
    for (kwidth = 0; kwidth < kernelWidth; kwidth++)
    {
        float g1, g2, g3;
        g1 = gaussian((float)kwidth, kernelRadius);
        if (g1 <= GAUSSIAN_CUT_OFF && kwidth >= 2)
            break;
        g2 = gaussian(kwidth - 0.5f, kernelRadius);
        g3 = gaussian(kwidth + 0.5f, kernelRadius);
        kernel[kwidth] = (g1 + g2 + g3) / 3.0f / (2.0f * (float) 3.14 * kernelRadius * kernelRadius);
        diffKernel[kwidth] = g3 - g2;
    }

    initX = kwidth - 1;
    maxX = width - (kwidth - 1);
    initY = width * (kwidth - 1);
    maxY = width * (height - (kwidth - 1));

    /* perform convolution in x and y directions */
    for (x = initX; x < maxX; x++)
    {
        for (y = initY; y < maxY; y += width)
        {
            int index = x + y;
            float sumX = can->data[index] * kernel[0];
            float sumY = sumX;
            int xOffset = 1;
            int yOffset = width;
            while (xOffset < kwidth)
            {
                sumY += kernel[xOffset] * (can->data[index - yOffset] + can->data[index + yOffset]);
                sumX += kernel[xOffset] * (can->data[index - xOffset] + can->data[index + xOffset]);
                yOffset += width;
                xOffset++;
            }

            can->yConv[index] = sumY;
            can->xConv[index] = sumX;
        }
    }

    for (x = initX; x < maxX; x++)
    {
        for (y = initY; y < maxY; y += width)
        {
            float sum = 0.0f;
            int index = x + y;
            for (i = 1; i < kwidth; i++)
                sum += diffKernel[i] * (can->yConv[index - i] - can->yConv[index + i]);

            can->xGradient[index] = sum;
        }
    }

    for (x = kwidth; x < width - kwidth; x++)
    {
        for (y = initY; y < maxY; y += width)
        {
            float sum = 0.0f;
            int index = x + y;
            int yOffset = width;
            for (i = 1; i < kwidth; i++)
            {
                sum += diffKernel[i] * (can->xConv[index - yOffset] - can->xConv[index + yOffset]);
                yOffset += width;
            }

            can->yGradient[index] = sum;
        }
    }

    initX = kwidth;
    maxX = width - kwidth;
    initY = width * kwidth;
    maxY = width * (height - kwidth);
    for (x = initX; x < maxX; x++)
    {
        for (y = initY; y < maxY; y += width)
        {
            int index = x + y;
            int indexN = index - width;
            int indexS = index + width;
            int indexW = index - 1;
            int indexE = index + 1;
            int indexNW = indexN - 1;
            int indexNE = indexN + 1;
            int indexSW = indexS - 1;
            int indexSE = indexS + 1;

            float xGrad = can->xGradient[index];
            float yGrad = can->yGradient[index];
            float gradMag = hypotenuse(xGrad, yGrad);

            /* perform non-maximal supression */
            float nMag = hypotenuse(can->xGradient[indexN], can->yGradient[indexN]);
            float sMag = hypotenuse(can->xGradient[indexS], can->yGradient[indexS]);
            float wMag = hypotenuse(can->xGradient[indexW], can->yGradient[indexW]);
            float eMag = hypotenuse(can->xGradient[indexE], can->yGradient[indexE]);
            float neMag = hypotenuse(can->xGradient[indexNE], can->yGradient[indexNE]);
            float seMag = hypotenuse(can->xGradient[indexSE], can->yGradient[indexSE]);
            float swMag = hypotenuse(can->xGradient[indexSW], can->yGradient[indexSW]);
            float nwMag = hypotenuse(can->xGradient[indexNW], can->yGradient[indexNW]);
            float tmp;
            /*
            * An explanation of what's happening here, for those who want
            * to understand the source: This performs the "non-maximal
            * supression" phase of the Canny edge detection in which we
            * need to compare the gradient magnitude to that in the
            * direction of the gradient; only if the value is a local
            * maximum do we consider the point as an edge candidate.
            *
            * We need to break the comparison into a number of different
            * cases depending on the gradient direction so that the
            * appropriate values can be used. To avoid computing the
            * gradient direction, we use two simple comparisons: first we
            * check that the partial derivatives have the same sign (1)
            * and then we check which is larger (2). As a consequence, we
            * have reduced the problem to one of four identical cases that
            * each test the central gradient magnitude against the values at
            * two points with 'identical support'; what this means is that
            * the geometry required to accurately interpolate the magnitude
            * of gradient function at those points has an identical
            * geometry (upto right-angled-rotation/reflection).
            *
            * When comparing the central gradient to the two interpolated
            * values, we avoid performing any divisions by multiplying both
            * sides of each inequality by the greater of the two partial
            * derivatives. The common comparand is stored in a temporary
            * variable (3) and reused in the mirror case (4).
            *
            */
            flag = ((xGrad * yGrad <= 0.0f) /*(1)*/
                ? ffabs(xGrad) >= ffabs(yGrad) /*(2)*/
                ? (tmp = ffabs(xGrad * gradMag)) >= ffabs(yGrad * neMag - (xGrad + yGrad) * eMag) /*(3)*/
                && tmp > fabs(yGrad * swMag - (xGrad + yGrad) * wMag) /*(4)*/
                : (tmp = ffabs(yGrad * gradMag)) >= ffabs(xGrad * neMag - (yGrad + xGrad) * nMag) /*(3)*/
                && tmp > ffabs(xGrad * swMag - (yGrad + xGrad) * sMag) /*(4)*/
                : ffabs(xGrad) >= ffabs(yGrad) /*(2)*/
                ? (tmp = ffabs(xGrad * gradMag)) >= ffabs(yGrad * seMag + (xGrad - yGrad) * eMag) /*(3)*/
                && tmp > ffabs(yGrad * nwMag + (xGrad - yGrad) * wMag) /*(4)*/
                : (tmp = ffabs(yGrad * gradMag)) >= ffabs(xGrad * seMag + (yGrad - xGrad) * sMag) /*(3)*/
                && tmp > ffabs(xGrad * nwMag + (yGrad - xGrad) * nMag) /*(4)*/
                );
            if (flag)
            {
                can->magnitude[index] = (gradMag >= MAGNITUDE_LIMIT) ? MAGNITUDE_MAX : (int)(MAGNITUDE_SCALE * gradMag);
                /*NOTE: The orientation of the edge is not employed by this
                implementation. It is a simple matter to compute it at
                this point as: Math.atan2(yGrad, xGrad); */
            }
            else
            {
                can->magnitude[index] = 0;
            }
        }
    }
    free(kernel);
    free(diffKernel);
    return 0;
error_exit:
    free(kernel);
    free(diffKernel);
    return -1;
}

/*
we follow edges. high gives the parameter for starting an edge,
how the parameter for continuing it.
*/
void Canny::performHysteresis(Canny *can, int low, int high)
{
    int offset = 0;
    int x, y;

    memset(can->idata, 0, can->width * can->height * sizeof(int));

    for (y = 0; y < can->height; y++)
    {
        for (x = 0; x < can->width; x++) {
            if (can->idata[offset] == 0 && can->magnitude[offset] >= high)
                follow(can, x, y, offset, low);
            offset++;
        }
    }
}

/*
recursive portion of edge follower
*/
void Canny::follow(Canny *can, int x1, int y1, int i1, int threshold)
{
    int x, y;
    int x0 = x1 == 0 ? x1 : x1 - 1;
    int x2 = x1 == can->width - 1 ? x1 : x1 + 1;
    int y0 = y1 == 0 ? y1 : y1 - 1;
    int y2 = y1 == can->height - 1 ? y1 : y1 + 1;

    can->idata[i1] = can->magnitude[i1];
    for (x = x0; x <= x2; x++)
    {
        for (y = y0; y <= y2; y++)
        {
            int i2 = x + y * can->width;
            if ((y != y1 || x != x1) && can->idata[i2] == 0 && can->magnitude[i2] >= threshold)
                follow(can, x, y, i2, threshold);
        }
    }
}

void Canny::normalizeContrast(CImg<unsigned char> & data, int width, int height)
{
    int histogram[256] = { 0 };
    int remap[256];
    int sum = 0;
    int j = 0;
    int k;
    int target;
    int i;

    cimg_forXY(data, x, y)
    {
        histogram[data(x, y, 0)]++;
    }

    for (i = 0; i < 256; i++)
    {
        sum += histogram[i];
        target = (sum * 255) / (width * height);
        for (k = j + 1; k <= target; k++)
            remap[k] = i;
        j = target;
    }

    cimg_forXY(data, x, y)
    {
        data(x, y, 0) = remap[data(x, y, 0)];
    }
}

float Canny::hypotenuse(float x, float y)
{
    return (float)sqrt(x*x + y*y);
}

float Canny::gaussian(float x, float sigma)
{
    return (float)exp(-(x * x) / (2.0f * sigma * sigma));
}

main.cpp文件

#include "canny.cpp"

int main() {
    CImg<unsigned char> bigben_grey("../test_Data/bigben.bmp");
    Canny c;
    CImg<unsigned char> bigben_canny = c.canny(bigben_grey, bigben_grey.width(), bigben_grey.height());
    bigben_canny.save("../result_Data/bigben_canny.bmp");

    CImg<unsigned char> lena_grey("../test_Data/lena.bmp");
    CImg<unsigned char> lena_canny = c.canny(lena_grey, lena_grey.width(), lena_grey.height());
    lena_canny.save("../result_Data/lena_canny.bmp");
    //lena_canny.display("lena_canny");

    CImg<unsigned char> stpietro_grey("../test_Data/stpietro.bmp");
    CImg<unsigned char> stpietro_canny = c.canny(stpietro_grey, stpietro_grey.width(), stpietro_grey.height());
    stpietro_canny.save("../result_Data/stpietro_canny.bmp");

    CImg<unsigned char> twows_grey("../test_Data/twows.bmp");
    CImg<unsigned char> twows_canny = c.canny(twows_grey, twows_grey.width(), twows_grey.height());
    twows_canny.save("../result_Data/twows_canny.bmp");
    return 0;
}

测试数据

作业中有四张bmp图像，但这里限于篇幅，我以女神lena为例：
这里写图片描述

测试结果

这里写图片描述

修改算法参数后的测试结果

注意到程序中这个函数接收Canny边缘检测算法的相关参数，也就是调参主要是针对这几个参数：其中width和height为输入图像的宽度和高度，无需调整，所以一共有五个参数需要调整，分别为lowthreshold低阈值（默认2.5）、highthreshold高阈值（默认7.5）、gaussiankernelradius标准差（默认2.0）、gaussiankernelwidth高斯卷积核大小（默认16）、contrastnormalised图像是否需要归一化（默认0值表示不需要）。

lowthreshold低阈值

保持其他参数不变，修改低阈值后的测试结果如下：默认2.5。
这里写图片描述

分析：

可以看出，我们修改原程序中的lowthreshold低阈值后，比如改成0.1，低阈值减小，将会增加很多噪声；而改成6.0，低阈值增大，又会丢失很多强边缘像素。这与已知结论吻合：对于弱边缘像素（在低阈值和高阈值之间），这些像素可以从真实边缘提取也可以是因噪声或颜色变化引起的。为了获得准确的结果，应该抑制由后者引起的弱边缘像素。因此需要调整低阈值参数。

highthreshold高阈值

保持其他参数不变，修改高阈值后的测试结果如下：默认7.5。
这里写图片描述

分析：

可以看出，我们修改原程序中的highthreshold高阈值后，比如改成3.0，高阈值减小，此时将会增加很多强边缘像素，因为大于3的像素点将被确定为边缘；而改成10.0，高阈值增大，原来的强边缘像素大部分会转化为弱边缘像素，丢失一部分边缘像素点。这与已知结论吻合：被划分为强边缘的像素点已经被确定为边缘，因为它们是从图像中的真实边缘中提取出来的。

gaussiankernelradius标准差

保持其他参数不变，修改标准差后的测试结果如下：默认2.0。
这里写图片描述

分析：

可以看出，我们修改原程序中的gaussiankernelradius标准差后，比如改成1.0，标准差减小，为标准正态分布，此时将会增加很多噪声，高斯滤波平滑效果不好，表现为噪声过多；而改成4.0，标准差增大，原来的强边缘像素大部分被误认为噪声，因此将会被丢弃，造成边缘缺失，高斯滤波平滑效果也不好。这与已知结论吻合：为了平滑图像，使用高斯滤波器与图像进行卷积，该步骤将平滑图像，以减少边缘检测器上明显的噪声影响。

gaussiankernelwidth高斯卷积核大小

保持其他参数不变，修改高斯卷积核大小后的测试结果如下：默认16。
这里写图片描述

分析：

可以看出，我们修改原程序中的gaussiankernelwidth高斯卷积核大小后，比如改成7，发现两张边缘检测图其实没变化，说明原程序中高斯卷积核大小16已经过大，将会浪费内存空间，其实为7就有同样的效果了；而改成5，高斯卷积核大小为5也是比较推荐的折中，再看改成3，此时丢失了很多边缘像素，即误认为噪声，对噪声的敏感度较大。这与已知结论吻合：高斯卷积核大小越大，检测器对噪声的敏感度越低，但是边缘检测的定位误差也将略有增加。