【opencv】示例-pca.cpp PCA图像重建演示

news2026/3/16 10:10:39

// 加载必要的头文件
#include <iostream> // 用于标准输入输出流
#include <fstream>  // 用于文件的输入输出
#include <sstream>  // 用于字符串的输入输出流操作


#include <opencv2/core.hpp>          // OpenCV核心功能的头文件
#include "opencv2/imgcodecs.hpp"     // OpenCV图像编解码功能的头文件
#include <opencv2/highgui.hpp>       // OpenCV的高级GUI（图形用户界面）


// 使用标准命名空间和OpenCV命名空间，避免重复声明
using namespace cv;
using namespace std;


///
// 函数声明部分


// read_imgList函数用于从文本文件中读取图像路径并加载这些图像
static void read_imgList(const string& filename, vector<Mat>& images) {
    std::ifstream file(filename.c_str(), ifstream::in); // 打开文件
    if (!file) {
        string error_message = "No valid input file was given, please check the given filename."; // 错误消息
        CV_Error(Error::StsBadArg, error_message); // 如果文件打开失败，给出错误信息并退出程序
    }
    string line; // 存储读取的每行文字
    while (getline(file, line)) {
        images.push_back(imread(line, IMREAD_GRAYSCALE)); // 将每行读取到的图像路径用于加载图像，并转换为灰度图像
    }
}


// formatImagesForPCA函数用于将图像数据格式化为一个适合PCA处理的矩阵
static  Mat formatImagesForPCA(const vector<Mat> &data)
{
    // 创建一个用于PCA处理的矩阵，将所有图像行向量垂直堆叠
    Mat dst(static_cast<int>(data.size()), data[0].rows*data[0].cols, CV_32F);
    for(unsigned int i = 0; i < data.size(); i++) // 遍历所有图像
    {
        Mat image_row = data[i].clone().reshape(1,1); // 将每张图像转换为行向量
        Mat row_i = dst.row(i); // 获取目标矩阵的当前行
        image_row.convertTo(row_i,CV_32F); // 将图像数据转换为浮点型，并填入目标矩阵的相应行
    }
    return dst; // 返回格式化后的矩阵
}


// toGrayscale函数用于将输入图像转换为灰度图像，并进行归一化处理
static Mat toGrayscale(InputArray _src) {
    Mat src = _src.getMat(); // 获取输入数据的Mat对象
    // 检查是否是单通道图像
    if(src.channels() != 1) {
        CV_Error(Error::StsBadArg, "Only Matrices with one channel are supported"); // 如果不是，抛出异常
    }
    // 创建一个目标Mat对象，并对输入图像进行归一化处理
    Mat dst;
    cv::normalize(_src, dst, 0, 255, NORM_MINMAX, CV_8UC1);
    return dst; // 返回处理后的图像
}


// 定义一个结构体用于传递给滑动条回调函数的参数
struct params
{
    Mat data;    // 存放数据的Mat矩阵
    int ch;      // 图像的通道数
    int rows;    // 图像行数
    PCA pca;     // PCA对象
    string winName; // 窗口名称
};


// onTrackbar滑动条回调函数，用于根据Retained Variance(保留方差)的变化更新PCA结果并显示
static void onTrackbar(int pos, void* ptr)
{
    cout << "Retained Variance = " << pos << "%   ";
    cout << "re-calculating PCA..." << std::flush; // 提示正在重新计算PCA


    double var = pos / 100.0; // 将滑动条的整型位置值转换为[0,1]之间的百分比表示的保留方差


    struct params *p = (struct params *)ptr; // 从回调函数的指针参数中提取出params结构体


    // 使用新的保留方差重新计算PCA
    p->pca = PCA(p->data, cv::Mat(), PCA::DATA_AS_ROW, var); 


    // 将原始数据的第一行（第一幅图像）投影到PCA空间，并获取其点representation
    Mat point = p->pca.project(p->data.row(0));
    // 然后利用该点representation重构图像
    Mat reconstruction = p->pca.backProject(point);
    reconstruction = reconstruction.reshape(p->ch, p->rows); // 重构的图像需要重新改变其形状
    reconstruction = toGrayscale(reconstruction); // 转换为灰度图便于显示


    // 在窗口中显示重构的图像
    imshow(p->winName, reconstruction);
    // 打印PCA使用的主成分数量
    cout << "done!   # of principal components: " << p->pca.eigenvectors.rows << endl;
}


///
// 主程序
int main(int argc, char** argv)
{
    // 解析命令行参数
    cv::CommandLineParser parser(argc, argv, "{@input||image list}{help h||show help message}");
    // 如果存在"help"参数，则打印帮助消息
    if (parser.has("help"))
    {
        parser.printMessage();
        exit(0);
    }
    
    // 获取CSV文件的路径
    string imgList = parser.get<string>("@input");
    // 如果未传入图片列表，则打印消息并退出程序
    if (imgList.empty())
    {
        parser.printMessage();
        exit(1);
    }
    
    // 创建一个向量来存储图像
    vector<Mat> images;
    
    // 读取数据，如果失败则会抛出异常
    try {
        read_imgList(imgList, images);
    } catch (const cv::Exception& e) {
        cerr << "Error opening file \"" << imgList << "\". Reason: " << e.msg << endl;
        exit(1);
    }
    
    // 如果图片不足以进行此演示，则退出程序
    if(images.size() <= 1) {
        string error_message = "This demo needs at least 2 images to work. Please add more images to your data set!";
        CV_Error(Error::StsError, error_message);
    }
    
    // 将图像重排并堆叠成一个行矩阵
    Mat data = formatImagesForPCA(images);
    
    // 执行PCA
    // 这里trackbar初始设置为95%，这也是一个常见的保留方差值
    PCA pca(data, cv::Mat(), PCA::DATA_AS_ROW, 0.95); 


    // 展示保留方差对第一张图片效果的演示
    Mat point = pca.project(data.row(0)); // 将图像投影到特征空间，图像变成了一个“点”
    Mat reconstruction = pca.backProject(point); // 从“点”中重建图像
    reconstruction = reconstruction.reshape(images[0].channels(), images[0].rows); // 重新将行向量变形为图像形状
    reconstruction = toGrayscale(reconstruction); // 重新缩放以便于显示
    
    // 初始化高层GUI窗口
    string winName = "Reconstruction | press 'q' to quit";
    namedWindow(winName, WINDOW_NORMAL);
    
    // 创建一个结构体以传递给trackbar处理函数
    params p;
    p.data = data;
    p.ch = images[0].channels();
    p.rows = images[0].rows;
    p.pca = pca;
    p.winName = winName;
    
    // 创建trackbar
    int pos = 95;
    createTrackbar("Retained Variance (%)", winName, &pos, 100, onTrackbar, (void*)&p);
    
    // 显示直到用户按下'q'键
    imshow(winName, reconstruction);
    
    char key = 0;
    while(key != 'q')
        key = (char)waitKey();
        
    return 0;
}

代码的主要功能是，通过用户输入一个包含图像全路径的文本文件，该文件的每一行都代表一张图片的路径。程序将会使用主成分分析(PCA)技术对这些图像进行处理，并通过OpenCV库完成。这一处理过程可以通过一个trackbar（滑动条）来动态调整保留方差的百分比，从而展现不同保留方差下图像重建的效果。程序界面会持续显示直到用户按下'q'键退出。这个代码示例建议使用AT&T人脸数据库的前15个人脸图片来演示。

// Reshape and stack images into a rowMatrix
    Mat data = formatImagesForPCA(images);


    // perform PCA
    PCA pca(data, cv::Mat(), PCA::DATA_AS_ROW, 0.95); // trackbar is initially set here, also this is a common value for retainedVariance


    // Demonstration of the effect of retainedVariance on the first image
    Mat point = pca.project(data.row(0)); // project into the eigenspace, thus the image becomes a "point"
    Mat reconstruction = pca.backProject(point); // re-create the image from the "point"
    reconstruction = reconstruction.reshape(images[0].channels(), images[0].rows); // reshape from a row vector into image shape
    reconstruction = toGrayscale(reconstruction); // re-scale for displaying purposes