gpt4 book ai didi

.net - 在 opencv 中查找视频帧的熵时出现奇怪的输出

转载 作者:太空宇宙 更新时间:2023-11-03 20:53:44 26 4
gpt4 key购买 nike

#include <cv.h>
#include <highgui.h>
#include <iostream>
#include <cmath>
#include <cstdlib>
#include <fstream>

using namespace std;

typedef struct histBundle {
double rCh[256];
double gCh[256];
double bCh[256];
}bundleForHist;

bundleForHist getHistFromImage (IplImage* img, int numBins) {
float range[] = {
0,
numBins
};
float *ranges[] = {
range
};

bundleForHist bfh;

CvHistogram *hist = cvCreateHist (1, &numBins, CV_HIST_ARRAY, ranges, 1);
cvClearHist (hist);
IplImage* imgRed = cvCreateImage(cvGetSize(img), 8, 1);
IplImage* imgGreen = cvCreateImage(cvGetSize(img), 8, 1);
IplImage* imgBlue = cvCreateImage(cvGetSize(img), 8, 1);
cvSplit(img, imgBlue, imgGreen, imgRed, NULL);
cvCalcHist(&imgRed, hist, 0, 0);
for (int i = 0; i < numBins; ++i) {
bfh.rCh[i] = cvQueryHistValue_1D(hist, i);
}
cvClearHist(hist);
cvCalcHist(&imgGreen, hist, 0, 0);
for (int i = 0; i < numBins; ++i) {
bfh.gCh[i] = cvQueryHistValue_1D(hist, i);
}
cvClearHist(hist);
cvCalcHist(&imgBlue, hist, 0, 0);
for (int i = 0; i < numBins; ++i) {
bfh.bCh[i] = cvQueryHistValue_1D(hist, i);
}
cvClearHist(hist);
return bfh;
}

int main (int argc, char** argv) {
int c;
IplImage* img = NULL;
int frame_number = 0;
CvCapture* capture = cvCaptureFromAVI ("Cricketc1.avi");
assert(capture);
int fps = ( int )cvGetCaptureProperty( capture, CV_CAP_PROP_FPS );
cvNamedWindow ("Video", 0);

while (1) {
//IplImage * img = cvLoadImage("C:\\Users\\ANIMES~1\\Desktop\\bw.jpg");
img = cvQueryFrame(capture);
frame_number++;
if (img) {
cvShowImage("Video", img);
int numBins = 256;
bundleForHist bfh;
bfh = getHistFromImage (img, numBins);
double totalForR = 0;
double totalForG = 0;
double totalForB = 0;
double probR[256];
double probG[256];
double probB[256];
for (int i = 0; i < numBins-1; ++i) {
totalForR += bfh.rCh[i];
totalForG += bfh.gCh[i];
totalForB += bfh.bCh[i];
}
double lengthHistogram = totalForR + totalForG + totalForB;
for (int i = 0; i < 256; ++i) {
probR[i] = bfh.rCh[i]/(double)lengthHistogram;
probG[i] = bfh.gCh[i]/(double)lengthHistogram;
probB[i] = bfh.bCh[i]/(double)lengthHistogram;
//file << bfh.rCh[i] << "\t" << bfh.gCh[i] << "\t" << bfh.bCh[i] << "\t" << probR[i] << "\t" << probG[i] << "\t" << probB[i] << "\n";
}

double entropyR = 0.0;
double entropyG = 0.0;
double entropyB = 0.0;
for (int i = 0; i < numBins; ++i) {
entropyR += probR[i]*log(probR[i]);
entropyG += probG[i]*log(probG[i]);
entropyB += probB[i]*log(probB[i]);
}
cout << frame_number << "\t" << (-1.0)*(entropyR + entropyG + entropyB) << endl;
}
c = cvWaitKey(1000/fps);
if (c == 27)
break;
}
//cvReleaseImage(&img);
cvReleaseCapture(&capture);
cvDestroyWindow("Video");
return 0;
}

输出:

.
.
254 -1.#IND
255 -1.#IND
256 -1.#IND
257 -1.#IND
258 5.5686
.
.

我首先找到了图像熵,结果是正确的。但视频中将近 80% 的帧熵为 -1.#IND

这是视频.... download

可能出了什么问题?

最佳答案

对于某些 iprob[i] = 0 可能是这种情况,因此您正在计算 log(0),它是不明确的。要解决这个问题,您只需丢弃此类“概率”:

for (int i = 0; i < numBins; ++i) {
if (prob[i])
entropy += prob[i]*log(prob[i]);
}

对于您在 bin 255 中发现的有关 0 值的其他错误,这是由于您指定的范围造成的。 OpenCV 将相关函数的范围视为 [start, end),因此指定 [0, 255) 的范围将忽略 255 的结束值。您想要的是同时保留 0 和 255,因此:

float range[] = {0, numBins};

关于.net - 在 opencv 中查找视频帧的熵时出现奇怪的输出,我们在Stack Overflow上找到一个类似的问题: https://stackoverflow.com/questions/13920828/

26 4 0
Copyright 2021 - 2024 cfsdn All Rights Reserved 蜀ICP备2022000587号
广告合作:1813099741@qq.com 6ren.com