Revert "Update video_quality_analysis to align videos instead of using barcodes"
This reverts commit d65e143801a7aaa9affdb939ea836aec1955cdcc. Reason for revert: Breaks perf bots. frame_analyzer is a prebuilt binary, so it won't automatically pick up changes in the .cc file. Original change's description: > Update video_quality_analysis to align videos instead of using barcodes > > This CL is a follow-up to the previous CL > https://webrtc-review.googlesource.com/c/src/+/94773 that added generic > logic for aligning videos. This will allow us to easily extend > video_quality_analysis with new sophisticated video quality metrics. > Also, we can use any kind of video that does not necessarily need to > contain bar codes. Removing the need to decode barcodes also leads to a > big speedup for the tests. > > Bug: webrtc:9642 > Change-Id: I74b0d630b3e1ed44781ad024115ded3143e28f50 > Reviewed-on: https://webrtc-review.googlesource.com/94845 > Reviewed-by: Paulina Hensman <phensman@webrtc.org> > Reviewed-by: Patrik Höglund <phoglund@webrtc.org> > Commit-Queue: Magnus Jedvert <magjed@webrtc.org> > Cr-Commit-Position: refs/heads/master@{#24423} TBR=phoglund@webrtc.org,magjed@webrtc.org,phensman@webrtc.org Change-Id: Ia590b465687b861fe37ed1b14756d4607ca90da1 No-Presubmit: true No-Tree-Checks: true No-Try: true Bug: webrtc:9642 Reviewed-on: https://webrtc-review.googlesource.com/95946 Reviewed-by: Magnus Jedvert <magjed@webrtc.org> Commit-Queue: Magnus Jedvert <magjed@webrtc.org> Cr-Commit-Position: refs/heads/master@{#24428}
This commit is contained in:
committed by
Commit Bot
parent
a1cceca02c
commit
3e169ac18c
@ -10,19 +10,87 @@
|
||||
|
||||
#include "rtc_tools/frame_analyzer/video_quality_analysis.h"
|
||||
|
||||
#include <assert.h>
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
#include <algorithm>
|
||||
#include <numeric>
|
||||
#include <map>
|
||||
#include <string>
|
||||
#include <utility>
|
||||
|
||||
#include "test/testsupport/perf_test.h"
|
||||
#include "third_party/libyuv/include/libyuv/compare.h"
|
||||
#include "third_party/libyuv/include/libyuv/convert.h"
|
||||
|
||||
#define STATS_LINE_LENGTH 32
|
||||
|
||||
namespace webrtc {
|
||||
namespace test {
|
||||
|
||||
ResultsContainer::ResultsContainer() {}
|
||||
ResultsContainer::~ResultsContainer() {}
|
||||
|
||||
int GetI420FrameSize(int width, int height) {
|
||||
int half_width = (width + 1) >> 1;
|
||||
int half_height = (height + 1) >> 1;
|
||||
|
||||
int y_plane = width * height; // I420 Y plane.
|
||||
int u_plane = half_width * half_height; // I420 U plane.
|
||||
int v_plane = half_width * half_height; // I420 V plane.
|
||||
|
||||
return y_plane + u_plane + v_plane;
|
||||
}
|
||||
|
||||
int ExtractFrameSequenceNumber(std::string line) {
|
||||
size_t space_position = line.find(' ');
|
||||
if (space_position == std::string::npos) {
|
||||
return -1;
|
||||
}
|
||||
std::string frame = line.substr(0, space_position);
|
||||
|
||||
size_t underscore_position = frame.find('_');
|
||||
if (underscore_position == std::string::npos) {
|
||||
return -1;
|
||||
}
|
||||
std::string frame_number = frame.substr(underscore_position + 1);
|
||||
|
||||
return strtol(frame_number.c_str(), NULL, 10);
|
||||
}
|
||||
|
||||
int ExtractDecodedFrameNumber(std::string line) {
|
||||
size_t space_position = line.find(' ');
|
||||
if (space_position == std::string::npos) {
|
||||
return -1;
|
||||
}
|
||||
std::string decoded_number = line.substr(space_position + 1);
|
||||
|
||||
return strtol(decoded_number.c_str(), NULL, 10);
|
||||
}
|
||||
|
||||
bool IsThereBarcodeError(std::string line) {
|
||||
size_t barcode_error_position = line.find("Barcode error");
|
||||
if (barcode_error_position != std::string::npos) {
|
||||
return true;
|
||||
}
|
||||
return false;
|
||||
}
|
||||
|
||||
bool GetNextStatsLine(FILE* stats_file, char* line) {
|
||||
int chars = 0;
|
||||
char buf = 0;
|
||||
|
||||
while (buf != '\n') {
|
||||
size_t chars_read = fread(&buf, 1, 1, stats_file);
|
||||
if (chars_read != 1 || feof(stats_file)) {
|
||||
return false;
|
||||
}
|
||||
line[chars] = buf;
|
||||
++chars;
|
||||
}
|
||||
line[chars - 1] = '\0'; // Strip the trailing \n and put end of string.
|
||||
return true;
|
||||
}
|
||||
|
||||
template <typename FrameMetricFunction>
|
||||
static double CalculateMetric(
|
||||
const FrameMetricFunction& frame_metric_function,
|
||||
@ -51,69 +119,225 @@ double Ssim(const rtc::scoped_refptr<I420BufferInterface>& ref_buffer,
|
||||
return CalculateMetric(&libyuv::I420Ssim, ref_buffer, test_buffer);
|
||||
}
|
||||
|
||||
std::vector<AnalysisResult> RunAnalysis(
|
||||
const rtc::scoped_refptr<webrtc::test::Video>& reference_video,
|
||||
const rtc::scoped_refptr<webrtc::test::Video>& test_video,
|
||||
const std::vector<size_t>& test_frame_indices) {
|
||||
std::vector<AnalysisResult> results;
|
||||
for (size_t i = 0; i < test_frame_indices.size(); ++i) {
|
||||
// Ignore duplicated frames in the test video.
|
||||
if (i > 0 && test_frame_indices[i] == test_frame_indices[i - 1])
|
||||
continue;
|
||||
void RunAnalysis(const rtc::scoped_refptr<webrtc::test::Video>& reference_video,
|
||||
const rtc::scoped_refptr<webrtc::test::Video>& test_video,
|
||||
const char* stats_file_reference_name,
|
||||
const char* stats_file_test_name,
|
||||
int width,
|
||||
int height,
|
||||
ResultsContainer* results) {
|
||||
FILE* stats_file_ref = fopen(stats_file_reference_name, "r");
|
||||
FILE* stats_file_test = fopen(stats_file_test_name, "r");
|
||||
|
||||
const rtc::scoped_refptr<I420BufferInterface>& test_frame =
|
||||
test_video->GetFrame(i);
|
||||
const rtc::scoped_refptr<I420BufferInterface>& reference_frame =
|
||||
reference_video->GetFrame(test_frame_indices[i] %
|
||||
reference_video->number_of_frames());
|
||||
// String buffer for the lines in the stats file.
|
||||
char line[STATS_LINE_LENGTH];
|
||||
|
||||
int previous_frame_number = -1;
|
||||
|
||||
// Maps barcode id to the frame id for the reference video.
|
||||
// In case two frames have same id, then we only save the first one.
|
||||
std::map<int, int> ref_barcode_to_frame;
|
||||
// While there are entries in the stats file.
|
||||
while (GetNextStatsLine(stats_file_ref, line)) {
|
||||
int extracted_ref_frame = ExtractFrameSequenceNumber(line);
|
||||
int decoded_frame_number = ExtractDecodedFrameNumber(line);
|
||||
|
||||
// Insert will only add if it is not in map already.
|
||||
ref_barcode_to_frame.insert(
|
||||
std::make_pair(decoded_frame_number, extracted_ref_frame));
|
||||
}
|
||||
|
||||
while (GetNextStatsLine(stats_file_test, line)) {
|
||||
int extracted_test_frame = ExtractFrameSequenceNumber(line);
|
||||
int decoded_frame_number = ExtractDecodedFrameNumber(line);
|
||||
auto it = ref_barcode_to_frame.find(decoded_frame_number);
|
||||
if (it == ref_barcode_to_frame.end()) {
|
||||
// Not found in the reference video.
|
||||
// TODO(mandermo) print
|
||||
continue;
|
||||
}
|
||||
int extracted_ref_frame = it->second;
|
||||
|
||||
// If there was problem decoding the barcode in this frame or the frame has
|
||||
// been duplicated, continue.
|
||||
if (IsThereBarcodeError(line) ||
|
||||
decoded_frame_number == previous_frame_number) {
|
||||
continue;
|
||||
}
|
||||
|
||||
assert(extracted_test_frame != -1);
|
||||
assert(decoded_frame_number != -1);
|
||||
|
||||
const rtc::scoped_refptr<webrtc::I420BufferInterface> test_frame =
|
||||
test_video->GetFrame(extracted_test_frame);
|
||||
const rtc::scoped_refptr<webrtc::I420BufferInterface> reference_frame =
|
||||
reference_video->GetFrame(extracted_ref_frame);
|
||||
|
||||
// Calculate the PSNR and SSIM.
|
||||
double result_psnr = Psnr(reference_frame, test_frame);
|
||||
double result_ssim = Ssim(reference_frame, test_frame);
|
||||
|
||||
previous_frame_number = decoded_frame_number;
|
||||
|
||||
// Fill in the result struct.
|
||||
AnalysisResult result;
|
||||
result.frame_number = test_frame_indices[i];
|
||||
result.psnr_value = Psnr(reference_frame, test_frame);
|
||||
result.ssim_value = Ssim(reference_frame, test_frame);
|
||||
results.push_back(result);
|
||||
result.frame_number = decoded_frame_number;
|
||||
result.psnr_value = result_psnr;
|
||||
result.ssim_value = result_ssim;
|
||||
|
||||
results->frames.push_back(result);
|
||||
}
|
||||
|
||||
return results;
|
||||
// Cleanup.
|
||||
fclose(stats_file_ref);
|
||||
fclose(stats_file_test);
|
||||
}
|
||||
|
||||
std::vector<Cluster> CalculateFrameClusters(
|
||||
const std::vector<size_t>& indices) {
|
||||
std::vector<Cluster> clusters;
|
||||
for (size_t i = 0; i < indices.size(); ++i) {
|
||||
const size_t start_index = i;
|
||||
while (i < indices.size() && indices[i] == indices[start_index])
|
||||
++i;
|
||||
const int number_of_repeated_frames = static_cast<int>(i - start_index);
|
||||
clusters.push_back({indices[start_index], number_of_repeated_frames});
|
||||
std::vector<std::pair<int, int> > CalculateFrameClusters(
|
||||
FILE* file,
|
||||
int* num_decode_errors) {
|
||||
if (num_decode_errors) {
|
||||
*num_decode_errors = 0;
|
||||
}
|
||||
return clusters;
|
||||
}
|
||||
|
||||
int GetMaxRepeatedFrames(const std::vector<Cluster>& clusters) {
|
||||
int max_number_of_repeated_frames = 0;
|
||||
for (const Cluster& cluster : clusters) {
|
||||
max_number_of_repeated_frames = std::max(max_number_of_repeated_frames,
|
||||
cluster.number_of_repeated_frames);
|
||||
std::vector<std::pair<int, int> > frame_cnt;
|
||||
char line[STATS_LINE_LENGTH];
|
||||
while (GetNextStatsLine(file, line)) {
|
||||
int decoded_frame_number;
|
||||
if (IsThereBarcodeError(line)) {
|
||||
decoded_frame_number = DECODE_ERROR;
|
||||
if (num_decode_errors) {
|
||||
++*num_decode_errors;
|
||||
}
|
||||
} else {
|
||||
decoded_frame_number = ExtractDecodedFrameNumber(line);
|
||||
}
|
||||
if (frame_cnt.size() >= 2 && decoded_frame_number != DECODE_ERROR &&
|
||||
frame_cnt.back().first == DECODE_ERROR &&
|
||||
frame_cnt[frame_cnt.size() - 2].first == decoded_frame_number) {
|
||||
// Handle when there is a decoding error inside a cluster of frames.
|
||||
frame_cnt[frame_cnt.size() - 2].second += frame_cnt.back().second + 1;
|
||||
frame_cnt.pop_back();
|
||||
} else if (frame_cnt.empty() ||
|
||||
frame_cnt.back().first != decoded_frame_number) {
|
||||
frame_cnt.push_back(std::make_pair(decoded_frame_number, 1));
|
||||
} else {
|
||||
++frame_cnt.back().second;
|
||||
}
|
||||
}
|
||||
return max_number_of_repeated_frames;
|
||||
return frame_cnt;
|
||||
}
|
||||
|
||||
int GetMaxSkippedFrames(const std::vector<Cluster>& clusters) {
|
||||
size_t max_skipped_frames = 0;
|
||||
for (size_t i = 1; i < clusters.size(); ++i) {
|
||||
const size_t skipped_frames = clusters[i].index - clusters[i - 1].index - 1;
|
||||
max_skipped_frames = std::max(max_skipped_frames, skipped_frames);
|
||||
void GetMaxRepeatedAndSkippedFrames(const std::string& stats_file_ref_name,
|
||||
const std::string& stats_file_test_name,
|
||||
ResultsContainer* results) {
|
||||
FILE* stats_file_ref = fopen(stats_file_ref_name.c_str(), "r");
|
||||
FILE* stats_file_test = fopen(stats_file_test_name.c_str(), "r");
|
||||
if (stats_file_ref == NULL) {
|
||||
fprintf(stderr, "Couldn't open reference stats file for reading: %s\n",
|
||||
stats_file_ref_name.c_str());
|
||||
return;
|
||||
}
|
||||
if (stats_file_test == NULL) {
|
||||
fprintf(stderr, "Couldn't open test stats file for reading: %s\n",
|
||||
stats_file_test_name.c_str());
|
||||
fclose(stats_file_ref);
|
||||
return;
|
||||
}
|
||||
return static_cast<int>(max_skipped_frames);
|
||||
}
|
||||
|
||||
int GetTotalNumberOfSkippedFrames(const std::vector<Cluster>& clusters) {
|
||||
// The number of reference frames the test video spans.
|
||||
const size_t number_ref_frames =
|
||||
clusters.empty() ? 0 : 1 + clusters.back().index - clusters.front().index;
|
||||
return static_cast<int>(number_ref_frames - clusters.size());
|
||||
int max_repeated_frames = 1;
|
||||
int max_skipped_frames = 0;
|
||||
|
||||
int decode_errors_ref = 0;
|
||||
int decode_errors_test = 0;
|
||||
|
||||
std::vector<std::pair<int, int> > frame_cnt_ref =
|
||||
CalculateFrameClusters(stats_file_ref, &decode_errors_ref);
|
||||
|
||||
std::vector<std::pair<int, int> > frame_cnt_test =
|
||||
CalculateFrameClusters(stats_file_test, &decode_errors_test);
|
||||
|
||||
fclose(stats_file_ref);
|
||||
fclose(stats_file_test);
|
||||
|
||||
auto it_ref = frame_cnt_ref.begin();
|
||||
auto it_test = frame_cnt_test.begin();
|
||||
auto end_ref = frame_cnt_ref.end();
|
||||
auto end_test = frame_cnt_test.end();
|
||||
|
||||
if (it_test == end_test || it_ref == end_ref) {
|
||||
fprintf(stderr, "Either test or ref file is empty, nothing to print\n");
|
||||
return;
|
||||
}
|
||||
|
||||
while (it_test != end_test && it_test->first == DECODE_ERROR) {
|
||||
++it_test;
|
||||
}
|
||||
|
||||
if (it_test == end_test) {
|
||||
fprintf(stderr, "Test video only has barcode decode errors\n");
|
||||
return;
|
||||
}
|
||||
|
||||
// Find the first frame in the reference video that match the first frame in
|
||||
// the test video.
|
||||
while (it_ref != end_ref &&
|
||||
(it_ref->first == DECODE_ERROR || it_ref->first != it_test->first)) {
|
||||
++it_ref;
|
||||
}
|
||||
if (it_ref == end_ref) {
|
||||
fprintf(stderr,
|
||||
"The barcode in the test video's first frame is not in the "
|
||||
"reference video.\n");
|
||||
return;
|
||||
}
|
||||
|
||||
int total_skipped_frames = 0;
|
||||
for (;;) {
|
||||
max_repeated_frames =
|
||||
std::max(max_repeated_frames, it_test->second - it_ref->second + 1);
|
||||
|
||||
bool passed_error = false;
|
||||
|
||||
++it_test;
|
||||
while (it_test != end_test && it_test->first == DECODE_ERROR) {
|
||||
++it_test;
|
||||
passed_error = true;
|
||||
}
|
||||
if (it_test == end_test) {
|
||||
break;
|
||||
}
|
||||
|
||||
int skipped_frames = 0;
|
||||
++it_ref;
|
||||
for (; it_ref != end_ref; ++it_ref) {
|
||||
if (it_ref->first != DECODE_ERROR && it_ref->first >= it_test->first) {
|
||||
break;
|
||||
}
|
||||
++skipped_frames;
|
||||
}
|
||||
if (passed_error) {
|
||||
// If we pass an error in the test video, then we are conservative
|
||||
// and will not calculate skipped frames for that part.
|
||||
skipped_frames = 0;
|
||||
}
|
||||
if (it_ref != end_ref && it_ref->first == it_test->first) {
|
||||
total_skipped_frames += skipped_frames;
|
||||
if (skipped_frames > max_skipped_frames) {
|
||||
max_skipped_frames = skipped_frames;
|
||||
}
|
||||
continue;
|
||||
}
|
||||
fprintf(stdout,
|
||||
"Found barcode %d in test video, which is not in reference video\n",
|
||||
it_test->first);
|
||||
break;
|
||||
}
|
||||
|
||||
results->max_repeated_frames = max_repeated_frames;
|
||||
results->max_skipped_frames = max_skipped_frames;
|
||||
results->total_skipped_frames = total_skipped_frames;
|
||||
results->decode_errors_ref = decode_errors_ref;
|
||||
results->decode_errors_test = decode_errors_test;
|
||||
}
|
||||
|
||||
void PrintAnalysisResults(const std::string& label, ResultsContainer* results) {
|
||||
|
||||
Reference in New Issue
Block a user