c9cdae001 fix(toxav): remove extra copy of video frame on encode 4f6d4546b test: Improve the fake network library. a2581e700 refactor(toxcore): generate `Friend_Request` and `Dht_Nodes_Response` 2aaa11770 refactor(toxcore): use Tox_Memory in generated events 5c367452b test(toxcore): fix incorrect mutex in tox_scenario_get_time 8f92e710f perf: Add a timed limit of number of cookie requests. 695b6417a test: Add some more simulated network support. 815ae9ce9 test(toxcore): fix thread-safety in scenario framework 6d85c754e test(toxcore): add unit tests for net_crypto 9c22e79cc test(support): add SimulatedEnvironment for deterministic testing f34fcb195 chore: Update windows Dockerfile to debian stable (trixie). ece0e8980 fix(group_moderation): allow validating unsorted sanction list signatures a4fa754d7 refactor: rename struct Packet to struct Net_Packet d6f330f85 cleanup: Fix some warnings from coverity. e206bffa2 fix(group_chats): fix sync packets reverting topics 0e4715598 test: Add new scenario testing framework. 668291f44 refactor(toxcore): decouple Network_Funcs from sockaddr via IP_Port fc4396cef fix: potential division by zero in toxav and unsafe hex parsing 8e8b352ab refactor: Add nullable annotations to struct members. 7740bb421 refactor: decouple net_crypto from DHT 1936d4296 test: add benchmark for toxav audio and video 46bfdc2df fix: correct printf format specifiers for unsigned integers REVERT: 1828c5356 fix(toxav): remove extra copy of video frame on encode git-subtree-dir: external/toxcore/c-toxcore git-subtree-split: c9cdae001341e701fca980c9bb9febfeb95d2902
197 lines
6.5 KiB
C++
197 lines
6.5 KiB
C++
/* SPDX-License-Identifier: GPL-3.0-or-later
|
|
* Copyright © 2025 The TokTok team.
|
|
*/
|
|
|
|
#include <benchmark/benchmark.h>
|
|
|
|
#include <vector>
|
|
|
|
#include "../toxcore/logger.h"
|
|
#include "../toxcore/mono_time.h"
|
|
#include "../toxcore/os_memory.h"
|
|
#include "av_test_support.hh"
|
|
#include "rtp.h"
|
|
#include "video.h"
|
|
|
|
namespace {
|
|
|
|
class VideoBench : public benchmark::Fixture {
|
|
public:
|
|
void SetUp(const ::benchmark::State &state) override
|
|
{
|
|
const Memory *mem = os_memory();
|
|
log = logger_new(mem);
|
|
tm.t = 1000;
|
|
mono_time = mono_time_new(mem, mock_time_cb, &tm);
|
|
vc = vc_new(log, mono_time, 123, nullptr, nullptr);
|
|
|
|
width = static_cast<uint16_t>(state.range(0));
|
|
height = static_cast<uint16_t>(state.range(1));
|
|
// Use a standard bitrate for benchmarks
|
|
vc_reconfigure_encoder(vc, 2000, width, height, -1);
|
|
|
|
y.resize(static_cast<size_t>(width) * height);
|
|
u.resize((static_cast<size_t>(width) / 2) * (static_cast<size_t>(height) / 2));
|
|
v.resize((static_cast<size_t>(width) / 2) * (static_cast<size_t>(height) / 2));
|
|
|
|
rtp_mock.capture_packets = false; // Disable capturing for benchmarks
|
|
rtp_mock.auto_forward = true;
|
|
|
|
rtp_mock.recv_session = rtp_new(log, RTP_TYPE_VIDEO, mono_time, RtpMock::send_packet,
|
|
&rtp_mock, nullptr, nullptr, nullptr, vc, RtpMock::video_cb);
|
|
}
|
|
|
|
void TearDown(const ::benchmark::State &state) override
|
|
{
|
|
const Memory *mem = os_memory();
|
|
if (rtp_mock.recv_session) {
|
|
rtp_kill(log, rtp_mock.recv_session);
|
|
}
|
|
if (vc) {
|
|
vc_kill(vc);
|
|
}
|
|
if (mono_time) {
|
|
mono_time_free(mem, mono_time);
|
|
}
|
|
if (log) {
|
|
logger_kill(log);
|
|
}
|
|
}
|
|
|
|
Logger *log = nullptr;
|
|
Mono_Time *mono_time = nullptr;
|
|
MockTime tm;
|
|
VCSession *vc = nullptr;
|
|
RtpMock rtp_mock;
|
|
uint16_t width = 0, height = 0;
|
|
std::vector<uint8_t> y, u, v;
|
|
};
|
|
|
|
// Benchmark encoding a sequence of frames.
|
|
// Measures how the encoder performs as it builds up temporal state.
|
|
BENCHMARK_DEFINE_F(VideoBench, EncodeSequence)(benchmark::State &state)
|
|
{
|
|
int frame_index = 0;
|
|
// Pre-fill frames to avoid measuring fill_frame time
|
|
const int num_prefilled = 100;
|
|
std::vector<std::vector<uint8_t>> ys(num_prefilled, std::vector<uint8_t>(width * height));
|
|
std::vector<std::vector<uint8_t>> us(
|
|
num_prefilled, std::vector<uint8_t>((width / 2) * (height / 2)));
|
|
std::vector<std::vector<uint8_t>> vs(
|
|
num_prefilled, std::vector<uint8_t>((width / 2) * (height / 2)));
|
|
for (int i = 0; i < num_prefilled; ++i) {
|
|
fill_video_frame(width, height, i, ys[i], us[i], vs[i]);
|
|
}
|
|
|
|
for (auto _ : state) {
|
|
int idx = frame_index % num_prefilled;
|
|
// Force a keyframe every 100 frames to simulate real-world periodic keyframes
|
|
int flags = (frame_index % 100 == 0) ? VC_EFLAG_FORCE_KF : VC_EFLAG_NONE;
|
|
vc_encode(vc, width, height, ys[idx].data(), us[idx].data(), vs[idx].data(), flags);
|
|
vc_increment_frame_counter(vc);
|
|
|
|
uint8_t *pkt_data;
|
|
uint32_t pkt_size;
|
|
bool is_keyframe;
|
|
while (vc_get_cx_data(vc, &pkt_data, &pkt_size, &is_keyframe)) {
|
|
benchmark::DoNotOptimize(pkt_data);
|
|
benchmark::DoNotOptimize(pkt_size);
|
|
}
|
|
frame_index++;
|
|
}
|
|
}
|
|
|
|
BENCHMARK_REGISTER_F(VideoBench, EncodeSequence)
|
|
->Args({320, 240})
|
|
->Args({640, 480})
|
|
->Args({1280, 720})
|
|
->Args({1920, 1080});
|
|
|
|
// Benchmark decoding a sequence of frames.
|
|
// First pre-encodes a sequence, then measures decoding performance.
|
|
BENCHMARK_DEFINE_F(VideoBench, DecodeSequence)(benchmark::State &state)
|
|
{
|
|
const int num_frames = 100;
|
|
std::vector<std::vector<uint8_t>> encoded_frames(num_frames);
|
|
std::vector<bool> is_keyframe_list(num_frames);
|
|
|
|
// Pre-encode
|
|
for (int i = 0; i < num_frames; ++i) {
|
|
fill_video_frame(width, height, i, y, u, v);
|
|
int flags = (i == 0) ? VC_EFLAG_FORCE_KF : VC_EFLAG_NONE;
|
|
vc_encode(vc, width, height, y.data(), u.data(), v.data(), flags);
|
|
vc_increment_frame_counter(vc);
|
|
|
|
uint8_t *pkt_data;
|
|
uint32_t pkt_size;
|
|
bool is_kf;
|
|
while (vc_get_cx_data(vc, &pkt_data, &pkt_size, &is_kf)) {
|
|
encoded_frames[i].insert(encoded_frames[i].end(), pkt_data, pkt_data + pkt_size);
|
|
is_keyframe_list[i] = is_kf;
|
|
}
|
|
}
|
|
|
|
int frame_index = 0;
|
|
for (auto _ : state) {
|
|
int idx = frame_index % num_frames;
|
|
const auto &encoded_data = encoded_frames[idx];
|
|
rtp_send_data(log, rtp_mock.recv_session, encoded_data.data(),
|
|
static_cast<uint32_t>(encoded_data.size()), is_keyframe_list[idx]);
|
|
vc_iterate(vc);
|
|
frame_index++;
|
|
}
|
|
}
|
|
|
|
BENCHMARK_REGISTER_F(VideoBench, DecodeSequence)
|
|
->Args({320, 240})
|
|
->Args({640, 480})
|
|
->Args({1280, 720})
|
|
->Args({1920, 1080});
|
|
|
|
// Full end-to-end sequence benchmark (Encode -> RTP -> Decode)
|
|
BENCHMARK_DEFINE_F(VideoBench, FullSequence)(benchmark::State &state)
|
|
{
|
|
int frame_index = 0;
|
|
const int num_prefilled = 100;
|
|
std::vector<std::vector<uint8_t>> ys(num_prefilled, std::vector<uint8_t>(width * height));
|
|
std::vector<std::vector<uint8_t>> us(
|
|
num_prefilled, std::vector<uint8_t>((width / 2) * (height / 2)));
|
|
std::vector<std::vector<uint8_t>> vs(
|
|
num_prefilled, std::vector<uint8_t>((width / 2) * (height / 2)));
|
|
for (int i = 0; i < num_prefilled; ++i) {
|
|
fill_video_frame(width, height, i, ys[i], us[i], vs[i]);
|
|
}
|
|
|
|
for (auto _ : state) {
|
|
int idx = frame_index % num_prefilled;
|
|
int flags = (frame_index % 100 == 0) ? VC_EFLAG_FORCE_KF : VC_EFLAG_NONE;
|
|
vc_encode(vc, width, height, ys[idx].data(), us[idx].data(), vs[idx].data(), flags);
|
|
vc_increment_frame_counter(vc);
|
|
|
|
uint8_t *pkt_data;
|
|
uint32_t pkt_size;
|
|
bool is_keyframe = false;
|
|
// We need to collect all packets for the frame before sending to decoder
|
|
std::vector<uint8_t> frame_data;
|
|
while (vc_get_cx_data(vc, &pkt_data, &pkt_size, &is_keyframe)) {
|
|
frame_data.insert(frame_data.end(), pkt_data, pkt_data + pkt_size);
|
|
}
|
|
|
|
rtp_send_data(log, rtp_mock.recv_session, frame_data.data(),
|
|
static_cast<uint32_t>(frame_data.size()), is_keyframe);
|
|
vc_iterate(vc);
|
|
|
|
frame_index++;
|
|
}
|
|
}
|
|
|
|
BENCHMARK_REGISTER_F(VideoBench, FullSequence)
|
|
->Args({320, 240})
|
|
->Args({640, 480})
|
|
->Args({1280, 720})
|
|
->Args({1920, 1080});
|
|
|
|
}
|
|
|
|
BENCHMARK_MAIN();
|