forked from Green-Sky/tomato
cae0ab9c5c
55752a2e2ef fix(toxav): pass video bit rate as kbit Previously we unintentionally made it Mbit. 7e573280a75 docs(toxav): fix docs of toxav.h - fix units to be more readable - use width before height consistently - video -> audio typo 5f88a084e8c fix: friend_connections leak on allocation failure clean up when it only contains connections in the NONE state 6d27a1ae178 fix: wrong comment for closelist ce4f29e8036 cleanup: Fix all `-Wsign-compare` warnings. 4d4251c397f chore: lower cirrus ci timeout drastically 40676284507 fix: events leak that can occur if allocation fails rare in practice, found by fuzzing 9610ac31c5f fix: Return an error instead of crashing on nullptr args in NGC. a57c2c8f956 refactor: Make ToxAV independent of toxcore internals. 5752fc29f86 refactor: Make tox-bootstrapd use bool instead of int df675786eb2 chore: Add release-drafter github action. 03fd7a69dcf chore: Use toktok's cmp instead of upstream. 350c0ba1205 cleanup: Sort apk/apt install commands in Dockerfiles. 8c1bda502cb chore(deps): bump golang.org/x/net ddb9d3210da chore: Upgrade to FreeBSD 14.1 in cirrus build. e9076f45bd3 chore(cmake): set options changes as cache and with force git-subtree-dir: external/toxcore/c-toxcore git-subtree-split: 55752a2e2ef894bfa6d7a2a21a0278e3f2bede7d
451 lines
15 KiB
C
451 lines
15 KiB
C
/* SPDX-License-Identifier: GPL-3.0-or-later
|
|
* Copyright © 2016-2018 The TokTok team.
|
|
* Copyright © 2013-2015 Tox project.
|
|
*/
|
|
#include "video.h"
|
|
|
|
#include <assert.h>
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
|
|
#include "msi.h"
|
|
#include "ring_buffer.h"
|
|
#include "rtp.h"
|
|
|
|
#include "../toxcore/ccompat.h"
|
|
#include "../toxcore/logger.h"
|
|
#include "../toxcore/mono_time.h"
|
|
#include "../toxcore/network.h"
|
|
|
|
/**
|
|
* Soft deadline the decoder should attempt to meet, in "us" (microseconds).
|
|
* Set to zero for unlimited.
|
|
*
|
|
* By convention, the value 1 is used to mean "return as fast as possible."
|
|
*/
|
|
// TODO(zoff99): don't hardcode this, let the application choose it
|
|
#define WANTED_MAX_DECODER_FPS 40
|
|
|
|
/**
|
|
* VPX_DL_REALTIME (1)
|
|
* deadline parameter analogous to VPx REALTIME mode.
|
|
*
|
|
* VPX_DL_GOOD_QUALITY (1000000)
|
|
* deadline parameter analogous to VPx GOOD QUALITY mode.
|
|
*
|
|
* VPX_DL_BEST_QUALITY (0)
|
|
* deadline parameter analogous to VPx BEST QUALITY mode.
|
|
*/
|
|
#define MAX_DECODE_TIME_US (1000000 / WANTED_MAX_DECODER_FPS) // to allow x fps
|
|
|
|
/**
|
|
* Codec control function to set encoder internal speed settings. Changes in
|
|
* this value influences, among others, the encoder's selection of motion
|
|
* estimation methods. Values greater than 0 will increase encoder speed at the
|
|
* expense of quality.
|
|
*
|
|
* Note Valid range for VP8: `-16..16`
|
|
*/
|
|
#define VP8E_SET_CPUUSED_VALUE 16
|
|
|
|
/**
|
|
* Initialize encoder with this value.
|
|
*
|
|
* Target bandwidth to use for this stream, in kilobits per second.
|
|
*/
|
|
#define VIDEO_BITRATE_INITIAL_VALUE 5000
|
|
#define VIDEO_DECODE_BUFFER_SIZE 5 // this buffer has normally max. 1 entry
|
|
|
|
static vpx_codec_iface_t *video_codec_decoder_interface(void)
|
|
{
|
|
return vpx_codec_vp8_dx();
|
|
}
|
|
static vpx_codec_iface_t *video_codec_encoder_interface(void)
|
|
{
|
|
return vpx_codec_vp8_cx();
|
|
}
|
|
|
|
#define VIDEO_CODEC_DECODER_MAX_WIDTH 800 // its a dummy value, because the struct needs a value there
|
|
#define VIDEO_CODEC_DECODER_MAX_HEIGHT 600 // its a dummy value, because the struct needs a value there
|
|
|
|
#define VPX_MAX_DIST_START 40
|
|
|
|
#define VPX_MAX_ENCODER_THREADS 4
|
|
#define VPX_MAX_DECODER_THREADS 4
|
|
#define VIDEO_VP8_DECODER_POST_PROCESSING_ENABLED 0
|
|
|
|
static void vc_init_encoder_cfg(const Logger *log, vpx_codec_enc_cfg_t *cfg, int16_t kf_max_dist)
|
|
{
|
|
const vpx_codec_err_t rc = vpx_codec_enc_config_default(video_codec_encoder_interface(), cfg, 0);
|
|
|
|
if (rc != VPX_CODEC_OK) {
|
|
LOGGER_ERROR(log, "vc_init_encoder_cfg:Failed to get config: %s", vpx_codec_err_to_string(rc));
|
|
}
|
|
|
|
/* Target bandwidth to use for this stream, in kilobits per second */
|
|
cfg->rc_target_bitrate = VIDEO_BITRATE_INITIAL_VALUE;
|
|
cfg->g_w = VIDEO_CODEC_DECODER_MAX_WIDTH;
|
|
cfg->g_h = VIDEO_CODEC_DECODER_MAX_HEIGHT;
|
|
cfg->g_pass = VPX_RC_ONE_PASS;
|
|
cfg->g_error_resilient = VPX_ERROR_RESILIENT_DEFAULT | VPX_ERROR_RESILIENT_PARTITIONS;
|
|
cfg->g_lag_in_frames = 0;
|
|
|
|
/* Allow lagged encoding
|
|
*
|
|
* If set, this value allows the encoder to consume a number of input
|
|
* frames before producing output frames. This allows the encoder to
|
|
* base decisions for the current frame on future frames. This does
|
|
* increase the latency of the encoding pipeline, so it is not appropriate
|
|
* in all situations (ex: realtime encoding).
|
|
*
|
|
* Note that this is a maximum value -- the encoder may produce frames
|
|
* sooner than the given limit. Set this value to 0 to disable this
|
|
* feature.
|
|
*/
|
|
cfg->kf_min_dist = 0;
|
|
cfg->kf_mode = VPX_KF_AUTO; // Encoder determines optimal placement automatically
|
|
cfg->rc_end_usage = VPX_VBR; // what quality mode?
|
|
|
|
/*
|
|
* VPX_VBR Variable Bit Rate (VBR) mode
|
|
* VPX_CBR Constant Bit Rate (CBR) mode
|
|
* VPX_CQ Constrained Quality (CQ) mode -> give codec a hint that we may be on low bandwidth connection
|
|
* VPX_Q Constant Quality (Q) mode
|
|
*/
|
|
if (kf_max_dist > 1) {
|
|
cfg->kf_max_dist = kf_max_dist; // a full frame every x frames minimum (can be more often, codec decides automatically)
|
|
LOGGER_DEBUG(log, "kf_max_dist=%d (1)", cfg->kf_max_dist);
|
|
} else {
|
|
cfg->kf_max_dist = VPX_MAX_DIST_START;
|
|
LOGGER_DEBUG(log, "kf_max_dist=%d (2)", cfg->kf_max_dist);
|
|
}
|
|
|
|
cfg->g_threads = VPX_MAX_ENCODER_THREADS; // Maximum number of threads to use
|
|
/* TODO: set these to something reasonable */
|
|
// cfg->g_timebase.num = 1;
|
|
// cfg->g_timebase.den = 60; // 60 fps
|
|
cfg->rc_resize_allowed = 1; // allow encoder to resize to smaller resolution
|
|
cfg->rc_resize_up_thresh = 40;
|
|
cfg->rc_resize_down_thresh = 5;
|
|
|
|
/* TODO: make quality setting an API call, but start with normal quality */
|
|
#if 0
|
|
/* Highest-resolution encoder settings */
|
|
cfg->rc_dropframe_thresh = 0;
|
|
cfg->rc_resize_allowed = 0;
|
|
cfg->rc_min_quantizer = 2;
|
|
cfg->rc_max_quantizer = 56;
|
|
cfg->rc_undershoot_pct = 100;
|
|
cfg->rc_overshoot_pct = 15;
|
|
cfg->rc_buf_initial_sz = 500;
|
|
cfg->rc_buf_optimal_sz = 600;
|
|
cfg->rc_buf_sz = 1000;
|
|
#endif /* 0 */
|
|
}
|
|
|
|
VCSession *vc_new(const Logger *log, Mono_Time *mono_time, ToxAV *av, uint32_t friend_number,
|
|
toxav_video_receive_frame_cb *cb, void *cb_data)
|
|
{
|
|
VCSession *vc = (VCSession *)calloc(1, sizeof(VCSession));
|
|
vpx_codec_err_t rc;
|
|
|
|
if (vc == nullptr) {
|
|
LOGGER_WARNING(log, "Allocation failed! Application might misbehave!");
|
|
return nullptr;
|
|
}
|
|
|
|
if (create_recursive_mutex(vc->queue_mutex) != 0) {
|
|
LOGGER_WARNING(log, "Failed to create recursive mutex!");
|
|
free(vc);
|
|
return nullptr;
|
|
}
|
|
|
|
const int cpu_used_value = VP8E_SET_CPUUSED_VALUE;
|
|
|
|
vc->vbuf_raw = rb_new(VIDEO_DECODE_BUFFER_SIZE);
|
|
|
|
if (vc->vbuf_raw == nullptr) {
|
|
goto BASE_CLEANUP;
|
|
}
|
|
|
|
/*
|
|
* VPX_CODEC_USE_FRAME_THREADING
|
|
* Enable frame-based multi-threading
|
|
*
|
|
* VPX_CODEC_USE_ERROR_CONCEALMENT
|
|
* Conceal errors in decoded frames
|
|
*/
|
|
vpx_codec_dec_cfg_t dec_cfg;
|
|
dec_cfg.threads = VPX_MAX_DECODER_THREADS; // Maximum number of threads to use
|
|
dec_cfg.w = VIDEO_CODEC_DECODER_MAX_WIDTH;
|
|
dec_cfg.h = VIDEO_CODEC_DECODER_MAX_HEIGHT;
|
|
|
|
LOGGER_DEBUG(log, "Using VP8 codec for decoder (0)");
|
|
rc = vpx_codec_dec_init(vc->decoder, video_codec_decoder_interface(), &dec_cfg,
|
|
VPX_CODEC_USE_FRAME_THREADING | VPX_CODEC_USE_POSTPROC);
|
|
|
|
if (rc == VPX_CODEC_INCAPABLE) {
|
|
LOGGER_WARNING(log, "Postproc not supported by this decoder (0)");
|
|
rc = vpx_codec_dec_init(vc->decoder, video_codec_decoder_interface(), &dec_cfg, VPX_CODEC_USE_FRAME_THREADING);
|
|
}
|
|
|
|
if (rc != VPX_CODEC_OK) {
|
|
LOGGER_ERROR(log, "Init video_decoder failed: %s", vpx_codec_err_to_string(rc));
|
|
goto BASE_CLEANUP;
|
|
}
|
|
|
|
if (VIDEO_VP8_DECODER_POST_PROCESSING_ENABLED == 1) {
|
|
vp8_postproc_cfg_t pp = {VP8_DEBLOCK, 1, 0};
|
|
const vpx_codec_err_t cc_res = vpx_codec_control(vc->decoder, VP8_SET_POSTPROC, &pp);
|
|
|
|
if (cc_res != VPX_CODEC_OK) {
|
|
LOGGER_WARNING(log, "Failed to turn on postproc");
|
|
} else {
|
|
LOGGER_DEBUG(log, "turn on postproc: OK");
|
|
}
|
|
} else {
|
|
vp8_postproc_cfg_t pp = {0, 0, 0};
|
|
vpx_codec_err_t cc_res = vpx_codec_control(vc->decoder, VP8_SET_POSTPROC, &pp);
|
|
|
|
if (cc_res != VPX_CODEC_OK) {
|
|
LOGGER_WARNING(log, "Failed to turn OFF postproc");
|
|
} else {
|
|
LOGGER_DEBUG(log, "Disable postproc: OK");
|
|
}
|
|
}
|
|
|
|
/* Set encoder to some initial values
|
|
*/
|
|
vpx_codec_enc_cfg_t cfg;
|
|
vc_init_encoder_cfg(log, &cfg, 1);
|
|
|
|
LOGGER_DEBUG(log, "Using VP8 codec for encoder (0.1)");
|
|
rc = vpx_codec_enc_init(vc->encoder, video_codec_encoder_interface(), &cfg, VPX_CODEC_USE_FRAME_THREADING);
|
|
|
|
if (rc != VPX_CODEC_OK) {
|
|
LOGGER_ERROR(log, "Failed to initialize encoder: %s", vpx_codec_err_to_string(rc));
|
|
goto BASE_CLEANUP_1;
|
|
}
|
|
|
|
rc = vpx_codec_control(vc->encoder, VP8E_SET_CPUUSED, cpu_used_value);
|
|
|
|
if (rc != VPX_CODEC_OK) {
|
|
LOGGER_ERROR(log, "Failed to set encoder control setting: %s", vpx_codec_err_to_string(rc));
|
|
vpx_codec_destroy(vc->encoder);
|
|
goto BASE_CLEANUP_1;
|
|
}
|
|
|
|
/*
|
|
* VPX_CTRL_USE_TYPE(VP8E_SET_NOISE_SENSITIVITY, unsigned int)
|
|
* control function to set noise sensitivity
|
|
* 0: off, 1: OnYOnly, 2: OnYUV, 3: OnYUVAggressive, 4: Adaptive
|
|
*/
|
|
#if 0
|
|
rc = vpx_codec_control(vc->encoder, VP8E_SET_NOISE_SENSITIVITY, 2);
|
|
|
|
if (rc != VPX_CODEC_OK) {
|
|
LOGGER_ERROR(log, "Failed to set encoder control setting: %s", vpx_codec_err_to_string(rc));
|
|
vpx_codec_destroy(vc->encoder);
|
|
goto BASE_CLEANUP_1;
|
|
}
|
|
|
|
#endif /* 0 */
|
|
|
|
vc->linfts = current_time_monotonic(mono_time);
|
|
vc->lcfd = 60;
|
|
vc->vcb = cb;
|
|
vc->vcb_user_data = cb_data;
|
|
vc->friend_number = friend_number;
|
|
vc->av = av;
|
|
vc->log = log;
|
|
return vc;
|
|
|
|
BASE_CLEANUP_1:
|
|
vpx_codec_destroy(vc->decoder);
|
|
BASE_CLEANUP:
|
|
pthread_mutex_destroy(vc->queue_mutex);
|
|
rb_kill(vc->vbuf_raw);
|
|
free(vc);
|
|
|
|
return nullptr;
|
|
}
|
|
|
|
void vc_kill(VCSession *vc)
|
|
{
|
|
if (vc == nullptr) {
|
|
return;
|
|
}
|
|
|
|
vpx_codec_destroy(vc->encoder);
|
|
vpx_codec_destroy(vc->decoder);
|
|
void *p;
|
|
|
|
while (rb_read(vc->vbuf_raw, &p)) {
|
|
free(p);
|
|
}
|
|
|
|
rb_kill(vc->vbuf_raw);
|
|
pthread_mutex_destroy(vc->queue_mutex);
|
|
LOGGER_DEBUG(vc->log, "Terminated video handler: %p", (void *)vc);
|
|
free(vc);
|
|
}
|
|
|
|
void vc_iterate(VCSession *vc)
|
|
{
|
|
if (vc == nullptr) {
|
|
return;
|
|
}
|
|
|
|
pthread_mutex_lock(vc->queue_mutex);
|
|
|
|
struct RTPMessage *p;
|
|
|
|
if (!rb_read(vc->vbuf_raw, (void **)&p)) {
|
|
LOGGER_TRACE(vc->log, "no Video frame data available");
|
|
pthread_mutex_unlock(vc->queue_mutex);
|
|
return;
|
|
}
|
|
|
|
const uint16_t log_rb_size = rb_size(vc->vbuf_raw);
|
|
pthread_mutex_unlock(vc->queue_mutex);
|
|
const struct RTPHeader *const header = &p->header;
|
|
|
|
uint32_t full_data_len;
|
|
|
|
if ((header->flags & RTP_LARGE_FRAME) != 0) {
|
|
full_data_len = header->data_length_full;
|
|
LOGGER_DEBUG(vc->log, "vc_iterate:001:full_data_len=%d", (int)full_data_len);
|
|
} else {
|
|
full_data_len = p->len;
|
|
LOGGER_DEBUG(vc->log, "vc_iterate:002");
|
|
}
|
|
|
|
LOGGER_DEBUG(vc->log, "vc_iterate: rb_read p->len=%d p->header.xe=%d", (int)full_data_len, p->header.xe);
|
|
LOGGER_DEBUG(vc->log, "vc_iterate: rb_read rb size=%d", (int)log_rb_size);
|
|
const vpx_codec_err_t rc = vpx_codec_decode(vc->decoder, p->data, full_data_len, nullptr, MAX_DECODE_TIME_US);
|
|
free(p);
|
|
|
|
if (rc != VPX_CODEC_OK) {
|
|
LOGGER_ERROR(vc->log, "Error decoding video: %d %s", (int)rc, vpx_codec_err_to_string(rc));
|
|
return;
|
|
}
|
|
|
|
/* Play decoded images */
|
|
vpx_codec_iter_t iter = nullptr;
|
|
|
|
for (vpx_image_t *dest = vpx_codec_get_frame(vc->decoder, &iter);
|
|
dest != nullptr;
|
|
dest = vpx_codec_get_frame(vc->decoder, &iter)) {
|
|
if (vc->vcb != nullptr) {
|
|
vc->vcb(vc->av, vc->friend_number, dest->d_w, dest->d_h,
|
|
dest->planes[0], dest->planes[1], dest->planes[2],
|
|
dest->stride[0], dest->stride[1], dest->stride[2], vc->vcb_user_data);
|
|
}
|
|
|
|
vpx_img_free(dest); // is this needed? none of the VPx examples show that
|
|
}
|
|
}
|
|
|
|
int vc_queue_message(Mono_Time *mono_time, void *cs, struct RTPMessage *msg)
|
|
{
|
|
VCSession *vc = (VCSession *)cs;
|
|
|
|
/* This function is called with complete messages
|
|
* they have already been assembled.
|
|
* this function gets called from handle_rtp_packet() and handle_rtp_packet_v3()
|
|
*/
|
|
if (vc == nullptr || msg == nullptr) {
|
|
free(msg);
|
|
|
|
return -1;
|
|
}
|
|
|
|
const struct RTPHeader *const header = &msg->header;
|
|
|
|
if (msg->header.pt == (RTP_TYPE_VIDEO + 2) % 128) {
|
|
LOGGER_WARNING(vc->log, "Got dummy!");
|
|
free(msg);
|
|
return 0;
|
|
}
|
|
|
|
if (msg->header.pt != RTP_TYPE_VIDEO % 128) {
|
|
LOGGER_WARNING(vc->log, "Invalid payload type! pt=%d", (int)msg->header.pt);
|
|
free(msg);
|
|
return -1;
|
|
}
|
|
|
|
pthread_mutex_lock(vc->queue_mutex);
|
|
|
|
if ((header->flags & RTP_LARGE_FRAME) != 0 && header->pt == RTP_TYPE_VIDEO % 128) {
|
|
LOGGER_DEBUG(vc->log, "rb_write msg->len=%d b0=%d b1=%d", (int)msg->len, (int)msg->data[0], (int)msg->data[1]);
|
|
}
|
|
|
|
free(rb_write(vc->vbuf_raw, msg));
|
|
|
|
/* Calculate time it took for peer to send us this frame */
|
|
const uint32_t t_lcfd = current_time_monotonic(mono_time) - vc->linfts;
|
|
vc->lcfd = t_lcfd > 100 ? vc->lcfd : t_lcfd;
|
|
vc->linfts = current_time_monotonic(mono_time);
|
|
pthread_mutex_unlock(vc->queue_mutex);
|
|
return 0;
|
|
}
|
|
|
|
int vc_reconfigure_encoder(VCSession *vc, uint32_t bit_rate, uint16_t width, uint16_t height, int16_t kf_max_dist)
|
|
{
|
|
if (vc == nullptr) {
|
|
return -1;
|
|
}
|
|
|
|
vpx_codec_enc_cfg_t cfg2 = *vc->encoder->config.enc;
|
|
|
|
if (cfg2.rc_target_bitrate == bit_rate && cfg2.g_w == width && cfg2.g_h == height && kf_max_dist == -1) {
|
|
return 0; /* Nothing changed */
|
|
}
|
|
|
|
if (cfg2.g_w == width && cfg2.g_h == height && kf_max_dist == -1) {
|
|
/* Only bit rate changed */
|
|
LOGGER_INFO(vc->log, "bitrate change from: %u to: %u", (uint32_t)cfg2.rc_target_bitrate, (uint32_t)bit_rate);
|
|
cfg2.rc_target_bitrate = bit_rate;
|
|
const vpx_codec_err_t rc = vpx_codec_enc_config_set(vc->encoder, &cfg2);
|
|
|
|
if (rc != VPX_CODEC_OK) {
|
|
LOGGER_ERROR(vc->log, "Failed to set encoder control setting: %s", vpx_codec_err_to_string(rc));
|
|
return -1;
|
|
}
|
|
} else {
|
|
/* Resolution is changed, must reinitialize encoder since libvpx v1.4 doesn't support
|
|
* reconfiguring encoder to use resolutions greater than initially set.
|
|
*/
|
|
LOGGER_DEBUG(vc->log, "Have to reinitialize vpx encoder on session %p", (void *)vc);
|
|
vpx_codec_ctx_t new_c;
|
|
vpx_codec_enc_cfg_t cfg;
|
|
vc_init_encoder_cfg(vc->log, &cfg, kf_max_dist);
|
|
cfg.rc_target_bitrate = bit_rate;
|
|
cfg.g_w = width;
|
|
cfg.g_h = height;
|
|
|
|
LOGGER_DEBUG(vc->log, "Using VP8 codec for encoder");
|
|
vpx_codec_err_t rc = vpx_codec_enc_init(&new_c, video_codec_encoder_interface(), &cfg, VPX_CODEC_USE_FRAME_THREADING);
|
|
|
|
if (rc != VPX_CODEC_OK) {
|
|
LOGGER_ERROR(vc->log, "Failed to initialize encoder: %s", vpx_codec_err_to_string(rc));
|
|
return -1;
|
|
}
|
|
|
|
const int cpu_used_value = VP8E_SET_CPUUSED_VALUE;
|
|
|
|
rc = vpx_codec_control(&new_c, VP8E_SET_CPUUSED, cpu_used_value);
|
|
|
|
if (rc != VPX_CODEC_OK) {
|
|
LOGGER_ERROR(vc->log, "Failed to set encoder control setting: %s", vpx_codec_err_to_string(rc));
|
|
vpx_codec_destroy(&new_c);
|
|
return -1;
|
|
}
|
|
|
|
vpx_codec_destroy(vc->encoder);
|
|
memcpy(vc->encoder, &new_c, sizeof(new_c));
|
|
}
|
|
|
|
return 0;
|
|
}
|