mirror of
https://github.com/irungentoo/toxcore.git
synced 2024-03-22 13:30:51 +08:00
443abcfafe
Audio killing itself after 20 minutes in a call should be fixed.
345 lines
8.9 KiB
C
345 lines
8.9 KiB
C
/** codec.c
|
|
*
|
|
* Audio and video codec intitialization, encoding/decoding and playback
|
|
*
|
|
* Copyright (C) 2013 Tox project All Rights Reserved.
|
|
*
|
|
* This file is part of Tox.
|
|
*
|
|
* Tox is free software: you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation, either version 3 of the License, or
|
|
* (at your option) any later version.
|
|
*
|
|
* Tox is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with Tox. If not, see <http://www.gnu.org/licenses/>.
|
|
*
|
|
*/
|
|
|
|
|
|
#ifdef HAVE_CONFIG_H
|
|
#include "config.h"
|
|
#endif /* HAVE_CONFIG_H */
|
|
|
|
#include "../toxcore/logger.h"
|
|
|
|
#include <stdio.h>
|
|
#include <stdlib.h>
|
|
#include <math.h>
|
|
#include <assert.h>
|
|
|
|
#include "rtp.h"
|
|
#include "codec.h"
|
|
|
|
JitterBuffer *create_queue(unsigned int capacity)
|
|
{
|
|
unsigned int size = 1;
|
|
|
|
while (size <= (capacity + 1) * 2) {
|
|
size *= 2;
|
|
}
|
|
|
|
JitterBuffer *q;
|
|
|
|
if ( !(q = calloc(sizeof(JitterBuffer), 1)) ) return NULL;
|
|
|
|
if (!(q->queue = calloc(sizeof(RTPMessage *), size))) {
|
|
free(q);
|
|
return NULL;
|
|
}
|
|
|
|
q->size = size;
|
|
q->capacity = capacity;
|
|
return q;
|
|
}
|
|
|
|
void terminate_queue(JitterBuffer *q)
|
|
{
|
|
if (!q) return;
|
|
|
|
for (; q->bottom != q->top; ++q->bottom) {
|
|
if (!q->queue[q->bottom % q->size])
|
|
rtp_free_msg(NULL, q->queue[q->bottom % q->size]);
|
|
}
|
|
|
|
free(q->queue);
|
|
free(q);
|
|
}
|
|
|
|
void queue(JitterBuffer *q, RTPMessage *pk)
|
|
{
|
|
uint16_t sequnum = pk->header->sequnum;
|
|
|
|
if (sequnum - q->bottom > q->size)
|
|
return;
|
|
|
|
unsigned int num = sequnum % q->size;
|
|
|
|
if (q->queue[num])
|
|
return;
|
|
|
|
q->queue[num] = pk;
|
|
|
|
if ((sequnum - q->bottom) >= (q->top - q->bottom))
|
|
q->top = sequnum + 1;
|
|
}
|
|
|
|
/* success is 0 when there is nothing to dequeue, 1 when there's a good packet, 2 when there's a lost packet */
|
|
RTPMessage *dequeue(JitterBuffer *q, int *success)
|
|
{
|
|
if (q->top == q->bottom) {
|
|
*success = 0;
|
|
return NULL;
|
|
}
|
|
|
|
unsigned int num = q->bottom % q->size;
|
|
|
|
if (q->queue[num]) {
|
|
RTPMessage *ret = q->queue[num];
|
|
q->queue[num] = NULL;
|
|
++q->bottom;
|
|
*success = 1;
|
|
return ret;
|
|
}
|
|
|
|
if (q->top - q->bottom > q->capacity) {
|
|
++q->bottom;
|
|
*success = 2;
|
|
return NULL;
|
|
}
|
|
|
|
*success = 0;
|
|
return NULL;
|
|
}
|
|
|
|
|
|
int init_video_decoder(CodecState *cs)
|
|
{
|
|
int rc = vpx_codec_dec_init_ver(&cs->v_decoder, VIDEO_CODEC_DECODER_INTERFACE, NULL, 0, VPX_DECODER_ABI_VERSION);
|
|
|
|
if ( rc != VPX_CODEC_OK) {
|
|
LOGGER_ERROR("Init video_decoder failed: %s", vpx_codec_err_to_string(rc));
|
|
return -1;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
int init_audio_decoder(CodecState *cs, uint32_t audio_channels)
|
|
{
|
|
int rc;
|
|
cs->audio_decoder = opus_decoder_create(cs->audio_sample_rate, audio_channels, &rc );
|
|
|
|
if ( rc != OPUS_OK ) {
|
|
LOGGER_ERROR("Error while starting audio decoder: %s", opus_strerror(rc));
|
|
return -1;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
int reconfigure_video_encoder_resolution(CodecState *cs, uint16_t width, uint16_t height)
|
|
{
|
|
vpx_codec_enc_cfg_t cfg = *cs->v_encoder.config.enc;
|
|
|
|
if (cfg.g_w == width && cfg.g_h == height)
|
|
return 0;
|
|
|
|
if (width * height > cs->max_width * cs->max_height)
|
|
return -1;
|
|
|
|
LOGGER_DEBUG("New video resolution: %u %u", width, height);
|
|
cfg.g_w = width;
|
|
cfg.g_h = height;
|
|
int rc = vpx_codec_enc_config_set(&cs->v_encoder, &cfg);
|
|
|
|
if ( rc != VPX_CODEC_OK) {
|
|
LOGGER_ERROR("Failed to set encoder control setting: %s", vpx_codec_err_to_string(rc));
|
|
return -1;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
int reconfigure_video_encoder_bitrate(CodecState *cs, uint32_t video_bitrate)
|
|
{
|
|
vpx_codec_enc_cfg_t cfg = *cs->v_encoder.config.enc;
|
|
|
|
if (cfg.rc_target_bitrate == video_bitrate)
|
|
return 0;
|
|
|
|
LOGGER_DEBUG("New video bitrate: %u", video_bitrate);
|
|
cfg.rc_target_bitrate = video_bitrate;
|
|
int rc = vpx_codec_enc_config_set(&cs->v_encoder, &cfg);
|
|
|
|
if ( rc != VPX_CODEC_OK) {
|
|
LOGGER_ERROR("Failed to set encoder control setting: %s", vpx_codec_err_to_string(rc));
|
|
return -1;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
int init_video_encoder(CodecState *cs, uint16_t max_width, uint16_t max_height, uint32_t video_bitrate)
|
|
{
|
|
vpx_codec_enc_cfg_t cfg;
|
|
int rc = vpx_codec_enc_config_default(VIDEO_CODEC_ENCODER_INTERFACE, &cfg, 0);
|
|
|
|
if (rc != VPX_CODEC_OK) {
|
|
LOGGER_ERROR("Failed to get config: %s", vpx_codec_err_to_string(rc));
|
|
return -1;
|
|
}
|
|
|
|
cfg.rc_target_bitrate = video_bitrate;
|
|
cfg.g_w = max_width;
|
|
cfg.g_h = max_height;
|
|
cfg.g_pass = VPX_RC_ONE_PASS;
|
|
cfg.g_error_resilient = VPX_ERROR_RESILIENT_DEFAULT | VPX_ERROR_RESILIENT_PARTITIONS;
|
|
cfg.g_lag_in_frames = 0;
|
|
cfg.kf_min_dist = 0;
|
|
cfg.kf_max_dist = 300;
|
|
cfg.kf_mode = VPX_KF_AUTO;
|
|
|
|
cs->max_width = max_width;
|
|
cs->max_height = max_height;
|
|
cs->bitrate = video_bitrate;
|
|
|
|
rc = vpx_codec_enc_init_ver(&cs->v_encoder, VIDEO_CODEC_ENCODER_INTERFACE, &cfg, 0, VPX_ENCODER_ABI_VERSION);
|
|
|
|
if ( rc != VPX_CODEC_OK) {
|
|
LOGGER_ERROR("Failed to initialize encoder: %s", vpx_codec_err_to_string(rc));
|
|
return -1;
|
|
}
|
|
|
|
rc = vpx_codec_control(&cs->v_encoder, VP8E_SET_CPUUSED, 7);
|
|
|
|
if ( rc != VPX_CODEC_OK) {
|
|
LOGGER_ERROR("Failed to set encoder control setting: %s", vpx_codec_err_to_string(rc));
|
|
return -1;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
int init_audio_encoder(CodecState *cs, uint32_t audio_channels)
|
|
{
|
|
int rc = OPUS_OK;
|
|
cs->audio_encoder = opus_encoder_create(cs->audio_sample_rate, audio_channels, OPUS_APPLICATION_AUDIO, &rc);
|
|
|
|
if ( rc != OPUS_OK ) {
|
|
LOGGER_ERROR("Error while starting audio encoder: %s", opus_strerror(rc));
|
|
return -1;
|
|
}
|
|
|
|
rc = opus_encoder_ctl(cs->audio_encoder, OPUS_SET_BITRATE(cs->audio_bitrate));
|
|
|
|
if ( rc != OPUS_OK ) {
|
|
LOGGER_ERROR("Error while setting encoder ctl: %s", opus_strerror(rc));
|
|
return -1;
|
|
}
|
|
|
|
rc = opus_encoder_ctl(cs->audio_encoder, OPUS_SET_COMPLEXITY(10));
|
|
|
|
if ( rc != OPUS_OK ) {
|
|
LOGGER_ERROR("Error while setting encoder ctl: %s", opus_strerror(rc));
|
|
return -1;
|
|
}
|
|
|
|
|
|
return 0;
|
|
}
|
|
|
|
|
|
CodecState *codec_init_session ( uint32_t audio_bitrate,
|
|
uint16_t audio_frame_duration,
|
|
uint32_t audio_sample_rate,
|
|
uint32_t audio_channels,
|
|
uint32_t audio_VAD_tolerance_ms,
|
|
uint16_t max_video_width,
|
|
uint16_t max_video_height,
|
|
uint32_t video_bitrate )
|
|
{
|
|
CodecState *retu = calloc(sizeof(CodecState), 1);
|
|
|
|
if (!retu) return NULL;
|
|
|
|
retu->audio_bitrate = audio_bitrate;
|
|
retu->audio_sample_rate = audio_sample_rate;
|
|
|
|
/* Encoders */
|
|
if (!max_video_width || !max_video_height) { /* Disable video */
|
|
/*video_width = 320;
|
|
video_height = 240; */
|
|
} else {
|
|
retu->capabilities |= ( 0 == init_video_encoder(retu, max_video_width, max_video_height,
|
|
video_bitrate) ) ? v_encoding : 0;
|
|
retu->capabilities |= ( 0 == init_video_decoder(retu) ) ? v_decoding : 0;
|
|
}
|
|
|
|
retu->capabilities |= ( 0 == init_audio_encoder(retu, audio_channels) ) ? a_encoding : 0;
|
|
retu->capabilities |= ( 0 == init_audio_decoder(retu, audio_channels) ) ? a_decoding : 0;
|
|
|
|
if ( retu->capabilities == 0 ) { /* everything failed */
|
|
free (retu);
|
|
return NULL;
|
|
}
|
|
|
|
|
|
retu->EVAD_tolerance = audio_VAD_tolerance_ms > audio_frame_duration ?
|
|
audio_VAD_tolerance_ms / audio_frame_duration : audio_frame_duration;
|
|
|
|
return retu;
|
|
}
|
|
|
|
void codec_terminate_session ( CodecState *cs )
|
|
{
|
|
if (!cs) return;
|
|
|
|
if ( cs->audio_encoder )
|
|
opus_encoder_destroy(cs->audio_encoder);
|
|
|
|
if ( cs->audio_decoder )
|
|
opus_decoder_destroy(cs->audio_decoder);
|
|
|
|
if ( cs->capabilities & v_decoding )
|
|
vpx_codec_destroy(&cs->v_decoder);
|
|
|
|
if ( cs->capabilities & v_encoding )
|
|
vpx_codec_destroy(&cs->v_encoder);
|
|
|
|
LOGGER_DEBUG("Terminated codec state: %p", cs);
|
|
free(cs);
|
|
}
|
|
|
|
static float calculate_sum_sq (int16_t *n, uint16_t k)
|
|
{
|
|
float result = 0;
|
|
uint16_t i = 0;
|
|
|
|
for ( ; i < k; i ++) result += (float) (n[i] * n[i]);
|
|
|
|
return result;
|
|
}
|
|
|
|
int energy_VAD(CodecState *cs, int16_t *PCM, uint16_t frame_size, float energy)
|
|
{
|
|
float frame_energy = sqrt(calculate_sum_sq(PCM, frame_size)) / frame_size;
|
|
|
|
if ( frame_energy > energy) {
|
|
cs->EVAD_tolerance_cr = cs->EVAD_tolerance; /* Reset counter */
|
|
return 1;
|
|
}
|
|
|
|
if ( cs->EVAD_tolerance_cr ) {
|
|
cs->EVAD_tolerance_cr --;
|
|
return 1;
|
|
}
|
|
|
|
return 0;
|
|
}
|