Files
fmviewer3/project/fm_viewer/fav/AudioResamplerTemplate.cpp
2026-02-21 17:11:31 +09:00

287 lines
12 KiB
C++

/******************************************************************************
QtAV: Multimedia framework based on Qt and FFmpeg
Copyright (C) 2012-2016 Wang Bin <wbsecg1@gmail.com>
* This file is part of QtAV
This library is free software; you can redistribute it and/or
modify it under the terms of the GNU Lesser General Public
License as published by the Free Software Foundation; either
version 2.1 of the License, or (at your option) any later version.
This library is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
Lesser General Public License for more details.
You should have received a copy of the GNU Lesser General Public
License along with this library; if not, write to the Free Software
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
******************************************************************************/
#define REMOVE_AUDIO_RESAMPLER 0
#if !(REMOVE_AUDIO_RESAMPLER)
#if defined(BUILD_AVR) || defined(BUILD_SWR) // no this macro is fine too for qmake
#include "AudioResampler.h"
#include "AudioResampler_p.h"
#include "AVCompat.h"
#include "factory.h"
#include "Logger.h"
namespace FAV {
#if QTAV_HAVE(SWR_AVR_MAP)
#define AudioResamplerFF AudioResamplerLibav
#define AudioResamplerFFPrivate AudioResamplerLibavPrivate
#define AudioResamplerId_FF AudioResamplerId_Libav
#define RegisterAudioResamplerFF_Man RegisterAudioResamplerLibav_Man
#define FF Libav
static const char kName[] = "Libav";
#else
static const char kName[] = "FFmpeg";
#endif
class AudioResamplerFFPrivate;
class AudioResamplerFF : public AudioResampler
{
DPTR_DECLARE_PRIVATE(AudioResampler)
public:
AudioResamplerFF();
virtual bool convert(const quint8** data);
virtual bool prepare();
};
extern AudioResamplerId AudioResamplerId_FF;
FACTORY_REGISTER(AudioResampler, FF, kName)
class AudioResamplerFFPrivate : public AudioResamplerPrivate
{
public:
AudioResamplerFFPrivate(): context(0) {}
~AudioResamplerFFPrivate() {
if (context) {
swr_free(&context);
context = 0;
}
}
SwrContext *context;
// defined in swr<1
#ifndef SWR_CH_MAX
#define SWR_CH_MAX 64
#endif
int channel_map[SWR_CH_MAX];
};
AudioResamplerFF::AudioResamplerFF():
AudioResampler(*new AudioResamplerFFPrivate())
{
}
bool AudioResamplerFF::convert(const quint8 **data)
{
DPTR_D(AudioResamplerFF);
/*
* swr_get_delay: Especially when downsampling by a large value, the output sample rate may be a poor choice to represent
* the delay, similarly upsampling and the input sample rate.
*/
qreal osr = d.out_format.sampleRate();
if (!qFuzzyCompare(d.speed, 1.0))
osr /= d.speed;
d.out_samples_per_channel = av_rescale_rnd(
#if HAVE_SWR_GET_DELAY
swr_get_delay(d.context, qMax(d.in_format.sampleRate(), d.out_format.sampleRate())) +
#else
128 + //TODO: QtAV_Compat
#endif //HAVE_SWR_GET_DELAY
d.in_samples_per_channel //TODO: wanted_samples(ffplay mplayer2)
, osr, d.in_format.sampleRate(), AV_ROUND_UP);
//TODO: why crash for swr 0.5?
//int out_size = av_samples_get_buffer_size(NULL/*out linesize*/, d.out_channels, d.out_samples_per_channel, (AVSampleFormat)d.out_sample_format, 0/*alignment default*/);
int size_per_sample_with_channels = d.out_format.channels()*d.out_format.bytesPerSample();
int out_size = d.out_samples_per_channel*size_per_sample_with_channels;
if (out_size > d.data_out.size())
d.data_out.resize(out_size);
uint8_t *out[] = {(uint8_t*)d.data_out.data()}; // detach if implicitly shared by others
//number of input/output samples available in one channel
int converted_samplers_per_channel = swr_convert(d.context, out, d.out_samples_per_channel, data, d.in_samples_per_channel);
d.out_samples_per_channel = converted_samplers_per_channel;
if (converted_samplers_per_channel < 0) {
qWarning("[AudioResamplerFF] %s", av_err2str(converted_samplers_per_channel));
return false;
}
//TODO: converted_samplers_per_channel==out_samples_per_channel means out_size is too small, see mplayer2
//converted_samplers_per_channel*d.out_channels*av_get_bytes_per_sample(d.out_sample_format)
//av_samples_get_buffer_size(0, d.out_channels, converted_samplers_per_channel, d.out_sample_format, 0)
//if (converted_samplers_per_channel != out_size)
d.data_out.resize(converted_samplers_per_channel*size_per_sample_with_channels);
return true;
}
/*
*TODO: broken sample rate(AAC), see mplayer
*/
bool AudioResamplerFF::prepare()
{
DPTR_D(AudioResamplerFF);
if (!d.in_format.isValid()) {
qWarning("src audio parameters 'channel layout(or channels), sample rate and sample format must be set before initialize resampler");
return false;
}
//TODO: also in do this statistics
if (!d.in_format.channels()) {
if (!d.in_format.channelLayoutFFmpeg()) { //FIXME: already return
d.in_format.setChannels(2);
d.in_format.setChannelLayoutFFmpeg(av_get_default_channel_layout(d.in_format.channels())); //from mplayer2
qWarning("both channels and channel layout are not available, assume channels=%d, channel layout=%lld", d.in_format.channels(), d.in_format.channelLayoutFFmpeg());
} else {
d.in_format.setChannels(av_get_channel_layout_nb_channels(d.in_format.channelLayoutFFmpeg()));
}
}
if (!d.in_format.channels())
d.in_format.setChannels(2); //TODO: why av_get_channel_layout_nb_channels() may return 0?
if (!d.in_format.channelLayoutFFmpeg()) {
qWarning("channel layout not available, use default layout");
d.in_format.setChannelLayoutFFmpeg(av_get_default_channel_layout(d.in_format.channels()));
}
if (!d.out_format.channels()) {
if (d.out_format.channelLayoutFFmpeg()) {
d.out_format.setChannels(av_get_channel_layout_nb_channels(d.out_format.channelLayoutFFmpeg()));
} else {
d.out_format.setChannels(d.in_format.channels());
d.out_format.setChannelLayoutFFmpeg(d.in_format.channelLayoutFFmpeg());
}
}
if (d.out_format.channelLayout() == AudioFormat::ChannelLayout_Unsupported) {
d.out_format.setChannels(d.in_format.channels());
d.out_format.setChannelLayoutFFmpeg(d.in_format.channelLayoutFFmpeg());
}
//now we have out channels
if (!d.out_format.channelLayoutFFmpeg())
d.out_format.setChannelLayoutFFmpeg(av_get_default_channel_layout(d.out_format.channels()));
if (!d.out_format.sampleRate())
d.out_format.setSampleRate(inAudioFormat().sampleRate());
if (d.speed <= 0)
d.speed = 1.0;
//DO NOT set sample rate here, we should keep the original and multiply 1/speed when needed
//if (d.speed != 1.0)
// d.out_format.setSampleRate(int(qreal(d.out_format.sampleFormat())/d.speed));
qDebug("swr speed=%.2f", d.speed);
//d.in_planes = av_sample_fmt_is_planar((enum AVSampleFormat)d.in_sample_format) ? d.in_channels : 1;
//d.out_planes = av_sample_fmt_is_planar((enum AVSampleFormat)d.out_sample_format) ? d.out_channels : 1;
if (d.context)
swr_free(&d.context); //TODO: if no free(of cause free is required), why channel mapping and layout not work if change from left to stereo?
//If use swr_alloc() need to set the parameters (av_opt_set_xxx() manually or with swr_alloc_set_opts()) before calling swr_init()
d.context = swr_alloc_set_opts(d.context
, d.out_format.channelLayoutFFmpeg()
, (enum AVSampleFormat)outAudioFormat().sampleFormatFFmpeg()
, qreal(outAudioFormat().sampleRate())/d.speed
, d.in_format.channelLayoutFFmpeg()
, (enum AVSampleFormat)inAudioFormat().sampleFormatFFmpeg()
, inAudioFormat().sampleRate()
, 0 /*log_offset*/, 0 /*log_ctx*/);
/*
av_opt_set_int(d.context, "in_channel_layout", d.in_channel_layout, 0);
av_opt_set_int(d.context, "in_sample_rate", d.in_format.sampleRate(), 0);
av_opt_set_sample_fmt(d.context, "in_sample_fmt", (enum AVSampleFormat)in_format.sampleFormatFFmpeg(), 0);
av_opt_set_int(d.context, "out_channel_layout", d.out_channel_layout, 0);
av_opt_set_int(d.context, "out_sample_rate", d.out_format.sampleRate(), 0);
av_opt_set_sample_fmt(d.context, "out_sample_fmt", (enum AVSampleFormat)out_format.sampleFormatFFmpeg(), 0);
*/
qDebug("out: {cl: %lld, fmt: %s, freq: %d}"
, d.out_format.channelLayoutFFmpeg()
, qPrintable(d.out_format.sampleFormatName())
, d.out_format.sampleRate());
qDebug("in {cl: %lld, fmt: %s, freq: %d}"
, d.in_format.channelLayoutFFmpeg()
, qPrintable(d.in_format.sampleFormatName())
, d.in_format.sampleRate());
if (!d.context) {
qWarning("Allocat swr context failed!");
return false;
}
//avresample 0.0.2(FFmpeg 0.11)~1.0.1(FFmpeg 1.1) has no channel mapping. but has remix matrix, so does swresample
//TODO: why crash if use channel mapping for L or R?
#if QTAV_HAVE(SWR_AVR_MAP) //LIBAVRESAMPLE_VERSION_INT < AV_VERSION_INT(1, 1, 0)
bool remix = false;
int in_c = d.in_format.channels();
int out_c = d.out_format.channels();
/*
* matrix[i + stride * o] is the weight of input channel i in output channel o.
*/
double *matrix = 0;
if (d.out_format.channelLayout() == AudioFormat::ChannelLayout_Left) {
remix = true;
matrix = (double*)calloc(in_c*out_c, sizeof(double));
for (int o = 0; o < out_c; ++o) {
matrix[0 + in_c * o] = 1;
}
}
if (d.out_format.channelLayout() == AudioFormat::ChannelLayout_Right) {
remix = true;
matrix = (double*)calloc(in_c*out_c, sizeof(double));
for (int o = 0; o < out_c; ++o) {
matrix[1 + in_c * o] = 1;
}
}
if (!remix && in_c < out_c) {
remix = true;
//double matrix[in_c*out_c]; //C99, VLA
matrix = (double*)calloc(in_c*out_c, sizeof(double));
for (int i = 0, o = 0; o < out_c; ++o) {
matrix[i + in_c * o] = 1;
i = (i + i)%in_c;
}
}
if (remix && matrix) {
avresample_set_matrix(d.context, matrix, in_c);
free(matrix);
}
#else
bool use_channel_map = false;
if (d.out_format.channelLayout() == AudioFormat::ChannelLayout_Left) {
use_channel_map = true;
memset(d.channel_map, 0, sizeof(d.channel_map));
for (int i = 0; i < d.out_format.channels(); ++i) {
d.channel_map[i] = 0;
}
}
if (d.out_format.channelLayout() == AudioFormat::ChannelLayout_Right) {
use_channel_map = true;
memset(d.channel_map, 0, sizeof(d.channel_map));
for (int i = 0; i < d.out_format.channels(); ++i) {
d.channel_map[i] = 1;
}
}
if (!use_channel_map && d.in_format.channels() < d.out_format.channels()) {
use_channel_map = true;
memset(d.channel_map, 0, sizeof(d.channel_map));
for (int i = 0; i < d.out_format.channels(); ++i) {
d.channel_map[i] = i % d.in_format.channels();
}
}
if (use_channel_map) {
av_opt_set_int(d.context, "icl", d.out_format.channelLayoutFFmpeg(), 0);
//TODO: why crash if layout is mono and set uch(i.e. always the next line)
av_opt_set_int(d.context, "uch", d.out_format.channels(), 0);
swr_set_channel_mapping(d.context, d.channel_map);
}
#endif //QTAV_HAVE(SWR_AVR_MAP)
int ret = swr_init(d.context);
if (ret < 0) {
qWarning("swr_init failed: %s", av_err2str(ret));
swr_free(&d.context);
return false;
}
return true;
}
} //namespace FAV
#endif //defined(BUILD_AVR) || defined(BUILD_SWR)
#endif // #if !(REMOVE_AUDIO_RESAMPLER)