Rewrite media decoder to use FFMpeg 3.2+ API (task #4686)

pull/541/head
Andrei Kortunov 6 years ago
parent 261bbded00
commit f88d5e808c

@ -3,6 +3,7 @@
Feature #2229: Improve pathfinding AI Feature #2229: Improve pathfinding AI
Feature #3442: Default values for fallbacks from ini file Feature #3442: Default values for fallbacks from ini file
Task #4686: Upgrade media decoder to a more current FFmpeg API
0.45.0 0.45.0

@ -6,5 +6,5 @@ brew outdated cmake || brew upgrade cmake
brew outdated pkgconfig || brew upgrade pkgconfig brew outdated pkgconfig || brew upgrade pkgconfig
brew install qt brew install qt
curl -fSL -R -J https://downloads.openmw.org/osx/dependencies/openmw-deps-4eec887.zip -o ~/openmw-deps.zip curl -fSL -R -J https://downloads.openmw.org/osx/dependencies/openmw-deps-7cf2789.zip -o ~/openmw-deps.zip
unzip -o ~/openmw-deps.zip -d /private/tmp/openmw-deps > /dev/null unzip -o ~/openmw-deps.zip -d /private/tmp/openmw-deps > /dev/null

@ -153,7 +153,52 @@ if (USE_QT)
endif() endif()
# Sound setup # Sound setup
# Require at least ffmpeg 3.2 for now
SET(FFVER_OK FALSE)
find_package(FFmpeg REQUIRED COMPONENTS AVCODEC AVFORMAT AVUTIL SWSCALE SWRESAMPLE) find_package(FFmpeg REQUIRED COMPONENTS AVCODEC AVFORMAT AVUTIL SWSCALE SWRESAMPLE)
if(FFmpeg_FOUND)
SET(FFVER_OK TRUE)
# Can not detect FFmpeg version on Windows for now
if (NOT WIN32)
if(FFmpeg_AVFORMAT_VERSION VERSION_LESS "57.56.100")
message(STATUS "libavformat is too old! (${FFmpeg_AVFORMAT_VERSION}, wanted 57.56.100)")
set(FFVER_OK FALSE)
endif()
if(FFmpeg_AVCODEC_VERSION VERSION_LESS "57.64.100")
message(STATUS "libavcodec is too old! (${FFmpeg_AVCODEC_VERSION}, wanted 57.64.100)")
set(FFVER_OK FALSE)
endif()
if(FFmpeg_AVUTIL_VERSION VERSION_LESS "55.34.100")
message(STATUS "libavutil is too old! (${FFmpeg_AVUTIL_VERSION}, wanted 55.34.100)")
set(FFVER_OK FALSE)
endif()
if(FFmpeg_SWSCALE_VERSION VERSION_LESS "4.2.100")
message(STATUS "libswscale is too old! (${FFmpeg_SWSCALE_VERSION}, wanted 4.2.100)")
set(FFVER_OK FALSE)
endif()
if(FFmpeg_SWRESAMPLE_VERSION VERSION_LESS "2.3.100")
message(STATUS "libswresample is too old! (${FFmpeg_SWRESAMPLE_VERSION}, wanted 2.3.100)")
set(FFVER_OK FALSE)
endif()
endif()
endif()
if(NOT FFmpeg_FOUND)
message(FATAL_ERROR "FFmpeg was not found" )
endif()
if(NOT FFVER_OK)
message(FATAL_ERROR "FFmpeg version is too old, 3.2 is required" )
endif()
if(WIN32)
message("Can not detect FFmpeg version, at least the 3.2 is required" )
endif()
# Required for building the FFmpeg headers # Required for building the FFmpeg headers
add_definitions(-D__STDC_CONSTANT_MACROS) add_definitions(-D__STDC_CONSTANT_MACROS)

@ -82,7 +82,7 @@ bool FFmpeg_Decoder::getNextPacket()
} }
/* Free the packet and look for another */ /* Free the packet and look for another */
av_free_packet(&mPacket); av_packet_unref(&mPacket);
} }
return false; return false;
@ -90,9 +90,9 @@ bool FFmpeg_Decoder::getNextPacket()
bool FFmpeg_Decoder::getAVAudioData() bool FFmpeg_Decoder::getAVAudioData()
{ {
int got_frame; bool got_frame;
if((*mStream)->codec->codec_type != AVMEDIA_TYPE_AUDIO) if(mCodecCtx->codec_type != AVMEDIA_TYPE_AUDIO)
return false; return false;
do { do {
@ -100,19 +100,18 @@ bool FFmpeg_Decoder::getAVAudioData()
return false; return false;
/* Decode some data, and check for errors */ /* Decode some data, and check for errors */
int len = 0; int ret = 0;
if((len=avcodec_decode_audio4((*mStream)->codec, mFrame, &got_frame, &mPacket)) < 0) ret = avcodec_receive_frame(mCodecCtx, mFrame);
if (ret == 0)
got_frame = true;
if (ret == AVERROR(EAGAIN))
ret = 0;
if (ret == 0)
ret = avcodec_send_packet(mCodecCtx, &mPacket);
if (ret < 0 && ret != AVERROR(EAGAIN))
return false; return false;
/* Move the unread data to the front and clear the end bits */ av_packet_unref(&mPacket);
int remaining = mPacket.size - len;
if(remaining <= 0)
av_free_packet(&mPacket);
else
{
memmove(mPacket.data, &mPacket.data[len], remaining);
av_shrink_packet(&mPacket, remaining);
}
if (!got_frame || mFrame->nb_samples == 0) if (!got_frame || mFrame->nb_samples == 0)
continue; continue;
@ -139,8 +138,8 @@ bool FFmpeg_Decoder::getAVAudioData()
else else
mFrameData = &mFrame->data[0]; mFrameData = &mFrame->data[0];
} while(got_frame == 0 || mFrame->nb_samples == 0); } while(!got_frame || mFrame->nb_samples == 0);
mNextPts += (double)mFrame->nb_samples / (double)(*mStream)->codec->sample_rate; mNextPts += (double)mFrame->nb_samples / mCodecCtx->sample_rate;
return true; return true;
} }
@ -213,7 +212,7 @@ void FFmpeg_Decoder::open(const std::string &fname)
for(size_t j = 0;j < mFormatCtx->nb_streams;j++) for(size_t j = 0;j < mFormatCtx->nb_streams;j++)
{ {
if(mFormatCtx->streams[j]->codec->codec_type == AVMEDIA_TYPE_AUDIO) if(mFormatCtx->streams[j]->codecpar->codec_type == AVMEDIA_TYPE_AUDIO)
{ {
mStream = &mFormatCtx->streams[j]; mStream = &mFormatCtx->streams[j];
break; break;
@ -222,39 +221,48 @@ void FFmpeg_Decoder::open(const std::string &fname)
if(!mStream) if(!mStream)
throw std::runtime_error("No audio streams in "+fname); throw std::runtime_error("No audio streams in "+fname);
(*mStream)->codec->request_sample_fmt = (*mStream)->codec->sample_fmt; AVCodec *codec = avcodec_find_decoder((*mStream)->codecpar->codec_id);
AVCodec *codec = avcodec_find_decoder((*mStream)->codec->codec_id);
if(!codec) if(!codec)
{ {
std::string ss = "No codec found for id " + std::string ss = "No codec found for id " +
std::to_string((*mStream)->codec->codec_id); std::to_string((*mStream)->codecpar->codec_id);
throw std::runtime_error(ss); throw std::runtime_error(ss);
} }
if(avcodec_open2((*mStream)->codec, codec, nullptr) < 0)
throw std::runtime_error(std::string("Failed to open audio codec ") + AVCodecContext *avctx = avcodec_alloc_context3(codec);
codec->long_name); avcodec_parameters_to_context(avctx, (*mStream)->codecpar);
// This is not needed anymore above FFMpeg version 4.0
#if LIBAVCODEC_VERSION_INT < 3805796
av_codec_set_pkt_timebase(avctx, (*mStream)->time_base);
#endif
mCodecCtx = avctx;
if(avcodec_open2(mCodecCtx, codec, nullptr) < 0)
throw std::runtime_error(std::string("Failed to open audio codec ") + codec->long_name);
mFrame = av_frame_alloc(); mFrame = av_frame_alloc();
if((*mStream)->codec->sample_fmt == AV_SAMPLE_FMT_FLT || if(mCodecCtx->sample_fmt == AV_SAMPLE_FMT_FLT || mCodecCtx->sample_fmt == AV_SAMPLE_FMT_FLTP)
(*mStream)->codec->sample_fmt == AV_SAMPLE_FMT_FLTP)
mOutputSampleFormat = AV_SAMPLE_FMT_S16; // FIXME: Check for AL_EXT_FLOAT32 support mOutputSampleFormat = AV_SAMPLE_FMT_S16; // FIXME: Check for AL_EXT_FLOAT32 support
else if((*mStream)->codec->sample_fmt == AV_SAMPLE_FMT_U8P) else if(mCodecCtx->sample_fmt == AV_SAMPLE_FMT_U8P)
mOutputSampleFormat = AV_SAMPLE_FMT_U8; mOutputSampleFormat = AV_SAMPLE_FMT_U8;
else if((*mStream)->codec->sample_fmt == AV_SAMPLE_FMT_S16P) else if(mCodecCtx->sample_fmt == AV_SAMPLE_FMT_S16P)
mOutputSampleFormat = AV_SAMPLE_FMT_S16; mOutputSampleFormat = AV_SAMPLE_FMT_S16;
else else
mOutputSampleFormat = AV_SAMPLE_FMT_S16; mOutputSampleFormat = AV_SAMPLE_FMT_S16;
mOutputChannelLayout = (*mStream)->codec->channel_layout; mOutputChannelLayout = (*mStream)->codecpar->channel_layout;
if(mOutputChannelLayout == 0) if(mOutputChannelLayout == 0)
mOutputChannelLayout = av_get_default_channel_layout((*mStream)->codec->channels); mOutputChannelLayout = av_get_default_channel_layout(mCodecCtx->channels);
mCodecCtx->channel_layout = mOutputChannelLayout;
} }
catch(...) catch(...)
{ {
if(mStream) if(mStream)
avcodec_close((*mStream)->codec); avcodec_free_context(&mCodecCtx);
mStream = nullptr; mStream = nullptr;
if (mFormatCtx != nullptr) if (mFormatCtx != nullptr)
@ -275,10 +283,10 @@ void FFmpeg_Decoder::open(const std::string &fname)
void FFmpeg_Decoder::close() void FFmpeg_Decoder::close()
{ {
if(mStream) if(mStream)
avcodec_close((*mStream)->codec); avcodec_free_context(&mCodecCtx);
mStream = nullptr; mStream = nullptr;
av_free_packet(&mPacket); av_packet_unref(&mPacket);
av_freep(&mFrame); av_freep(&mFrame);
swr_free(&mSwr); swr_free(&mSwr);
av_freep(&mDataBuf); av_freep(&mDataBuf);
@ -308,7 +316,12 @@ void FFmpeg_Decoder::close()
std::string FFmpeg_Decoder::getName() std::string FFmpeg_Decoder::getName()
{ {
// In the FFMpeg 4.0 a "filename" field was replaced by "url"
#if LIBAVCODEC_VERSION_INT < 3805796
return mFormatCtx->filename; return mFormatCtx->filename;
#else
return mFormatCtx->url;
#endif
} }
void FFmpeg_Decoder::getInfo(int *samplerate, ChannelConfig *chans, SampleType *type) void FFmpeg_Decoder::getInfo(int *samplerate, ChannelConfig *chans, SampleType *type)
@ -341,11 +354,10 @@ void FFmpeg_Decoder::getInfo(int *samplerate, ChannelConfig *chans, SampleType *
else else
{ {
char str[1024]; char str[1024];
av_get_channel_layout_string(str, sizeof(str), (*mStream)->codec->channels, av_get_channel_layout_string(str, sizeof(str), mCodecCtx->channels, mCodecCtx->channel_layout);
(*mStream)->codec->channel_layout);
Log(Debug::Error) << "Unsupported channel layout: "<< str; Log(Debug::Error) << "Unsupported channel layout: "<< str;
if((*mStream)->codec->channels == 1) if(mCodecCtx->channels == 1)
{ {
mOutputChannelLayout = AV_CH_LAYOUT_MONO; mOutputChannelLayout = AV_CH_LAYOUT_MONO;
*chans = ChannelConfig_Mono; *chans = ChannelConfig_Mono;
@ -357,27 +369,28 @@ void FFmpeg_Decoder::getInfo(int *samplerate, ChannelConfig *chans, SampleType *
} }
} }
*samplerate = (*mStream)->codec->sample_rate; *samplerate = mCodecCtx->sample_rate;
int64_t ch_layout = (*mStream)->codec->channel_layout; int64_t ch_layout = mCodecCtx->channel_layout;
if(ch_layout == 0) if(ch_layout == 0)
ch_layout = av_get_default_channel_layout((*mStream)->codec->channels); ch_layout = av_get_default_channel_layout(mCodecCtx->channels);
if(mOutputSampleFormat != (*mStream)->codec->sample_fmt || if(mOutputSampleFormat != mCodecCtx->sample_fmt ||
mOutputChannelLayout != ch_layout) mOutputChannelLayout != ch_layout)
{ {
mSwr = swr_alloc_set_opts(mSwr, // SwrContext mSwr = swr_alloc_set_opts(mSwr, // SwrContext
mOutputChannelLayout, // output ch layout mOutputChannelLayout, // output ch layout
mOutputSampleFormat, // output sample format mOutputSampleFormat, // output sample format
(*mStream)->codec->sample_rate, // output sample rate mCodecCtx->sample_rate, // output sample rate
ch_layout, // input ch layout ch_layout, // input ch layout
(*mStream)->codec->sample_fmt, // input sample format mCodecCtx->sample_fmt, // input sample format
(*mStream)->codec->sample_rate, // input sample rate mCodecCtx->sample_rate, // input sample rate
0, // logging level offset 0, // logging level offset
nullptr); // log context nullptr); // log context
if(!mSwr) if(!mSwr)
throw std::runtime_error("Couldn't allocate SwrContext"); throw std::runtime_error("Couldn't allocate SwrContext");
if(swr_init(mSwr) < 0) int init=swr_init(mSwr);
throw std::runtime_error("Couldn't initialize SwrContext"); if(init < 0)
throw std::runtime_error("Couldn't initialize SwrContext: "+std::to_string(init));
} }
} }
@ -412,7 +425,7 @@ size_t FFmpeg_Decoder::getSampleOffset()
{ {
int delay = (mFrameSize-mFramePos) / av_get_channel_layout_nb_channels(mOutputChannelLayout) / int delay = (mFrameSize-mFramePos) / av_get_channel_layout_nb_channels(mOutputChannelLayout) /
av_get_bytes_per_sample(mOutputSampleFormat); av_get_bytes_per_sample(mOutputSampleFormat);
return (int)(mNextPts*(*mStream)->codec->sample_rate) - delay; return (int)(mNextPts*mCodecCtx->sample_rate) - delay;
} }
FFmpeg_Decoder::FFmpeg_Decoder(const VFS::Manager* vfs) FFmpeg_Decoder::FFmpeg_Decoder(const VFS::Manager* vfs)
@ -437,7 +450,10 @@ FFmpeg_Decoder::FFmpeg_Decoder(const VFS::Manager* vfs)
static bool done_init = false; static bool done_init = false;
if(!done_init) if(!done_init)
{ {
// This is not needed anymore above FFMpeg version 4.0
#if LIBAVCODEC_VERSION_INT < 3805796
av_register_all(); av_register_all();
#endif
av_log_set_level(AV_LOG_ERROR); av_log_set_level(AV_LOG_ERROR);
done_init = true; done_init = true;
} }

@ -6,18 +6,7 @@ extern "C"
{ {
#include <libavcodec/avcodec.h> #include <libavcodec/avcodec.h>
#include <libavformat/avformat.h> #include <libavformat/avformat.h>
// From libavutil version 52.2.0 and onward the declaration of
// AV_CH_LAYOUT_* is removed from libavcodec/avcodec.h and moved to
// libavutil/channel_layout.h
#if AV_VERSION_INT(52, 2, 0) <= AV_VERSION_INT(LIBAVUTIL_VERSION_MAJOR, \
LIBAVUTIL_VERSION_MINOR, LIBAVUTIL_VERSION_MICRO)
#include <libavutil/channel_layout.h> #include <libavutil/channel_layout.h>
#endif
#if LIBAVCODEC_VERSION_INT < AV_VERSION_INT(55,28,1)
#define av_frame_alloc avcodec_alloc_frame
#endif
// From version 54.56 binkaudio encoding format changed from S16 to FLTP. See: // From version 54.56 binkaudio encoding format changed from S16 to FLTP. See:
// https://gitorious.org/ffmpeg/ffmpeg/commit/7bfd1766d1c18f07b0a2dd042418a874d49ea60d // https://gitorious.org/ffmpeg/ffmpeg/commit/7bfd1766d1c18f07b0a2dd042418a874d49ea60d
@ -38,6 +27,7 @@ namespace MWSound
class FFmpeg_Decoder final : public Sound_Decoder class FFmpeg_Decoder final : public Sound_Decoder
{ {
AVFormatContext *mFormatCtx; AVFormatContext *mFormatCtx;
AVCodecContext *mCodecCtx;
AVStream **mStream; AVStream **mStream;
AVPacket mPacket; AVPacket mPacket;

@ -48,7 +48,7 @@ namespace MWSound
{ {
ssize_t clock_delay = (mFrameSize-mFramePos) / av_get_channel_layout_nb_channels(mOutputChannelLayout) / ssize_t clock_delay = (mFrameSize-mFramePos) / av_get_channel_layout_nb_channels(mOutputChannelLayout) /
av_get_bytes_per_sample(mOutputSampleFormat); av_get_bytes_per_sample(mOutputSampleFormat);
return (size_t)(mAudioClock*mAVStream->codec->sample_rate) - clock_delay; return (size_t)(mAudioClock*mAudioContext->sample_rate) - clock_delay;
} }
std::string getStreamName() std::string getStreamName()
@ -61,7 +61,7 @@ namespace MWSound
virtual double getAudioClock() virtual double getAudioClock()
{ {
return (double)getSampleOffset()/(double)mAVStream->codec->sample_rate - return (double)getSampleOffset()/(double)mAudioContext->sample_rate -
MWBase::Environment::get().getSoundManager()->getTrackTimeDelay(mAudioTrack); MWBase::Environment::get().getSoundManager()->getTrackTimeDelay(mAudioTrack);
} }

@ -6,15 +6,9 @@
extern "C" extern "C"
{ {
#include <libavcodec/avcodec.h> #include <libavcodec/avcodec.h>
#include <libswresample/swresample.h> #include <libswresample/swresample.h>
#if LIBAVCODEC_VERSION_INT < AV_VERSION_INT(55,28,1)
#define av_frame_alloc avcodec_alloc_frame
#endif
} }
#include "videostate.hpp" #include "videostate.hpp"
@ -61,6 +55,7 @@ MovieAudioDecoder::MovieAudioDecoder(VideoState* videoState)
, mFrameData(NULL) , mFrameData(NULL)
, mDataBufLen(0) , mDataBufLen(0)
, mFrame(av_frame_alloc()) , mFrame(av_frame_alloc())
, mGetNextPacket(true)
, mAudioDiffAccum(0.0) , mAudioDiffAccum(0.0)
, mAudioDiffAvgCoef(exp(log(0.01 / AUDIO_DIFF_AVG_NB))) , mAudioDiffAvgCoef(exp(log(0.01 / AUDIO_DIFF_AVG_NB)))
/* Correct audio only if larger error than this */ /* Correct audio only if larger error than this */
@ -68,10 +63,34 @@ MovieAudioDecoder::MovieAudioDecoder(VideoState* videoState)
, mAudioDiffAvgCount(0) , mAudioDiffAvgCount(0)
{ {
mAudioResampler.reset(new AudioResampler()); mAudioResampler.reset(new AudioResampler());
AVCodec *codec = avcodec_find_decoder(mAVStream->codecpar->codec_id);
if(!codec)
{
std::string ss = "No codec found for id " +
std::to_string(mAVStream->codecpar->codec_id);
throw std::runtime_error(ss);
}
AVCodecContext *avctx = avcodec_alloc_context3(codec);
avcodec_parameters_to_context(avctx, mAVStream->codecpar);
// This is not needed anymore above FFMpeg version 4.0
#if LIBAVCODEC_VERSION_INT < 3805796
av_codec_set_pkt_timebase(avctx, mAVStream->time_base);
#endif
mAudioContext = avctx;
if(avcodec_open2(mAudioContext, codec, nullptr) < 0)
throw std::runtime_error(std::string("Failed to open audio codec ") + codec->long_name);
} }
MovieAudioDecoder::~MovieAudioDecoder() MovieAudioDecoder::~MovieAudioDecoder()
{ {
if(mAudioContext)
avcodec_free_context(&mAudioContext);
av_freep(&mFrame); av_freep(&mFrame);
av_freep(&mDataBuf); av_freep(&mDataBuf);
} }
@ -81,13 +100,13 @@ void MovieAudioDecoder::setupFormat()
if (mAudioResampler->mSwr) if (mAudioResampler->mSwr)
return; // already set up return; // already set up
AVSampleFormat inputSampleFormat = mAVStream->codec->sample_fmt; AVSampleFormat inputSampleFormat = mAudioContext->sample_fmt;
uint64_t inputChannelLayout = mAVStream->codec->channel_layout; uint64_t inputChannelLayout = mAudioContext->channel_layout;
if (inputChannelLayout == 0) if (inputChannelLayout == 0)
inputChannelLayout = av_get_default_channel_layout(mAVStream->codec->channels); inputChannelLayout = av_get_default_channel_layout(mAudioContext->channels);
int inputSampleRate = mAVStream->codec->sample_rate; int inputSampleRate = mAudioContext->sample_rate;
mOutputSampleRate = inputSampleRate; mOutputSampleRate = inputSampleRate;
mOutputSampleFormat = inputSampleFormat; mOutputSampleFormat = inputSampleFormat;
@ -133,7 +152,7 @@ int MovieAudioDecoder::synchronize_audio()
{ {
int n = av_get_bytes_per_sample(mOutputSampleFormat) * int n = av_get_bytes_per_sample(mOutputSampleFormat) *
av_get_channel_layout_nb_channels(mOutputChannelLayout); av_get_channel_layout_nb_channels(mOutputChannelLayout);
sample_skip = ((int)(diff * mAVStream->codec->sample_rate) * n); sample_skip = ((int)(diff * mAudioContext->sample_rate) * n);
} }
} }
@ -146,23 +165,31 @@ int MovieAudioDecoder::audio_decode_frame(AVFrame *frame, int &sample_skip)
for(;;) for(;;)
{ {
while(pkt->size > 0) /* send the packet with the compressed data to the decoder */
{ int ret = 0;
int len1, got_frame; if (mGetNextPacket)
ret = avcodec_send_packet(mAudioContext, pkt);
len1 = avcodec_decode_audio4(mAVStream->codec, frame, &got_frame, pkt);
if(len1 < 0) break;
if(len1 <= pkt->size) /* read all the output frames (in general there may be any number of them */
while (ret >= 0)
{ {
/* Move the unread data to the front and clear the end bits */ ret = avcodec_receive_frame(mAudioContext, frame);
int remaining = pkt->size - len1; if (ret == AVERROR_EOF || ret == AVERROR(EAGAIN))
memmove(pkt->data, &pkt->data[len1], remaining); {
av_shrink_packet(pkt, remaining); // EAGAIN means that we need additional packages to decode this frame.
// AVERROR_EOF means the end of package.
mGetNextPacket = true;
break;
}
else if (ret < 0)
{
// Error encountered. Stop to decode audio stream.
av_packet_unref(&mPacket);
mGetNextPacket = true;
return -1;
} }
/* No data yet? Look for more frames */ if(frame->nb_samples <= 0)
if(!got_frame || frame->nb_samples <= 0)
continue; continue;
if(mAudioResampler->mSwr) if(mAudioResampler->mSwr)
@ -170,7 +197,7 @@ int MovieAudioDecoder::audio_decode_frame(AVFrame *frame, int &sample_skip)
if(!mDataBuf || mDataBufLen < frame->nb_samples) if(!mDataBuf || mDataBufLen < frame->nb_samples)
{ {
av_freep(&mDataBuf); av_freep(&mDataBuf);
if(av_samples_alloc(&mDataBuf, NULL, av_get_channel_layout_nb_channels(mOutputChannelLayout), if(av_samples_alloc(&mDataBuf, nullptr, av_get_channel_layout_nb_channels(mOutputChannelLayout),
frame->nb_samples, mOutputSampleFormat, 0) < 0) frame->nb_samples, mOutputSampleFormat, 0) < 0)
break; break;
else else
@ -187,14 +214,16 @@ int MovieAudioDecoder::audio_decode_frame(AVFrame *frame, int &sample_skip)
else else
mFrameData = &frame->data[0]; mFrameData = &frame->data[0];
mAudioClock += (double)frame->nb_samples / int result = frame->nb_samples * av_get_channel_layout_nb_channels(mOutputChannelLayout) *
(double)mAVStream->codec->sample_rate; av_get_bytes_per_sample(mOutputSampleFormat);
/* We have data, return it and come back for more later */ /* We have data, return it and come back for more later */
return frame->nb_samples * av_get_channel_layout_nb_channels(mOutputChannelLayout) * mGetNextPacket = false;
av_get_bytes_per_sample(mOutputSampleFormat); return result;
} }
av_free_packet(pkt);
av_packet_unref(&mPacket);
mGetNextPacket = true;
/* next packet */ /* next packet */
if(mVideoState->audioq.get(pkt, mVideoState) < 0) if(mVideoState->audioq.get(pkt, mVideoState) < 0)
@ -202,7 +231,7 @@ int MovieAudioDecoder::audio_decode_frame(AVFrame *frame, int &sample_skip)
if(pkt->data == mVideoState->mFlushPktData) if(pkt->data == mVideoState->mFlushPktData)
{ {
avcodec_flush_buffers(mAVStream->codec); avcodec_flush_buffers(mAudioContext);
mAudioDiffAccum = 0.0; mAudioDiffAccum = 0.0;
mAudioDiffAvgCount = 0; mAudioDiffAvgCount = 0;
mAudioClock = av_q2d(mAVStream->time_base)*pkt->pts; mAudioClock = av_q2d(mAVStream->time_base)*pkt->pts;

@ -11,11 +11,7 @@ extern "C"
#include <libavutil/avutil.h> #include <libavutil/avutil.h>
#include <libavcodec/avcodec.h> #include <libavcodec/avcodec.h>
#include <libavformat/avformat.h> #include <libavformat/avformat.h>
#if AV_VERSION_INT(52, 2, 0) <= AV_VERSION_INT(LIBAVUTIL_VERSION_MAJOR, \
LIBAVUTIL_VERSION_MINOR, LIBAVUTIL_VERSION_MICRO)
#include <libavutil/channel_layout.h> #include <libavutil/channel_layout.h>
#endif
} }
#if defined(_WIN32) && !defined(__MINGW32__) #if defined(_WIN32) && !defined(__MINGW32__)
@ -35,6 +31,7 @@ class MovieAudioDecoder
{ {
protected: protected:
VideoState *mVideoState; VideoState *mVideoState;
AVCodecContext* mAudioContext;
AVStream *mAVStream; AVStream *mAVStream;
enum AVSampleFormat mOutputSampleFormat; enum AVSampleFormat mOutputSampleFormat;
uint64_t mOutputChannelLayout; uint64_t mOutputChannelLayout;
@ -51,7 +48,7 @@ private:
throw std::bad_alloc(); throw std::bad_alloc();
} }
~AutoAVPacket() ~AutoAVPacket()
{ av_free_packet(this); } { av_packet_unref(this); }
}; };
@ -63,6 +60,7 @@ private:
AutoAVPacket mPacket; AutoAVPacket mPacket;
AVFrame *mFrame; AVFrame *mFrame;
bool mGetNextPacket;
/* averaging filter for audio sync */ /* averaging filter for audio sync */
double mAudioDiffAccum; double mAudioDiffAccum;

@ -11,19 +11,7 @@ extern "C"
#include <libavcodec/avcodec.h> #include <libavcodec/avcodec.h>
#include <libavformat/avformat.h> #include <libavformat/avformat.h>
#include <libswscale/swscale.h> #include <libswscale/swscale.h>
// From libavformat version 55.0.100 and onward the declaration of av_gettime() is
// removed from libavformat/avformat.h and moved to libavutil/time.h
// https://github.com/FFmpeg/FFmpeg/commit/06a83505992d5f49846c18507a6c3eb8a47c650e
#if AV_VERSION_INT(55, 0, 100) <= AV_VERSION_INT(LIBAVFORMAT_VERSION_MAJOR, \
LIBAVFORMAT_VERSION_MINOR, LIBAVFORMAT_VERSION_MICRO)
#include <libavutil/time.h> #include <libavutil/time.h>
#endif
#if LIBAVCODEC_VERSION_INT < AV_VERSION_INT(55,28,1)
#define av_frame_alloc avcodec_alloc_frame
#endif
} }
static const char* flushString = "FLUSH"; static const char* flushString = "FLUSH";
@ -54,6 +42,8 @@ namespace Video
VideoState::VideoState() VideoState::VideoState()
: mAudioFactory(NULL) : mAudioFactory(NULL)
, format_ctx(NULL) , format_ctx(NULL)
, video_ctx(NULL)
, audio_ctx(NULL)
, av_sync_type(AV_SYNC_DEFAULT) , av_sync_type(AV_SYNC_DEFAULT)
, audio_st(NULL) , audio_st(NULL)
, video_st(NULL), frame_last_pts(0.0) , video_st(NULL), frame_last_pts(0.0)
@ -67,8 +57,10 @@ VideoState::VideoState()
{ {
mFlushPktData = flush_pkt.data; mFlushPktData = flush_pkt.data;
// Register all formats and codecs // This is not needed anymore above FFMpeg version 4.0
#if LIBAVCODEC_VERSION_INT < 3805796
av_register_all(); av_register_all();
#endif
} }
VideoState::~VideoState() VideoState::~VideoState()
@ -85,11 +77,12 @@ void VideoState::setAudioFactory(MovieAudioFactory *factory)
void PacketQueue::put(AVPacket *pkt) void PacketQueue::put(AVPacket *pkt)
{ {
AVPacketList *pkt1; AVPacketList *pkt1;
if(pkt != &flush_pkt && !pkt->buf && av_dup_packet(pkt) < 0)
throw std::runtime_error("Failed to duplicate packet");
pkt1 = (AVPacketList*)av_malloc(sizeof(AVPacketList)); pkt1 = (AVPacketList*)av_malloc(sizeof(AVPacketList));
if(!pkt1) throw std::bad_alloc(); if(!pkt1) throw std::bad_alloc();
if(pkt != &flush_pkt && !pkt->buf && av_packet_ref(&pkt1->pkt, pkt) < 0)
throw std::runtime_error("Failed to duplicate packet");
pkt1->pkt = *pkt; pkt1->pkt = *pkt;
pkt1->next = NULL; pkt1->next = NULL;
@ -150,7 +143,7 @@ void PacketQueue::clear()
{ {
pkt1 = pkt->next; pkt1 = pkt->next;
if (pkt->pkt.data != flush_pkt.data) if (pkt->pkt.data != flush_pkt.data)
av_free_packet(&pkt->pkt); av_packet_unref(&pkt->pkt);
av_freep(&pkt); av_freep(&pkt);
} }
this->last_pkt = NULL; this->last_pkt = NULL;
@ -211,7 +204,7 @@ int64_t VideoState::istream_seek(void *user_data, int64_t offset, int whence)
void VideoState::video_display(VideoPicture *vp) void VideoState::video_display(VideoPicture *vp)
{ {
if((*this->video_st)->codec->width != 0 && (*this->video_st)->codec->height != 0) if(this->video_ctx->width != 0 && this->video_ctx->height != 0)
{ {
if (!mTexture.get()) if (!mTexture.get())
{ {
@ -224,7 +217,7 @@ void VideoState::video_display(VideoPicture *vp)
osg::ref_ptr<osg::Image> image = new osg::Image; osg::ref_ptr<osg::Image> image = new osg::Image;
image->setImage((*this->video_st)->codec->width, (*this->video_st)->codec->height, image->setImage(this->video_ctx->width, this->video_ctx->height,
1, GL_RGBA, GL_RGBA, GL_UNSIGNED_BYTE, &vp->data[0], osg::Image::NO_DELETE); 1, GL_RGBA, GL_RGBA, GL_UNSIGNED_BYTE, &vp->data[0], osg::Image::NO_DELETE);
mTexture->setImage(image); mTexture->setImage(image);
@ -303,9 +296,9 @@ int VideoState::queue_picture(AVFrame *pFrame, double pts)
// matches a commonly used format (ie YUV420P) // matches a commonly used format (ie YUV420P)
if(this->sws_context == NULL) if(this->sws_context == NULL)
{ {
int w = (*this->video_st)->codec->width; int w = this->video_ctx->width;
int h = (*this->video_st)->codec->height; int h = this->video_ctx->height;
this->sws_context = sws_getContext(w, h, (*this->video_st)->codec->pix_fmt, this->sws_context = sws_getContext(w, h, this->video_ctx->pix_fmt,
w, h, AV_PIX_FMT_RGBA, SWS_BICUBIC, w, h, AV_PIX_FMT_RGBA, SWS_BICUBIC,
NULL, NULL, NULL); NULL, NULL, NULL);
if(this->sws_context == NULL) if(this->sws_context == NULL)
@ -313,11 +306,11 @@ int VideoState::queue_picture(AVFrame *pFrame, double pts)
} }
vp->pts = pts; vp->pts = pts;
vp->data.resize((*this->video_st)->codec->width * (*this->video_st)->codec->height * 4); vp->data.resize(this->video_ctx->width * this->video_ctx->height * 4);
uint8_t *dst[4] = { &vp->data[0], nullptr, nullptr, nullptr }; uint8_t *dst[4] = { &vp->data[0], nullptr, nullptr, nullptr };
sws_scale(this->sws_context, pFrame->data, pFrame->linesize, sws_scale(this->sws_context, pFrame->data, pFrame->linesize,
0, (*this->video_st)->codec->height, dst, this->rgbaFrame->linesize); 0, this->video_ctx->height, dst, this->rgbaFrame->linesize);
// now we inform our display thread that we have a pic ready // now we inform our display thread that we have a pic ready
this->pictq_windex = (this->pictq_windex+1) % VIDEO_PICTURE_ARRAY_SIZE; this->pictq_windex = (this->pictq_windex+1) % VIDEO_PICTURE_ARRAY_SIZE;
@ -338,7 +331,7 @@ double VideoState::synchronize_video(AVFrame *src_frame, double pts)
pts = this->video_clock; pts = this->video_clock;
/* update the video clock */ /* update the video clock */
frame_delay = av_q2d((*this->video_st)->codec->time_base); frame_delay = av_q2d(this->video_ctx->pkt_timebase);
/* if we are repeating a frame, adjust clock accordingly */ /* if we are repeating a frame, adjust clock accordingly */
frame_delay += src_frame->repeat_pict * (frame_delay * 0.5); frame_delay += src_frame->repeat_pict * (frame_delay * 0.5);
@ -347,30 +340,6 @@ double VideoState::synchronize_video(AVFrame *src_frame, double pts)
return pts; return pts;
} }
static void our_free_buffer(void *opaque, uint8_t *data);
/* These are called whenever we allocate a frame
* buffer. We use this to store the global_pts in
* a frame at the time it is allocated.
*/
static int64_t global_video_pkt_pts = AV_NOPTS_VALUE;
static int our_get_buffer(struct AVCodecContext *c, AVFrame *pic, int flags)
{
AVBufferRef *ref;
int ret = avcodec_default_get_buffer2(c, pic, flags);
int64_t *pts = (int64_t*)av_malloc(sizeof(int64_t));
*pts = global_video_pkt_pts;
pic->opaque = pts;
ref = av_buffer_create((uint8_t *)pic->opaque, sizeof(int64_t), our_free_buffer, pic->buf[0], flags);
pic->buf[0] = ref;
return ret;
}
static void our_free_buffer(void *opaque, uint8_t *data)
{
AVBufferRef *ref = (AVBufferRef *)opaque;
av_buffer_unref(&ref);
av_free(data);
}
class VideoThread : public OpenThreads::Thread class VideoThread : public OpenThreads::Thread
{ {
public: public:
@ -384,19 +353,18 @@ public:
{ {
VideoState* self = mVideoState; VideoState* self = mVideoState;
AVPacket pkt1, *packet = &pkt1; AVPacket pkt1, *packet = &pkt1;
int frameFinished;
AVFrame *pFrame; AVFrame *pFrame;
pFrame = av_frame_alloc(); pFrame = av_frame_alloc();
self->rgbaFrame = av_frame_alloc(); self->rgbaFrame = av_frame_alloc();
avpicture_alloc((AVPicture*)self->rgbaFrame, AV_PIX_FMT_RGBA, (*self->video_st)->codec->width, (*self->video_st)->codec->height); av_image_alloc(self->rgbaFrame->data, self->rgbaFrame->linesize, self->video_ctx->width, self->video_ctx->height, AV_PIX_FMT_RGBA, 1);
while(self->videoq.get(packet, self) >= 0) while(self->videoq.get(packet, self) >= 0)
{ {
if(packet->data == flush_pkt.data) if(packet->data == flush_pkt.data)
{ {
avcodec_flush_buffers((*self->video_st)->codec); avcodec_flush_buffers(self->video_ctx);
self->pictq_mutex.lock(); self->pictq_mutex.lock();
self->pictq_size = 0; self->pictq_size = 0;
@ -405,37 +373,36 @@ public:
self->pictq_mutex.unlock(); self->pictq_mutex.unlock();
self->frame_last_pts = packet->pts * av_q2d((*self->video_st)->time_base); self->frame_last_pts = packet->pts * av_q2d((*self->video_st)->time_base);
global_video_pkt_pts = static_cast<int64_t>(self->frame_last_pts);
continue; continue;
} }
// Save global pts to be stored in pFrame
global_video_pkt_pts = packet->pts;
// Decode video frame // Decode video frame
if(avcodec_decode_video2((*self->video_st)->codec, pFrame, &frameFinished, packet) < 0) int ret = avcodec_send_packet(self->video_ctx, packet);
// EAGAIN is not expected
if (ret < 0)
throw std::runtime_error("Error decoding video frame"); throw std::runtime_error("Error decoding video frame");
double pts = 0; while (!ret)
if(packet->dts != AV_NOPTS_VALUE) {
pts = static_cast<double>(packet->dts); ret = avcodec_receive_frame(self->video_ctx, pFrame);
else if(pFrame->opaque && *(int64_t*)pFrame->opaque != AV_NOPTS_VALUE) if (!ret)
pts = static_cast<double>(*(int64_t*)pFrame->opaque); {
double pts = pFrame->best_effort_timestamp;
pts *= av_q2d((*self->video_st)->time_base); pts *= av_q2d((*self->video_st)->time_base);
av_free_packet(packet);
// Did we get a video frame?
if(frameFinished)
{
pts = self->synchronize_video(pFrame, pts); pts = self->synchronize_video(pFrame, pts);
if(self->queue_picture(pFrame, pts) < 0) if(self->queue_picture(pFrame, pts) < 0)
break; break;
} }
} }
}
av_packet_unref(packet);
av_free(pFrame); av_free(pFrame);
avpicture_free((AVPicture*)self->rgbaFrame); av_freep(&self->rgbaFrame->data[0]);
av_free(self->rgbaFrame); av_free(self->rgbaFrame);
} }
@ -497,7 +464,14 @@ public:
// AVSEEK_FLAG_BACKWARD appears to be needed, otherwise ffmpeg may seek to a keyframe *after* the given time // AVSEEK_FLAG_BACKWARD appears to be needed, otherwise ffmpeg may seek to a keyframe *after* the given time
// we want to seek to any keyframe *before* the given time, so we can continue decoding as normal from there on // we want to seek to any keyframe *before* the given time, so we can continue decoding as normal from there on
if(av_seek_frame(self->format_ctx, streamIndex, timestamp, AVSEEK_FLAG_BACKWARD) < 0) if(av_seek_frame(self->format_ctx, streamIndex, timestamp, AVSEEK_FLAG_BACKWARD) < 0)
{
// In the FFMpeg 4.0 a "filename" field was replaced by "url"
#if LIBAVCODEC_VERSION_INT < 3805796
std::cerr << "Error seeking " << self->format_ctx->filename << std::endl; std::cerr << "Error seeking " << self->format_ctx->filename << std::endl;
#else
std::cerr << "Error seeking " << self->format_ctx->url << std::endl;
#endif
}
else else
{ {
// Clear the packet queues and put a special packet with the new clock time // Clear the packet queues and put a special packet with the new clock time
@ -548,7 +522,7 @@ public:
else if(self->audio_st && packet->stream_index == self->audio_st-pFormatCtx->streams) else if(self->audio_st && packet->stream_index == self->audio_st-pFormatCtx->streams)
self->audioq.put(packet); self->audioq.put(packet);
else else
av_free_packet(packet); av_packet_unref(packet);
} }
} }
catch(std::exception& e) { catch(std::exception& e) {
@ -572,30 +546,43 @@ bool VideoState::update()
int VideoState::stream_open(int stream_index, AVFormatContext *pFormatCtx) int VideoState::stream_open(int stream_index, AVFormatContext *pFormatCtx)
{ {
AVCodecContext *codecCtx;
AVCodec *codec; AVCodec *codec;
if(stream_index < 0 || stream_index >= static_cast<int>(pFormatCtx->nb_streams)) if(stream_index < 0 || stream_index >= static_cast<int>(pFormatCtx->nb_streams))
return -1; return -1;
// Get a pointer to the codec context for the video stream // Get a pointer to the codec context for the video stream
codecCtx = pFormatCtx->streams[stream_index]->codec; codec = avcodec_find_decoder(pFormatCtx->streams[stream_index]->codecpar->codec_id);
codec = avcodec_find_decoder(codecCtx->codec_id); if(!codec)
if(!codec || (avcodec_open2(codecCtx, codec, NULL) < 0))
{ {
fprintf(stderr, "Unsupported codec!\n"); fprintf(stderr, "Unsupported codec!\n");
return -1; return -1;
} }
switch(codecCtx->codec_type) switch(pFormatCtx->streams[stream_index]->codecpar->codec_type)
{ {
case AVMEDIA_TYPE_AUDIO: case AVMEDIA_TYPE_AUDIO:
this->audio_st = pFormatCtx->streams + stream_index; this->audio_st = pFormatCtx->streams + stream_index;
// Get a pointer to the codec context for the video stream
this->audio_ctx = avcodec_alloc_context3(codec);
avcodec_parameters_to_context(this->audio_ctx, pFormatCtx->streams[stream_index]->codecpar);
// This is not needed anymore above FFMpeg version 4.0
#if LIBAVCODEC_VERSION_INT < 3805796
av_codec_set_pkt_timebase(this->audio_ctx, pFormatCtx->streams[stream_index]->time_base);
#endif
if (avcodec_open2(this->audio_ctx, codec, NULL) < 0)
{
fprintf(stderr, "Unsupported codec!\n");
return -1;
}
if (!mAudioFactory) if (!mAudioFactory)
{ {
std::cerr << "No audio factory registered, can not play audio stream" << std::endl; std::cerr << "No audio factory registered, can not play audio stream" << std::endl;
avcodec_close((*this->audio_st)->codec); avcodec_free_context(&this->audio_ctx);
this->audio_st = NULL; this->audio_st = NULL;
return -1; return -1;
} }
@ -604,7 +591,7 @@ int VideoState::stream_open(int stream_index, AVFormatContext *pFormatCtx)
if (!mAudioDecoder.get()) if (!mAudioDecoder.get())
{ {
std::cerr << "Failed to create audio decoder, can not play audio stream" << std::endl; std::cerr << "Failed to create audio decoder, can not play audio stream" << std::endl;
avcodec_close((*this->audio_st)->codec); avcodec_free_context(&this->audio_ctx);
this->audio_st = NULL; this->audio_st = NULL;
return -1; return -1;
} }
@ -614,7 +601,21 @@ int VideoState::stream_open(int stream_index, AVFormatContext *pFormatCtx)
case AVMEDIA_TYPE_VIDEO: case AVMEDIA_TYPE_VIDEO:
this->video_st = pFormatCtx->streams + stream_index; this->video_st = pFormatCtx->streams + stream_index;
codecCtx->get_buffer2 = our_get_buffer; // Get a pointer to the codec context for the video stream
this->video_ctx = avcodec_alloc_context3(codec);
avcodec_parameters_to_context(this->video_ctx, pFormatCtx->streams[stream_index]->codecpar);
// This is not needed anymore above FFMpeg version 4.0
#if LIBAVCODEC_VERSION_INT < 3805796
av_codec_set_pkt_timebase(this->video_ctx, pFormatCtx->streams[stream_index]->time_base);
#endif
if (avcodec_open2(this->video_ctx, codec, NULL) < 0)
{
fprintf(stderr, "Unsupported codec!\n");
return -1;
}
this->video_thread.reset(new VideoThread(this)); this->video_thread.reset(new VideoThread(this));
break; break;
@ -680,9 +681,9 @@ void VideoState::init(std::shared_ptr<std::istream> inputstream, const std::stri
for(i = 0;i < this->format_ctx->nb_streams;i++) for(i = 0;i < this->format_ctx->nb_streams;i++)
{ {
if(this->format_ctx->streams[i]->codec->codec_type == AVMEDIA_TYPE_VIDEO && video_index < 0) if(this->format_ctx->streams[i]->codecpar->codec_type == AVMEDIA_TYPE_VIDEO && video_index < 0)
video_index = i; video_index = i;
if(this->format_ctx->streams[i]->codec->codec_type == AVMEDIA_TYPE_AUDIO && audio_index < 0) if(this->format_ctx->streams[i]->codecpar->codec_type == AVMEDIA_TYPE_AUDIO && audio_index < 0)
audio_index = i; audio_index = i;
} }
@ -720,12 +721,14 @@ void VideoState::deinit()
this->video_thread.reset(); this->video_thread.reset();
} }
if(this->audio_st) if(this->audio_ctx)
avcodec_close((*this->audio_st)->codec); avcodec_free_context(&this->audio_ctx);
this->audio_st = NULL; this->audio_st = NULL;
if(this->video_st) this->audio_ctx = NULL;
avcodec_close((*this->video_st)->codec); if(this->video_ctx)
avcodec_free_context(&this->video_ctx);
this->video_st = NULL; this->video_st = NULL;
this->video_ctx = NULL;
if(this->sws_context) if(this->sws_context)
sws_freeContext(this->sws_context); sws_freeContext(this->sws_context);

@ -15,6 +15,19 @@ namespace osg
class Texture2D; class Texture2D;
} }
extern "C"
{
#include <libavcodec/avcodec.h>
#include <libavformat/avformat.h>
#include <libavutil/imgutils.h>
#include <libavutil/channel_layout.h>
// From version 54.56 binkaudio encoding format changed from S16 to FLTP. See:
// https://gitorious.org/ffmpeg/ffmpeg/commit/7bfd1766d1c18f07b0a2dd042418a874d49ea60d
// https://ffmpeg.zeranoe.com/forum/viewtopic.php?f=15&t=872
#include <libswresample/swresample.h>
}
#include "videodefs.hpp" #include "videodefs.hpp"
#define VIDEO_PICTURE_QUEUE_SIZE 50 #define VIDEO_PICTURE_QUEUE_SIZE 50
@ -131,6 +144,8 @@ struct VideoState {
std::shared_ptr<std::istream> stream; std::shared_ptr<std::istream> stream;
AVFormatContext* format_ctx; AVFormatContext* format_ctx;
AVCodecContext* video_ctx;
AVCodecContext* audio_ctx;
int av_sync_type; int av_sync_type;

Loading…
Cancel
Save