More FFmpeg backend code.

MikuAuahDark · Jun 11, 2024 · 0a2e8f7 · 0a2e8f7
1 parent b846926
commit 0a2e8f7
Show file tree

Hide file tree

Showing 3 changed files with 163 additions and 64 deletions.
diff --git a/src/nav_backend_ffmpeg.cpp b/src/nav_backend_ffmpeg.cpp
@@ -2,6 +2,7 @@
 
 #ifdef NAV_BACKEND_FFMPEG
 
+#include <numeric>
 #include <stdexcept>
 #include <string>
 #include <tuple>
@@ -367,6 +368,35 @@ static std::tuple<nav_pixelformat, AVPixelFormat> getBestPixelFormat(AVPixelForm
 	}
 }
 
+template<typename T>
+double derationalize(T num, T den, double dv0 = 0.0)
+{
+	if (den == 0)
+		return dv0;
+	T gcd = std::gcd(num, den);
+	num /= gcd;
+	den /= gcd;
+	return double(num) / double(den);
+}
+
+inline double derationalize(const AVRational &r, double dv0 = 0.0)
+{
+	return derationalize(r.num, r.den, dv0);
+}
+
+constexpr std::tuple<unsigned int, unsigned int> extractVersion(unsigned int ver)
+{
+	return std::make_tuple(ver >> 16, (ver >> 16) & 0xFF);
+}
+
+template<unsigned int ver>
+bool isVersionCompatible(unsigned int(*func)())
+{
+	constexpr std::tuple<unsigned int, unsigned int> compilever = extractVersion(ver);
+	std::tuple<unsigned int, unsigned int> runtimever = extractVersion(func());
+	return std::get<0>(runtimever) == std::get<0>(compilever) && (std::get<1>(runtimever) >= std::get<1>(compilever));
+}
+
 namespace nav::ffmpeg
 {
 
@@ -386,81 +416,124 @@ FFmpegState::FFmpegState(FFmpegBackend *backend, UniqueAVFormatContext &formatCo
 		nav_streaminfo_t sinfo = {NAV_STREAMTYPE_UNKNOWN};
 		AVStream *stream = formatContext->streams[i];
 		const AVCodec *codec = nullptr;
-		// UniqueAVCodecContext codecContext(nullptr, {avcodec_free_context});
 		AVCodecContext *codecContext = nullptr;
 		SwsContext *rescaler = nullptr;
 		SwrContext *resampler = nullptr;
+		bool good = true;
 
 		switch (stream->codecpar->codec_type)
 		{
 			case AVMEDIA_TYPE_AUDIO:
 			case AVMEDIA_TYPE_VIDEO:
 			{
-				codec = avcodec_find_decoder(stream->codecpar->codec_id);
-				if (!codec)
-				{
-					stream->discard = AVDISCARD_ALL;
-					break;
-				}
+				codec = f->avcodec_find_decoder(stream->codecpar->codec_id);
+				good = codec != nullptr;
 
-				codecContext = avcodec_alloc_context3(codec);
-				if (!codecContext)
+				if (good)
 				{
-					stream->discard = AVDISCARD_ALL;
-					break;
+					codecContext = f->avcodec_alloc_context3(codec);
+					good = codecContext;
 				}
 
-				if (avcodec_parameters_to_context(codecContext, stream->codecpar) < 0)
-				{
-					avcodec_free_context(&codecContext);
-					stream->discard = AVDISCARD_ALL;
-					break;
-				}
+				if (good)
+					good = avcodec_parameters_to_context(codecContext, stream->codecpar) >= 0;
 
-				if (!avcodec_open2(codecContext, codec, nullptr))
-				{
-					avcodec_free_context(&codecContext);
-					stream->discard = AVDISCARD_ALL;
-					break;
-				}
+				if (good)
+					good = f->avcodec_open2(codecContext, codec, nullptr) >= 0;
 
-				if (stream->codecpar->codec_type == AVMEDIA_TYPE_AUDIO)
-				{
-					// Audio stream
-					sinfo.audio.format = audioFormatFromAVSampleFormat(
-						getPackedFormatOf((AVSampleFormat) stream->codecpar->format)
-					);
-					sinfo.audio.sample_rate = stream->codecpar->sample_rate;
-					sinfo.audio.nchannels = stream->codecpar->ch_layout.nb_channels;
-					sinfo.type = NAV_STREAMTYPE_AUDIO;
-				}
-				else
+				if (good)
 				{
-					AVPixelFormat originalFormat = (AVPixelFormat) stream->codecpar->format;
-					AVPixelFormat rescaleFormat = originalFormat;
-					std::tie(sinfo.video.format, rescaleFormat) = getBestPixelFormat(originalFormat);
-
-					if (originalFormat != rescaleFormat)
+					if (stream->codecpar->codec_type == AVMEDIA_TYPE_AUDIO)
 					{
-						// Need to rescale
+						AVSampleFormat originalFormat = (AVSampleFormat) stream->codecpar->format;
+						AVSampleFormat packedFormat = getPackedFormatOf(originalFormat);
+						if (packedFormat != originalFormat)
+						{
+							// Need to resample
+							good = f->swr_alloc_set_opts2(
+								&resampler,
+								&stream->codecpar->ch_layout,
+								packedFormat,
+								stream->codecpar->sample_rate,
+								&stream->codecpar->ch_layout,
+								originalFormat,
+								stream->codecpar->sample_rate,
+								0, nullptr
+							) >= 0;
+						}
+
+						if (good)
+						{
+							// Audio stream
+							sinfo.audio.format = audioFormatFromAVSampleFormat(packedFormat);
+							sinfo.audio.sample_rate = stream->codecpar->sample_rate;
+							sinfo.audio.nchannels = stream->codecpar->ch_layout.nb_channels;
+							sinfo.type = NAV_STREAMTYPE_AUDIO;
+						}
+					}
+					else
+					{
+						AVPixelFormat originalFormat = (AVPixelFormat) stream->codecpar->format;
+						AVPixelFormat rescaleFormat = originalFormat;
+						std::tie(sinfo.video.format, rescaleFormat) = getBestPixelFormat(originalFormat);
+
+						if (originalFormat != rescaleFormat)
+						{
+							// Need to rescale
+							rescaler = f->sws_getContext(
+								stream->codecpar->width,
+								stream->codecpar->height,
+								originalFormat,
+								stream->codecpar->width,
+								stream->codecpar->height,
+								rescaleFormat,
+								SWS_BICUBIC, nullptr, nullptr, nullptr
+							);
+							good = rescaler != nullptr;
+						}
+
+						if (good)
+						{
+							// Video stream
+							sinfo.type = NAV_STREAMTYPE_VIDEO;
+							sinfo.video.width = (uint32_t) stream->codecpar->width;
+							sinfo.video.height = (uint32_t) stream->codecpar->height;
+							sinfo.video.fps = derationalize(stream->avg_frame_rate);
+							// sinfo.video.format is already set
+						}
 					}
-
-					// Video stream
-					sinfo.type = NAV_STREAMTYPE_VIDEO;
 				}
 			}
 			default:
-				stream->discard = AVDISCARD_ALL;
+				good = false;
 				break;
 		}
 
+		if (!good)
+		{
+			stream->discard = AVDISCARD_ALL;
+			f->avcodec_free_context(&codecContext);
+			f->swr_free(&resampler);
+			f->sws_freeContext(rescaler); rescaler = nullptr;
+		}
+
 		streamInfo.push_back(sinfo);
 		decoders.push_back(codecContext);
 		resamplers.push_back(resampler);
 		rescalers.push_back(rescaler);
 	}
 }
 
+FFmpegState::~FFmpegState()
+{
+	for (AVCodecContext *&decoder: decoders)
+		f->avcodec_free_context(&decoder);
+	for (SwrContext *&resampler: resamplers)
+		f->swr_free(&resampler);
+	for (SwsContext *&rescaler: rescalers)
+		f->sws_freeContext(rescaler);
+}
+
 size_t FFmpegState::getStreamCount() noexcept
 {
 	return formatContext->nb_streams;
@@ -470,17 +543,30 @@ FFmpegBackend::FFmpegBackend()
 : avutil(getLibName("avutil", LIBAVUTIL_VERSION_MAJOR))
 , avcodec(getLibName("avcodec", LIBAVCODEC_VERSION_MAJOR))
 , avformat(getLibName("avformat", LIBAVFORMAT_VERSION_MAJOR))
+, swresample(getLibName("swresample", LIBSWRESAMPLE_VERSION_MAJOR))
+, swscale(getLibName("swscale", LIBSWSCALE_VERSION_MAJOR))
+#define _NAV_PROXY_FUNCTION_POINTER_FFMPEG(lib, n) , n(nullptr)
+#include "nav_backend_ffmpeg_funcptr.h"
+#undef _NAV_PROXY_FUNCTION_POINTER_FFMPEG
 {
 	if (
-		!avformat.get("avformat_alloc_context", &avformat_alloc_context) ||
-		!avformat.get("avformat_find_stream_info", &avformat_find_stream_info) ||
-		!avformat.get("avformat_free_context", &avformat_free_context) ||
-		!avformat.get("avformat_open_input", &avformat_open_input) ||
-		!avformat.get("avio_context_free", &avio_context_free) ||
-		!avutil.get("av_malloc", &av_malloc) ||
-		!avutil.get("av_strerror", &av_strerror)
+#define _NAV_PROXY_FUNCTION_POINTER_FFMPEG(lib, n) !lib.get(#n, &n) ||
+#include "nav_backend_ffmpeg_funcptr.h"
+#undef _NAV_PROXY_FUNCTION_POINTER_FFMPEG
+		!true // needed to fix the preprocessor stuff
 	)
 		throw std::runtime_error("Cannot load FFmpeg function pointer");
+
+	if (!isVersionCompatible<LIBAVCODEC_VERSION_INT>(avcodec_version))
+		throw std::runtime_error("avcodec version mismatch");
+	if (!isVersionCompatible<LIBAVFORMAT_VERSION_INT>(avformat_version))
+		throw std::runtime_error("avformat version mismatch");
+	if (!isVersionCompatible<LIBAVUTIL_VERSION_INT>(avutil_version))
+		throw std::runtime_error("avutil version mismatch");
+	if (!isVersionCompatible<LIBSWRESAMPLE_VERSION_INT>(swresample_version))
+		throw std::runtime_error("swresample version mismatch");
+	if (!isVersionCompatible<LIBSWSCALE_VERSION_INT>(swscale_version))
+		throw std::runtime_error("swscale version mismatch");
 }
 
 FFmpegBackend::~FFmpegBackend()

diff --git a/src/nav_backend_ffmpeg_funcptr.h b/src/nav_backend_ffmpeg_funcptr.h
@@ -0,0 +1,21 @@
+_NAV_PROXY_FUNCTION_POINTER_FFMPEG(avutil, av_malloc)
+_NAV_PROXY_FUNCTION_POINTER_FFMPEG(avutil, av_strerror)
+_NAV_PROXY_FUNCTION_POINTER_FFMPEG(avutil, avutil_version)
+_NAV_PROXY_FUNCTION_POINTER_FFMPEG(avcodec, avcodec_alloc_context3)
+_NAV_PROXY_FUNCTION_POINTER_FFMPEG(avcodec, avcodec_find_decoder)
+_NAV_PROXY_FUNCTION_POINTER_FFMPEG(avcodec, avcodec_free_context)
+_NAV_PROXY_FUNCTION_POINTER_FFMPEG(avcodec, avcodec_open2)
+_NAV_PROXY_FUNCTION_POINTER_FFMPEG(avcodec, avcodec_parameters_to_context)
+_NAV_PROXY_FUNCTION_POINTER_FFMPEG(avcodec, avcodec_version)
+_NAV_PROXY_FUNCTION_POINTER_FFMPEG(avformat, avformat_alloc_context)
+_NAV_PROXY_FUNCTION_POINTER_FFMPEG(avformat, avformat_find_stream_info)
+_NAV_PROXY_FUNCTION_POINTER_FFMPEG(avformat, avformat_free_context)
+_NAV_PROXY_FUNCTION_POINTER_FFMPEG(avformat, avformat_open_input)
+_NAV_PROXY_FUNCTION_POINTER_FFMPEG(avformat, avio_context_free)
+_NAV_PROXY_FUNCTION_POINTER_FFMPEG(avformat, avformat_version)
+_NAV_PROXY_FUNCTION_POINTER_FFMPEG(swresample, swr_alloc_set_opts2)
+_NAV_PROXY_FUNCTION_POINTER_FFMPEG(swresample, swr_free)
+_NAV_PROXY_FUNCTION_POINTER_FFMPEG(swresample, swresample_version)
+_NAV_PROXY_FUNCTION_POINTER_FFMPEG(swscale, sws_getContext)
+_NAV_PROXY_FUNCTION_POINTER_FFMPEG(swscale, sws_freeContext)
+_NAV_PROXY_FUNCTION_POINTER_FFMPEG(swscale, swscale_version)
diff --git a/src/nav_backend_ffmpeg_internal.hpp b/src/nav_backend_ffmpeg_internal.hpp
@@ -73,19 +73,11 @@ class FFmpegBackend: public Backend
 private:
 	friend class FFmpegState;
 
-	DynLib avutil, avcodec, avformat;
-
-#define _NAV_PROXY_FUNCTION_POINTER(n) decltype(n) *n
-	// avformat
-	_NAV_PROXY_FUNCTION_POINTER(avformat_alloc_context);
-	_NAV_PROXY_FUNCTION_POINTER(avformat_find_stream_info);
-	_NAV_PROXY_FUNCTION_POINTER(avformat_free_context);
-	_NAV_PROXY_FUNCTION_POINTER(avformat_open_input);
-	_NAV_PROXY_FUNCTION_POINTER(avio_context_free);
-	// avutil
-	_NAV_PROXY_FUNCTION_POINTER(av_malloc);
-	_NAV_PROXY_FUNCTION_POINTER(av_strerror);
-#undef _NAV_PROXY_FUNCTION_POINTER
+	DynLib avutil, avcodec, avformat, swscale, swresample;
+
+#define _NAV_PROXY_FUNCTION_POINTER_FFMPEG(lib, n) decltype(n) *n;
+#include "nav_backend_ffmpeg_funcptr.h"
+#undef _NAV_PROXY_FUNCTION_POINTER_FFMPEG
 };
 
 }