10#include <QtCore/qloggingcategory.h>
11#include <QtCore/qoperatingsystemversion.h>
12#include <QtCore/private/qexpected_p.h>
15#include "libavutil/display.h"
16#include "libavutil/pixdesc.h"
21namespace ranges = QtMultimediaPrivate::ranges;
22using namespace Qt::Literals;
30AVCodecID avCodecID(
const QMediaEncoderSettings &settings)
32 const QMediaFormat::VideoCodec qVideoCodec = settings.videoCodec();
33 return QFFmpegMediaFormatInfo::codecIdForVideoCodec(qVideoCodec);
38VideoFrameEncoderUPtr
VideoFrameEncoder::create(
const QMediaEncoderSettings &encoderSettings,
40 AVFormatContext *formatContext)
42 Q_ASSERT(isSwPixelFormat(sourceParams.swFormat));
43 Q_ASSERT(isHwPixelFormat(sourceParams.format) || sourceParams.swFormat == sourceParams.format);
45 AVStream *stream = createStream(sourceParams, formatContext);
50 CreationResult result;
52 auto findAndOpenAVEncoder = [&](
const auto &scoresGetter,
const auto &creator) {
53 auto createWithTargetFormatFallback = [&](
const Codec &codec) {
54 result = creator(codec, AVPixelFormatSet{});
58 if (!result.encoder) {
59 const auto targetFormatDesc = av_pix_fmt_desc_get(result.targetFormat);
60 const bool is420TargetFormat = targetFormatDesc
61 && targetFormatDesc->log2_chroma_h == 1
62 && targetFormatDesc->log2_chroma_w == 1;
63 if (is420TargetFormat && result.targetFormat != AV_PIX_FMT_NV12)
64 result = creator(codec, AVPixelFormatSet{ result.targetFormat });
67 return result.encoder !=
nullptr;
69 return QFFmpeg::findAndOpenAVEncoder(avCodecID(encoderSettings), scoresGetter,
70 createWithTargetFormatFallback);
74 const auto &deviceTypes = HWAccel::encodingDeviceTypes();
76 auto findDeviceType = [&](
const Codec &codec) {
77 std::optional<AVPixelFormat> pixelFormat = findAVPixelFormat(codec, &isHwPixelFormat);
79 return deviceTypes.end();
82 if (QOperatingSystemVersion::current() < QOperatingSystemVersion::MacOSSequoia
83 && codec.name() ==
"hevc_videotoolbox"_L1) {
84 return ranges::find_if(deviceTypes, [&](AVHWDeviceType deviceType) {
85 return pixelFormatForHwDevice(deviceType) == pixelFormat;
90 const AVCodecHWConfig *cfg = codec.hwConfigForPixelFormat(*pixelFormat);
92 return deviceTypes.end();
94 bool supportsHwDeviceContext =
95 (cfg->methods & AV_CODEC_HW_CONFIG_METHOD_HW_DEVICE_CTX) != 0;
96 if (!supportsHwDeviceContext)
97 return deviceTypes.end();
99 return ranges::find_if(deviceTypes, [&](AVHWDeviceType deviceType) {
100 return pixelFormatForHwDevice(deviceType) == pixelFormat;
104 findAndOpenAVEncoder(
105 [&](
const Codec &codec) {
106 const auto found = findDeviceType(codec);
107 if (found == deviceTypes.end())
108 return NotSuitableAVScore;
110 return DefaultAVScore -
static_cast<AVScore>(found - deviceTypes.begin());
112 [&](
const Codec &codec,
const AVPixelFormatSet &prohibitedTargetFormats) {
113 HWAccelUPtr hwAccel = HWAccel::create(*findDeviceType(codec));
115 return CreationResult{};
116 if (!hwAccel->matchesSizeContraints(encoderSettings.videoResolution()))
117 return CreationResult{};
118 return create(stream, codec, std::move(hwAccel), sourceParams, encoderSettings,
119 prohibitedTargetFormats);
123 if (!result.encoder) {
124 findAndOpenAVEncoder(
125 [&](
const Codec &codec) {
126 return findSWFormatScores(codec, sourceParams.swFormat);
128 [&](
const Codec &codec,
const AVPixelFormatSet &prohibitedTargetFormats) {
129 return create(stream, codec,
nullptr, sourceParams, encoderSettings,
130 prohibitedTargetFormats);
134 if (
auto &encoder = result.encoder)
135 qCDebug(qLcVideoFrameEncoder)
136 <<
"found" << (encoder->m_accel ?
"hw" :
"sw") <<
"encoder"
137 << encoder->m_codec.name() <<
"for id" << encoder->m_codec.id();
139 qCWarning(qLcVideoFrameEncoder) <<
"No valid video codecs found";
141 return std::move(result.encoder);
146 const QMediaEncoderSettings &encoderSettings)
147 : m_settings(encoderSettings),
150 m_accel(std::move(hwAccel)),
151 m_sourceSize(sourceParams.size),
152 m_sourceFormat(sourceParams.format),
153 m_sourceSWFormat(sourceParams.swFormat)
158 AVFormatContext *formatContext)
160 AVStream *stream = avformat_new_stream(formatContext,
nullptr);
165 stream->id = formatContext->nb_streams - 1;
166 stream->codecpar->codec_type = AVMEDIA_TYPE_VIDEO;
168 stream->codecpar->color_trc = sourceParams.colorTransfer;
169 stream->codecpar->color_space = sourceParams.colorSpace;
170 stream->codecpar->color_range = sourceParams.colorRange;
172 if (sourceParams.transform.rotation != QtVideo::Rotation::None || sourceParams.transform.mirroredHorizontallyAfterRotation) {
173 constexpr auto displayMatrixSize =
sizeof(int32_t) * 9;
174 AVPacketSideData sideData = {
reinterpret_cast<uint8_t *>(av_malloc(displayMatrixSize)),
175 displayMatrixSize, AV_PKT_DATA_DISPLAYMATRIX };
176 int32_t *matrix =
reinterpret_cast<int32_t *>(sideData.data);
177 av_display_rotation_set(matrix,
static_cast<
double>(sourceParams.transform.rotation));
178 if (sourceParams.transform.mirroredHorizontallyAfterRotation)
179 av_display_matrix_flip(matrix, sourceParams.transform.mirroredHorizontallyAfterRotation,
false);
181 addStreamSideData(stream, sideData);
190 const QMediaEncoderSettings &encoderSettings,
191 const AVPixelFormatSet &prohibitedTargetFormats)
194 sourceParams, encoderSettings));
195 frameEncoder->initTargetSize();
197 frameEncoder->initCodecFrameRate();
199 if (!frameEncoder->initTargetFormats(prohibitedTargetFormats))
202 frameEncoder->initStream();
204 const AVPixelFormat targetFormat = frameEncoder->m_targetFormat;
206 if (!frameEncoder->initCodecContext())
207 return {
nullptr, targetFormat };
209 if (!frameEncoder->open())
210 return {
nullptr, targetFormat };
212 frameEncoder->updateConversions();
214 return {
std::move(frameEncoder), targetFormat };
219 m_targetSize = adjustVideoResolution(m_codec, m_settings.videoResolution());
223 if (m_codec.name() == u"h264_mf") {
224 auto makeEven = [](
int size) {
return size & ~1; };
225 const QSize fixedSize(makeEven(m_targetSize.width()), makeEven(m_targetSize.height()));
226 if (fixedSize != m_targetSize) {
227 qCDebug(qLcVideoFrameEncoder) <<
"Fix odd video resolution for codec" << m_codec.name()
228 <<
":" << m_targetSize <<
"->" << fixedSize;
229 m_targetSize = fixedSize;
237 const auto frameRates = m_codec.frameRates();
238 if (qLcVideoFrameEncoder().isEnabled(QtDebugMsg))
239 for (AVRational rate : frameRates)
240 qCDebug(qLcVideoFrameEncoder) <<
"supported frame rate:" << rate;
242 m_codecFrameRate = adjustFrameRate(frameRates, m_settings.videoFrameRate());
243 qCDebug(qLcVideoFrameEncoder) <<
"Adjusted frame rate:" << m_codecFrameRate;
246bool VideoFrameEncoder::initTargetFormats(
const AVPixelFormatSet &prohibitedTargetFormats)
248 const auto format = findTargetFormat(m_sourceFormat, m_sourceSWFormat, m_codec, m_accel.get(),
249 prohibitedTargetFormats);
252 qWarning() <<
"Could not find target format for codecId" << m_codec.id();
256 m_targetFormat = *format;
258 if (isHwPixelFormat(m_targetFormat)) {
263 const auto swFormat = findTargetSWFormat(m_sourceSWFormat, m_codec, *m_accel);
265 qWarning() <<
"Cannot find software target format. sourceSWFormat:" << m_sourceSWFormat
266 <<
"targetFormat:" << m_targetFormat;
270 m_targetSWFormat = *swFormat;
272 m_accel->createFramesContext(m_targetSWFormat, m_targetSize);
273 if (!m_accel->hwFramesContextAsBuffer())
276 m_targetSWFormat = m_targetFormat;
286 m_stream->codecpar->codec_id = m_codec.id();
290 if (m_codec.id() == AV_CODEC_ID_HEVC)
291 m_stream->codecpar->codec_tag = MKTAG(
'h',
'v',
'c',
'1');
293 m_stream->codecpar->codec_tag = 0;
296 m_stream->codecpar->format = m_targetFormat;
297 m_stream->codecpar->width = m_targetSize.width();
298 m_stream->codecpar->height = m_targetSize.height();
299 m_stream->codecpar->sample_aspect_ratio = AVRational{ 1, 1 };
300#if QT_CODEC_PARAMETERS_HAVE_FRAMERATE
301 m_stream->codecpar->framerate = m_codecFrameRate;
304 const auto frameRates = m_codec.frameRates();
305 m_stream->time_base = adjustFrameTimeBase(frameRates, m_codecFrameRate);
310 Q_ASSERT(m_stream->codecpar->codec_id);
312 m_codecContext.reset(avcodec_alloc_context3(m_codec.get()));
313 if (!m_codecContext) {
314 qWarning() <<
"Could not allocate codec context";
319 avcodec_parameters_to_context(m_codecContext.get(), m_stream->codecpar);
320#if !QT_CODEC_PARAMETERS_HAVE_FRAMERATE
321 m_codecContext->framerate = m_codecFrameRate;
323 m_codecContext->time_base = m_stream->time_base;
324 qCDebug(qLcVideoFrameEncoder) <<
"codecContext time base" << m_codecContext->time_base.num
325 << m_codecContext->time_base.den;
328 auto deviceContext = m_accel->hwDeviceContextAsBuffer();
329 Q_ASSERT(deviceContext);
330 m_codecContext->hw_device_ctx = av_buffer_ref(deviceContext);
332 if (
auto framesContext = m_accel->hwFramesContextAsBuffer())
333 m_codecContext->hw_frames_ctx = av_buffer_ref(framesContext);
336 avcodec_parameters_from_context(m_stream->codecpar, m_codecContext.get());
343 Q_ASSERT(m_codecContext);
345 AVDictionaryHolder opts;
346 applyVideoEncoderOptions(m_settings, m_codec.name(), m_codecContext.get(), opts);
347 applyExperimentalCodecOptions(m_codec, opts);
349 qCDebug(qLcVideoFrameEncoder) <<
"Opening encoder" << m_codec.name() <<
"with" << opts;
351 const int res = avcodec_open2(m_codecContext.get(), m_codec.get(), opts);
353 qCWarning(qLcVideoFrameEncoder)
354 <<
"Couldn't open video encoder" << m_codec.name() <<
"; result:" << AVError(res);
357 qCDebug(qLcVideoFrameEncoder) <<
"video codec opened" << res <<
"time base"
358 << m_codecContext->time_base;
364 return m_codecFrameRate.den ? qreal(m_codecFrameRate.num) / m_codecFrameRate.den : 0.;
369 qint64 div = 1'000'000 * m_stream->time_base.num;
370 return div != 0 ? (us * m_stream->time_base.den + div / 2) / div : 0;
375 return m_stream->time_base;
381 FrameConverter(AVFrameUPtr inputFrame) : m_inputFrame{ std::move(inputFrame) } { }
385 AVFrameUPtr cpuFrame = makeAVFrame();
387 int err = av_hwframe_transfer_data(cpuFrame.get(), currentFrame(), 0);
389 qCDebug(qLcVideoFrameEncoder)
390 <<
"Error transferring frame data to surface." << AVError(err);
394 setFrame(std::move(cpuFrame));
398 void convert(SwsContext *scaleContext, AVPixelFormat format,
const QSize &size)
400 AVFrameUPtr scaledFrame = makeAVFrame();
402 scaledFrame->format = format;
403 scaledFrame->width = size.width();
404 scaledFrame->height = size.height();
406 av_frame_get_buffer(scaledFrame.get(), 0);
408 const AVFrame *srcFrame = currentFrame();
410 const auto scaledHeight =
411 sws_scale(scaleContext, srcFrame->data, srcFrame->linesize, 0, srcFrame->height,
412 scaledFrame->data, scaledFrame->linesize);
414 if (scaledHeight != scaledFrame->height)
415 qCWarning(qLcVideoFrameEncoder)
416 <<
"Scaled height" << scaledHeight <<
"!=" << scaledFrame->height;
418 setFrame(std::move(scaledFrame));
421 int uploadToHw(HWAccel *accel)
423 auto *hwFramesContext = accel->hwFramesContextAsBuffer();
424 Q_ASSERT(hwFramesContext);
425 AVFrameUPtr hwFrame = makeAVFrame();
427 return AVERROR(ENOMEM);
429 int err = av_hwframe_get_buffer(hwFramesContext, hwFrame.get(), 0);
431 qCDebug(qLcVideoFrameEncoder) <<
"Error getting HW buffer" << AVError(err);
434 qCDebug(qLcVideoFrameEncoder) <<
"got HW buffer";
436 if (!hwFrame->hw_frames_ctx) {
437 qCDebug(qLcVideoFrameEncoder) <<
"no hw frames context";
438 return AVERROR(ENOMEM);
440 err = av_hwframe_transfer_data(hwFrame.get(), currentFrame(), 0);
442 qCDebug(qLcVideoFrameEncoder)
443 <<
"Error transferring frame data to surface." << AVError(err);
447 setFrame(std::move(hwFrame));
452 q23::expected<AVFrameUPtr,
int> takeResultFrame()
455 AVFrameUPtr converted =
std::move(m_convertedFrame);
456 AVFrameUPtr input =
std::move(m_inputFrame);
462 const int status = av_frame_copy_props(converted.get(), input.get());
464 return q23::unexpected{ status };
470 void setFrame(AVFrameUPtr frame) { m_convertedFrame = std::move(frame); }
472 AVFrame *currentFrame()
const
474 if (m_convertedFrame)
475 return m_convertedFrame.get();
476 return m_inputFrame.get();
479 AVFrameUPtr m_inputFrame;
480 AVFrameUPtr m_convertedFrame;
486 if (!m_codecContext) {
487 qWarning() <<
"codec context is not initialized!";
488 return AVERROR(EINVAL);
492 return avcodec_send_frame(m_codecContext.get(),
nullptr);
494 if (!updateSourceFormatAndSize(inputFrame.get()))
495 return AVERROR(EINVAL);
498 inputFrame->quality = m_codecContext->global_quality;
500 FrameConverter converter{
std::move(inputFrame) };
502 if (m_downloadFromHW) {
503 const int status = converter.downloadFromHw();
509 converter.convert(m_scaleContext.get(), m_targetSWFormat, m_targetSize);
512 const int status = converter.uploadToHw(m_accel.get());
517 const q23::expected<AVFrameUPtr,
int> resultFrame = converter.takeResultFrame();
519 return resultFrame.error();
521 AVRational timeBase{};
523 getAVFrameTime(*resultFrame.value(), pts, timeBase);
524 qCDebug(qLcVideoFrameEncoder) <<
"sending frame" << pts <<
"*" << timeBase;
526 return avcodec_send_frame(m_codecContext.get(), resultFrame.value().get());
529qint64
VideoFrameEncoder::estimateDuration(
const AVPacket &packet,
bool isFirstPacket)
537 const AVRational frameDuration = av_inv_q(m_codecContext->framerate);
538 duration = av_rescale_q(1, frameDuration, m_stream->time_base);
541 duration = packet.pts - m_lastPacketTime;
552 auto getPacket = [&]() {
553 AVPacketUPtr packet(av_packet_alloc());
554 const int ret = avcodec_receive_packet(m_codecContext.get(), packet.get());
556 if (ret != AVERROR(EOF) && ret != AVERROR(EAGAIN) && ret != AVERROR_EOF)
557 qCDebug(qLcVideoFrameEncoder) <<
"Error receiving packet" << ret << AVError(ret);
558 return AVPacketUPtr{};
560 auto ts = timeStampMs(packet->pts, m_stream->time_base);
562 qCDebug(qLcVideoFrameEncoder)
563 <<
"got a packet" << packet->pts << packet->dts << (ts ? *ts : 0);
565 packet->stream_index = m_stream->id;
567 if (packet->duration == 0) {
568 const bool firstFrame = m_lastPacketTime == AV_NOPTS_VALUE;
569 packet->duration = estimateDuration(*packet, firstFrame);
572 m_lastPacketTime = packet->pts;
577 auto fixPacketDts = [&](AVPacket &packet) {
581 if (packet.dts == AV_NOPTS_VALUE)
584 packet.dts -= m_packetDtsOffset;
586 if (packet.pts != AV_NOPTS_VALUE && packet.pts < packet.dts) {
587 m_packetDtsOffset += packet.dts - packet.pts;
588 packet.dts = packet.pts;
590 if (m_prevPacketDts != AV_NOPTS_VALUE && packet.dts < m_prevPacketDts) {
591 qCWarning(qLcVideoFrameEncoder)
592 <<
"Skip packet; failed to fix dts:" << packet.dts << m_prevPacketDts;
597 m_prevPacketDts = packet.dts;
602 while (
auto packet = getPacket()) {
603 if (fixPacketDts(*packet))
614 const QSize frameSize(frame->width, frame->height);
615 const AVPixelFormat frameFormat =
static_cast<AVPixelFormat>(frame->format);
617 if (frameSize == m_sourceSize && frameFormat == m_sourceFormat)
620 auto applySourceFormatAndSize = [&](AVPixelFormat swFormat) {
621 m_sourceSize = frameSize;
622 m_sourceFormat = frameFormat;
623 m_sourceSWFormat = swFormat;
628 if (frameFormat == m_sourceFormat)
629 return applySourceFormatAndSize(m_sourceSWFormat);
631 if (frameFormat == AV_PIX_FMT_NONE) {
632 qWarning() <<
"Got a frame with invalid pixel format";
636 if (isSwPixelFormat(frameFormat))
637 return applySourceFormatAndSize(frameFormat);
639 auto framesCtx =
reinterpret_cast<
const AVHWFramesContext *>(frame->hw_frames_ctx->data);
640 if (!framesCtx || framesCtx->sw_format == AV_PIX_FMT_NONE) {
641 qWarning() <<
"Cannot update conversions as hw frame has invalid framesCtx" << framesCtx;
645 return applySourceFormatAndSize(framesCtx->sw_format);
650 const bool needToScale = m_sourceSize != m_targetSize;
651 const bool zeroCopy = m_sourceFormat == m_targetFormat && !needToScale;
653 m_scaleContext.reset();
656 m_downloadFromHW =
false;
657 m_uploadToHW =
false;
659 qCDebug(qLcVideoFrameEncoder) <<
"zero copy encoding, format" << m_targetFormat;
664 m_downloadFromHW = m_sourceFormat != m_sourceSWFormat;
665 m_uploadToHW = m_targetFormat != m_targetSWFormat;
667 if (m_sourceSWFormat != m_targetSWFormat || needToScale) {
668 qCDebug(qLcVideoFrameEncoder)
669 <<
"video source and encoder use different formats:" << m_sourceSWFormat
670 << m_targetSWFormat <<
"or sizes:" << m_sourceSize << m_targetSize;
672 const SwsFlags conversionType = getScaleConversionType(m_sourceSize, m_targetSize);
674 m_scaleContext = createSwsContext(m_sourceSize, m_sourceSWFormat, m_targetSize,
675 m_targetSWFormat, conversionType);
678 qCDebug(qLcVideoFrameEncoder) <<
"VideoFrameEncoder conversions initialized:"
679 <<
"sourceFormat:" << m_sourceFormat
680 << (isHwPixelFormat(m_sourceFormat) ?
"(hw)" :
"(sw)")
681 <<
"targetFormat:" << m_targetFormat
682 << (isHwPixelFormat(m_targetFormat) ?
"(hw)" :
"(sw)")
683 <<
"sourceSWFormat:" << m_sourceSWFormat
684 <<
"targetSWFormat:" << m_targetSWFormat
685 <<
"scaleContext:" << m_scaleContext.get();
const AVRational & getTimeBase() const
qint64 getPts(qint64 ms) const
int sendFrame(AVFrameUPtr inputFrame)
AVPacketUPtr retrievePacket()
qreal codecFrameRate() const
QT_MANGLE_NAMESPACE(QMacScreenCaptureStreamDelegate) QMacScreenCaptureStreamDelegate
QT_BEGIN_NAMESPACE Q_STATIC_LOGGING_CATEGORY(lcSynthesizedIterableAccess, "qt.iterable.synthesized", QtWarningMsg)