File: mux.cpp

package info (click to toggle)
nageru 2.3.2-1
links: PTS
area: main
in suites: forky, sid
size: 3,120 kB
sloc: cpp: 39,131; perl: 94; sh: 18; makefile: 4
file content (332 lines) | stat: -rw-r--r-- 10,430 bytes
parent folder | download | duplicates (2)
#include "shared/mux.h"

#include <algorithm>
#include <assert.h>
#include <mutex>
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <string>
#include <utility>
#include <vector>

extern "C" {
#include <libavformat/avio.h>
#include <libavutil/avutil.h>
#include <libavutil/dict.h>
#include <libavutil/mathematics.h>
#include <libavutil/mem.h>
#include <libavutil/pixfmt.h>
#include <libavutil/rational.h>
}

#include "shared/metrics.h"
#include "shared/shared_defs.h"
#include "shared/timebase.h"

using namespace std;

struct PacketBefore {
	PacketBefore(const AVFormatContext *ctx) : ctx(ctx) {}

	bool operator() (const Mux::QueuedPacket &a_qp, const Mux::QueuedPacket &b_qp) const {
		const AVPacket *a = a_qp.pkt;
		const AVPacket *b = b_qp.pkt;
		int64_t a_dts = (a->dts == AV_NOPTS_VALUE ? a->pts : a->dts);
		int64_t b_dts = (b->dts == AV_NOPTS_VALUE ? b->pts : b->dts);
		AVRational a_timebase = ctx->streams[a->stream_index]->time_base;
		AVRational b_timebase = ctx->streams[b->stream_index]->time_base;
		if (av_compare_ts(a_dts, a_timebase, b_dts, b_timebase) != 0) {
			return av_compare_ts(a_dts, a_timebase, b_dts, b_timebase) < 0;
		} else {
			return av_compare_ts(a->pts, a_timebase, b->pts, b_timebase) < 0;
		}
	}

	const AVFormatContext * const ctx;
};

Mux::Mux(AVFormatContext *avctx, int width, int height, Codec video_codec, const string &video_extradata, const AVCodecParameters *audio_codecpar, AVColorSpace color_space, int time_base, function<void(int64_t)> write_callback, WriteStrategy write_strategy, const vector<MuxMetrics *> &metrics, WithSubtitles with_subtitles)
	: write_strategy(write_strategy), avctx(avctx), write_callback(write_callback), metrics(metrics)
{
	// MPEG-TS ostensibly needs some conversions (e.g. for differing start codes),
	// so let FFmpeg insert them as needed in case we are muxing to that.
	// Curiously enough, things actually seem to go quite fine without
	// (and it also seems FFmpeg's MPEG-TS muxer automatically does stuff like
	// repeat PPS/SPS before keyframes for us), but it can't hurt.
	avctx->flags |= AVFMT_FLAG_AUTO_BSF;

	AVStream *avstream_video = avformat_new_stream(avctx, nullptr);
	if (avstream_video == nullptr) {
		fprintf(stderr, "avformat_new_stream() failed\n");
		abort();
	}
	avstream_video->time_base = AVRational{1, time_base};
	avstream_video->codecpar->codec_type = AVMEDIA_TYPE_VIDEO;
	if (video_codec == CODEC_H264) {
		avstream_video->codecpar->codec_id = AV_CODEC_ID_H264;
	} else if (video_codec == CODEC_AV1) {
		avstream_video->codecpar->codec_id = AV_CODEC_ID_AV1;
	} else {
		assert(video_codec == CODEC_MJPEG);
		avstream_video->codecpar->codec_id = AV_CODEC_ID_MJPEG;
	}
	avstream_video->codecpar->width = width;
	avstream_video->codecpar->height = height;

	// Colorspace details. Closely correspond to settings in EffectChain_finalize,
	// as noted in each comment.
	// Note that the H.264 stream also contains this information and depending on the
	// mux, this might simply get ignored. See sps_rbsp().
	// Note that there's no way to change this per-frame as the H.264 stream
	// would like to be able to.
	avstream_video->codecpar->color_primaries = AVCOL_PRI_BT709;  // RGB colorspace (inout_format.color_space).
	avstream_video->codecpar->color_trc = AVCOL_TRC_IEC61966_2_1;  // Gamma curve (inout_format.gamma_curve).
	// YUV colorspace (output_ycbcr_format.luma_coefficients).
	avstream_video->codecpar->color_space = color_space;
	avstream_video->codecpar->color_range = AVCOL_RANGE_MPEG;  // Full vs. limited range (output_ycbcr_format.full_range).
	avstream_video->codecpar->chroma_location = AVCHROMA_LOC_LEFT;  // Chroma sample location. See chroma_offset_0[] in Mixer::subsample_chroma().
	avstream_video->codecpar->field_order = AV_FIELD_PROGRESSIVE;

	if (!video_extradata.empty()) {
		avstream_video->codecpar->extradata = (uint8_t *)av_malloc(video_extradata.size() + AV_INPUT_BUFFER_PADDING_SIZE);
		avstream_video->codecpar->extradata_size = video_extradata.size();
		memcpy(avstream_video->codecpar->extradata, video_extradata.data(), video_extradata.size());
	}
	streams.push_back(avstream_video);

	if (audio_codecpar != nullptr) {
		AVStream *avstream_audio = avformat_new_stream(avctx, nullptr);
		if (avstream_audio == nullptr) {
			fprintf(stderr, "avformat_new_stream() failed\n");
			abort();
		}
		avstream_audio->time_base = AVRational{1, time_base};
		if (avcodec_parameters_copy(avstream_audio->codecpar, audio_codecpar) < 0) {
			fprintf(stderr, "avcodec_parameters_copy() failed\n");
			abort();
		}
		streams.push_back(avstream_audio);
	}

	if (with_subtitles == WITH_SUBTITLES) {
		AVStream *avstream_subtitles = avformat_new_stream(avctx, nullptr);
		if (avstream_subtitles == nullptr) {
			fprintf(stderr, "avformat_new_stream() failed\n");
			abort();
		}
		avstream_subtitles->time_base = AVRational{1, time_base};
		avstream_subtitles->codecpar->codec_type = AVMEDIA_TYPE_SUBTITLE;
		avstream_subtitles->codecpar->codec_id = AV_CODEC_ID_WEBVTT;
		avstream_subtitles->disposition = AV_DISPOSITION_METADATA;
		streams.push_back(avstream_subtitles);
		subtitle_stream_idx = streams.size() - 1;
	}

	if (write_strategy == WRITE_BACKGROUND) {
		writer_thread = thread(&Mux::thread_func, this);
	} else {
		write_header();
	}
}

Mux::~Mux()
{
	assert(plug_count == 0);
	if (write_strategy == WRITE_BACKGROUND) {
		writer_thread_should_quit = true;
		packet_queue_ready.notify_all();
		writer_thread.join();
	}
	int64_t old_pos = avctx->pb->pos;
	av_write_trailer(avctx);
	for (MuxMetrics *metric : metrics) {
		metric->metric_written_bytes += avctx->pb->pos - old_pos;
	}

	if (!(avctx->oformat->flags & AVFMT_NOFILE) &&
	    !(avctx->flags & AVFMT_FLAG_CUSTOM_IO)) {
		avio_closep(&avctx->pb);
	}
	avformat_free_context(avctx);
}

void Mux::add_packet(const AVPacket &pkt, int64_t pts, int64_t dts, AVRational timebase, int stream_index_override)
{
	assert(pts >= dts);

	AVPacket pkt_copy;
	if (av_packet_ref(&pkt_copy, &pkt) < 0) {
		fprintf(stderr, "av_copy_packet() failed\n");
		abort();
	}
	if (stream_index_override != -1) {
		pkt_copy.stream_index = stream_index_override;
	}
	assert(size_t(pkt_copy.stream_index) < streams.size());
	AVRational time_base = streams[pkt_copy.stream_index]->time_base;
	pkt_copy.pts = av_rescale_q(pts, timebase, time_base);
	pkt_copy.dts = av_rescale_q(dts, timebase, time_base);
	pkt_copy.duration = av_rescale_q(pkt.duration, timebase, time_base);

	{
		lock_guard<mutex> lock(mu);
		if (drained) {
			// Just drop the packet on the floor.
		} else if (write_strategy == WriteStrategy::WRITE_BACKGROUND) {
			packet_queue.push_back(QueuedPacket{ av_packet_clone(&pkt_copy), pts });
			if (plug_count == 0)
				packet_queue_ready.notify_all();
		} else if (plug_count > 0) {
			packet_queue.push_back(QueuedPacket{ av_packet_clone(&pkt_copy), pts });
		} else {
			write_packet_or_die(pkt_copy, pts);
		}
	}

	av_packet_unref(&pkt_copy);
}

void Mux::write_packet_or_die(const AVPacket &pkt, int64_t unscaled_pts)
{
	for (MuxMetrics *metric : metrics) {
		if (pkt.stream_index == 0) {
			metric->metric_video_bytes += pkt.size;
		} else if (pkt.stream_index == 1) {
			metric->metric_audio_bytes += pkt.size;
		} else {
			assert(false);
		}
	}
	int64_t old_pos = avctx->pb->pos;
	int err = av_interleaved_write_frame(avctx, const_cast<AVPacket *>(&pkt));
	if (err < 0) {
		char errbuf[AV_ERROR_MAX_STRING_SIZE];
		av_strerror(err, errbuf, sizeof(errbuf));
		fprintf(stderr, "av_interleaved_write_frame() failed: %s\n", errbuf);
		exit(EXIT_FAILURE);
	}
	avio_flush(avctx->pb);
	for (MuxMetrics *metric : metrics) {
		metric->metric_written_bytes += avctx->pb->pos - old_pos;
	}

	if (pkt.stream_index == 0 && write_callback != nullptr) {
		write_callback(unscaled_pts);
	}
}

void Mux::plug()
{
	lock_guard<mutex> lock(mu);
	assert(!drained);
	++plug_count;
}

void Mux::unplug()
{
	lock_guard<mutex> lock(mu);
	if (--plug_count > 0) {
		return;
	}
	assert(plug_count >= 0);

	sort(packet_queue.begin(), packet_queue.end(), PacketBefore(avctx));

	if (write_strategy == WRITE_BACKGROUND) {
		packet_queue_ready.notify_all();
	} else {
		for (QueuedPacket &qp : packet_queue) {
			write_packet_or_die(*qp.pkt, qp.unscaled_pts);
			av_packet_free(&qp.pkt);
		}
		packet_queue.clear();
	}
}

void Mux::drain()
{
	lock_guard<mutex> lock(mu);
	assert(!drained);
	assert(plug_count == 0);
	for (QueuedPacket &qp : packet_queue) {
		av_packet_free(&qp.pkt);
	}
	packet_queue.clear();
	drained = true;
}

void Mux::undrain()
{
	lock_guard<mutex> lock(mu);
	assert(drained);
	drained = false;
}

void Mux::thread_func()
{
	pthread_setname_np(pthread_self(), "Mux");

	write_header();

	unique_lock<mutex> lock(mu);
	for ( ;; ) {
		packet_queue_ready.wait(lock, [this]() {
			return writer_thread_should_quit || (!packet_queue.empty() && plug_count == 0);
		});
		if (writer_thread_should_quit && packet_queue.empty()) {
			// All done.
			break;
		}

		assert(!packet_queue.empty() && plug_count == 0);
		vector<QueuedPacket> packets;
		swap(packets, packet_queue);

		lock.unlock();
		for (QueuedPacket &qp : packets) {
			write_packet_or_die(*qp.pkt, qp.unscaled_pts);
			av_packet_free(&qp.pkt);
		}
		lock.lock();
	}
}

void Mux::write_header()
{
	AVDictionary *options = NULL;
	vector<pair<string, string>> opts = MUX_OPTS;
	for (pair<string, string> opt : opts) {
		av_dict_set(&options, opt.first.c_str(), opt.second.c_str(), 0);
	}

	int err = avformat_write_header(avctx, &options);
	if (err < 0) {
		char errbuf[AV_ERROR_MAX_STRING_SIZE];
		av_strerror(err, errbuf, sizeof(errbuf));
		fprintf(stderr, "avformat_write_header() failed: %s\n", errbuf);
		exit(EXIT_FAILURE);
	}
	for (MuxMetrics *metric : metrics) {
		metric->metric_written_bytes += avctx->pb->pos;
	}

	// Make sure the header is written before the constructor exits
	// (assuming we are in WRITE_FOREGROUND mode).
	avio_flush(avctx->pb);

}

void MuxMetrics::init(const vector<pair<string, string>> &labels)
{
	vector<pair<string, string>> labels_video = labels;
	labels_video.emplace_back("stream", "video");
	global_metrics.add("mux_stream_bytes", labels_video, &metric_video_bytes);

	vector<pair<string, string>> labels_audio = labels;
	labels_audio.emplace_back("stream", "audio");
	global_metrics.add("mux_stream_bytes", labels_audio, &metric_audio_bytes);

	global_metrics.add("mux_written_bytes", labels, &metric_written_bytes);
}