// // Created by loki on 6/6/19. // #include #include extern "C" { #include } #include "platform/common.h" #include "thread_pool.h" #include "round_robin.h" #include "config.h" #include "video.h" #include "main.h" namespace video { using namespace std::literals; void free_ctx(AVCodecContext *ctx) { avcodec_free_context(&ctx); } void free_frame(AVFrame *frame) { av_frame_free(&frame); } void free_buffer(AVBufferRef *ref) { av_buffer_unref(&ref); } void free_packet(AVPacket *packet) { av_packet_free(&packet); } using ctx_t = util::safe_ptr; using codec_t = util::safe_ptr_v2; using frame_t = util::safe_ptr; using buffer_t = util::safe_ptr; using sws_t = util::safe_ptr; using img_event_t = std::shared_ptr>>; void sw_img_to_frame(sws_t &sws, platf::img_t &img, frame_t &frame); struct encoder_t { struct option_t { std::string name; util::Either value; }; struct { int h264_high; int hevc_main; int hevc_main_10; } profile; AVHWDeviceType dev_type; AVPixelFormat pix_fmt; struct { std::vector options; std::string name; } hevc, h264; bool system_memory; std::function img_to_frame; }; struct session_t { buffer_t hwdevice; ctx_t ctx; codec_t codec_handle; frame_t frame; int sws_color_format; }; static encoder_t nvenc { { 2, 0, 1 }, AV_HWDEVICE_TYPE_D3D11VA, AV_PIX_FMT_D3D11, { { {"force-idr"s, 1} }, "nvenc_hevc"s }, { { {"force-idr"s, 1} }, "nvenc_h264"s }, false, nullptr // D3D11Device }; static encoder_t software { { FF_PROFILE_H264_HIGH, FF_PROFILE_HEVC_MAIN, FF_PROFILE_HEVC_MAIN_10 }, AV_HWDEVICE_TYPE_NONE, AV_PIX_FMT_NONE, { // x265's Info SEI is so long that it causes the IDR picture data to be // kicked to the 2nd packet in the frame, breaking Moonlight's parsing logic. // It also looks like gop_size isn't passed on to x265, so we have to set // 'keyint=-1' in the parameters ourselves. {{ "x265-params"s, "info=0:keyint=-1"s }}, "libx265"s }, { {{}}, "libx264"s }, true, sw_img_to_frame // nullptr }; static std::vector encoders { nvenc, software }; struct capture_ctx_t { img_event_t images; std::chrono::nanoseconds delay; }; struct capture_thread_ctx_t { std::shared_ptr> capture_ctx_queue; std::thread capture_thread; }; [[nodiscard]] codec_t open_codec(ctx_t &ctx, AVCodec *codec, AVDictionary **options) { avcodec_open2(ctx.get(), codec, options); return codec_t { ctx.get() }; } void captureThread(std::shared_ptr> capture_ctx_queue) { std::vector capture_ctxs; auto fg = util::fail_guard([&]() { capture_ctx_queue->stop(); // Stop all sessions listening to this thread for(auto &capture_ctx : capture_ctxs) { capture_ctx.images->stop(); } for(auto &capture_ctx : capture_ctx_queue->unsafe()) { capture_ctx.images->stop(); } }); std::chrono::nanoseconds delay = 1s; auto disp = platf::display(); if(!disp) { return; } std::vector> imgs(12); auto round_robin = util::make_round_robin>(std::begin(imgs), std::end(imgs)); for(auto &img : imgs) { img = disp->alloc_img(); if(!img) { BOOST_LOG(error) << "Couldn't initialize an image"sv; return; } } auto next_frame = std::chrono::steady_clock::now(); while(capture_ctx_queue->running()) { while(capture_ctx_queue->peek()) { capture_ctxs.emplace_back(std::move(*capture_ctx_queue->pop())); delay = std::min(delay, capture_ctxs.back().delay); } auto now = std::chrono::steady_clock::now(); if(next_frame > now) { std::this_thread::sleep_until(next_frame); } next_frame += delay; auto &img = *round_robin++; auto status = disp->snapshot(img.get(), display_cursor); switch (status) { case platf::capture_e::reinit: { // Some classes of images contain references to the display --> display won't delete unless img is deleted for(auto &img : imgs) { img.reset(); } while(disp.use_count() > 1) { std::this_thread::sleep_for(100ms); } // We try this twice, in case we still get an error on reinitialization for(int x = 0; x < 2; ++x) { // Some classes of display cannot have multiple instances at once disp.reset(); disp = platf::display(); if(disp) { break; } std::this_thread::sleep_for(200ms); } if(!disp) { return; } // Re-allocate images for(auto &img : imgs) { img = disp->alloc_img(); if(!img) { BOOST_LOG(error) << "Couldn't initialize an image"sv; return; } } continue; } case platf::capture_e::error: return; case platf::capture_e::timeout: continue; case platf::capture_e::ok: break; default: BOOST_LOG(error) << "Unrecognized capture status ["sv << (int)status << ']'; return; } KITTY_WHILE_LOOP(auto capture_ctx = std::begin(capture_ctxs), capture_ctx != std::end(capture_ctxs), { if(!capture_ctx->images->running()) { auto tmp_delay = capture_ctx->delay; capture_ctx = capture_ctxs.erase(capture_ctx); if(tmp_delay == delay) { delay = std::min_element(std::begin(capture_ctxs), std::end(capture_ctxs), [](const auto &l, const auto &r) { return l.delay < r.delay; })->delay; } continue; } capture_ctx->images->raise(img); ++capture_ctx; }) } } util::Either hwdevice_ctx(AVHWDeviceType type) { buffer_t ctx; AVBufferRef *ref; auto err = av_hwdevice_ctx_create(&ref, type, nullptr, nullptr, 0); // auto err = av_hwdevice_ctx_create(&ref, type, "/dev/dri/renderD129", nullptr, 0); ctx.reset(ref); if(err < 0) { return err; } return ctx; } int hwframe_ctx(ctx_t &ctx, buffer_t &hwdevice, AVPixelFormat format) { buffer_t frame_ref { av_hwframe_ctx_alloc(hwdevice.get())}; auto frame_ctx = (AVHWFramesContext*)frame_ref->data; frame_ctx->format = ctx->pix_fmt; frame_ctx->sw_format = format; frame_ctx->height = ctx->height; frame_ctx->width = ctx->width; frame_ctx->initial_pool_size = 20; if(auto err = av_hwframe_ctx_init(frame_ref.get()); err < 0) { return err; } ctx->hw_frames_ctx = av_buffer_ref(frame_ref.get()); return 0; } void sw_img_to_frame(sws_t &sws, platf::img_t &img, frame_t &frame) { av_frame_make_writable(frame.get()); const int linesizes[2] { img.row_pitch, 0 }; int ret = sws_scale(sws.get(), (std::uint8_t*const*)&img.data, linesizes, 0, img.height, frame->data, frame->linesize); if(ret <= 0) { BOOST_LOG(fatal) << "Couldn't convert image to required format and/or size"sv; log_flush(); std::abort(); } } void encode(int64_t frame_nr, ctx_t &ctx, frame_t &frame, packet_queue_t &packets, void *channel_data) { frame->pts = frame_nr; /* send the frame to the encoder */ auto ret = avcodec_send_frame(ctx.get(), frame.get()); if (ret < 0) { BOOST_LOG(fatal) << "Could not send a frame for encoding"sv; log_flush(); std::abort(); } while (ret >= 0) { auto packet = std::make_unique(nullptr); ret = avcodec_receive_packet(ctx.get(), packet.get()); if (ret == AVERROR(EAGAIN) || ret == AVERROR_EOF) { return; } else if (ret < 0) { BOOST_LOG(fatal) << "Could not encode video packet"sv; log_flush(); std::abort(); } packet->channel_data = channel_data; packets->raise(std::move(packet)); } } int start_capture(capture_thread_ctx_t &capture_thread_ctx) { capture_thread_ctx.capture_ctx_queue = std::make_shared>(); capture_thread_ctx.capture_thread = std::thread { captureThread, capture_thread_ctx.capture_ctx_queue }; return 0; } void end_capture(capture_thread_ctx_t &capture_thread_ctx) { capture_thread_ctx.capture_ctx_queue->stop(); capture_thread_ctx.capture_thread.join(); } std::optional make_session(const encoder_t &encoder, const config_t &config, void *device_ctx) { bool hardware = device_ctx; auto &video_format = config.videoFormat == 0 ? encoder.h264 : encoder.hevc; auto codec = avcodec_find_encoder_by_name(video_format.name.c_str()); if(!codec) { BOOST_LOG(error) << "Couldn't open ["sv << video_format.name << ']'; return std::nullopt; } buffer_t hwdevice; if(hardware) { auto buf_or_error = hwdevice_ctx(encoder.dev_type); if(buf_or_error.has_right()) { auto err = buf_or_error.right(); char err_str[AV_ERROR_MAX_STRING_SIZE] {0}; BOOST_LOG(error) << "Failed to create FFMpeg "sv << video_format.name << ": "sv << av_make_error_string(err_str, AV_ERROR_MAX_STRING_SIZE, err); return std::nullopt;; } hwdevice = std::move(buf_or_error.left()); } ctx_t ctx {avcodec_alloc_context3(codec) }; ctx->width = config.width; ctx->height = config.height; ctx->time_base = AVRational{1, config.framerate}; ctx->framerate = AVRational{config.framerate, 1}; if(config.videoFormat == 0) { ctx->profile = encoder.profile.h264_high; } else if(config.dynamicRange == 0) { ctx->profile = encoder.profile.hevc_main; } else { ctx->profile = encoder.profile.hevc_main_10; } // B-frames delay decoder output, so never use them ctx->max_b_frames = 0; // Use an infinite GOP length since I-frames are generated on demand ctx->gop_size = std::numeric_limits::max(); ctx->keyint_min = ctx->gop_size; // Some client decoders have limits on the number of reference frames ctx->refs = config.numRefFrames; ctx->flags |= (AV_CODEC_FLAG_CLOSED_GOP | AV_CODEC_FLAG_LOW_DELAY); ctx->flags2 |= AV_CODEC_FLAG2_FAST; ctx->color_range = (config.encoderCscMode & 0x1) ? AVCOL_RANGE_JPEG : AVCOL_RANGE_MPEG; int sws_color_space; switch (config.encoderCscMode >> 1) { case 0: default: // Rec. 601 ctx->color_primaries = AVCOL_PRI_SMPTE170M; ctx->color_trc = AVCOL_TRC_SMPTE170M; ctx->colorspace = AVCOL_SPC_SMPTE170M; sws_color_space = SWS_CS_SMPTE170M; break; case 1: // Rec. 709 ctx->color_primaries = AVCOL_PRI_BT709; ctx->color_trc = AVCOL_TRC_BT709; ctx->colorspace = AVCOL_SPC_BT709; sws_color_space = SWS_CS_ITU709; break; case 2: // Rec. 2020 ctx->color_primaries = AVCOL_PRI_BT2020; ctx->color_trc = AVCOL_TRC_BT2020_10; ctx->colorspace = AVCOL_SPC_BT2020_NCL; sws_color_space = SWS_CS_BT2020; break; } AVPixelFormat src_fmt; if(config.dynamicRange == 0) { src_fmt = AV_PIX_FMT_YUV420P; } else { src_fmt = AV_PIX_FMT_YUV420P10; } if(hardware) { ctx->pix_fmt = encoder.pix_fmt; ((AVHWFramesContext *)ctx->hw_frames_ctx->data)->device_ctx = (AVHWDeviceContext*)device_ctx; if(auto err = hwframe_ctx(ctx, hwdevice, src_fmt); err < 0) { char err_str[AV_ERROR_MAX_STRING_SIZE] {0}; BOOST_LOG(error) << "Failed to initialize hardware frame: "sv << av_make_error_string(err_str, AV_ERROR_MAX_STRING_SIZE, err) << std::endl; return std::nullopt; } } else /* software */ { ctx->pix_fmt = src_fmt; // Clients will request for the fewest slices per frame to get the // most efficient encode, but we may want to provide more slices than // requested to ensure we have enough parallelism for good performance. ctx->slices = std::max(config.slicesPerFrame, config::video.min_threads); ctx->thread_type = FF_THREAD_SLICE; ctx->thread_count = ctx->slices; } AVDictionary *options {nullptr}; for(auto &option : video_format.options) { if(option.value.has_left()) { av_dict_set_int(&options, option.name.c_str(), option.value.left(), 0); } else { av_dict_set(&options, option.name.c_str(), option.value.right().c_str(), 0); } } if(config.bitrate > 500) { auto bitrate = config.bitrate * 1000; ctx->rc_max_rate = bitrate; ctx->rc_buffer_size = bitrate / 100; ctx->bit_rate = bitrate; ctx->rc_min_rate = bitrate; } else if(config::video.crf != 0) { av_dict_set_int(&options, "crf", config::video.crf, 0); } else { av_dict_set_int(&options, "qp", config::video.qp, 0); } av_dict_set(&options, "preset", config::video.preset.c_str(), 0); av_dict_set(&options, "tune", config::video.tune.c_str(), 0); auto codec_handle = open_codec(ctx, codec, &options); frame_t frame {av_frame_alloc() }; frame->format = ctx->pix_fmt; frame->width = ctx->width; frame->height = ctx->height; if(config.videoFormat == 1) { auto err = av_hwframe_get_buffer(ctx->hw_frames_ctx, frame.get(), 0); if(err < 0) { char err_str[AV_ERROR_MAX_STRING_SIZE] {0}; BOOST_LOG(error) << "Coudn't create hardware frame: "sv << av_make_error_string(err_str, AV_ERROR_MAX_STRING_SIZE, err) << std::endl; return std::nullopt; } } else { av_frame_get_buffer(frame.get(), 0); } return std::make_optional(session_t { std::move(hwdevice), std::move(ctx), std::move(codec_handle), std::move(frame), sws_color_space }); } void capture( safe::signal_t *shutdown_event, packet_queue_t packets, idr_event_t idr_events, config_t config, void *channel_data) { auto session = make_session(software, config, nullptr); if(!session) { return; } int framerate = config.framerate; auto images = std::make_shared(); // Temporary image to ensure something is send to Moonlight even if no frame has been captured yet. int dummy_data = 0; { auto img = std::make_shared(); img->row_pitch = 4; img->height = 1; img->width = 1; img->pixel_pitch = 4; img->data = (std::uint8_t*)&dummy_data; images->raise(std::move(img)); } // Keep a reference counter to ensure the capture thread only runs when other threads have a reference to the capture thread static auto capture_thread = safe::make_shared(start_capture, end_capture); auto ref = capture_thread.ref(); if(!ref) { return; } auto delay = std::chrono::floor(1s) / framerate; ref->capture_ctx_queue->raise(capture_ctx_t { images, delay }); if(!ref->capture_ctx_queue->running()) { return; } int64_t frame_nr = 1; int64_t key_frame_nr = 1; auto img_width = 0; auto img_height = 0; // Initiate scaling context with correct height and width sws_t sws; auto next_frame = std::chrono::steady_clock::now(); while(true) { if(shutdown_event->peek() || !images->running()) { break; } if(idr_events->peek()) { session->frame->pict_type = AV_PICTURE_TYPE_I; auto event = idr_events->pop(); TUPLE_2D_REF(_, end, *event); frame_nr = end; key_frame_nr = end + config.framerate; } else if(frame_nr == key_frame_nr) { session->frame->pict_type = AV_PICTURE_TYPE_I; } std::this_thread::sleep_until(next_frame); next_frame += delay; // When Moonlight request an IDR frame, send frames even if there is no new captured frame if(frame_nr > (key_frame_nr + config.framerate) || images->peek()) { if(auto img = images->pop(delay)) { if(software.system_memory) { auto new_width = img->width; auto new_height = img->height; if(img_width != new_width || img_height != new_height) { img_width = new_width; img_height = new_height; sws.reset( sws_getContext( img_width, img_height, AV_PIX_FMT_BGR0, session->ctx->width, session->ctx->height, session->ctx->pix_fmt, SWS_LANCZOS | SWS_ACCURATE_RND, nullptr, nullptr, nullptr)); sws_setColorspaceDetails(sws.get(), sws_getCoefficients(SWS_CS_DEFAULT), 0, sws_getCoefficients(session->sws_color_format), config.encoderCscMode & 0x1, 0, 1 << 16, 1 << 16); } } software.img_to_frame(sws, *img, session->frame); } else if(images->running()) { continue; } else { break; } } encode(frame_nr++, session->ctx, session->frame, packets, channel_data); session->frame->pict_type = AV_PICTURE_TYPE_NONE; } images->stop(); } }