// // Created by loki on 6/6/19. // #include #include #include extern "C" { #include } #include "platform/common.h" #include "round_robin.h" #include "sync.h" #include "config.h" #include "video.h" #include "main.h" #ifdef _WIN32 extern "C" { #include } #endif namespace video { using namespace std::literals; void free_ctx(AVCodecContext *ctx) { avcodec_free_context(&ctx); } void free_frame(AVFrame *frame) { av_frame_free(&frame); } void free_buffer(AVBufferRef *ref) { av_buffer_unref(&ref); } void free_packet(AVPacket *packet) { av_packet_free(&packet); } namespace nv { enum class profile_h264_e : int { baseline, main, high, high_444p, }; enum class profile_hevc_e : int { main, main_10, rext, }; } namespace amd { enum class profile_h264_e : int { main, high, constrained_baseline, constrained_high, }; enum class profile_hevc_e : int { main, }; } using ctx_t = util::safe_ptr; using frame_t = util::safe_ptr; using buffer_t = util::safe_ptr; using sws_t = util::safe_ptr; using img_event_t = std::shared_ptr>>; platf::dev_type_e map_dev_type(AVHWDeviceType type); platf::pix_fmt_e map_pix_fmt(AVPixelFormat fmt); void sw_img_to_frame(const platf::img_t &img, frame_t &frame); void nv_d3d_img_to_frame(const platf::img_t &img, frame_t &frame); util::Either nv_d3d_make_hwdevice_ctx(platf::hwdevice_t *hwdevice_ctx); void amd_d3d_img_to_frame(const platf::img_t &img, frame_t &frame); util::Either amd_d3d_make_hwdevice_ctx(platf::hwdevice_t *hwdevice_ctx); util::Either make_hwdevice_ctx(AVHWDeviceType type, void *hwdevice_ctx); int hwframe_ctx(ctx_t &ctx, buffer_t &hwdevice, AVPixelFormat format); class swdevice_t : public platf::hwdevice_t { public: int convert(platf::img_t &img) override { auto frame = (AVFrame *)data; av_frame_make_writable(frame); const int linesizes[2] { img.row_pitch, 0 }; int ret = sws_scale(sws.get(), (std::uint8_t*const*)&img.data, linesizes, 0, img.height, frame->data, frame->linesize); if(ret <= 0) { BOOST_LOG(fatal) << "Couldn't convert image to required format and/or size"sv; return -1; } return 0; } virtual void set_colorspace(std::uint32_t colorspace, std::uint32_t color_range) { sws_setColorspaceDetails(sws.get(), sws_getCoefficients(SWS_CS_DEFAULT), 0, sws_getCoefficients(colorspace), color_range -1, 0, 1 << 16, 1 << 16 ); } int init(int in_width, int in_height, int out_width, int out_height, AVFrame *frame, AVPixelFormat format) { sws.reset(sws_getContext( in_width, in_height, AV_PIX_FMT_BGR0, out_width, out_height, format, SWS_LANCZOS | SWS_ACCURATE_RND, nullptr, nullptr, nullptr )); data = frame; return sws ? 0 : -1; } ~swdevice_t() override {} sws_t sws; }; struct encoder_t { std::string_view name; enum flag_e { PASSED, // Is supported REF_FRAMES_RESTRICT, // Set maximum reference frames REF_FRAMES_AUTOSELECT, // Allow encoder to select maximum reference frames (If !REF_FRAMES_RESTRICT --> REF_FRAMES_AUTOSELECT) DYNAMIC_RANGE, MAX_FLAGS }; struct option_t { KITTY_DEFAULT_CONSTR(option_t) option_t(const option_t &) = default; std::string name; std::variant*, std::string, std::string*> value; option_t(std::string &&name, decltype(value) &&value) : name { std::move(name) }, value { std::move(value) } {} }; struct { int h264_high; int hevc_main; int hevc_main_10; } profile; AVHWDeviceType dev_type; AVPixelFormat dev_pix_fmt; AVPixelFormat static_pix_fmt; AVPixelFormat dynamic_pix_fmt; struct { std::vector options; std::optional crf, qp; std::string name; std::bitset capabilities; bool operator[](flag_e flag) const { return capabilities[(std::size_t)flag]; } std::bitset::reference operator[](flag_e flag) { return capabilities[(std::size_t)flag]; } } hevc, h264; bool system_memory; bool hevc_mode; std::function img_to_frame; std::function(platf::hwdevice_t *hwdevice)> make_hwdevice_ctx; }; class session_t { public: session_t() = default; session_t(ctx_t &&ctx, frame_t &&frame, util::wrap_ptr &&device) : ctx { std::move(ctx) }, frame { std::move(frame) }, device { std::move(device) } {} session_t(session_t &&other) : ctx { std::move(other.ctx) }, frame { std::move(other.frame) }, device { std::move(other.device) } {} // Ensure objects are destroyed in the correct order session_t &operator=(session_t &&other) { device = std::move(other.device); frame = std::move(other.frame); ctx = std::move(other.ctx); return *this; } ctx_t ctx; frame_t frame; util::wrap_ptr device; }; struct sync_session_ctx_t { safe::signal_t *shutdown_event; safe::signal_t *join_event; packet_queue_t packets; idr_event_t idr_events; config_t config; int frame_nr; int key_frame_nr; void *channel_data; }; struct sync_session_t { sync_session_ctx_t *ctx; std::chrono::steady_clock::time_point next_frame; std::chrono::nanoseconds delay; platf::img_t *img_tmp; std::shared_ptr hwdevice; session_t session; }; using encode_session_ctx_queue_t = safe::queue_t; using encode_e = platf::capture_e; struct capture_ctx_t { img_event_t images; std::chrono::nanoseconds delay; }; struct capture_thread_async_ctx_t { std::shared_ptr> capture_ctx_queue; std::thread capture_thread; safe::signal_t reinit_event; const encoder_t *encoder_p; util::sync_t> display_wp; }; struct capture_thread_sync_ctx_t { encode_session_ctx_queue_t encode_session_ctx_queue { 30 }; }; int start_capture_sync(capture_thread_sync_ctx_t &ctx); void end_capture_sync(capture_thread_sync_ctx_t &ctx); int start_capture_async(capture_thread_async_ctx_t &ctx); void end_capture_async(capture_thread_async_ctx_t &ctx); // Keep a reference counter to ensure the capture thread only runs when other threads have a reference to the capture thread auto capture_thread_async = safe::make_shared(start_capture_async, end_capture_async); auto capture_thread_sync = safe::make_shared(start_capture_sync, end_capture_sync); #ifdef _WIN32 static encoder_t nvenc { "nvenc"sv, { (int)nv::profile_h264_e::high, (int)nv::profile_hevc_e::main, (int)nv::profile_hevc_e::main_10 }, AV_HWDEVICE_TYPE_D3D11VA, AV_PIX_FMT_D3D11, AV_PIX_FMT_NV12, AV_PIX_FMT_P010, { { { "forced-idr"s, 1 }, { "zerolatency"s, 1 }, { "preset"s, &config::video.nv.preset }, { "rc"s, &config::video.nv.rc } }, std::nullopt, std::nullopt, "hevc_nvenc"s, }, { { { "forced-idr"s, 1 }, { "zerolatency"s, 1 }, { "preset"s, &config::video.nv.preset }, { "rc"s, &config::video.nv.rc }, { "coder"s, &config::video.nv.coder } }, std::nullopt, std::make_optional({"qp"s, &config::video.qp}), "h264_nvenc"s }, false, true, nv_d3d_img_to_frame, nv_d3d_make_hwdevice_ctx }; static encoder_t amdvce { "amdvce"sv, { (int)amd::profile_h264_e::high, (int)amd::profile_hevc_e::main }, AV_HWDEVICE_TYPE_D3D11VA, AV_PIX_FMT_D3D11, AV_PIX_FMT_NV12, AV_PIX_FMT_YUV420P, { { { "header_insertion_mode"s, "idr"s }, { "gops_per_idr"s, 30 }, { "usage"s, "ultralowlatency"s }, { "quality"s, &config::video.amd.quality }, { "rc"s, &config::video.amd.rc } }, std::nullopt, std::make_optional({"qp"s, &config::video.qp}), "hevc_amf"s, }, { { { "usage"s, "ultralowlatency"s }, { "quality"s, &config::video.amd.quality }, { "rc"s, &config::video.amd.rc }, {"log_to_dbg"s,"1"s}, }, std::nullopt, std::make_optional({"qp"s, &config::video.qp}), "h264_amf"s }, false, true, amd_d3d_img_to_frame, amd_d3d_make_hwdevice_ctx }; #endif static encoder_t software { "software"sv, { FF_PROFILE_H264_HIGH, FF_PROFILE_HEVC_MAIN, FF_PROFILE_HEVC_MAIN_10 }, AV_HWDEVICE_TYPE_NONE, AV_PIX_FMT_NONE, AV_PIX_FMT_YUV420P, AV_PIX_FMT_YUV420P10, { // x265's Info SEI is so long that it causes the IDR picture data to be // kicked to the 2nd packet in the frame, breaking Moonlight's parsing logic. // It also looks like gop_size isn't passed on to x265, so we have to set // 'keyint=-1' in the parameters ourselves. { { "x265-params"s, "info=0:keyint=-1"s }, { "preset"s, &config::video.sw.preset }, { "tune"s, &config::video.sw.tune } }, std::make_optional("crf"s, &config::video.crf), std::make_optional("qp"s, &config::video.qp), "libx265"s }, { { { "preset"s, &config::video.sw.preset }, { "tune"s, &config::video.sw.tune } }, std::make_optional("crf"s, &config::video.crf), std::make_optional("qp"s, &config::video.qp), "libx264"s }, true, false, sw_img_to_frame, nullptr }; static std::vector encoders { #ifdef _WIN32 nvenc, #endif software, #ifdef _WIN32 amdvce, #endif }; void reset_display(std::shared_ptr &disp, AVHWDeviceType type) { // We try this twice, in case we still get an error on reinitialization for(int x = 0; x < 2; ++x) { disp.reset(); disp = platf::display(map_dev_type(type)); if(disp) { break; } std::this_thread::sleep_for(200ms); } } void captureThread( std::shared_ptr> capture_ctx_queue, util::sync_t> &display_wp, safe::signal_t &reinit_event, const encoder_t &encoder ) { std::vector capture_ctxs; auto fg = util::fail_guard([&]() { capture_ctx_queue->stop(); // Stop all sessions listening to this thread for(auto &capture_ctx : capture_ctxs) { capture_ctx.images->stop(); } for(auto &capture_ctx : capture_ctx_queue->unsafe()) { capture_ctx.images->stop(); } }); std::chrono::nanoseconds delay = 1s; auto disp = platf::display(map_dev_type(encoder.dev_type)); if(!disp) { return; } display_wp = disp; std::vector> imgs(12); auto round_robin = util::make_round_robin>(std::begin(imgs), std::end(imgs)); for(auto &img : imgs) { img = disp->alloc_img(); if(!img) { BOOST_LOG(error) << "Couldn't initialize an image"sv; return; } } if(auto capture_ctx = capture_ctx_queue->pop()) { capture_ctxs.emplace_back(std::move(*capture_ctx)); delay = capture_ctxs.back().delay; } auto next_frame = std::chrono::steady_clock::now(); while(capture_ctx_queue->running()) { while(capture_ctx_queue->peek()) { capture_ctxs.emplace_back(std::move(*capture_ctx_queue->pop())); delay = std::min(delay, capture_ctxs.back().delay); } auto now = std::chrono::steady_clock::now(); auto &img = *round_robin++; while(img.use_count() > 1) {} auto status = disp->snapshot(img.get(), 1000ms, display_cursor); switch (status) { case platf::capture_e::reinit: { reinit_event.raise(true); // Some classes of images contain references to the display --> display won't delete unless img is deleted for(auto &img : imgs) { img.reset(); } // Some classes of display cannot have multiple instances at once disp.reset(); // display_wp is modified in this thread only while(!display_wp->expired()) { std::this_thread::sleep_for(100ms); } while(capture_ctx_queue->running()) { reset_display(disp, encoder.dev_type); if(disp) { break; } std::this_thread::sleep_for(200ms); } if(!disp) { return; } display_wp = disp; // Re-allocate images for(auto &img : imgs) { img = disp->alloc_img(); if(!img) { BOOST_LOG(error) << "Couldn't initialize an image"sv; return; } } reinit_event.reset(); continue; } case platf::capture_e::error: return; case platf::capture_e::timeout: std::this_thread::sleep_for(1ms); continue; case platf::capture_e::ok: break; default: BOOST_LOG(error) << "Unrecognized capture status ["sv << (int)status << ']'; return; } KITTY_WHILE_LOOP(auto capture_ctx = std::begin(capture_ctxs), capture_ctx != std::end(capture_ctxs), { if(!capture_ctx->images->running()) { auto tmp_delay = capture_ctx->delay; capture_ctx = capture_ctxs.erase(capture_ctx); if(tmp_delay == delay) { delay = std::min_element(std::begin(capture_ctxs), std::end(capture_ctxs), [](const auto &l, const auto &r) { return l.delay < r.delay; })->delay; } continue; } capture_ctx->images->raise(img); ++capture_ctx; }) if(next_frame > now) { std::this_thread::sleep_until(next_frame); } next_frame += delay; } } int encode(int64_t frame_nr, ctx_t &ctx, frame_t &frame, packet_queue_t &packets, void *channel_data) { frame->pts = frame_nr; /* send the frame to the encoder */ auto ret = avcodec_send_frame(ctx.get(), frame.get()); if (ret < 0) { char err_str[AV_ERROR_MAX_STRING_SIZE] {0}; BOOST_LOG(error) << "Could not send a frame for encoding: "sv << av_make_error_string(err_str, AV_ERROR_MAX_STRING_SIZE, ret); return -1; } while (ret >= 0) { auto packet = std::make_unique(nullptr); ret = avcodec_receive_packet(ctx.get(), packet.get()); if (ret == AVERROR(EAGAIN) || ret == AVERROR_EOF) { return 0; } else if (ret < 0) { return ret; } packet->channel_data = channel_data; packets->raise(std::move(packet)); } return 0; } std::optional make_session(const encoder_t &encoder, const config_t &config, int width, int height, platf::hwdevice_t *hwdevice) { bool hardware = encoder.dev_type != AV_HWDEVICE_TYPE_NONE; auto &video_format = config.videoFormat == 0 ? encoder.h264 : encoder.hevc; if(!video_format[encoder_t::PASSED]) { BOOST_LOG(error) << encoder.name << ": "sv << video_format.name << " mode not supported"sv; return std::nullopt; } if(config.dynamicRange && !video_format[encoder_t::DYNAMIC_RANGE]) { BOOST_LOG(error) << video_format.name << ": dynamic range not supported"sv; return std::nullopt; } auto codec = avcodec_find_encoder_by_name(video_format.name.c_str()); if(!codec) { BOOST_LOG(error) << "Couldn't open ["sv << video_format.name << ']'; return std::nullopt; } ctx_t ctx { avcodec_alloc_context3(codec) }; ctx->width = config.width; ctx->height = config.height; ctx->time_base = AVRational{1, config.framerate}; ctx->framerate = AVRational{config.framerate, 1}; if(config.videoFormat == 0) { ctx->profile = encoder.profile.h264_high; } else if(config.dynamicRange == 0) { ctx->profile = encoder.profile.hevc_main; } else { ctx->profile = encoder.profile.hevc_main_10; } // B-frames delay decoder output, so never use them ctx->max_b_frames = 0; // Use an infinite GOP length since I-frames are generated on demand ctx->gop_size = std::numeric_limits::max(); ctx->keyint_min = ctx->gop_size; if(config.numRefFrames == 0) { ctx->refs = video_format[encoder_t::REF_FRAMES_AUTOSELECT] ? 0 : 16; } else { // Some client decoders have limits on the number of reference frames ctx->refs = video_format[encoder_t::REF_FRAMES_RESTRICT] ? config.numRefFrames : 0; } ctx->flags |= (AV_CODEC_FLAG_CLOSED_GOP | AV_CODEC_FLAG_LOW_DELAY); ctx->flags2 |= AV_CODEC_FLAG2_FAST; ctx->color_range = (config.encoderCscMode & 0x1) ? AVCOL_RANGE_JPEG : AVCOL_RANGE_MPEG; int sws_color_space; switch (config.encoderCscMode >> 1) { case 0: default: // Rec. 601 BOOST_LOG(info) << "Color coding [Rec. 601]"sv; ctx->color_primaries = AVCOL_PRI_SMPTE170M; ctx->color_trc = AVCOL_TRC_SMPTE170M; ctx->colorspace = AVCOL_SPC_SMPTE170M; sws_color_space = SWS_CS_SMPTE170M; break; case 1: // Rec. 709 BOOST_LOG(info) << "Color coding [Rec. 709]"sv; ctx->color_primaries = AVCOL_PRI_BT709; ctx->color_trc = AVCOL_TRC_BT709; ctx->colorspace = AVCOL_SPC_BT709; sws_color_space = SWS_CS_ITU709; break; case 2: // Rec. 2020 BOOST_LOG(info) << "Color coding [Rec. 2020]"sv; ctx->color_primaries = AVCOL_PRI_BT2020; ctx->color_trc = AVCOL_TRC_BT2020_10; ctx->colorspace = AVCOL_SPC_BT2020_NCL; sws_color_space = SWS_CS_BT2020; break; } BOOST_LOG(info) << "Color range: ["sv << ((config.encoderCscMode & 0x1) ? "JPEG"sv : "MPEG"sv) << ']'; AVPixelFormat sw_fmt; if(config.dynamicRange == 0) { sw_fmt = encoder.static_pix_fmt; } else { sw_fmt = encoder.dynamic_pix_fmt; } buffer_t hwdevice_ctx; if(hardware) { ctx->pix_fmt = encoder.dev_pix_fmt; auto buf_or_error = encoder.make_hwdevice_ctx(hwdevice); if(buf_or_error.has_right()) { return std::nullopt; } hwdevice_ctx = std::move(buf_or_error.left()); if(hwframe_ctx(ctx, hwdevice_ctx, sw_fmt)) { return std::nullopt; } ctx->slices = config.slicesPerFrame; } else /* software */ { ctx->pix_fmt = sw_fmt; // Clients will request for the fewest slices per frame to get the // most efficient encode, but we may want to provide more slices than // requested to ensure we have enough parallelism for good performance. ctx->slices = std::max(config.slicesPerFrame, config::video.min_threads); } ctx->thread_type = FF_THREAD_SLICE; ctx->thread_count = ctx->slices; AVDictionary *options {nullptr}; auto handle_option = [&options](const encoder_t::option_t &option) { std::visit(util::overloaded { [&](int v) { av_dict_set_int(&options, option.name.c_str(), v, 0); }, [&](int *v) { av_dict_set_int(&options, option.name.c_str(), *v, 0); }, [&](std::optional *v) { if(*v) av_dict_set_int(&options, option.name.c_str(), **v, 0); }, [&](const std::string &v) { av_dict_set(&options, option.name.c_str(), v.c_str(), 0); }, [&](std::string *v) { if(!v->empty()) av_dict_set(&options, option.name.c_str(), v->c_str(), 0); } }, option.value); }; for(auto &option : video_format.options) { handle_option(option); } if(config.bitrate > 500) { auto bitrate = config.bitrate * 1000; ctx->rc_max_rate = bitrate; ctx->rc_buffer_size = bitrate / config.framerate; ctx->bit_rate = bitrate; ctx->rc_min_rate = bitrate; } else if(video_format.crf && config::video.crf != 0) { handle_option(*video_format.crf); } else if(video_format.qp) { handle_option(*video_format.qp); } else { BOOST_LOG(error) << "Couldn't set video quality: encoder "sv << encoder.name << " doesn't support either crf or qp"sv; return std::nullopt; } avcodec_open2(ctx.get(), codec, &options); frame_t frame {av_frame_alloc() }; frame->format = ctx->pix_fmt; frame->width = ctx->width; frame->height = ctx->height; if(hardware) { frame->hw_frames_ctx = av_buffer_ref(ctx->hw_frames_ctx); } else /* software */ { av_frame_get_buffer(frame.get(), 0); } util::wrap_ptr device; if(!hwdevice->data) { auto device_tmp = std::make_unique(); if(device_tmp->init(width, height, config.width, config.height, frame.get(), sw_fmt)) { return std::nullopt; } device = std::move(device_tmp); } else { device = hwdevice; } device->set_colorspace(sws_color_space, ctx->color_range); return std::make_optional(session_t { std::move(ctx), std::move(frame), std::move(device) }); } void encode_run( int &frame_nr, int &key_frame_nr, // Store progress of the frame number safe::signal_t* shutdown_event, // Signal for shutdown event of the session packet_queue_t packets, idr_event_t idr_events, img_event_t images, config_t config, int width, int height, platf::hwdevice_t *hwdevice, safe::signal_t &reinit_event, const encoder_t &encoder, void *channel_data) { auto session = make_session(encoder, config, width, height, hwdevice); if(!session) { return; } auto delay = std::chrono::floor(1s) / config.framerate; auto next_frame = std::chrono::steady_clock::now(); while(true) { if(shutdown_event->peek() || reinit_event.peek() || !images->running()) { break; } if(idr_events->peek()) { session->frame->pict_type = AV_PICTURE_TYPE_I; session->frame->key_frame = 1; auto event = idr_events->pop(); if(!event) { return; } auto end = event->second; frame_nr = end; key_frame_nr = end + config.framerate; } else if(frame_nr == key_frame_nr) { session->frame->pict_type = AV_PICTURE_TYPE_I; session->frame->key_frame = 1; } std::this_thread::sleep_until(next_frame); next_frame += delay; // When Moonlight request an IDR frame, send frames even if there is no new captured frame if(frame_nr > (key_frame_nr + config.framerate) || images->peek()) { if(auto img = images->pop(delay)) { session->device->convert(*img); encoder.img_to_frame(*session->device->img, session->frame); } else if(images->running()) { continue; } else { break; } } if(encode(frame_nr++, session->ctx, session->frame, packets, channel_data)) { BOOST_LOG(error) << "Could not encode video packet"sv; return; } session->frame->pict_type = AV_PICTURE_TYPE_NONE; session->frame->key_frame = 0; } } std::optional make_synced_session(platf::display_t *disp, const encoder_t &encoder, platf::img_t &img, sync_session_ctx_t &ctx) { sync_session_t encode_session; encode_session.ctx = &ctx; encode_session.next_frame = std::chrono::steady_clock::now(); encode_session.delay = std::chrono::nanoseconds { 1s } / ctx.config.framerate; auto pix_fmt = ctx.config.dynamicRange == 0 ? map_pix_fmt(encoder.static_pix_fmt) : map_pix_fmt(encoder.dynamic_pix_fmt); auto hwdevice = disp->make_hwdevice(ctx.config.width, ctx.config.height, pix_fmt); if(!hwdevice) { return std::nullopt; } auto session = make_session(encoder, ctx.config, img.width, img.height, hwdevice.get()); if(!session) { return std::nullopt; } encode_session.img_tmp = &img; encode_session.hwdevice = std::move(hwdevice); encode_session.session = std::move(*session); return std::move(encode_session); } encode_e encode_run_sync(std::vector> &synced_session_ctxs, encode_session_ctx_queue_t &encode_session_ctx_queue) { const auto &encoder = encoders.front(); std::shared_ptr disp; while(encode_session_ctx_queue.running()) { reset_display(disp, encoder.dev_type); if(disp) { break; } std::this_thread::sleep_for(200ms); } if(!disp) { return encode_e::error; } auto img = disp->alloc_img(); auto img_tmp = img.get(); if(disp->dummy_img(img_tmp)) { return encode_e::error; } std::vector synced_sessions; for(auto &ctx : synced_session_ctxs) { auto synced_session = make_synced_session(disp.get(), encoder, *img, *ctx); if(!synced_session) { return encode_e::error; } synced_sessions.emplace_back(std::move(*synced_session)); } auto next_frame = std::chrono::steady_clock::now(); while(encode_session_ctx_queue.running()) { while(encode_session_ctx_queue.peek()) { auto encode_session_ctx = encode_session_ctx_queue.pop(); if(!encode_session_ctx) { return encode_e::ok; } synced_session_ctxs.emplace_back(std::make_unique(std::move(*encode_session_ctx))); auto encode_session = make_synced_session(disp.get(), encoder, *img, *synced_session_ctxs.back()); if(!encode_session) { return encode_e::error; } synced_sessions.emplace_back(std::move(*encode_session)); next_frame = std::chrono::steady_clock::now(); } auto delay = std::max(0ms, std::chrono::duration_cast(next_frame - std::chrono::steady_clock::now())); auto status = disp->snapshot(img.get(), delay, display_cursor); switch(status) { case platf::capture_e::reinit: case platf::capture_e::error: return status; case platf::capture_e::timeout: break; case platf::capture_e::ok: img_tmp = img.get(); break; } auto now = std::chrono::steady_clock::now(); next_frame = now + 1s; KITTY_WHILE_LOOP(auto pos = std::begin(synced_sessions), pos != std::end(synced_sessions), { auto ctx = pos->ctx; if(ctx->shutdown_event->peek()) { // Let waiting thread know it can delete shutdown_event ctx->join_event->raise(true); pos = synced_sessions.erase(pos); synced_session_ctxs.erase(std::find_if(std::begin(synced_session_ctxs), std::end(synced_session_ctxs), [&ctx_p=ctx](auto &ctx) { return ctx.get() == ctx_p; })); if(synced_sessions.empty()) { return encode_e::ok; } continue; } if(ctx->idr_events->peek()) { pos->session.frame->pict_type = AV_PICTURE_TYPE_I; pos->session.frame->key_frame = 1; auto event = ctx->idr_events->pop(); auto end = event->second; ctx->frame_nr = end; ctx->key_frame_nr = end + ctx->config.framerate; } else if(ctx->frame_nr == ctx->key_frame_nr) { pos->session.frame->pict_type = AV_PICTURE_TYPE_I; pos->session.frame->key_frame = 1; } if(img_tmp) { pos->img_tmp = img_tmp; } auto timeout = now > pos->next_frame; if(timeout) { pos->next_frame += pos->delay; } next_frame = std::min(next_frame, pos->next_frame); if(!timeout) { ++pos; continue; } if(pos->img_tmp) { if(pos->hwdevice->convert(*pos->img_tmp)) { BOOST_LOG(error) << "Could not convert image"sv; ctx->shutdown_event->raise(true); continue; } pos->img_tmp = nullptr; encoder.img_to_frame(*pos->hwdevice->img, pos->session.frame); } if(encode(ctx->frame_nr++, pos->session.ctx, pos->session.frame, ctx->packets, ctx->channel_data)) { BOOST_LOG(error) << "Could not encode video packet"sv; ctx->shutdown_event->raise(true); continue; } pos->session.frame->pict_type = AV_PICTURE_TYPE_NONE; pos->session.frame->key_frame = 0; ++pos; }) img_tmp = nullptr; } return encode_e::ok; } void captureThreadSync() { auto ref = capture_thread_sync.ref(); std::vector> synced_session_ctxs; auto &ctx = ref->encode_session_ctx_queue; auto lg = util::fail_guard([&]() { ctx.stop(); for(auto &ctx : synced_session_ctxs) { ctx->shutdown_event->raise(true); ctx->join_event->raise(true); } for(auto &ctx : ctx.unsafe()) { ctx.shutdown_event->raise(true); ctx.join_event->raise(true); } }); while(encode_run_sync(synced_session_ctxs, ctx) == encode_e::reinit); } void capture_async( safe::signal_t *shutdown_event, packet_queue_t &packets, idr_event_t &idr_events, config_t &config, void *channel_data) { auto images = std::make_shared(); auto lg = util::fail_guard([&]() { images->stop(); shutdown_event->raise(true); }); auto ref = capture_thread_async.ref(); if(!ref) { return; } auto delay = std::chrono::floor(1s) / config.framerate; ref->capture_ctx_queue->raise(capture_ctx_t { images, delay }); if(!ref->capture_ctx_queue->running()) { return; } int frame_nr = 1; int key_frame_nr = 1; while(!shutdown_event->peek() && images->running()) { // Wait for the main capture event when the display is being reinitialized if(ref->reinit_event.peek()) { std::this_thread::sleep_for(100ms); continue; } // Wait for the display to be ready std::shared_ptr display; { auto lg = ref->display_wp.lock(); if(ref->display_wp->expired()) { continue; } display = ref->display_wp->lock(); } auto pix_fmt = config.dynamicRange == 0 ? platf::pix_fmt_e::yuv420p : platf::pix_fmt_e::yuv420p10; auto hwdevice = display->make_hwdevice(config.width, config.height, pix_fmt); if(!hwdevice) { return; } auto dummy_img = display->alloc_img(); if(display->dummy_img(dummy_img.get())) { return; } images->raise(std::move(dummy_img)); encode_run( frame_nr, key_frame_nr, shutdown_event, packets, idr_events, images, config, display->width, display->height, hwdevice.get(), ref->reinit_event, *ref->encoder_p, channel_data); } } void capture( safe::signal_t *shutdown_event, packet_queue_t packets, idr_event_t idr_events, config_t config, void *channel_data) { idr_events->raise(std::make_pair(0, 1)); if(encoders.front().system_memory) { capture_async(shutdown_event, packets, idr_events, config, channel_data); } else { safe::signal_t join_event; auto ref = capture_thread_sync.ref(); ref->encode_session_ctx_queue.raise(sync_session_ctx_t { shutdown_event, &join_event, packets, idr_events, config, 1, 1, channel_data }); // Wait for join signal join_event.view(); } } bool validate_config(std::shared_ptr &disp, const encoder_t &encoder, const config_t &config) { reset_display(disp, encoder.dev_type); if(!disp) { return false; } auto pix_fmt = config.dynamicRange == 0 ? map_pix_fmt(encoder.static_pix_fmt) : map_pix_fmt(encoder.dynamic_pix_fmt); auto hwdevice = disp->make_hwdevice(config.width, config.height, pix_fmt); if(!hwdevice) { return false; } auto session = make_session(encoder, config, disp->width, disp->height, hwdevice.get()); if(!session) { return false; } auto img = disp->alloc_img(); if(disp->dummy_img(img.get())) { return false; } if(session->device->convert(*img)) { return false; } encoder.img_to_frame(*hwdevice->img, session->frame); session->frame->pict_type = AV_PICTURE_TYPE_I; auto packets = std::make_shared(30); if(encode(1, session->ctx, session->frame, packets, nullptr)) { return false; } return true; } bool validate_encoder(encoder_t &encoder) { std::shared_ptr disp; auto force_hevc = config::video.hevc_mode >= 2; auto test_hevc = force_hevc || (config::video.hevc_mode == 0 && encoder.hevc_mode); encoder.h264.capabilities.set(); encoder.hevc.capabilities.set(); // First, test encoder viability config_t config_max_ref_frames { 1920, 1080, 60, 1000, 1, 1, 1, 0, 0 }; config_t config_autoselect { 1920, 1080, 60, 1000, 1, 0, 1, 0, 0 }; auto max_ref_frames_h264 = validate_config(disp, encoder, config_max_ref_frames); auto autoselect_h264 = validate_config(disp, encoder, config_autoselect); if(!max_ref_frames_h264 && !autoselect_h264) { return false; } encoder.h264[encoder_t::REF_FRAMES_RESTRICT] = max_ref_frames_h264; encoder.h264[encoder_t::REF_FRAMES_AUTOSELECT] = autoselect_h264; encoder.h264[encoder_t::PASSED] = true; if(test_hevc) { config_max_ref_frames.videoFormat = 1; config_autoselect.videoFormat = 1; auto max_ref_frames_hevc = validate_config(disp, encoder, config_max_ref_frames); auto autoselect_hevc = validate_config(disp, encoder, config_autoselect); // If HEVC must be supported, but it is not supported if(force_hevc && !max_ref_frames_hevc && !autoselect_hevc) { return false; } encoder.hevc[encoder_t::REF_FRAMES_RESTRICT] = max_ref_frames_hevc; encoder.hevc[encoder_t::REF_FRAMES_AUTOSELECT] = autoselect_hevc; } encoder.hevc[encoder_t::PASSED] = test_hevc; std::vector> configs { { encoder_t::DYNAMIC_RANGE, { 1920, 1080, 60, 1000, 1, 0, 1, 1, 1 } } }; for(auto &[flag, config] : configs) { auto h264 = config; auto hevc = config; h264.videoFormat = 0; hevc.videoFormat = 1; encoder.h264[flag] = validate_config(disp, encoder, h264); if(test_hevc && encoder.hevc[encoder_t::PASSED]) { encoder.hevc[flag] = validate_config(disp, encoder, hevc); } } return true; } int init() { KITTY_WHILE_LOOP(auto pos = std::begin(encoders), pos != std::end(encoders), { if( (!config::video.encoder.empty() && pos->name != config::video.encoder) || !validate_encoder(*pos) || (config::video.hevc_mode == 3 && !pos->hevc[encoder_t::DYNAMIC_RANGE]) ) { pos = encoders.erase(pos); continue; } break; }) if(encoders.empty()) { if(config::video.encoder.empty()) { BOOST_LOG(fatal) << "Couldn't find any encoder"sv; } else { BOOST_LOG(fatal) << "Couldn't find any encoder matching ["sv << config::video.encoder << ']'; } return -1; } auto &encoder = encoders.front(); if(encoder.hevc[encoder_t::PASSED]) { BOOST_LOG(info) << "Found encoder "sv << encoder.name << ": ["sv << encoder.h264.name << ", "sv << encoder.hevc.name << ']'; } else { BOOST_LOG(info) << "Found encoder "sv << encoder.name << ": ["sv << encoder.h264.name << ']'; } if(config::video.hevc_mode == 0) { config::video.hevc_mode = encoder.hevc[encoder_t::PASSED] ? (encoder.hevc[encoder_t::DYNAMIC_RANGE] ? 3 : 2) : 1; } return 0; } util::Either make_hwdevice_ctx(AVHWDeviceType type, void *hwdevice) { buffer_t ctx; int err; if(hwdevice) { ctx.reset(av_hwdevice_ctx_alloc(type)); ((AVHWDeviceContext*)ctx.get())->hwctx = hwdevice; err = av_hwdevice_ctx_init(ctx.get()); } else { AVBufferRef *ref {}; err = av_hwdevice_ctx_create(&ref, type, nullptr, nullptr, 0); ctx.reset(ref); } if(err < 0) { return err; } return ctx; } int hwframe_ctx(ctx_t &ctx, buffer_t &hwdevice, AVPixelFormat format) { buffer_t frame_ref { av_hwframe_ctx_alloc(hwdevice.get())}; auto frame_ctx = (AVHWFramesContext*)frame_ref->data; frame_ctx->format = ctx->pix_fmt; frame_ctx->sw_format = format; frame_ctx->height = ctx->height; frame_ctx->width = ctx->width; frame_ctx->initial_pool_size = 0; if(auto err = av_hwframe_ctx_init(frame_ref.get()); err < 0) { return err; } ctx->hw_frames_ctx = av_buffer_ref(frame_ref.get()); return 0; } void sw_img_to_frame(const platf::img_t &img, frame_t &frame) {} #ifdef _WIN32 void nv_d3d_img_to_frame(const platf::img_t &img, frame_t &frame) { if(img.data == frame->data[0]) { return; } // Need to have something refcounted if(!frame->buf[0]) { frame->buf[0] = av_buffer_allocz(sizeof(AVD3D11FrameDescriptor)); } auto desc = (AVD3D11FrameDescriptor*)frame->buf[0]->data; desc->texture = (ID3D11Texture2D*)img.data; desc->index = 0; frame->data[0] = img.data; frame->data[1] = 0; frame->linesize[0] = img.row_pitch; frame->height = img.height; frame->width = img.width; } void amd_d3d_img_to_frame(const platf::img_t &img, frame_t &frame) { if(img.data == frame->data[0]) { return; } // Need to have something refcounted if(!frame->buf[0]) { frame->buf[0] = av_buffer_allocz(sizeof(AVD3D11FrameDescriptor)); } auto desc = (AVD3D11FrameDescriptor*)frame->buf[0]->data; desc->texture = (ID3D11Texture2D*)img.data; desc->index = 0; frame->data[0] = img.data; frame->data[1] = 0; frame->linesize[0] = img.row_pitch; frame->height = img.height; frame->width = img.width; } util::Either nv_d3d_make_hwdevice_ctx(platf::hwdevice_t *hwdevice_ctx) { buffer_t ctx_buf { av_hwdevice_ctx_alloc(AV_HWDEVICE_TYPE_D3D11VA) }; auto ctx = (AVD3D11VADeviceContext*)((AVHWDeviceContext*)ctx_buf->data)->hwctx; std::fill_n((std::uint8_t*)ctx, sizeof(AVD3D11VADeviceContext), 0); auto device = (ID3D11Device*)hwdevice_ctx->data; device->AddRef(); ctx->device = device; auto err = av_hwdevice_ctx_init(ctx_buf.get()); if(err) { char err_str[AV_ERROR_MAX_STRING_SIZE] {0}; BOOST_LOG(error) << "Failed to create FFMpeg nvenc: "sv << av_make_error_string(err_str, AV_ERROR_MAX_STRING_SIZE, err); return err; } return ctx_buf; } util::Either amd_d3d_make_hwdevice_ctx(platf::hwdevice_t *hwdevice_ctx) { buffer_t ctx_buf { av_hwdevice_ctx_alloc(AV_HWDEVICE_TYPE_D3D11VA) }; auto ctx = (AVD3D11VADeviceContext*)((AVHWDeviceContext*)ctx_buf->data)->hwctx; std::fill_n((std::uint8_t*)ctx, sizeof(AVD3D11VADeviceContext), 0); auto device = (ID3D11Device*)hwdevice_ctx->data; device->AddRef(); ctx->device = device; auto err = av_hwdevice_ctx_init(ctx_buf.get()); if(err) { char err_str[AV_ERROR_MAX_STRING_SIZE] {0}; BOOST_LOG(error) << "Failed to create FFMpeg amddech: "sv << av_make_error_string(err_str, AV_ERROR_MAX_STRING_SIZE, err); return err; } return ctx_buf; } #endif int start_capture_async(capture_thread_async_ctx_t &capture_thread_ctx) { capture_thread_ctx.encoder_p = &encoders.front(); capture_thread_ctx.reinit_event.reset(); capture_thread_ctx.capture_ctx_queue = std::make_shared>(30); capture_thread_ctx.capture_thread = std::thread { captureThread, capture_thread_ctx.capture_ctx_queue, std::ref(capture_thread_ctx.display_wp), std::ref(capture_thread_ctx.reinit_event), std::ref(*capture_thread_ctx.encoder_p) }; return 0; } void end_capture_async(capture_thread_async_ctx_t &capture_thread_ctx) { capture_thread_ctx.capture_ctx_queue->stop(); capture_thread_ctx.capture_thread.join(); } int start_capture_sync(capture_thread_sync_ctx_t &ctx) { std::thread { &captureThreadSync }.detach(); return 0; } void end_capture_sync(capture_thread_sync_ctx_t &ctx) {} platf::dev_type_e map_dev_type(AVHWDeviceType type) { switch(type) { case AV_HWDEVICE_TYPE_D3D11VA: return platf::dev_type_e::dxgi; case AV_PICTURE_TYPE_NONE: return platf::dev_type_e::none; default: return platf::dev_type_e::unknown; } return platf::dev_type_e::unknown; } platf::pix_fmt_e map_pix_fmt(AVPixelFormat fmt) { switch(fmt) { case AV_PIX_FMT_YUV420P10: return platf::pix_fmt_e::yuv420p10; case AV_PIX_FMT_YUV420P: return platf::pix_fmt_e::yuv420p; case AV_PIX_FMT_NV12: return platf::pix_fmt_e::nv12; case AV_PIX_FMT_P010: return platf::pix_fmt_e::p010; default: return platf::pix_fmt_e::unknown; } return platf::pix_fmt_e::unknown; } }