#include "audio/aframe.h" #include "audio/chmap_sel.h" #include "audio/format.h" #include "common/common.h" #include "common/msg.h" #include "video/hwdec.h" #include "video/mp_image.h" #include "video/mp_image_pool.h" #include "f_autoconvert.h" #include "f_hwtransfer.h" #include "f_swresample.h" #include "f_swscale.h" #include "f_utils.h" #include "filter.h" #include "filter_internal.h" struct priv { struct mp_log *log; struct mp_subfilter sub; bool force_update; int *imgfmts; int *subfmts; int num_imgfmts; struct mp_image_params imgparams; bool imgparams_set; // Enable special conversion for the final stage before the VO. bool vo_convert; // sws state int in_imgfmt, in_subfmt; int *afmts; int num_afmts; int *srates; int num_srates; struct mp_chmap_sel chmaps; int in_afmt, in_srate; struct mp_chmap in_chmap; double audio_speed; bool resampling_forced; bool format_change_blocked; bool format_change_cont; struct mp_autoconvert public; }; // Dummy filter for bundling sub-conversion filters. static const struct mp_filter_info convert_filter = { .name = "convert", }; void mp_autoconvert_clear(struct mp_autoconvert *c) { struct priv *p = c->f->priv; p->num_imgfmts = 0; p->imgparams_set = false; p->num_afmts = 0; p->num_srates = 0; p->chmaps = (struct mp_chmap_sel){0}; p->force_update = true; } void mp_autoconvert_add_imgfmt(struct mp_autoconvert *c, int imgfmt, int subfmt) { struct priv *p = c->f->priv; MP_TARRAY_GROW(p, p->imgfmts, p->num_imgfmts); MP_TARRAY_GROW(p, p->subfmts, p->num_imgfmts); p->imgfmts[p->num_imgfmts] = imgfmt; p->subfmts[p->num_imgfmts] = subfmt; p->num_imgfmts += 1; p->force_update = true; } void mp_autoconvert_set_target_image_params(struct mp_autoconvert *c, struct mp_image_params *par) { struct priv *p = c->f->priv; if (p->imgparams_set && mp_image_params_equal(&p->imgparams, par) && p->num_imgfmts == 1 && p->imgfmts[0] == par->imgfmt && p->subfmts[0] == par->hw_subfmt) return; p->imgparams = *par; p->imgparams_set = true; p->num_imgfmts = 0; mp_autoconvert_add_imgfmt(c, par->imgfmt, par->hw_subfmt); } void mp_autoconvert_add_all_sw_imgfmts(struct mp_autoconvert *c) { for (int n = IMGFMT_START; n < IMGFMT_END; n++) { if (!IMGFMT_IS_HWACCEL(n)) mp_autoconvert_add_imgfmt(c, n, 0); } } void mp_autoconvert_add_afmt(struct mp_autoconvert *c, int afmt) { struct priv *p = c->f->priv; MP_TARRAY_APPEND(p, p->afmts, p->num_afmts, afmt); p->force_update = true; } void mp_autoconvert_add_chmap(struct mp_autoconvert *c, struct mp_chmap *chmap) { struct priv *p = c->f->priv; mp_chmap_sel_add_map(&p->chmaps, chmap); p->force_update = true; } void mp_autoconvert_add_srate(struct mp_autoconvert *c, int rate) { struct priv *p = c->f->priv; MP_TARRAY_APPEND(p, p->srates, p->num_srates, rate); // Some other API we call expects a 0-terminated sample rates array. MP_TARRAY_GROW(p, p->srates, p->num_srates); p->srates[p->num_srates] = 0; p->force_update = true; } // If this returns true, and *out==NULL, no conversion is necessary. static bool build_image_converter(struct mp_autoconvert *c, struct mp_log *log, struct mp_image *img, struct mp_filter **f_out) { struct mp_filter *f = c->f; struct priv *p = f->priv; *f_out = NULL; if (!p->num_imgfmts) return true; for (int n = 0; n < p->num_imgfmts; n++) { bool samefmt = img->params.imgfmt == p->imgfmts[n]; bool samesubffmt = img->params.hw_subfmt == p->subfmts[n]; /* * In practice, `p->subfmts` is not usually populated today, in which * case we must actively probe formats below to establish if the VO can * accept the subfmt being used by the hwdec. */ if (samefmt && samesubffmt) { if (p->imgparams_set) { if (!mp_image_params_static_equal(&p->imgparams, &img->params)) break; } return true; } } struct mp_filter *conv = mp_filter_create(f, &convert_filter); if (!conv) return false; mp_filter_add_pin(conv, MP_PIN_IN, "in"); mp_filter_add_pin(conv, MP_PIN_OUT, "out"); // 0: hw->sw download // 1: swscale // 2: sw->hw upload struct mp_filter *filters[3] = {0}; bool need_sws = true; bool force_sws_params = false; struct mp_image_params imgpar = img->params; int *fmts = p->imgfmts; int num_fmts = p->num_imgfmts; int hwupload_fmt = 0; bool imgfmt_is_sw = !IMGFMT_IS_HWACCEL(img->imgfmt); // This should not happen. But not enough guarantee to make it an assert(). if (imgfmt_is_sw != !img->hwctx) mp_warn(log, "Unexpected AVFrame/imgfmt hardware context mismatch.\n"); bool dst_all_hw = true; bool dst_have_sw = false; bool has_src_hw_fmt = false; for (int n = 0; n < num_fmts; n++) { bool is_hw = IMGFMT_IS_HWACCEL(fmts[n]); dst_all_hw &= is_hw; dst_have_sw |= !is_hw; has_src_hw_fmt |= is_hw && fmts[n] == imgpar.imgfmt; } // Source is hw, some targets are sw -> try to download. bool hw_to_sw = !imgfmt_is_sw && dst_have_sw; if (has_src_hw_fmt) { int src_fmt = img->params.hw_subfmt; /* * If the source format is a hardware format, and our output supports * that hardware format, we prioritize preserving the use of that * hardware format. In most cases, the sub format will also be supported * and no conversion will be required, but in some cases, the hwdec * may be able to output formats that the VO cannot display, and * hardware format conversion becomes necessary. */ struct mp_hwupload upload = mp_hwupload_create(conv, imgpar.imgfmt, src_fmt, true); if (upload.successful_init) { if (upload.f) { mp_info(log, "Converting %s[%s] -> %s[%s]\n", mp_imgfmt_to_name(imgpar.imgfmt), mp_imgfmt_to_name(src_fmt), mp_imgfmt_to_name(imgpar.imgfmt), mp_imgfmt_to_name(upload.selected_sw_imgfmt)); filters[2] = upload.f; } hw_to_sw = false; need_sws = false; } else { mp_err(log, "Failed to create HW uploader for format %s\n", mp_imgfmt_to_name(src_fmt)); } } else if (dst_all_hw && num_fmts > 0) { bool upload_created = false; int sw_fmt = imgfmt_is_sw ? img->imgfmt : img->params.hw_subfmt; for (int i = 0; i < num_fmts; i++) { // We can probably use this! Very lazy and very approximate. struct mp_hwupload upload = mp_hwupload_create(conv, fmts[i], sw_fmt, false); if (upload.successful_init) { mp_info(log, "HW-uploading to %s\n", mp_imgfmt_to_name(fmts[i])); filters[2] = upload.f; hwupload_fmt = upload.selected_sw_imgfmt; fmts = &hwupload_fmt; num_fmts = hwupload_fmt ? 1 : 0; hw_to_sw = false; // We cannot do format conversions when transferring between // two hardware devices, so reject this format if that would be // required. if (!imgfmt_is_sw && hwupload_fmt != sw_fmt) { mp_err(log, "Format %s is not supported by %s\n", mp_imgfmt_to_name(sw_fmt), mp_imgfmt_to_name(p->imgfmts[i])); continue; } upload_created = true; break; } } if (!upload_created) { mp_err(log, "Failed to create HW uploader for format %s\n", mp_imgfmt_to_name(sw_fmt)); } } int src_fmt = img->imgfmt; if (hw_to_sw) { mp_info(log, "HW-downloading from %s\n", mp_imgfmt_to_name(img->imgfmt)); int res_fmt = mp_image_hw_download_get_sw_format(img); if (!res_fmt) { mp_err(log, "cannot copy surface of this format to CPU memory\n"); goto fail; } struct mp_hwdownload *hwd = mp_hwdownload_create(conv); if (hwd) { filters[0] = hwd->f; src_fmt = res_fmt; // Downloading from hw will obviously change the parameters. We // stupidly don't know the result parameters, but if it's // sufficiently sane, it will only do the following. imgpar.imgfmt = src_fmt; imgpar.hw_subfmt = 0; // Try to compensate for in-sane cases. mp_image_params_guess_csp(&imgpar); } } if (p->imgparams_set) { force_sws_params |= !mp_image_params_equal(&imgpar, &p->imgparams); need_sws |= force_sws_params; } if (!imgfmt_is_sw && dst_all_hw) { // This is a hw -> hw upload, so the sw format must already be // mutually understood. No conversion can be done. need_sws = false; } if (need_sws) { // Create a new conversion filter. struct mp_sws_filter *sws = mp_sws_filter_create(conv); if (!sws) { mp_err(log, "error creating conversion filter\n"); goto fail; } sws->force_scaler = c->force_scaler; int out = mp_sws_find_best_out_format(sws, src_fmt, fmts, num_fmts); if (!out) { mp_err(log, "can't find video conversion for %s\n", mp_imgfmt_to_name(src_fmt)); goto fail; } if (out == src_fmt && !force_sws_params) { // Can happen if hwupload goes to same format. talloc_free(sws->f); } else { sws->out_format = out; sws->out_params = p->imgparams; sws->use_out_params = force_sws_params; mp_info(log, "Converting %s -> %s\n", mp_imgfmt_to_name(src_fmt), mp_imgfmt_to_name(sws->out_format)); filters[1] = sws->f; } } mp_chain_filters(conv->ppins[0], conv->ppins[1], filters, 3); *f_out = conv; return true; fail: talloc_free(conv); return false; } bool mp_autoconvert_probe_input_video(struct mp_autoconvert *c, struct mp_image *img) { struct mp_filter *conv = NULL; bool res = build_image_converter(c, mp_null_log, img, &conv); talloc_free(conv); return res; } static void handle_video_frame(struct mp_filter *f) { struct priv *p = f->priv; struct mp_image *img = p->sub.frame.data; if (p->force_update) p->in_imgfmt = p->in_subfmt = 0; if (img->imgfmt == p->in_imgfmt && img->params.hw_subfmt == p->in_subfmt) { mp_subfilter_continue(&p->sub); return; } if (!mp_subfilter_drain_destroy(&p->sub)) { MP_VERBOSE(f, "Sub-filter requires draining but we must destroy it now.\n"); mp_subfilter_destroy(&p->sub); } p->in_imgfmt = img->params.imgfmt; p->in_subfmt = img->params.hw_subfmt; p->force_update = false; struct mp_filter *conv = NULL; if (build_image_converter(&p->public, p->log, img, &conv)) { p->sub.filter = conv; mp_subfilter_continue(&p->sub); } else { mp_filter_internal_mark_failed(f); } } static void handle_audio_frame(struct mp_filter *f) { struct priv *p = f->priv; struct mp_aframe *aframe = p->sub.frame.data; int afmt = mp_aframe_get_format(aframe); int srate = mp_aframe_get_rate(aframe); struct mp_chmap chmap = {0}; mp_aframe_get_chmap(aframe, &chmap); if (p->resampling_forced && !af_fmt_is_pcm(afmt)) { MP_WARN(p, "ignoring request to resample non-PCM audio for speed change\n"); p->resampling_forced = false; } bool format_change = afmt != p->in_afmt || srate != p->in_srate || !mp_chmap_equals(&chmap, &p->in_chmap) || p->force_update; if (!format_change && (!p->resampling_forced || p->sub.filter)) goto cont; if (!mp_subfilter_drain_destroy(&p->sub)) return; if (format_change && p->public.on_audio_format_change) { if (p->format_change_blocked) return; if (!p->format_change_cont) { p->format_change_blocked = true; p->public. on_audio_format_change(p->public.on_audio_format_change_opaque); return; } p->format_change_cont = false; } p->in_afmt = afmt; p->in_srate = srate; p->in_chmap = chmap; p->force_update = false; int out_afmt = 0; int best_score = 0; for (int n = 0; n < p->num_afmts; n++) { int score = af_format_conversion_score(p->afmts[n], afmt); if (!out_afmt || score > best_score) { best_score = score; out_afmt = p->afmts[n]; } } if (!out_afmt) out_afmt = afmt; // (The p->srates array is 0-terminated already.) int out_srate = af_select_best_samplerate(srate, p->srates); if (out_srate <= 0) out_srate = p->num_srates ? p->srates[0] : srate; struct mp_chmap out_chmap = chmap; if (p->chmaps.num_chmaps) { if (!mp_chmap_sel_adjust(&p->chmaps, &out_chmap)) out_chmap = p->chmaps.chmaps[0]; // violently force fallback } if (out_afmt == p->in_afmt && out_srate == p->in_srate && mp_chmap_equals(&out_chmap, &p->in_chmap) && !p->resampling_forced) { goto cont; } MP_VERBOSE(p, "inserting resampler\n"); struct mp_swresample *s = mp_swresample_create(f, NULL); if (!s) abort(); s->out_format = out_afmt; s->out_rate = out_srate; s->out_channels = out_chmap; p->sub.filter = s->f; cont: if (p->sub.filter) { struct mp_filter_command cmd = { .type = MP_FILTER_COMMAND_SET_SPEED_RESAMPLE, .speed = p->audio_speed, }; mp_filter_command(p->sub.filter, &cmd); } mp_subfilter_continue(&p->sub); } static void autoconvert_process(struct mp_filter *f) { struct priv *p = f->priv; if (!mp_subfilter_read(&p->sub)) return; if (p->sub.frame.type == MP_FRAME_VIDEO) { handle_video_frame(f); return; } if (p->sub.frame.type == MP_FRAME_AUDIO) { handle_audio_frame(f); return; } mp_subfilter_continue(&p->sub); } void mp_autoconvert_format_change_continue(struct mp_autoconvert *c) { struct priv *p = c->f->priv; if (p->format_change_blocked) { p->format_change_cont = true; p->format_change_blocked = false; mp_filter_wakeup(c->f); } } static bool autoconvert_command(struct mp_filter *f, struct mp_filter_command *cmd) { struct priv *p = f->priv; if (cmd->type == MP_FILTER_COMMAND_SET_SPEED_RESAMPLE) { p->audio_speed = cmd->speed; // If we needed resampling once, keep forcing resampling, as it might be // quickly changing between 1.0 and other values for A/V compensation. if (p->audio_speed != 1.0) p->resampling_forced = true; return true; } if (cmd->type == MP_FILTER_COMMAND_IS_ACTIVE) { cmd->is_active = !!p->sub.filter; return true; } return false; } static void autoconvert_reset(struct mp_filter *f) { struct priv *p = f->priv; mp_subfilter_reset(&p->sub); p->format_change_cont = false; p->format_change_blocked = false; } static void autoconvert_destroy(struct mp_filter *f) { struct priv *p = f->priv; mp_subfilter_reset(&p->sub); TA_FREEP(&p->sub.filter); } static const struct mp_filter_info autoconvert_filter = { .name = "autoconvert", .priv_size = sizeof(struct priv), .process = autoconvert_process, .command = autoconvert_command, .reset = autoconvert_reset, .destroy = autoconvert_destroy, }; struct mp_autoconvert *mp_autoconvert_create(struct mp_filter *parent) { struct mp_filter *f = mp_filter_create(parent, &autoconvert_filter); if (!f) return NULL; mp_filter_add_pin(f, MP_PIN_IN, "in"); mp_filter_add_pin(f, MP_PIN_OUT, "out"); struct priv *p = f->priv; p->public.f = f; p->log = f->log; p->audio_speed = 1.0; p->sub.in = f->ppins[0]; p->sub.out = f->ppins[1]; return &p->public; }