/* * This file is part of mpv. * * With some chunks from original MPlayer VAAPI patch: * Copyright (C) 2008-2009 Splitted-Desktop Systems * * mpv is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * mpv is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License along * with mpv. If not, see . */ #include #include #include #include #include #include "lavc.h" #include "mpvcore/mp_common.h" #include "mpvcore/av_common.h" #include "video/fmt-conversion.h" #include "video/vaapi.h" #include "video/decode/dec_video.h" #include "video/filter/vf.h" /* * The VAAPI decoder can work only with surfaces passed to the decoder at * creation time. This means all surfaces have to be created in advance. * So, additionally to the maximum number of reference frames, we need * surfaces for: * - 1 decode frame * - decoding 1 frame ahead (done by generic playback code) * - keeping the reference to the previous frame (done by vo_vaapi.c) * Note that redundant additional surfaces also might allow for some * buffering (i.e. not trying to reuse a surface while it's busy). */ #define ADDTIONAL_SURFACES 3 // Magic number taken from original MPlayer vaapi patch. #define MAX_DECODER_SURFACES 21 #define MAX_SURFACES (MAX_DECODER_SURFACES + ADDTIONAL_SURFACES) struct priv { struct mp_vaapi_ctx *ctx; VADisplay display; // libavcodec shared struct struct vaapi_context *va_context; struct vaapi_context va_context_storage; int format, w, h; VASurfaceID surfaces[MAX_SURFACES]; struct va_surface_pool *pool; int rt_format; }; struct profile_entry { enum AVCodecID av_codec; int maxrefs; const VAProfile *va_profiles; }; #define RP(...) __VA_ARGS__ #define PE(av_codec_id, maxrefs, ...) \ {AV_CODEC_ID_ ## av_codec_id, \ maxrefs, (const VAProfile[]) {RP __VA_ARGS__, -1}} static const struct profile_entry profiles[] = { PE(MPEG2VIDEO, 2, (VAProfileMPEG2Main, VAProfileMPEG2Simple)), PE(H264, 16, (VAProfileH264High, VAProfileH264Main, VAProfileH264Baseline)), PE(WMV3, 2, (VAProfileVC1Main, VAProfileVC1Simple)), PE(VC1, 2, (VAProfileVC1Advanced)), PE(MPEG4, 2, (VAProfileMPEG4Main, VAProfileMPEG4AdvancedSimple, VAProfileMPEG4Simple)), }; static const struct profile_entry *find_codec(enum AVCodecID id) { for (int n = 0; n < MP_ARRAY_SIZE(profiles); n++) { if (profiles[n].av_codec == id) return &profiles[n]; } return NULL; } static const char *str_va_profile(VAProfile profile) { switch (profile) { #define PROFILE(profile) \ case VAProfile##profile: return "VAProfile" #profile PROFILE(MPEG2Simple); PROFILE(MPEG2Main); PROFILE(MPEG4Simple); PROFILE(MPEG4AdvancedSimple); PROFILE(MPEG4Main); PROFILE(H264Baseline); PROFILE(H264Main); PROFILE(H264High); PROFILE(VC1Simple); PROFILE(VC1Main); PROFILE(VC1Advanced); #undef PROFILE } return ""; } static int find_entrypoint(int format, VAEntrypoint *ep, int num_ep) { int entrypoint = -1; switch (format) { case IMGFMT_VAAPI: entrypoint = VAEntrypointVLD; break; case IMGFMT_VAAPI_MPEG2_IDCT: entrypoint = VAEntrypointIDCT; break; case IMGFMT_VAAPI_MPEG2_MOCO: entrypoint = VAEntrypointMoComp; break; } for (int n = 0; n < num_ep; n++) { if (ep[n] == entrypoint) return entrypoint; } return -1; } static int is_direct_mapping(VADisplay display) { VADisplayAttribute attr; VAStatus status; #if VA_CHECK_VERSION(0,34,0) attr.type = VADisplayAttribRenderMode; attr.flags = VA_DISPLAY_ATTRIB_GETTABLE; status = vaGetDisplayAttributes(display, &attr, 1); if (status == VA_STATUS_SUCCESS) return !(attr.value & (VA_RENDER_MODE_LOCAL_OVERLAY| VA_RENDER_MODE_EXTERNAL_OVERLAY)); #else /* If the driver doesn't make a copy of the VA surface for display, then we have to retain it until it's no longer the visible surface. In other words, if the driver is using DirectSurface mode, we don't want to decode the new surface into the previous one that was used for display. */ attr.type = VADisplayAttribDirectSurface; attr.flags = VA_DISPLAY_ATTRIB_GETTABLE; status = vaGetDisplayAttributes(display, &attr, 1); if (status == VA_STATUS_SUCCESS) return !attr.value; #endif return 0; } // We must allocate only surfaces that were passed to the decoder on creation. // We achieve this by reserving surfaces in the pool as needed. // Releasing surfaces is necessary after filling the surface id list so // that reserved surfaces can be reused for decoding. static bool preallocate_surfaces(struct lavc_ctx *ctx, int num) { struct priv *p = ctx->hwdec_priv; if (!va_surface_pool_reserve(p->pool, num, p->w, p->h)) { mp_msg(MSGT_VO, MSGL_ERR, "[vaapi] Could not allocate surfaces.\n"); return false; } for (int i = 0; i < num; i++) { struct va_surface *s = va_surface_pool_get(p->pool, p->w, p->h); p->surfaces[i] = s->id; va_surface_release(s); } return true; } static void destroy_decoder(struct lavc_ctx *ctx) { struct priv *p = ctx->hwdec_priv; if (p->va_context->context_id != VA_INVALID_ID) { vaDestroyContext(p->display, p->va_context->context_id); p->va_context->context_id = VA_INVALID_ID; } if (p->va_context->config_id != VA_INVALID_ID) { vaDestroyConfig(p->display, p->va_context->config_id); p->va_context->config_id = VA_INVALID_ID; } for (int n = 0; n < MAX_SURFACES; n++) p->surfaces[n] = VA_INVALID_ID; } static bool has_profile(VAProfile *va_profiles, int num_profiles, VAProfile p) { for (int i = 0; i < num_profiles; i++) { if (va_profiles[i] == p) return true; } return false; } static int create_decoder(struct lavc_ctx *ctx) { void *tmp = talloc_new(NULL); struct priv *p = ctx->hwdec_priv; VAStatus status; int res = -1; assert(IMGFMT_IS_VAAPI(p->format)); destroy_decoder(ctx); const struct profile_entry *pe = find_codec(ctx->avctx->codec_id); if (!pe) { mp_msg(MSGT_VO, MSGL_ERR, "[vaapi] Unknown codec!\n"); goto error; } int num_profiles = vaMaxNumProfiles(p->display); VAProfile *va_profiles = talloc_zero_array(tmp, VAProfile, num_profiles); status = vaQueryConfigProfiles(p->display, va_profiles, &num_profiles); if (!check_va_status(status, "vaQueryConfigProfiles()")) goto error; mp_msg(MSGT_VO, MSGL_DBG2, "[vaapi] %d profiles available:\n", num_profiles); for (int i = 0; i < num_profiles; i++) mp_msg(MSGT_VO, MSGL_DBG2, " %s\n", str_va_profile(va_profiles[i])); VAProfile va_profile = -1; for (int n = 0; ; n++) { if (pe->va_profiles[n] == -1) break; if (has_profile(va_profiles, num_profiles, pe->va_profiles[n])) { va_profile = pe->va_profiles[n]; break; } } if (va_profile == -1) { mp_msg(MSGT_VO, MSGL_ERR, "[vaapi] No decoder profile available.\n"); goto error; } mp_msg(MSGT_VO, MSGL_V, "[vaapi] Using profile '%s'.\n", str_va_profile(va_profile)); int num_surfaces = pe->maxrefs; if (!is_direct_mapping(p->display)) { mp_msg(MSGT_VO, MSGL_V, "[vaapi] No direct mapping.\n"); // Note: not sure why it has to be *=2 rather than +=1. num_surfaces *= 2; } num_surfaces = MPMIN(num_surfaces, MAX_DECODER_SURFACES) + ADDTIONAL_SURFACES; if (num_surfaces > MAX_SURFACES) { mp_msg(MSGT_VO, MSGL_ERR, "[vaapi] Internal error: too many surfaces.\n"); goto error; } if (!preallocate_surfaces(ctx, num_surfaces)) { mp_msg(MSGT_VO, MSGL_ERR, "[vaapi] Could not allocate surfaces.\n"); goto error; } int num_ep = vaMaxNumEntrypoints(p->display); VAEntrypoint *ep = talloc_zero_array(tmp, VAEntrypoint, num_ep); status = vaQueryConfigEntrypoints(p->display, va_profile, ep, &num_ep); if (!check_va_status(status, "vaQueryConfigEntrypoints()")) goto error; VAEntrypoint entrypoint = find_entrypoint(p->format, ep, num_ep); if (entrypoint < 0) { mp_msg(MSGT_VO, MSGL_ERR, "[vaapi] Could not find VA entrypoint.\n"); goto error; } VAConfigAttrib attrib = { .type = VAConfigAttribRTFormat, }; status = vaGetConfigAttributes(p->display, va_profile, entrypoint, &attrib, 1); if (!check_va_status(status, "vaGetConfigAttributes()")) goto error; if ((attrib.value & p->rt_format) == 0) { mp_msg(MSGT_VO, MSGL_ERR, "[vaapi] Chroma format not supported.\n"); goto error; } status = vaCreateConfig(p->display, va_profile, entrypoint, &attrib, 1, &p->va_context->config_id); if (!check_va_status(status, "vaCreateConfig()")) goto error; status = vaCreateContext(p->display, p->va_context->config_id, p->w, p->h, VA_PROGRESSIVE, p->surfaces, num_surfaces, &p->va_context->context_id); if (!check_va_status(status, "vaCreateContext()")) goto error; res = 0; error: talloc_free(tmp); return res; } static struct mp_image *allocate_image(struct lavc_ctx *ctx, int format, int w, int h) { struct priv *p = ctx->hwdec_priv; if (!IMGFMT_IS_VAAPI(format)) return NULL; if (format != p->format || w != p->w || h != p->h || p->va_context->context_id == VA_INVALID_ID) { p->format = format; p->w = w; p->h = h; if (create_decoder(ctx) < 0) return NULL; } struct va_surface *s = va_surface_pool_get(p->pool, p->w, p->h); if (s) { for (int n = 0; n < MAX_SURFACES; n++) { if (p->surfaces[n] == s->id) return va_surface_wrap(s); } va_surface_release(s); } mp_msg(MSGT_VO, MSGL_ERR, "[vaapi] Insufficient number of surfaces.\n"); return NULL; } static void uninit(struct lavc_ctx *ctx) { struct priv *p = ctx->hwdec_priv; if (!p) return; destroy_decoder(ctx); va_surface_pool_release(p->pool); talloc_free(p); ctx->hwdec_priv = NULL; } static int init(struct lavc_ctx *ctx) { struct priv *p = talloc_ptrtype(NULL, p); *p = (struct priv) { .ctx = ctx->hwdec_info->vaapi_ctx, .va_context = &p->va_context_storage, .rt_format = VA_RT_FORMAT_YUV420 }; p->display = p->ctx->display; p->pool = va_surface_pool_alloc(p->display, p->rt_format); p->va_context->display = p->display; p->va_context->config_id = VA_INVALID_ID; p->va_context->context_id = VA_INVALID_ID; ctx->avctx->hwaccel_context = p->va_context; ctx->hwdec_priv = p; return 0; } static int probe(struct vd_lavc_hwdec *hwdec, struct mp_hwdec_info *info, const char *decoder) { if (!info || !info->vaapi_ctx) return HWDEC_ERR_NO_CTX; if (!find_codec(mp_codec_to_av_codec_id(decoder))) return HWDEC_ERR_NO_CODEC; return 0; } const struct vd_lavc_hwdec mp_vd_lavc_vaapi = { .type = HWDEC_VAAPI, .image_formats = (const int[]) {IMGFMT_VAAPI, IMGFMT_VAAPI_MPEG2_IDCT, IMGFMT_VAAPI_MPEG2_MOCO, 0}, .probe = probe, .init = init, .uninit = uninit, .allocate_image = allocate_image, };