| /* |
| * This file is part of FFmpeg. |
| * |
| * FFmpeg is free software; you can redistribute it and/or |
| * modify it under the terms of the GNU Lesser General Public |
| * License as published by the Free Software Foundation; either |
| * version 2.1 of the License, or (at your option) any later version. |
| * |
| * FFmpeg is distributed in the hope that it will be useful, |
| * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
| * Lesser General Public License for more details. |
| * |
| * You should have received a copy of the GNU Lesser General Public |
| * License along with FFmpeg; if not, write to the Free Software |
| * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
| */ |
| |
| #define CL_USE_DEPRECATED_OPENCL_1_2_APIS |
| |
| #include <string.h> |
| |
| #include "config.h" |
| |
| #include "avassert.h" |
| #include "avstring.h" |
| #include "common.h" |
| #include "hwcontext.h" |
| #include "hwcontext_internal.h" |
| #include "hwcontext_opencl.h" |
| #include "mem.h" |
| #include "pixdesc.h" |
| |
| #if HAVE_OPENCL_VAAPI_BEIGNET |
| #include <unistd.h> |
| #include <va/va.h> |
| #include <va/va_drmcommon.h> |
| #include <CL/cl_intel.h> |
| #include "hwcontext_vaapi.h" |
| #endif |
| |
| #if HAVE_OPENCL_DRM_BEIGNET |
| #include <unistd.h> |
| #include <CL/cl_intel.h> |
| #include "hwcontext_drm.h" |
| #endif |
| |
| #if HAVE_OPENCL_VAAPI_INTEL_MEDIA |
| #if CONFIG_LIBMFX |
| #include <mfx/mfxstructures.h> |
| #endif |
| #include <va/va.h> |
| #include <CL/cl_va_api_media_sharing_intel.h> |
| #include "hwcontext_vaapi.h" |
| #endif |
| |
| #if HAVE_OPENCL_DXVA2 |
| #define COBJMACROS |
| #include <CL/cl_dx9_media_sharing.h> |
| #include <dxva2api.h> |
| #include "hwcontext_dxva2.h" |
| #endif |
| |
| #if HAVE_OPENCL_D3D11 |
| #include <CL/cl_d3d11.h> |
| #include "hwcontext_d3d11va.h" |
| #endif |
| |
| #if HAVE_OPENCL_DRM_ARM |
| #include <CL/cl_ext.h> |
| #include <drm_fourcc.h> |
| #include "hwcontext_drm.h" |
| #endif |
| |
| |
| typedef struct OpenCLDeviceContext { |
| // Default command queue to use for transfer/mapping operations on |
| // the device. If the user supplies one, this is a reference to it. |
| // Otherwise, it is newly-created. |
| cl_command_queue command_queue; |
| |
| // The platform the context exists on. This is needed to query and |
| // retrieve extension functions. |
| cl_platform_id platform_id; |
| |
| // Platform/device-specific functions. |
| #if HAVE_OPENCL_DRM_BEIGNET |
| int beignet_drm_mapping_usable; |
| clCreateImageFromFdINTEL_fn clCreateImageFromFdINTEL; |
| #endif |
| |
| #if HAVE_OPENCL_VAAPI_INTEL_MEDIA |
| int qsv_mapping_usable; |
| clCreateFromVA_APIMediaSurfaceINTEL_fn |
| clCreateFromVA_APIMediaSurfaceINTEL; |
| clEnqueueAcquireVA_APIMediaSurfacesINTEL_fn |
| clEnqueueAcquireVA_APIMediaSurfacesINTEL; |
| clEnqueueReleaseVA_APIMediaSurfacesINTEL_fn |
| clEnqueueReleaseVA_APIMediaSurfacesINTEL; |
| #endif |
| |
| #if HAVE_OPENCL_DXVA2 |
| int dxva2_mapping_usable; |
| cl_dx9_media_adapter_type_khr dx9_media_adapter_type; |
| |
| clCreateFromDX9MediaSurfaceKHR_fn |
| clCreateFromDX9MediaSurfaceKHR; |
| clEnqueueAcquireDX9MediaSurfacesKHR_fn |
| clEnqueueAcquireDX9MediaSurfacesKHR; |
| clEnqueueReleaseDX9MediaSurfacesKHR_fn |
| clEnqueueReleaseDX9MediaSurfacesKHR; |
| #endif |
| |
| #if HAVE_OPENCL_D3D11 |
| int d3d11_mapping_usable; |
| clCreateFromD3D11Texture2DKHR_fn |
| clCreateFromD3D11Texture2DKHR; |
| clEnqueueAcquireD3D11ObjectsKHR_fn |
| clEnqueueAcquireD3D11ObjectsKHR; |
| clEnqueueReleaseD3D11ObjectsKHR_fn |
| clEnqueueReleaseD3D11ObjectsKHR; |
| #endif |
| |
| #if HAVE_OPENCL_DRM_ARM |
| int drm_arm_mapping_usable; |
| #endif |
| } OpenCLDeviceContext; |
| |
| typedef struct OpenCLFramesContext { |
| // Command queue used for transfer/mapping operations on this frames |
| // context. If the user supplies one, this is a reference to it. |
| // Otherwise, it is a reference to the default command queue for the |
| // device. |
| cl_command_queue command_queue; |
| |
| #if HAVE_OPENCL_DXVA2 || HAVE_OPENCL_D3D11 |
| // For mapping APIs which have separate creation and acquire/release |
| // steps, this stores the OpenCL memory objects corresponding to each |
| // frame. |
| int nb_mapped_frames; |
| AVOpenCLFrameDescriptor *mapped_frames; |
| #endif |
| } OpenCLFramesContext; |
| |
| |
| static void CL_CALLBACK opencl_error_callback(const char *errinfo, |
| const void *private_info, |
| size_t cb, |
| void *user_data) |
| { |
| AVHWDeviceContext *ctx = user_data; |
| av_log(ctx, AV_LOG_ERROR, "OpenCL error: %s\n", errinfo); |
| } |
| |
| static void opencl_device_free(AVHWDeviceContext *hwdev) |
| { |
| AVOpenCLDeviceContext *hwctx = hwdev->hwctx; |
| cl_int cle; |
| |
| cle = clReleaseContext(hwctx->context); |
| if (cle != CL_SUCCESS) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to release OpenCL " |
| "context: %d.\n", cle); |
| } |
| } |
| |
| static struct { |
| const char *key; |
| cl_platform_info name; |
| } opencl_platform_params[] = { |
| { "platform_profile", CL_PLATFORM_PROFILE }, |
| { "platform_version", CL_PLATFORM_VERSION }, |
| { "platform_name", CL_PLATFORM_NAME }, |
| { "platform_vendor", CL_PLATFORM_VENDOR }, |
| { "platform_extensions", CL_PLATFORM_EXTENSIONS }, |
| }; |
| |
| static struct { |
| const char *key; |
| cl_device_info name; |
| } opencl_device_params[] = { |
| { "device_name", CL_DEVICE_NAME }, |
| { "device_vendor", CL_DEVICE_VENDOR }, |
| { "driver_version", CL_DRIVER_VERSION }, |
| { "device_version", CL_DEVICE_VERSION }, |
| { "device_profile", CL_DEVICE_PROFILE }, |
| { "device_extensions", CL_DEVICE_EXTENSIONS }, |
| }; |
| |
| static struct { |
| const char *key; |
| cl_device_type type; |
| } opencl_device_types[] = { |
| { "cpu", CL_DEVICE_TYPE_CPU }, |
| { "gpu", CL_DEVICE_TYPE_GPU }, |
| { "accelerator", CL_DEVICE_TYPE_ACCELERATOR }, |
| { "custom", CL_DEVICE_TYPE_CUSTOM }, |
| { "default", CL_DEVICE_TYPE_DEFAULT }, |
| { "all", CL_DEVICE_TYPE_ALL }, |
| }; |
| |
| static char *opencl_get_platform_string(cl_platform_id platform_id, |
| cl_platform_info key) |
| { |
| char *str; |
| size_t size; |
| cl_int cle; |
| cle = clGetPlatformInfo(platform_id, key, 0, NULL, &size); |
| if (cle != CL_SUCCESS) |
| return NULL; |
| str = av_malloc(size); |
| if (!str) |
| return NULL; |
| cle = clGetPlatformInfo(platform_id, key, size, str, &size); |
| if (cle != CL_SUCCESS) { |
| av_free(str); |
| return NULL; |
| } |
| av_assert0(strlen(str) + 1 == size); |
| return str; |
| } |
| |
| static char *opencl_get_device_string(cl_device_id device_id, |
| cl_device_info key) |
| { |
| char *str; |
| size_t size; |
| cl_int cle; |
| cle = clGetDeviceInfo(device_id, key, 0, NULL, &size); |
| if (cle != CL_SUCCESS) |
| return NULL; |
| str = av_malloc(size); |
| if (!str) |
| return NULL; |
| cle = clGetDeviceInfo(device_id, key, size, str, &size); |
| if (cle != CL_SUCCESS) { |
| av_free(str); |
| return NULL; |
| } |
| av_assert0(strlen(str) + 1== size); |
| return str; |
| } |
| |
| static int opencl_check_platform_extension(cl_platform_id platform_id, |
| const char *name) |
| { |
| char *str; |
| int found = 0; |
| str = opencl_get_platform_string(platform_id, |
| CL_PLATFORM_EXTENSIONS); |
| if (str && strstr(str, name)) |
| found = 1; |
| av_free(str); |
| return found; |
| } |
| |
| static int opencl_check_device_extension(cl_device_id device_id, |
| const char *name) |
| { |
| char *str; |
| int found = 0; |
| str = opencl_get_device_string(device_id, |
| CL_DEVICE_EXTENSIONS); |
| if (str && strstr(str, name)) |
| found = 1; |
| av_free(str); |
| return found; |
| } |
| |
| static av_unused int opencl_check_extension(AVHWDeviceContext *hwdev, |
| const char *name) |
| { |
| AVOpenCLDeviceContext *hwctx = hwdev->hwctx; |
| OpenCLDeviceContext *priv = hwdev->internal->priv; |
| |
| if (opencl_check_platform_extension(priv->platform_id, name)) { |
| av_log(hwdev, AV_LOG_DEBUG, |
| "%s found as platform extension.\n", name); |
| return 1; |
| } |
| |
| if (opencl_check_device_extension(hwctx->device_id, name)) { |
| av_log(hwdev, AV_LOG_DEBUG, |
| "%s found as device extension.\n", name); |
| return 1; |
| } |
| |
| return 0; |
| } |
| |
| static int opencl_enumerate_platforms(AVHWDeviceContext *hwdev, |
| cl_uint *nb_platforms, |
| cl_platform_id **platforms, |
| void *context) |
| { |
| cl_int cle; |
| |
| cle = clGetPlatformIDs(0, NULL, nb_platforms); |
| if (cle != CL_SUCCESS) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to get number of " |
| "OpenCL platforms: %d.\n", cle); |
| return AVERROR(ENODEV); |
| } |
| av_log(hwdev, AV_LOG_DEBUG, "%u OpenCL platforms found.\n", |
| *nb_platforms); |
| |
| *platforms = av_malloc_array(*nb_platforms, sizeof(**platforms)); |
| if (!*platforms) |
| return AVERROR(ENOMEM); |
| |
| cle = clGetPlatformIDs(*nb_platforms, *platforms, NULL); |
| if (cle != CL_SUCCESS) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to get list of OpenCL " |
| "platforms: %d.\n", cle); |
| av_freep(platforms); |
| return AVERROR(ENODEV); |
| } |
| |
| return 0; |
| } |
| |
| static int opencl_filter_platform(AVHWDeviceContext *hwdev, |
| cl_platform_id platform_id, |
| const char *platform_name, |
| void *context) |
| { |
| AVDictionary *opts = context; |
| const AVDictionaryEntry *param; |
| char *str; |
| int i, ret = 0; |
| |
| for (i = 0; i < FF_ARRAY_ELEMS(opencl_platform_params); i++) { |
| param = av_dict_get(opts, opencl_platform_params[i].key, |
| NULL, 0); |
| if (!param) |
| continue; |
| |
| str = opencl_get_platform_string(platform_id, |
| opencl_platform_params[i].name); |
| if (!str) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to query %s " |
| "of platform \"%s\".\n", |
| opencl_platform_params[i].key, platform_name); |
| return AVERROR_UNKNOWN; |
| } |
| if (!av_stristr(str, param->value)) { |
| av_log(hwdev, AV_LOG_DEBUG, "%s does not match (\"%s\").\n", |
| param->key, str); |
| ret = 1; |
| } |
| av_free(str); |
| } |
| |
| return ret; |
| } |
| |
| static int opencl_enumerate_devices(AVHWDeviceContext *hwdev, |
| cl_platform_id platform_id, |
| const char *platform_name, |
| cl_uint *nb_devices, |
| cl_device_id **devices, |
| void *context) |
| { |
| cl_int cle; |
| |
| cle = clGetDeviceIDs(platform_id, CL_DEVICE_TYPE_ALL, |
| 0, NULL, nb_devices); |
| if (cle == CL_DEVICE_NOT_FOUND) { |
| av_log(hwdev, AV_LOG_DEBUG, "No devices found " |
| "on platform \"%s\".\n", platform_name); |
| *nb_devices = 0; |
| return 0; |
| } else if (cle != CL_SUCCESS) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to get number of devices " |
| "on platform \"%s\": %d.\n", platform_name, cle); |
| return AVERROR(ENODEV); |
| } |
| av_log(hwdev, AV_LOG_DEBUG, "%u OpenCL devices found on " |
| "platform \"%s\".\n", *nb_devices, platform_name); |
| |
| *devices = av_malloc_array(*nb_devices, sizeof(**devices)); |
| if (!*devices) |
| return AVERROR(ENOMEM); |
| |
| cle = clGetDeviceIDs(platform_id, CL_DEVICE_TYPE_ALL, |
| *nb_devices, *devices, NULL); |
| if (cle != CL_SUCCESS) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to get list of devices " |
| "on platform \"%s\": %d.\n", platform_name, cle); |
| av_freep(devices); |
| return AVERROR(ENODEV); |
| } |
| |
| return 0; |
| } |
| |
| static int opencl_filter_device(AVHWDeviceContext *hwdev, |
| cl_device_id device_id, |
| const char *device_name, |
| void *context) |
| { |
| AVDictionary *opts = context; |
| const AVDictionaryEntry *param; |
| char *str; |
| int i, ret = 0; |
| |
| param = av_dict_get(opts, "device_type", NULL, 0); |
| if (param) { |
| cl_device_type match_type = 0, device_type; |
| cl_int cle; |
| |
| for (i = 0; i < FF_ARRAY_ELEMS(opencl_device_types); i++) { |
| if (!strcmp(opencl_device_types[i].key, param->value)) { |
| match_type = opencl_device_types[i].type; |
| break; |
| } |
| } |
| if (!match_type) { |
| av_log(hwdev, AV_LOG_ERROR, "Unknown device type %s.\n", |
| param->value); |
| return AVERROR(EINVAL); |
| } |
| |
| cle = clGetDeviceInfo(device_id, CL_DEVICE_TYPE, |
| sizeof(device_type), &device_type, NULL); |
| if (cle != CL_SUCCESS) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to query device type " |
| "of device \"%s\".\n", device_name); |
| return AVERROR_UNKNOWN; |
| } |
| |
| if (!(device_type & match_type)) { |
| av_log(hwdev, AV_LOG_DEBUG, "device_type does not match.\n"); |
| return 1; |
| } |
| } |
| |
| for (i = 0; i < FF_ARRAY_ELEMS(opencl_device_params); i++) { |
| param = av_dict_get(opts, opencl_device_params[i].key, |
| NULL, 0); |
| if (!param) |
| continue; |
| |
| str = opencl_get_device_string(device_id, |
| opencl_device_params[i].name); |
| if (!str) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to query %s " |
| "of device \"%s\".\n", |
| opencl_device_params[i].key, device_name); |
| return AVERROR_UNKNOWN; |
| } |
| if (!av_stristr(str, param->value)) { |
| av_log(hwdev, AV_LOG_DEBUG, "%s does not match (\"%s\").\n", |
| param->key, str); |
| ret = 1; |
| } |
| av_free(str); |
| } |
| |
| return ret; |
| } |
| |
| typedef struct OpenCLDeviceSelector { |
| int platform_index; |
| int device_index; |
| void *context; |
| int (*enumerate_platforms)(AVHWDeviceContext *hwdev, |
| cl_uint *nb_platforms, |
| cl_platform_id **platforms, |
| void *context); |
| int (*filter_platform) (AVHWDeviceContext *hwdev, |
| cl_platform_id platform_id, |
| const char *platform_name, |
| void *context); |
| int (*enumerate_devices) (AVHWDeviceContext *hwdev, |
| cl_platform_id platform_id, |
| const char *platform_name, |
| cl_uint *nb_devices, |
| cl_device_id **devices, |
| void *context); |
| int (*filter_device) (AVHWDeviceContext *hwdev, |
| cl_device_id device_id, |
| const char *device_name, |
| void *context); |
| } OpenCLDeviceSelector; |
| |
| static int opencl_device_create_internal(AVHWDeviceContext *hwdev, |
| const OpenCLDeviceSelector *selector, |
| cl_context_properties *props) |
| { |
| cl_uint nb_platforms; |
| cl_platform_id *platforms = NULL; |
| cl_platform_id platform_id; |
| cl_uint nb_devices; |
| cl_device_id *devices = NULL; |
| AVOpenCLDeviceContext *hwctx = hwdev->hwctx; |
| cl_int cle; |
| cl_context_properties default_props[3]; |
| char *platform_name_src = NULL, |
| *device_name_src = NULL; |
| int err, found, p, d; |
| |
| av_assert0(selector->enumerate_platforms && |
| selector->enumerate_devices); |
| |
| err = selector->enumerate_platforms(hwdev, &nb_platforms, &platforms, |
| selector->context); |
| if (err) |
| return err; |
| |
| found = 0; |
| for (p = 0; p < nb_platforms; p++) { |
| const char *platform_name; |
| |
| if (selector->platform_index >= 0 && |
| selector->platform_index != p) |
| continue; |
| |
| av_freep(&platform_name_src); |
| platform_name_src = opencl_get_platform_string(platforms[p], |
| CL_PLATFORM_NAME); |
| if (platform_name_src) |
| platform_name = platform_name_src; |
| else |
| platform_name = "Unknown Platform"; |
| |
| if (selector->filter_platform) { |
| err = selector->filter_platform(hwdev, platforms[p], |
| platform_name, |
| selector->context); |
| if (err < 0) |
| goto fail; |
| if (err > 0) |
| continue; |
| } |
| |
| err = selector->enumerate_devices(hwdev, platforms[p], platform_name, |
| &nb_devices, &devices, |
| selector->context); |
| if (err < 0) |
| continue; |
| |
| for (d = 0; d < nb_devices; d++) { |
| const char *device_name; |
| |
| if (selector->device_index >= 0 && |
| selector->device_index != d) |
| continue; |
| |
| av_freep(&device_name_src); |
| device_name_src = opencl_get_device_string(devices[d], |
| CL_DEVICE_NAME); |
| if (device_name_src) |
| device_name = device_name_src; |
| else |
| device_name = "Unknown Device"; |
| |
| if (selector->filter_device) { |
| err = selector->filter_device(hwdev, devices[d], |
| device_name, |
| selector->context); |
| if (err < 0) |
| goto fail; |
| if (err > 0) |
| continue; |
| } |
| |
| av_log(hwdev, AV_LOG_VERBOSE, "%d.%d: %s / %s\n", p, d, |
| platform_name, device_name); |
| |
| ++found; |
| platform_id = platforms[p]; |
| hwctx->device_id = devices[d]; |
| } |
| |
| av_freep(&devices); |
| } |
| |
| if (found == 0) { |
| av_log(hwdev, AV_LOG_ERROR, "No matching devices found.\n"); |
| err = AVERROR(ENODEV); |
| goto fail; |
| } |
| if (found > 1) { |
| av_log(hwdev, AV_LOG_ERROR, "More than one matching device found.\n"); |
| err = AVERROR(ENODEV); |
| goto fail; |
| } |
| |
| if (!props) { |
| props = default_props; |
| default_props[0] = CL_CONTEXT_PLATFORM; |
| default_props[1] = (intptr_t)platform_id; |
| default_props[2] = 0; |
| } else { |
| if (props[0] == CL_CONTEXT_PLATFORM && props[1] == 0) |
| props[1] = (intptr_t)platform_id; |
| } |
| |
| hwctx->context = clCreateContext(props, 1, &hwctx->device_id, |
| &opencl_error_callback, hwdev, &cle); |
| if (!hwctx->context) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to create OpenCL context: " |
| "%d.\n", cle); |
| err = AVERROR(ENODEV); |
| goto fail; |
| } |
| |
| hwdev->free = &opencl_device_free; |
| |
| err = 0; |
| fail: |
| av_freep(&platform_name_src); |
| av_freep(&device_name_src); |
| av_freep(&platforms); |
| av_freep(&devices); |
| return err; |
| } |
| |
| static int opencl_device_create(AVHWDeviceContext *hwdev, const char *device, |
| AVDictionary *opts, int flags) |
| { |
| OpenCLDeviceSelector selector = { |
| .context = opts, |
| .enumerate_platforms = &opencl_enumerate_platforms, |
| .filter_platform = &opencl_filter_platform, |
| .enumerate_devices = &opencl_enumerate_devices, |
| .filter_device = &opencl_filter_device, |
| }; |
| |
| if (device && device[0]) { |
| // Match one or both indices for platform and device. |
| int d = -1, p = -1, ret; |
| if (device[0] == '.') |
| ret = sscanf(device, ".%d", &d); |
| else |
| ret = sscanf(device, "%d.%d", &p, &d); |
| if (ret < 1) { |
| av_log(hwdev, AV_LOG_ERROR, "Invalid OpenCL platform/device " |
| "index specification \"%s\".\n", device); |
| return AVERROR(EINVAL); |
| } |
| selector.platform_index = p; |
| selector.device_index = d; |
| } else { |
| selector.platform_index = -1; |
| selector.device_index = -1; |
| } |
| |
| return opencl_device_create_internal(hwdev, &selector, NULL); |
| } |
| |
| static int opencl_device_init(AVHWDeviceContext *hwdev) |
| { |
| AVOpenCLDeviceContext *hwctx = hwdev->hwctx; |
| OpenCLDeviceContext *priv = hwdev->internal->priv; |
| cl_int cle; |
| |
| if (hwctx->command_queue) { |
| cle = clRetainCommandQueue(hwctx->command_queue); |
| if (cle != CL_SUCCESS) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to retain external " |
| "command queue: %d.\n", cle); |
| return AVERROR(EIO); |
| } |
| priv->command_queue = hwctx->command_queue; |
| } else { |
| priv->command_queue = clCreateCommandQueue(hwctx->context, |
| hwctx->device_id, |
| 0, &cle); |
| if (!priv->command_queue) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to create internal " |
| "command queue: %d.\n", cle); |
| return AVERROR(EIO); |
| } |
| } |
| |
| cle = clGetDeviceInfo(hwctx->device_id, CL_DEVICE_PLATFORM, |
| sizeof(priv->platform_id), &priv->platform_id, |
| NULL); |
| if (cle != CL_SUCCESS) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to determine the OpenCL " |
| "platform containing the device.\n"); |
| return AVERROR(EIO); |
| } |
| |
| #define CL_FUNC(name, desc) do { \ |
| if (fail) \ |
| break; \ |
| priv->name = clGetExtensionFunctionAddressForPlatform( \ |
| priv->platform_id, #name); \ |
| if (!priv->name) { \ |
| av_log(hwdev, AV_LOG_VERBOSE, \ |
| desc " function not found (%s).\n", #name); \ |
| fail = 1; \ |
| } else { \ |
| av_log(hwdev, AV_LOG_VERBOSE, \ |
| desc " function found (%s).\n", #name); \ |
| } \ |
| } while (0) |
| |
| #if HAVE_OPENCL_DRM_BEIGNET |
| { |
| int fail = 0; |
| |
| CL_FUNC(clCreateImageFromFdINTEL, |
| "Beignet DRM to OpenCL image mapping"); |
| |
| if (fail) { |
| av_log(hwdev, AV_LOG_WARNING, "Beignet DRM to OpenCL " |
| "mapping not usable.\n"); |
| priv->beignet_drm_mapping_usable = 0; |
| } else { |
| priv->beignet_drm_mapping_usable = 1; |
| } |
| } |
| #endif |
| |
| #if HAVE_OPENCL_VAAPI_INTEL_MEDIA |
| { |
| size_t props_size; |
| cl_context_properties *props = NULL; |
| VADisplay va_display; |
| const char *va_ext = "cl_intel_va_api_media_sharing"; |
| int i, fail = 0; |
| |
| if (!opencl_check_extension(hwdev, va_ext)) { |
| av_log(hwdev, AV_LOG_VERBOSE, "The %s extension is " |
| "required for QSV to OpenCL mapping.\n", va_ext); |
| goto no_qsv; |
| } |
| |
| cle = clGetContextInfo(hwctx->context, CL_CONTEXT_PROPERTIES, |
| 0, NULL, &props_size); |
| if (cle != CL_SUCCESS) { |
| av_log(hwdev, AV_LOG_VERBOSE, "Failed to get context " |
| "properties: %d.\n", cle); |
| goto no_qsv; |
| } |
| if (props_size == 0) { |
| av_log(hwdev, AV_LOG_VERBOSE, "Media sharing must be " |
| "enabled on context creation to use QSV to " |
| "OpenCL mapping.\n"); |
| goto no_qsv; |
| } |
| |
| props = av_malloc(props_size); |
| if (!props) |
| return AVERROR(ENOMEM); |
| |
| cle = clGetContextInfo(hwctx->context, CL_CONTEXT_PROPERTIES, |
| props_size, props, NULL); |
| if (cle != CL_SUCCESS) { |
| av_log(hwdev, AV_LOG_VERBOSE, "Failed to get context " |
| "properties: %d.\n", cle); |
| goto no_qsv; |
| } |
| |
| va_display = NULL; |
| for (i = 0; i < (props_size / sizeof(*props) - 1); i++) { |
| if (props[i] == CL_CONTEXT_VA_API_DISPLAY_INTEL) { |
| va_display = (VADisplay)(intptr_t)props[i+1]; |
| break; |
| } |
| } |
| if (!va_display) { |
| av_log(hwdev, AV_LOG_VERBOSE, "Media sharing must be " |
| "enabled on context creation to use QSV to " |
| "OpenCL mapping.\n"); |
| goto no_qsv; |
| } |
| if (!vaDisplayIsValid(va_display)) { |
| av_log(hwdev, AV_LOG_VERBOSE, "A valid VADisplay is " |
| "required on context creation to use QSV to " |
| "OpenCL mapping.\n"); |
| goto no_qsv; |
| } |
| |
| CL_FUNC(clCreateFromVA_APIMediaSurfaceINTEL, |
| "Intel QSV to OpenCL mapping"); |
| CL_FUNC(clEnqueueAcquireVA_APIMediaSurfacesINTEL, |
| "Intel QSV in OpenCL acquire"); |
| CL_FUNC(clEnqueueReleaseVA_APIMediaSurfacesINTEL, |
| "Intel QSV in OpenCL release"); |
| |
| if (fail) { |
| no_qsv: |
| av_log(hwdev, AV_LOG_WARNING, "QSV to OpenCL mapping " |
| "not usable.\n"); |
| priv->qsv_mapping_usable = 0; |
| } else { |
| priv->qsv_mapping_usable = 1; |
| } |
| av_free(props); |
| } |
| #endif |
| |
| #if HAVE_OPENCL_DXVA2 |
| { |
| int fail = 0; |
| |
| CL_FUNC(clCreateFromDX9MediaSurfaceKHR, |
| "DXVA2 to OpenCL mapping"); |
| CL_FUNC(clEnqueueAcquireDX9MediaSurfacesKHR, |
| "DXVA2 in OpenCL acquire"); |
| CL_FUNC(clEnqueueReleaseDX9MediaSurfacesKHR, |
| "DXVA2 in OpenCL release"); |
| |
| if (fail) { |
| av_log(hwdev, AV_LOG_WARNING, "DXVA2 to OpenCL mapping " |
| "not usable.\n"); |
| priv->dxva2_mapping_usable = 0; |
| } else { |
| priv->dx9_media_adapter_type = CL_ADAPTER_D3D9EX_KHR; |
| priv->dxva2_mapping_usable = 1; |
| } |
| } |
| #endif |
| |
| #if HAVE_OPENCL_D3D11 |
| { |
| const char *d3d11_ext = "cl_khr_d3d11_sharing"; |
| const char *nv12_ext = "cl_intel_d3d11_nv12_media_sharing"; |
| int fail = 0; |
| |
| if (!opencl_check_extension(hwdev, d3d11_ext)) { |
| av_log(hwdev, AV_LOG_VERBOSE, "The %s extension is " |
| "required for D3D11 to OpenCL mapping.\n", d3d11_ext); |
| fail = 1; |
| } else if (!opencl_check_extension(hwdev, nv12_ext)) { |
| av_log(hwdev, AV_LOG_VERBOSE, "The %s extension may be " |
| "required for D3D11 to OpenCL mapping.\n", nv12_ext); |
| // Not fatal. |
| } |
| |
| CL_FUNC(clCreateFromD3D11Texture2DKHR, |
| "D3D11 to OpenCL mapping"); |
| CL_FUNC(clEnqueueAcquireD3D11ObjectsKHR, |
| "D3D11 in OpenCL acquire"); |
| CL_FUNC(clEnqueueReleaseD3D11ObjectsKHR, |
| "D3D11 in OpenCL release"); |
| |
| if (fail) { |
| av_log(hwdev, AV_LOG_WARNING, "D3D11 to OpenCL mapping " |
| "not usable.\n"); |
| priv->d3d11_mapping_usable = 0; |
| } else { |
| priv->d3d11_mapping_usable = 1; |
| } |
| } |
| #endif |
| |
| #if HAVE_OPENCL_DRM_ARM |
| { |
| const char *drm_arm_ext = "cl_arm_import_memory"; |
| const char *image_ext = "cl_khr_image2d_from_buffer"; |
| int fail = 0; |
| |
| if (!opencl_check_extension(hwdev, drm_arm_ext)) { |
| av_log(hwdev, AV_LOG_VERBOSE, "The %s extension is " |
| "required for DRM to OpenCL mapping on ARM.\n", |
| drm_arm_ext); |
| fail = 1; |
| } |
| if (!opencl_check_extension(hwdev, image_ext)) { |
| av_log(hwdev, AV_LOG_VERBOSE, "The %s extension is " |
| "required for DRM to OpenCL mapping on ARM.\n", |
| image_ext); |
| fail = 1; |
| } |
| |
| // clImportMemoryARM() is linked statically. |
| |
| if (fail) { |
| av_log(hwdev, AV_LOG_WARNING, "DRM to OpenCL mapping on ARM " |
| "not usable.\n"); |
| priv->drm_arm_mapping_usable = 0; |
| } else { |
| priv->drm_arm_mapping_usable = 1; |
| } |
| } |
| #endif |
| |
| #undef CL_FUNC |
| |
| return 0; |
| } |
| |
| static void opencl_device_uninit(AVHWDeviceContext *hwdev) |
| { |
| OpenCLDeviceContext *priv = hwdev->internal->priv; |
| cl_int cle; |
| |
| if (priv->command_queue) { |
| cle = clReleaseCommandQueue(priv->command_queue); |
| if (cle != CL_SUCCESS) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to release internal " |
| "command queue reference: %d.\n", cle); |
| } |
| priv->command_queue = NULL; |
| } |
| } |
| |
| #if HAVE_OPENCL_VAAPI_INTEL_MEDIA |
| static int opencl_filter_intel_media_vaapi_platform(AVHWDeviceContext *hwdev, |
| cl_platform_id platform_id, |
| const char *platform_name, |
| void *context) |
| { |
| // This doesn't exist as a platform extension, so just test whether |
| // the function we will use for device enumeration exists. |
| |
| if (!clGetExtensionFunctionAddressForPlatform(platform_id, |
| "clGetDeviceIDsFromVA_APIMediaAdapterINTEL")) { |
| av_log(hwdev, AV_LOG_DEBUG, "Platform %s does not export the " |
| "VAAPI device enumeration function.\n", platform_name); |
| return 1; |
| } else { |
| return 0; |
| } |
| } |
| |
| static int opencl_enumerate_intel_media_vaapi_devices(AVHWDeviceContext *hwdev, |
| cl_platform_id platform_id, |
| const char *platform_name, |
| cl_uint *nb_devices, |
| cl_device_id **devices, |
| void *context) |
| { |
| VADisplay va_display = context; |
| clGetDeviceIDsFromVA_APIMediaAdapterINTEL_fn |
| clGetDeviceIDsFromVA_APIMediaAdapterINTEL; |
| cl_int cle; |
| |
| clGetDeviceIDsFromVA_APIMediaAdapterINTEL = |
| clGetExtensionFunctionAddressForPlatform(platform_id, |
| "clGetDeviceIDsFromVA_APIMediaAdapterINTEL"); |
| if (!clGetDeviceIDsFromVA_APIMediaAdapterINTEL) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to get address of " |
| "clGetDeviceIDsFromVA_APIMediaAdapterINTEL().\n"); |
| return AVERROR_UNKNOWN; |
| } |
| |
| cle = clGetDeviceIDsFromVA_APIMediaAdapterINTEL( |
| platform_id, CL_VA_API_DISPLAY_INTEL, va_display, |
| CL_PREFERRED_DEVICES_FOR_VA_API_INTEL, 0, NULL, nb_devices); |
| if (cle == CL_DEVICE_NOT_FOUND) { |
| av_log(hwdev, AV_LOG_DEBUG, "No VAAPI-supporting devices found " |
| "on platform \"%s\".\n", platform_name); |
| *nb_devices = 0; |
| return 0; |
| } else if (cle != CL_SUCCESS) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to get number of devices " |
| "on platform \"%s\": %d.\n", platform_name, cle); |
| return AVERROR_UNKNOWN; |
| } |
| |
| *devices = av_malloc_array(*nb_devices, sizeof(**devices)); |
| if (!*devices) |
| return AVERROR(ENOMEM); |
| |
| cle = clGetDeviceIDsFromVA_APIMediaAdapterINTEL( |
| platform_id, CL_VA_API_DISPLAY_INTEL, va_display, |
| CL_PREFERRED_DEVICES_FOR_VA_API_INTEL, *nb_devices, *devices, NULL); |
| if (cle != CL_SUCCESS) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to get list of VAAPI-supporting " |
| "devices on platform \"%s\": %d.\n", platform_name, cle); |
| av_freep(devices); |
| return AVERROR_UNKNOWN; |
| } |
| |
| return 0; |
| } |
| |
| static int opencl_filter_intel_media_vaapi_device(AVHWDeviceContext *hwdev, |
| cl_device_id device_id, |
| const char *device_name, |
| void *context) |
| { |
| const char *va_ext = "cl_intel_va_api_media_sharing"; |
| |
| if (opencl_check_device_extension(device_id, va_ext)) { |
| return 0; |
| } else { |
| av_log(hwdev, AV_LOG_DEBUG, "Device %s does not support the " |
| "%s extension.\n", device_name, va_ext); |
| return 1; |
| } |
| } |
| #endif |
| |
| #if HAVE_OPENCL_DXVA2 |
| static int opencl_filter_dxva2_platform(AVHWDeviceContext *hwdev, |
| cl_platform_id platform_id, |
| const char *platform_name, |
| void *context) |
| { |
| const char *dx9_ext = "cl_khr_dx9_media_sharing"; |
| |
| if (opencl_check_platform_extension(platform_id, dx9_ext)) { |
| return 0; |
| } else { |
| av_log(hwdev, AV_LOG_DEBUG, "Platform %s does not support the " |
| "%s extension.\n", platform_name, dx9_ext); |
| return 1; |
| } |
| } |
| |
| static int opencl_enumerate_dxva2_devices(AVHWDeviceContext *hwdev, |
| cl_platform_id platform_id, |
| const char *platform_name, |
| cl_uint *nb_devices, |
| cl_device_id **devices, |
| void *context) |
| { |
| IDirect3DDevice9 *device = context; |
| clGetDeviceIDsFromDX9MediaAdapterKHR_fn |
| clGetDeviceIDsFromDX9MediaAdapterKHR; |
| cl_dx9_media_adapter_type_khr media_adapter_type = CL_ADAPTER_D3D9EX_KHR; |
| cl_int cle; |
| |
| clGetDeviceIDsFromDX9MediaAdapterKHR = |
| clGetExtensionFunctionAddressForPlatform(platform_id, |
| "clGetDeviceIDsFromDX9MediaAdapterKHR"); |
| if (!clGetDeviceIDsFromDX9MediaAdapterKHR) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to get address of " |
| "clGetDeviceIDsFromDX9MediaAdapterKHR().\n"); |
| return AVERROR_UNKNOWN; |
| } |
| |
| cle = clGetDeviceIDsFromDX9MediaAdapterKHR( |
| platform_id, 1, &media_adapter_type, (void**)&device, |
| CL_PREFERRED_DEVICES_FOR_DX9_MEDIA_ADAPTER_KHR, |
| 0, NULL, nb_devices); |
| if (cle == CL_DEVICE_NOT_FOUND) { |
| av_log(hwdev, AV_LOG_DEBUG, "No DXVA2-supporting devices found " |
| "on platform \"%s\".\n", platform_name); |
| *nb_devices = 0; |
| return 0; |
| } else if (cle != CL_SUCCESS) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to get number of devices " |
| "on platform \"%s\": %d.\n", platform_name, cle); |
| return AVERROR_UNKNOWN; |
| } |
| |
| *devices = av_malloc_array(*nb_devices, sizeof(**devices)); |
| if (!*devices) |
| return AVERROR(ENOMEM); |
| |
| cle = clGetDeviceIDsFromDX9MediaAdapterKHR( |
| platform_id, 1, &media_adapter_type, (void**)&device, |
| CL_PREFERRED_DEVICES_FOR_DX9_MEDIA_ADAPTER_KHR, |
| *nb_devices, *devices, NULL); |
| if (cle != CL_SUCCESS) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to get list of DXVA2-supporting " |
| "devices on platform \"%s\": %d.\n", platform_name, cle); |
| av_freep(devices); |
| return AVERROR_UNKNOWN; |
| } |
| |
| return 0; |
| } |
| #endif |
| |
| #if HAVE_OPENCL_D3D11 |
| static int opencl_filter_d3d11_platform(AVHWDeviceContext *hwdev, |
| cl_platform_id platform_id, |
| const char *platform_name, |
| void *context) |
| { |
| const char *d3d11_ext = "cl_khr_d3d11_sharing"; |
| |
| if (opencl_check_platform_extension(platform_id, d3d11_ext)) { |
| return 0; |
| } else { |
| av_log(hwdev, AV_LOG_DEBUG, "Platform %s does not support the " |
| "%s extension.\n", platform_name, d3d11_ext); |
| return 1; |
| } |
| } |
| |
| static int opencl_enumerate_d3d11_devices(AVHWDeviceContext *hwdev, |
| cl_platform_id platform_id, |
| const char *platform_name, |
| cl_uint *nb_devices, |
| cl_device_id **devices, |
| void *context) |
| { |
| ID3D11Device *device = context; |
| clGetDeviceIDsFromD3D11KHR_fn clGetDeviceIDsFromD3D11KHR; |
| cl_int cle; |
| |
| clGetDeviceIDsFromD3D11KHR = |
| clGetExtensionFunctionAddressForPlatform(platform_id, |
| "clGetDeviceIDsFromD3D11KHR"); |
| if (!clGetDeviceIDsFromD3D11KHR) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to get address of " |
| "clGetDeviceIDsFromD3D11KHR().\n"); |
| return AVERROR_UNKNOWN; |
| } |
| |
| cle = clGetDeviceIDsFromD3D11KHR(platform_id, |
| CL_D3D11_DEVICE_KHR, device, |
| CL_PREFERRED_DEVICES_FOR_D3D11_KHR, |
| 0, NULL, nb_devices); |
| if (cle == CL_DEVICE_NOT_FOUND) { |
| av_log(hwdev, AV_LOG_DEBUG, "No D3D11-supporting devices found " |
| "on platform \"%s\".\n", platform_name); |
| *nb_devices = 0; |
| return 0; |
| } else if (cle != CL_SUCCESS) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to get number of devices " |
| "on platform \"%s\": %d.\n", platform_name, cle); |
| return AVERROR_UNKNOWN; |
| } |
| |
| *devices = av_malloc_array(*nb_devices, sizeof(**devices)); |
| if (!*devices) |
| return AVERROR(ENOMEM); |
| |
| cle = clGetDeviceIDsFromD3D11KHR(platform_id, |
| CL_D3D11_DEVICE_KHR, device, |
| CL_PREFERRED_DEVICES_FOR_D3D11_KHR, |
| *nb_devices, *devices, NULL); |
| if (cle != CL_SUCCESS) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to get list of D3D11-supporting " |
| "devices on platform \"%s\": %d.\n", platform_name, cle); |
| av_freep(devices); |
| return AVERROR_UNKNOWN; |
| } |
| |
| return 0; |
| } |
| #endif |
| |
| #if HAVE_OPENCL_DXVA2 || HAVE_OPENCL_D3D11 |
| static int opencl_filter_gpu_device(AVHWDeviceContext *hwdev, |
| cl_device_id device_id, |
| const char *device_name, |
| void *context) |
| { |
| cl_device_type device_type; |
| cl_int cle; |
| |
| cle = clGetDeviceInfo(device_id, CL_DEVICE_TYPE, |
| sizeof(device_type), &device_type, NULL); |
| if (cle != CL_SUCCESS) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to query device type " |
| "of device \"%s\".\n", device_name); |
| return AVERROR_UNKNOWN; |
| } |
| if (!(device_type & CL_DEVICE_TYPE_GPU)) { |
| av_log(hwdev, AV_LOG_DEBUG, "Device %s skipped (not GPU).\n", |
| device_name); |
| return 1; |
| } |
| |
| return 0; |
| } |
| #endif |
| |
| #if HAVE_OPENCL_DRM_ARM |
| static int opencl_filter_drm_arm_platform(AVHWDeviceContext *hwdev, |
| cl_platform_id platform_id, |
| const char *platform_name, |
| void *context) |
| { |
| const char *drm_arm_ext = "cl_arm_import_memory"; |
| |
| if (opencl_check_platform_extension(platform_id, drm_arm_ext)) { |
| return 0; |
| } else { |
| av_log(hwdev, AV_LOG_DEBUG, "Platform %s does not support the " |
| "%s extension.\n", platform_name, drm_arm_ext); |
| return 1; |
| } |
| } |
| |
| static int opencl_filter_drm_arm_device(AVHWDeviceContext *hwdev, |
| cl_device_id device_id, |
| const char *device_name, |
| void *context) |
| { |
| const char *drm_arm_ext = "cl_arm_import_memory"; |
| |
| if (opencl_check_device_extension(device_id, drm_arm_ext)) { |
| return 0; |
| } else { |
| av_log(hwdev, AV_LOG_DEBUG, "Device %s does not support the " |
| "%s extension.\n", device_name, drm_arm_ext); |
| return 1; |
| } |
| } |
| #endif |
| |
| static int opencl_device_derive(AVHWDeviceContext *hwdev, |
| AVHWDeviceContext *src_ctx, AVDictionary *opts, |
| int flags) |
| { |
| int err; |
| switch (src_ctx->type) { |
| |
| #if HAVE_OPENCL_DRM_BEIGNET |
| case AV_HWDEVICE_TYPE_DRM: |
| case AV_HWDEVICE_TYPE_VAAPI: |
| { |
| // Surface mapping works via DRM PRIME fds with no special |
| // initialisation required in advance. This just finds the |
| // Beignet ICD by name. |
| AVDictionary *selector_opts = NULL; |
| |
| err = av_dict_set(&selector_opts, "platform_vendor", "Intel", 0); |
| if (err >= 0) |
| err = av_dict_set(&selector_opts, "platform_version", "beignet", 0); |
| if (err >= 0) { |
| OpenCLDeviceSelector selector = { |
| .platform_index = -1, |
| .device_index = 0, |
| .context = selector_opts, |
| .enumerate_platforms = &opencl_enumerate_platforms, |
| .filter_platform = &opencl_filter_platform, |
| .enumerate_devices = &opencl_enumerate_devices, |
| .filter_device = NULL, |
| }; |
| err = opencl_device_create_internal(hwdev, &selector, NULL); |
| } |
| av_dict_free(&selector_opts); |
| } |
| break; |
| #endif |
| |
| #if HAVE_OPENCL_VAAPI_INTEL_MEDIA |
| // The generic code automatically attempts to derive from all |
| // ancestors of the given device, so we can ignore QSV devices here |
| // and just consider the inner VAAPI device it was derived from. |
| case AV_HWDEVICE_TYPE_VAAPI: |
| { |
| AVVAAPIDeviceContext *src_hwctx = src_ctx->hwctx; |
| cl_context_properties props[7] = { |
| CL_CONTEXT_PLATFORM, |
| 0, |
| CL_CONTEXT_VA_API_DISPLAY_INTEL, |
| (intptr_t)src_hwctx->display, |
| CL_CONTEXT_INTEROP_USER_SYNC, |
| CL_FALSE, |
| 0, |
| }; |
| OpenCLDeviceSelector selector = { |
| .platform_index = -1, |
| .device_index = -1, |
| .context = src_hwctx->display, |
| .enumerate_platforms = &opencl_enumerate_platforms, |
| .filter_platform = &opencl_filter_intel_media_vaapi_platform, |
| .enumerate_devices = &opencl_enumerate_intel_media_vaapi_devices, |
| .filter_device = &opencl_filter_intel_media_vaapi_device, |
| }; |
| |
| err = opencl_device_create_internal(hwdev, &selector, props); |
| } |
| break; |
| #endif |
| |
| #if HAVE_OPENCL_DXVA2 |
| case AV_HWDEVICE_TYPE_DXVA2: |
| { |
| AVDXVA2DeviceContext *src_hwctx = src_ctx->hwctx; |
| IDirect3DDevice9 *device; |
| HANDLE device_handle; |
| HRESULT hr; |
| |
| hr = IDirect3DDeviceManager9_OpenDeviceHandle(src_hwctx->devmgr, |
| &device_handle); |
| if (FAILED(hr)) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to open device handle " |
| "for Direct3D9 device: %lx.\n", (unsigned long)hr); |
| err = AVERROR_UNKNOWN; |
| break; |
| } |
| |
| hr = IDirect3DDeviceManager9_LockDevice(src_hwctx->devmgr, |
| device_handle, |
| &device, FALSE); |
| if (SUCCEEDED(hr)) { |
| cl_context_properties props[5] = { |
| CL_CONTEXT_PLATFORM, |
| 0, |
| CL_CONTEXT_ADAPTER_D3D9EX_KHR, |
| (intptr_t)device, |
| 0, |
| }; |
| OpenCLDeviceSelector selector = { |
| .platform_index = -1, |
| .device_index = -1, |
| .context = device, |
| .enumerate_platforms = &opencl_enumerate_platforms, |
| .filter_platform = &opencl_filter_dxva2_platform, |
| .enumerate_devices = &opencl_enumerate_dxva2_devices, |
| .filter_device = &opencl_filter_gpu_device, |
| }; |
| |
| err = opencl_device_create_internal(hwdev, &selector, props); |
| |
| IDirect3DDeviceManager9_UnlockDevice(src_hwctx->devmgr, |
| device_handle, FALSE); |
| } else { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to lock device handle " |
| "for Direct3D9 device: %lx.\n", (unsigned long)hr); |
| err = AVERROR_UNKNOWN; |
| } |
| |
| IDirect3DDeviceManager9_CloseDeviceHandle(src_hwctx->devmgr, |
| device_handle); |
| } |
| break; |
| #endif |
| |
| #if HAVE_OPENCL_D3D11 |
| case AV_HWDEVICE_TYPE_D3D11VA: |
| { |
| AVD3D11VADeviceContext *src_hwctx = src_ctx->hwctx; |
| cl_context_properties props[5] = { |
| CL_CONTEXT_PLATFORM, |
| 0, |
| CL_CONTEXT_D3D11_DEVICE_KHR, |
| (intptr_t)src_hwctx->device, |
| 0, |
| }; |
| OpenCLDeviceSelector selector = { |
| .platform_index = -1, |
| .device_index = -1, |
| .context = src_hwctx->device, |
| .enumerate_platforms = &opencl_enumerate_platforms, |
| .filter_platform = &opencl_filter_d3d11_platform, |
| .enumerate_devices = &opencl_enumerate_d3d11_devices, |
| .filter_device = &opencl_filter_gpu_device, |
| }; |
| |
| err = opencl_device_create_internal(hwdev, &selector, props); |
| } |
| break; |
| #endif |
| |
| #if HAVE_OPENCL_DRM_ARM |
| case AV_HWDEVICE_TYPE_DRM: |
| { |
| OpenCLDeviceSelector selector = { |
| .platform_index = -1, |
| .device_index = -1, |
| .context = NULL, |
| .enumerate_platforms = &opencl_enumerate_platforms, |
| .filter_platform = &opencl_filter_drm_arm_platform, |
| .enumerate_devices = &opencl_enumerate_devices, |
| .filter_device = &opencl_filter_drm_arm_device, |
| }; |
| |
| err = opencl_device_create_internal(hwdev, &selector, NULL); |
| } |
| break; |
| #endif |
| |
| default: |
| err = AVERROR(ENOSYS); |
| break; |
| } |
| |
| return err; |
| } |
| |
| static int opencl_get_plane_format(enum AVPixelFormat pixfmt, |
| int plane, int width, int height, |
| cl_image_format *image_format, |
| cl_image_desc *image_desc) |
| { |
| const AVPixFmtDescriptor *desc; |
| const AVComponentDescriptor *comp; |
| int channels = 0, order = 0, depth = 0, step = 0; |
| int wsub, hsub, alpha; |
| int c; |
| |
| if (plane >= AV_NUM_DATA_POINTERS) |
| return AVERROR(ENOENT); |
| |
| desc = av_pix_fmt_desc_get(pixfmt); |
| |
| // Only normal images are allowed. |
| if (desc->flags & (AV_PIX_FMT_FLAG_BITSTREAM | |
| AV_PIX_FMT_FLAG_HWACCEL | |
| AV_PIX_FMT_FLAG_PAL)) |
| return AVERROR(EINVAL); |
| |
| wsub = 1 << desc->log2_chroma_w; |
| hsub = 1 << desc->log2_chroma_h; |
| // Subsampled components must be exact. |
| if (width & wsub - 1 || height & hsub - 1) |
| return AVERROR(EINVAL); |
| |
| for (c = 0; c < desc->nb_components; c++) { |
| comp = &desc->comp[c]; |
| if (comp->plane != plane) |
| continue; |
| // The step size must be a power of two. |
| if (comp->step != 1 && comp->step != 2 && |
| comp->step != 4 && comp->step != 8) |
| return AVERROR(EINVAL); |
| // The bits in each component must be packed in the |
| // most-significant-bits of the relevant bytes. |
| if (comp->shift + comp->depth != 8 && |
| comp->shift + comp->depth != 16) |
| return AVERROR(EINVAL); |
| // The depth must not vary between components. |
| if (depth && comp->depth != depth) |
| return AVERROR(EINVAL); |
| // If a single data element crosses multiple bytes then |
| // it must match the native endianness. |
| if (comp->depth > 8 && |
| HAVE_BIGENDIAN == !(desc->flags & AV_PIX_FMT_FLAG_BE)) |
| return AVERROR(EINVAL); |
| // A single data element must not contain multiple samples |
| // from the same component. |
| if (step && comp->step != step) |
| return AVERROR(EINVAL); |
| |
| depth = comp->depth; |
| order = order * 10 + comp->offset / ((depth + 7) / 8) + 1; |
| step = comp->step; |
| alpha = (desc->flags & AV_PIX_FMT_FLAG_ALPHA && |
| c == desc->nb_components - 1); |
| ++channels; |
| } |
| if (channels == 0) |
| return AVERROR(ENOENT); |
| |
| memset(image_format, 0, sizeof(*image_format)); |
| memset(image_desc, 0, sizeof(*image_desc)); |
| image_desc->image_type = CL_MEM_OBJECT_IMAGE2D; |
| |
| if (plane == 0 || alpha) { |
| image_desc->image_width = width; |
| image_desc->image_height = height; |
| image_desc->image_row_pitch = step * width; |
| } else { |
| image_desc->image_width = width / wsub; |
| image_desc->image_height = height / hsub; |
| image_desc->image_row_pitch = step * width / wsub; |
| } |
| |
| if (depth <= 8) { |
| image_format->image_channel_data_type = CL_UNORM_INT8; |
| } else { |
| if (depth <= 16) |
| image_format->image_channel_data_type = CL_UNORM_INT16; |
| else |
| return AVERROR(EINVAL); |
| } |
| |
| #define CHANNEL_ORDER(order, type) \ |
| case order: image_format->image_channel_order = type; break; |
| switch (order) { |
| CHANNEL_ORDER(1, CL_R); |
| CHANNEL_ORDER(12, CL_RG); |
| CHANNEL_ORDER(1234, CL_RGBA); |
| CHANNEL_ORDER(2341, CL_ARGB); |
| CHANNEL_ORDER(3214, CL_BGRA); |
| #ifdef CL_ABGR |
| CHANNEL_ORDER(4321, CL_ABGR); |
| #endif |
| default: |
| return AVERROR(EINVAL); |
| } |
| #undef CHANNEL_ORDER |
| |
| return 0; |
| } |
| |
| static int opencl_frames_get_constraints(AVHWDeviceContext *hwdev, |
| const void *hwconfig, |
| AVHWFramesConstraints *constraints) |
| { |
| AVOpenCLDeviceContext *hwctx = hwdev->hwctx; |
| cl_uint nb_image_formats; |
| cl_image_format *image_formats = NULL; |
| cl_int cle; |
| enum AVPixelFormat pix_fmt; |
| int err, pix_fmts_found; |
| size_t max_width, max_height; |
| |
| cle = clGetDeviceInfo(hwctx->device_id, CL_DEVICE_IMAGE2D_MAX_WIDTH, |
| sizeof(max_width), &max_width, NULL); |
| if (cle != CL_SUCCESS) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to query maximum " |
| "supported image width: %d.\n", cle); |
| } else { |
| constraints->max_width = max_width; |
| } |
| cle = clGetDeviceInfo(hwctx->device_id, CL_DEVICE_IMAGE2D_MAX_HEIGHT, |
| sizeof(max_height), &max_height, NULL); |
| if (cle != CL_SUCCESS) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to query maximum " |
| "supported image height: %d.\n", cle); |
| } else { |
| constraints->max_height = max_height; |
| } |
| av_log(hwdev, AV_LOG_DEBUG, "Maximum supported image size %dx%d.\n", |
| constraints->max_width, constraints->max_height); |
| |
| cle = clGetSupportedImageFormats(hwctx->context, |
| CL_MEM_READ_WRITE, |
| CL_MEM_OBJECT_IMAGE2D, |
| 0, NULL, &nb_image_formats); |
| if (cle != CL_SUCCESS) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to query supported " |
| "image formats: %d.\n", cle); |
| err = AVERROR(ENOSYS); |
| goto fail; |
| } |
| if (nb_image_formats == 0) { |
| av_log(hwdev, AV_LOG_ERROR, "No image support in OpenCL " |
| "driver (zero supported image formats).\n"); |
| err = AVERROR(ENOSYS); |
| goto fail; |
| } |
| |
| image_formats = |
| av_malloc_array(nb_image_formats, sizeof(*image_formats)); |
| if (!image_formats) { |
| err = AVERROR(ENOMEM); |
| goto fail; |
| } |
| |
| cle = clGetSupportedImageFormats(hwctx->context, |
| CL_MEM_READ_WRITE, |
| CL_MEM_OBJECT_IMAGE2D, |
| nb_image_formats, |
| image_formats, NULL); |
| if (cle != CL_SUCCESS) { |
| av_log(hwdev, AV_LOG_ERROR, "Failed to query supported " |
| "image formats: %d.\n", cle); |
| err = AVERROR(ENOSYS); |
| goto fail; |
| } |
| |
| pix_fmts_found = 0; |
| for (pix_fmt = 0; pix_fmt < AV_PIX_FMT_NB; pix_fmt++) { |
| cl_image_format image_format; |
| cl_image_desc image_desc; |
| int plane, i; |
| |
| for (plane = 0;; plane++) { |
| err = opencl_get_plane_format(pix_fmt, plane, 0, 0, |
| &image_format, |
| &image_desc); |
| if (err < 0) |
| break; |
| |
| for (i = 0; i < nb_image_formats; i++) { |
| if (image_formats[i].image_channel_order == |
| image_format.image_channel_order && |
| image_formats[i].image_channel_data_type == |
| image_format.image_channel_data_type) |
| break; |
| } |
| if (i == nb_image_formats) { |
| err = AVERROR(EINVAL); |
| break; |
| } |
| } |
| if (err != AVERROR(ENOENT)) |
| continue; |
| |
| av_log(hwdev, AV_LOG_DEBUG, "Format %s supported.\n", |
| av_get_pix_fmt_name(pix_fmt)); |
| |
| err = av_reallocp_array(&constraints->valid_sw_formats, |
| pix_fmts_found + 2, |
| sizeof(*constraints->valid_sw_formats)); |
| if (err < 0) |
| goto fail; |
| constraints->valid_sw_formats[pix_fmts_found] = pix_fmt; |
| constraints->valid_sw_formats[pix_fmts_found + 1] = |
| AV_PIX_FMT_NONE; |
| ++pix_fmts_found; |
| } |
| |
| av_freep(&image_formats); |
| |
| constraints->valid_hw_formats = |
| av_malloc_array(2, sizeof(*constraints->valid_hw_formats)); |
| if (!constraints->valid_hw_formats) { |
| err = AVERROR(ENOMEM); |
| goto fail; |
| } |
| constraints->valid_hw_formats[0] = AV_PIX_FMT_OPENCL; |
| constraints->valid_hw_formats[1] = AV_PIX_FMT_NONE; |
| |
| return 0; |
| |
| fail: |
| av_freep(&image_formats); |
| return err; |
| } |
| |
| static void opencl_pool_free(void *opaque, uint8_t *data) |
| { |
| AVHWFramesContext *hwfc = opaque; |
| AVOpenCLFrameDescriptor *desc = (AVOpenCLFrameDescriptor*)data; |
| cl_int cle; |
| int p; |
| |
| for (p = 0; p < desc->nb_planes; p++) { |
| cle = clReleaseMemObject(desc->planes[p]); |
| if (cle != CL_SUCCESS) { |
| av_log(hwfc, AV_LOG_ERROR, "Failed to release plane %d: " |
| "%d.\n", p, cle); |
| } |
| } |
| |
| av_free(desc); |
| } |
| |
| static AVBufferRef *opencl_pool_alloc(void *opaque, int size) |
| { |
| AVHWFramesContext *hwfc = opaque; |
| AVOpenCLDeviceContext *hwctx = hwfc->device_ctx->hwctx; |
| AVOpenCLFrameDescriptor *desc; |
| cl_int cle; |
| cl_mem image; |
| cl_image_format image_format; |
| cl_image_desc image_desc; |
| int err, p; |
| AVBufferRef *ref; |
| |
| desc = av_mallocz(sizeof(*desc)); |
| if (!desc) |
| return NULL; |
| |
| for (p = 0;; p++) { |
| err = opencl_get_plane_format(hwfc->sw_format, p, |
| hwfc->width, hwfc->height, |
| &image_format, &image_desc); |
| if (err == AVERROR(ENOENT)) |
| break; |
| if (err < 0) |
| goto fail; |
| |
| // For generic image objects, the pitch is determined by the |
| // implementation. |
| image_desc.image_row_pitch = 0; |
| |
| image = clCreateImage(hwctx->context, CL_MEM_READ_WRITE, |
| &image_format, &image_desc, NULL, &cle); |
| if (!image) { |
| av_log(hwfc, AV_LOG_ERROR, "Failed to create image for " |
| "plane %d: %d.\n", p, cle); |
| goto fail; |
| } |
| |
| desc->planes[p] = image; |
| } |
| |
| desc->nb_planes = p; |
| |
| ref = av_buffer_create((uint8_t*)desc, sizeof(*desc), |
| &opencl_pool_free, hwfc, 0); |
| if (!ref) |
| goto fail; |
| |
| return ref; |
| |
| fail: |
| for (p = 0; desc->planes[p]; p++) |
| clReleaseMemObject(desc->planes[p]); |
| av_free(desc); |
| return NULL; |
| } |
| |
| static int opencl_frames_init_command_queue(AVHWFramesContext *hwfc) |
| { |
| AVOpenCLFramesContext *hwctx = hwfc->hwctx; |
| OpenCLDeviceContext *devpriv = hwfc->device_ctx->internal->priv; |
| OpenCLFramesContext *priv = hwfc->internal->priv; |
| cl_int cle; |
| |
| priv->command_queue = hwctx->command_queue ? hwctx->command_queue |
| : devpriv->command_queue; |
| cle = clRetainCommandQueue(priv->command_queue); |
| if (cle != CL_SUCCESS) { |
| av_log(hwfc, AV_LOG_ERROR, "Failed to retain frame " |
| "command queue: %d.\n", cle); |
| return AVERROR(EIO); |
| } |
| |
| return 0; |
| } |
| |
| static int opencl_frames_init(AVHWFramesContext *hwfc) |
| { |
| if (!hwfc->pool) { |
| hwfc->internal->pool_internal = |
| av_buffer_pool_init2(sizeof(cl_mem), hwfc, |
| &opencl_pool_alloc, NULL); |
| if (!hwfc->internal->pool_internal) |
| return AVERROR(ENOMEM); |
| } |
| |
| return opencl_frames_init_command_queue(hwfc); |
| } |
| |
| static void opencl_frames_uninit(AVHWFramesContext *hwfc) |
| { |
| OpenCLFramesContext *priv = hwfc->internal->priv; |
| cl_int cle; |
| |
| #if HAVE_OPENCL_DXVA2 || HAVE_OPENCL_D3D11 |
| int i, p; |
| for (i = 0; i < priv->nb_mapped_frames; i++) { |
| AVOpenCLFrameDescriptor *desc = &priv->mapped_frames[i]; |
| for (p = 0; p < desc->nb_planes; p++) { |
| cle = clReleaseMemObject(desc->planes[p]); |
| if (cle != CL_SUCCESS) { |
| av_log(hwfc, AV_LOG_ERROR, "Failed to release mapped " |
| "frame object (frame %d plane %d): %d.\n", |
| i, p, cle); |
| } |
| } |
| } |
| av_freep(&priv->mapped_frames); |
| #endif |
| |
| if (priv->command_queue) { |
| cle = clReleaseCommandQueue(priv->command_queue); |
| if (cle != CL_SUCCESS) { |
| av_log(hwfc, AV_LOG_ERROR, "Failed to release frame " |
| "command queue: %d.\n", cle); |
| } |
| priv->command_queue = NULL; |
| } |
| } |
| |
| static int opencl_get_buffer(AVHWFramesContext *hwfc, AVFrame *frame) |
| { |
| AVOpenCLFrameDescriptor *desc; |
| int p; |
| |
| frame->buf[0] = av_buffer_pool_get(hwfc->pool); |
| if (!frame->buf[0]) |
| return AVERROR(ENOMEM); |
| |
| desc = (AVOpenCLFrameDescriptor*)frame->buf[0]->data; |
| |
| for (p = 0; p < desc->nb_planes; p++) |
| frame->data[p] = (uint8_t*)desc->planes[p]; |
| |
| frame->format = AV_PIX_FMT_OPENCL; |
| frame->width = hwfc->width; |
| frame->height = hwfc->height; |
| |
| return 0; |
| } |
| |
| static int opencl_transfer_get_formats(AVHWFramesContext *hwfc, |
| enum AVHWFrameTransferDirection dir, |
| enum AVPixelFormat **formats) |
| { |
| enum AVPixelFormat *fmts; |
| |
| fmts = av_malloc_array(2, sizeof(*fmts)); |
| if (!fmts) |
| return AVERROR(ENOMEM); |
| |
| fmts[0] = hwfc->sw_format; |
| fmts[1] = AV_PIX_FMT_NONE; |
| |
| *formats = fmts; |
| return 0; |
| } |
| |
| static int opencl_wait_events(AVHWFramesContext *hwfc, |
| cl_event *events, int nb_events) |
| { |
| cl_int cle; |
| int i; |
| |
| cle = clWaitForEvents(nb_events, events); |
| if (cle != CL_SUCCESS) { |
| av_log(hwfc, AV_LOG_ERROR, "Failed to wait for event " |
| "completion: %d.\n", cle); |
| return AVERROR(EIO); |
| } |
| |
| for (i = 0; i < nb_events; i++) { |
| cle = clReleaseEvent(events[i]); |
| if (cle != CL_SUCCESS) { |
| av_log(hwfc, AV_LOG_ERROR, "Failed to release " |
| "event: %d.\n", cle); |
| } |
| } |
| |
| return 0; |
| } |
| |
| static int opencl_transfer_data_from(AVHWFramesContext *hwfc, |
| AVFrame *dst, const AVFrame *src) |
| { |
| OpenCLFramesContext *priv = hwfc->internal->priv; |
| cl_image_format image_format; |
| cl_image_desc image_desc; |
| cl_int cle; |
| size_t origin[3] = { 0, 0, 0 }; |
| size_t region[3]; |
| cl_event events[AV_NUM_DATA_POINTERS]; |
| int err, p; |
| |
| if (dst->format != hwfc->sw_format) |
| return AVERROR(EINVAL); |
| |
| for (p = 0;; p++) { |
| err = opencl_get_plane_format(hwfc->sw_format, p, |
| src->width, src->height, |
| &image_format, &image_desc); |
| if (err < 0) { |
| if (err == AVERROR(ENOENT)) |
| err = 0; |
| break; |
| } |
| |
| if (!dst->data[p]) { |
| av_log(hwfc, AV_LOG_ERROR, "Plane %d missing on " |
| "destination frame for transfer.\n", p); |
| err = AVERROR(EINVAL); |
| break; |
| } |
| |
| region[0] = image_desc.image_width; |
| region[1] = image_desc.image_height; |
| region[2] = 1; |
| |
| cle = clEnqueueReadImage(priv->command_queue, |
| (cl_mem)src->data[p], |
| CL_FALSE, origin, region, |
| dst->linesize[p], 0, |
| dst->data[p], |
| 0, NULL, &events[p]); |
| if (cle != CL_SUCCESS) { |
| av_log(hwfc, AV_LOG_ERROR, "Failed to enqueue read of " |
| "OpenCL image plane %d: %d.\n", p, cle); |
| err = AVERROR(EIO); |
| break; |
| } |
| } |
| |
| opencl_wait_events(hwfc, events, p); |
| |
| return err; |
| } |
| |
| static int opencl_transfer_data_to(AVHWFramesContext *hwfc, |
| AVFrame *dst, const AVFrame *src) |
| { |
| OpenCLFramesContext *priv = hwfc->internal->priv; |
| cl_image_format image_format; |
| cl_image_desc image_desc; |
| cl_int cle; |
| size_t origin[3] = { 0, 0, 0 }; |
| size_t region[3]; |
| cl_event events[AV_NUM_DATA_POINTERS]; |
| int err, p; |
| |
| if (src->format != hwfc->sw_format) |
| return AVERROR(EINVAL); |
| |
| for (p = 0;; p++) { |
| err = opencl_get_plane_format(hwfc->sw_format, p, |
| src->width, src->height, |
| &image_format, &image_desc); |
| if (err < 0) { |
| if (err == AVERROR(ENOENT)) |
| err = 0; |
| break; |
| } |
| |
| if (!src->data[p]) { |
| av_log(hwfc, AV_LOG_ERROR, "Plane %d missing on " |
| "source frame for transfer.\n", p); |
| err = AVERROR(EINVAL); |
| break; |
| } |
| |
| region[0] = image_desc.image_width; |
| region[1] = image_desc.image_height; |
| region[2] = 1; |
| |
| cle = clEnqueueWriteImage(priv->command_queue, |
| (cl_mem)dst->data[p], |
| CL_FALSE, origin, region, |
| src->linesize[p], 0, |
| src->data[p], |
| 0, NULL, &events[p]); |
| if (cle != CL_SUCCESS) { |
| av_log(hwfc, AV_LOG_ERROR, "Failed to enqueue write of " |
| "OpenCL image plane %d: %d.\n", p, cle); |
| err = AVERROR(EIO); |
| break; |
| } |
| } |
| |
| opencl_wait_events(hwfc, events, p); |
| |
| return err; |
| } |
| |
| typedef struct OpenCLMapping { |
| // The mapped addresses for each plane. |
| // The destination frame is not available when we unmap, so these |
| // need to be stored separately. |
| void *address[AV_NUM_DATA_POINTERS]; |
| } OpenCLMapping; |
| |
| static void opencl_unmap_frame(AVHWFramesContext *hwfc, |
| HWMapDescriptor *hwmap) |
| { |
| OpenCLFramesContext *priv = hwfc->internal->priv; |
| OpenCLMapping *map = hwmap->priv; |
| cl_event events[AV_NUM_DATA_POINTERS]; |
| int p, e; |
| cl_int cle; |
| |
| for (p = e = 0; p < FF_ARRAY_ELEMS(map->address); p++) { |
| if (!map->address[p]) |
| break; |
| |
| cle = clEnqueueUnmapMemObject(priv->command_queue, |
| (cl_mem)hwmap->source->data[p], |
| map->address[p], |
| 0, NULL, &events[e]); |
| if (cle != CL_SUCCESS) { |
| av_log(hwfc, AV_LOG_ERROR, "Failed to unmap OpenCL " |
| "image plane %d: %d.\n", p, cle); |
| } |
| ++e; |
| } |
| |
| opencl_wait_events(hwfc, events, e); |
| |
| av_free(map); |
| } |
| |
| static int opencl_map_frame(AVHWFramesContext *hwfc, AVFrame *dst, |
| const AVFrame *src, int flags) |
| { |
| OpenCLFramesContext *priv = hwfc->internal->priv; |
| cl_map_flags map_flags; |
| cl_image_format image_format; |
| cl_image_desc image_desc; |
| cl_int cle; |
| OpenCLMapping *map; |
| size_t origin[3] = { 0, 0, 0 }; |
| size_t region[3]; |
| size_t row_pitch; |
| cl_event events[AV_NUM_DATA_POINTERS]; |
| int err, p; |
| |
| av_assert0(hwfc->sw_format == dst->format); |
| |
| if (flags & AV_HWFRAME_MAP_OVERWRITE && |
| !(flags & AV_HWFRAME_MAP_READ)) { |
| // This is mutually exclusive with the read/write flags, so |
| // there is no way to map with read here. |
| map_flags = CL_MAP_WRITE_INVALIDATE_REGION; |
| } else { |
| map_flags = 0; |
| if (flags & AV_HWFRAME_MAP_READ) |
| map_flags |= CL_MAP_READ; |
| if (flags & AV_HWFRAME_MAP_WRITE) |
| map_flags |= CL_MAP_WRITE; |
| } |
| |
| map = av_mallocz(sizeof(*map)); |
| if (!map) |
| return AVERROR(ENOMEM); |
| |
| for (p = 0;; p++) { |
| err = opencl_get_plane_format(hwfc->sw_format, p, |
| src->width, src->height, |
| &image_format, &image_desc); |
| if (err == AVERROR(ENOENT)) |
| break; |
| if (err < 0) |
| goto fail; |
| |
| region[0] = image_desc.image_width; |
| region[1] = image_desc.image_height; |
| region[2] = 1; |
| |
| map->address[p] = |
| clEnqueueMapImage(priv->command_queue, |
| (cl_mem)src->data[p], |
| CL_FALSE, map_flags, origin, region, |
| &row_pitch, NULL, 0, NULL, |
| &events[p], &cle); |
| if (!map->address[p]) { |
| av_log(hwfc, AV_LOG_ERROR, "Failed to map OpenCL " |
| "image plane %d: %d.\n", p, cle); |
| err = AVERROR(EIO); |
| goto fail; |
| } |
| |
| dst->data[p] = map->address[p]; |
| |
| av_log(hwfc, AV_LOG_DEBUG, "Map plane %d (%p -> %p).\n", |
| p, src->data[p], dst->data[p]); |
| } |
| |
| err = opencl_wait_events(hwfc, events, p); |
| if (err < 0) |
| goto fail; |
| |
| err = ff_hwframe_map_create(src->hw_frames_ctx, dst, src, |
| &opencl_unmap_frame, map); |
| if (err < 0) |
| goto fail; |
| |
| dst->width = src->width; |
| dst->height = src->height; |
| |
| return 0; |
| |
| fail: |
| for (p = 0; p < AV_NUM_DATA_POINTERS; p++) { |
| if (!map->address[p]) |
| break; |
| clEnqueueUnmapMemObject(priv->command_queue, |
| (cl_mem)src->data[p], |
| map->address[p], |
| 0, NULL, &events[p]); |
| } |
| if (p > 0) |
| opencl_wait_events(hwfc, events, p); |
| av_freep(&map); |
| return err; |
| } |
| |
| #if HAVE_OPENCL_DRM_BEIGNET |
| |
| typedef struct DRMBeignetToOpenCLMapping { |
| AVFrame *drm_frame; |
| AVDRMFrameDescriptor *drm_desc; |
| |
| AVOpenCLFrameDescriptor frame; |
| } DRMBeignetToOpenCLMapping; |
| |
| static void opencl_unmap_from_drm_beignet(AVHWFramesContext *dst_fc, |
| HWMapDescriptor *hwmap) |
| { |
| DRMBeignetToOpenCLMapping *mapping = hwmap->priv; |
| cl_int cle; |
| int i; |
| |
| for (i = 0; i < mapping->frame.nb_planes; i++) { |
| cle = clReleaseMemObject(mapping->frame.planes[i]); |
| if (cle != CL_SUCCESS) { |
| av_log(dst_fc, AV_LOG_ERROR, "Failed to release CL image " |
| "of plane %d of DRM frame: %d.\n", i, cle); |
| } |
| } |
| |
| av_free(mapping); |
| } |
| |
| static int opencl_map_from_drm_beignet(AVHWFramesContext *dst_fc, |
| AVFrame *dst, const AVFrame *src, |
| int flags) |
| { |
| AVOpenCLDeviceContext *hwctx = dst_fc->device_ctx->hwctx; |
| OpenCLDeviceContext *priv = dst_fc->device_ctx->internal->priv; |
| DRMBeignetToOpenCLMapping *mapping; |
| const AVDRMFrameDescriptor *desc; |
| cl_int cle; |
| int err, i, j, p; |
| |
| desc = (const AVDRMFrameDescriptor*)src->data[0]; |
| |
| mapping = av_mallocz(sizeof(*mapping)); |
| if (!mapping) |
| return AVERROR(ENOMEM); |
| |
| p = 0; |
| for (i = 0; i < desc->nb_layers; i++) { |
| const AVDRMLayerDescriptor *layer = &desc->layers[i]; |
| for (j = 0; j < layer->nb_planes; j++) { |
| const AVDRMPlaneDescriptor *plane = &layer->planes[j]; |
| const AVDRMObjectDescriptor *object = |
| &desc->objects[plane->object_index]; |
| |
| cl_import_image_info_intel image_info = { |
| .fd = object->fd, |
| .size = object->size, |
| .type = CL_MEM_OBJECT_IMAGE2D, |
| .offset = plane->offset, |
| .row_pitch = plane->pitch, |
| }; |
| cl_image_desc image_desc; |
| |
| err = opencl_get_plane_format(dst_fc->sw_format, p, |
| src->width, src->height, |
| &image_info.fmt, |
| &image_desc); |
| if (err < 0) { |
| av_log(dst_fc, AV_LOG_ERROR, "DRM frame layer %d " |
| "plane %d is not representable in OpenCL: %d.\n", |
| i, j, err); |
| goto fail; |
| } |
| image_info.width = image_desc.image_width; |
| image_info.height = image_desc.image_height; |
| |
| mapping->frame.planes[p] = |
| priv->clCreateImageFromFdINTEL(hwctx->context, |
| &image_info, &cle); |
| if (!mapping->frame.planes[p]) { |
| av_log(dst_fc, AV_LOG_ERROR, "Failed to create CL image " |
| "from layer %d plane %d of DRM frame: %d.\n", |
| i, j, cle); |
| err = AVERROR(EIO); |
| goto fail; |
| } |
| |
| dst->data[p] = (uint8_t*)mapping->frame.planes[p]; |
| mapping->frame.nb_planes = ++p; |
| } |
| } |
| |
| err = ff_hwframe_map_create(dst->hw_frames_ctx, dst, src, |
| &opencl_unmap_from_drm_beignet, |
| mapping); |
| if (err < 0) |
| goto fail; |
| |
| dst->width = src->width; |
| dst->height = src->height; |
| |
| return 0; |
| |
| fail: |
| for (p = 0; p < mapping->frame.nb_planes; p++) { |
| if (mapping->frame.planes[p]) |
| clReleaseMemObject(mapping->frame.planes[p]); |
| } |
| av_free(mapping); |
| return err; |
| } |
| |
| #if HAVE_OPENCL_VAAPI_BEIGNET |
| |
| static int opencl_map_from_vaapi(AVHWFramesContext *dst_fc, |
| AVFrame *dst, const AVFrame *src, |
| int flags) |
| { |
| AVFrame *tmp; |
| int err; |
| |
| tmp = av_frame_alloc(); |
| if (!tmp) |
| return AVERROR(ENOMEM); |
| |
| tmp->format = AV_PIX_FMT_DRM_PRIME; |
| |
| err = av_hwframe_map(tmp, src, flags); |
| if (err < 0) |
| goto fail; |
| |
| err = opencl_map_from_drm_beignet(dst_fc, dst, tmp, flags); |
| if (err < 0) |
| goto fail; |
| |
| err = ff_hwframe_map_replace(dst, src); |
| |
| fail: |
| av_frame_free(&tmp); |
| return err; |
| } |
| |
| #endif /* HAVE_OPENCL_VAAPI_BEIGNET */ |
| #endif /* HAVE_OPENCL_DRM_BEIGNET */ |
| |
| static inline cl_mem_flags opencl_mem_flags_for_mapping(int map_flags) |
| { |
| if ((map_flags & AV_HWFRAME_MAP_READ) && |
| (map_flags & AV_HWFRAME_MAP_WRITE)) |
| return CL_MEM_READ_WRITE; |
| else if (map_flags & AV_HWFRAME_MAP_READ) |
| return CL_MEM_READ_ONLY; |
| else if (map_flags & AV_HWFRAME_MAP_WRITE) |
| return CL_MEM_WRITE_ONLY; |
| else |
| return 0; |
| } |
| |
| #if HAVE_OPENCL_VAAPI_INTEL_MEDIA |
| |
| static void opencl_unmap_from_qsv(AVHWFramesContext *dst_fc, |
| HWMapDescriptor *hwmap) |
| { |
| AVOpenCLFrameDescriptor *desc = hwmap->priv; |
| OpenCLDeviceContext *device_priv = dst_fc->device_ctx->internal->priv; |
| OpenCLFramesContext *frames_priv = dst_fc->internal->priv; |
| cl_event event; |
| cl_int cle; |
| int p; |
| |
| av_log(dst_fc, AV_LOG_DEBUG, "Unmap QSV/VAAPI surface from OpenCL.\n"); |
| |
| cle = device_priv->clEnqueueReleaseVA_APIMediaSurfacesINTEL( |
| frames_priv->command_queue, desc->nb_planes, desc->planes, |
| 0, NULL, &event); |
| if (cle != CL_SUCCESS) { |
| av_log(dst_fc, AV_LOG_ERROR, "Failed to release surface " |
| "handles: %d.\n", cle); |
| } |
| |
| opencl_wait_events(dst_fc, &event, 1); |
| |
| for (p = 0; p < desc->nb_planes; p++) { |
| cle = clReleaseMemObject(desc->planes[p]); |
| if (cle != CL_SUCCESS) { |
| av_log(dst_fc, AV_LOG_ERROR, "Failed to release CL " |
| "image of plane %d of QSV/VAAPI surface: %d\n", |
| p, cle); |
| } |
| } |
| |
| av_free(desc); |
| } |
| |
| static int opencl_map_from_qsv(AVHWFramesContext *dst_fc, AVFrame *dst, |
| const AVFrame *src, int flags) |
| { |
| AVHWFramesContext *src_fc = |
| (AVHWFramesContext*)src->hw_frames_ctx->data; |
| AVOpenCLDeviceContext *dst_dev = dst_fc->device_ctx->hwctx; |
| OpenCLDeviceContext *device_priv = dst_fc->device_ctx->internal->priv; |
| OpenCLFramesContext *frames_priv = dst_fc->internal->priv; |
| AVOpenCLFrameDescriptor *desc; |
| VASurfaceID va_surface; |
| cl_mem_flags cl_flags; |
| cl_event event; |
| cl_int cle; |
| int err, p; |
| |
| #if CONFIG_LIBMFX |
| if (src->format == AV_PIX_FMT_QSV) { |
| mfxFrameSurface1 *mfx_surface = (mfxFrameSurface1*)src->data[3]; |
| va_surface = *(VASurfaceID*)mfx_surface->Data.MemId; |
| } else |
| #endif |
| if (src->format == AV_PIX_FMT_VAAPI) { |
| va_surface = (VASurfaceID)(uintptr_t)src->data[3]; |
| } else { |
| return AVERROR(ENOSYS); |
| } |
| |
| cl_flags = opencl_mem_flags_for_mapping(flags); |
| if (!cl_flags) |
| return AVERROR(EINVAL); |
| |
| av_log(src_fc, AV_LOG_DEBUG, "Map QSV/VAAPI surface %#x to " |
| "OpenCL.\n", va_surface); |
| |
| desc = av_mallocz(sizeof(*desc)); |
| if (!desc) |
| return AVERROR(ENOMEM); |
| |
| // The cl_intel_va_api_media_sharing extension only supports NV12 |
| // surfaces, so for now there are always exactly two planes. |
| desc->nb_planes = 2; |
| |
| for (p = 0; p < desc->nb_planes; p++) { |
| desc->planes[p] = |
| device_priv->clCreateFromVA_APIMediaSurfaceINTEL( |
| dst_dev->context, cl_flags, &va_surface, p, &cle); |
| if (!desc->planes[p]) { |
| av_log(dst_fc, AV_LOG_ERROR, "Failed to create CL " |
| "image from plane %d of QSV/VAAPI surface " |
| "%#x: %d.\n", p, va_surface, cle); |
| err = AVERROR(EIO); |
| goto fail; |
| } |
| |
| dst->data[p] = (uint8_t*)desc->planes[p]; |
| } |
| |
| cle = device_priv->clEnqueueAcquireVA_APIMediaSurfacesINTEL( |
| frames_priv->command_queue, desc->nb_planes, desc->planes, |
| 0, NULL, &event); |
| if (cle != CL_SUCCESS) { |
| av_log(dst_fc, AV_LOG_ERROR, "Failed to acquire surface " |
| "handles: %d.\n", cle); |
| err = AVERROR(EIO); |
| goto fail; |
| } |
| |
| err = opencl_wait_events(dst_fc, &event, 1); |
| if (err < 0) |
| goto fail; |
| |
| err = ff_hwframe_map_create(dst->hw_frames_ctx, dst, src, |
| &opencl_unmap_from_qsv, desc); |
| if (err < 0) |
| goto fail; |
| |
| dst->width = src->width; |
| dst->height = src->height; |
| |
| return 0; |
| |
| fail: |
| for (p = 0; p < desc->nb_planes; p++) |
| if (desc->planes[p]) |
| clReleaseMemObject(desc->planes[p]); |
| av_freep(&desc); |
| return err; |
| } |
| |
| #endif |
| |
| #if HAVE_OPENCL_DXVA2 |
| |
| static void opencl_unmap_from_dxva2(AVHWFramesContext *dst_fc, |
| HWMapDescriptor *hwmap) |
| { |
| AVOpenCLFrameDescriptor *desc = hwmap->priv; |
| OpenCLDeviceContext *device_priv = dst_fc->device_ctx->internal->priv; |
| OpenCLFramesContext *frames_priv = dst_fc->device_ctx->internal->priv; |
| cl_event event; |
| cl_int cle; |
| |
| av_log(dst_fc, AV_LOG_DEBUG, "Unmap DXVA2 surface from OpenCL.\n"); |
| |
| cle = device_priv->clEnqueueReleaseDX9MediaSurfacesKHR( |
| frames_priv->command_queue, desc->nb_planes, desc->planes, |
| 0, NULL, &event); |
| if (cle != CL_SUCCESS) { |
| av_log(dst_fc, AV_LOG_ERROR, "Failed to release surface " |
| "handle: %d.\n", cle); |
| return; |
| } |
| |
| opencl_wait_events(dst_fc, &event, 1); |
| } |
| |
| static int opencl_map_from_dxva2(AVHWFramesContext *dst_fc, AVFrame *dst, |
| const AVFrame *src, int flags) |
| { |
| AVHWFramesContext *src_fc = |
| (AVHWFramesContext*)src->hw_frames_ctx->data; |
| AVDXVA2FramesContext *src_hwctx = src_fc->hwctx; |
| OpenCLDeviceContext *device_priv = dst_fc->device_ctx->internal->priv; |
| OpenCLFramesContext *frames_priv = dst_fc->internal->priv; |
| AVOpenCLFrameDescriptor *desc; |
| cl_event event; |
| cl_int cle; |
| int err, i; |
| |
| av_log(dst_fc, AV_LOG_DEBUG, "Map DXVA2 surface %p to " |
| "OpenCL.\n", src->data[3]); |
| |
| for (i = 0; i < src_hwctx->nb_surfaces; i++) { |
| if (src_hwctx->surfaces[i] == (IDirect3DSurface9*)src->data[3]) |
| break; |
| } |
| if (i >= src_hwctx->nb_surfaces) { |
| av_log(dst_fc, AV_LOG_ERROR, "Trying to map from a surface which " |
| "is not in the mapped frames context.\n"); |
| return AVERROR(EINVAL); |
| } |
| |
| desc = &frames_priv->mapped_frames[i]; |
| |
| cle = device_priv->clEnqueueAcquireDX9MediaSurfacesKHR( |
| frames_priv->command_queue, desc->nb_planes, desc->planes, |
| 0, NULL, &event); |
| if (cle != CL_SUCCESS) { |
| av_log(dst_fc, AV_LOG_ERROR, "Failed to acquire surface " |
| "handle: %d.\n", cle); |
| return AVERROR(EIO); |
| } |
| |
| err = opencl_wait_events(dst_fc, &event, 1); |
| if (err < 0) |
| goto fail; |
| |
| for (i = 0; i < desc->nb_planes; i++) |
| dst->data[i] = (uint8_t*)desc->planes[i]; |
| |
| err = ff_hwframe_map_create(dst->hw_frames_ctx, dst, src, |
| &opencl_unmap_from_dxva2, desc); |
| if (err < 0) |
| goto fail; |
| |
| dst->width = src->width; |
| dst->height = src->height; |
| |
| return 0; |
| |
| fail: |
| cle = device_priv->clEnqueueReleaseDX9MediaSurfacesKHR( |
| frames_priv->command_queue, desc->nb_planes, desc->planes, |
| 0, NULL, &event); |
| if (cle == CL_SUCCESS) |
| opencl_wait_events(dst_fc, &event, 1); |
| return err; |
| } |
| |
| static int opencl_frames_derive_from_dxva2(AVHWFramesContext *dst_fc, |
| AVHWFramesContext *src_fc, int flags) |
| { |
| AVOpenCLDeviceContext *dst_dev = dst_fc->device_ctx->hwctx; |
| AVDXVA2FramesContext *src_hwctx = src_fc->hwctx; |
| OpenCLDeviceContext *device_priv = dst_fc->device_ctx->internal->priv; |
| OpenCLFramesContext *frames_priv = dst_fc->internal->priv; |
| cl_mem_flags cl_flags; |
| cl_int cle; |
| int err, i, p, nb_planes; |
| |
| if (src_fc->sw_format != AV_PIX_FMT_NV12) { |
| av_log(dst_fc, AV_LOG_ERROR, "Only NV12 textures are supported " |
| "for DXVA2 to OpenCL mapping.\n"); |
| return AVERROR(EINVAL); |
| } |
| nb_planes = 2; |
| |
| if (src_fc->initial_pool_size == 0) { |
| av_log(dst_fc, AV_LOG_ERROR, "Only fixed-size pools are supported " |
| "for DXVA2 to OpenCL mapping.\n"); |
| return AVERROR(EINVAL); |
| } |
| |
| cl_flags = opencl_mem_flags_for_mapping(flags); |
| if (!cl_flags) |
| return AVERROR(EINVAL); |
| |
| frames_priv->nb_mapped_frames = src_hwctx->nb_surfaces; |
| |
| frames_priv->mapped_frames = |
| av_mallocz_array(frames_priv->nb_mapped_frames, |
| sizeof(*frames_priv->mapped_frames)); |
| if (!frames_priv->mapped_frames) |
| return AVERROR(ENOMEM); |
| |
| for (i = 0; i < frames_priv->nb_mapped_frames; i++) { |
| AVOpenCLFrameDescriptor *desc = &frames_priv->mapped_frames[i]; |
| cl_dx9_surface_info_khr surface_info = { |
| .resource = src_hwctx->surfaces[i], |
| .shared_handle = NULL, |
| }; |
| desc->nb_planes = nb_planes; |
| for (p = 0; p < nb_planes; p++) { |
| desc->planes[p] = |
| device_priv->clCreateFromDX9MediaSurfaceKHR( |
| dst_dev->context, cl_flags, |
| device_priv->dx9_media_adapter_type, |
| &surface_info, p, &cle); |
| if (!desc->planes[p]) { |
| av_log(dst_fc, AV_LOG_ERROR, "Failed to create CL " |
| "image from plane %d of DXVA2 surface %d: %d.\n", |
| p, i, cle); |
| err = AVERROR(EIO); |
| goto fail; |
| } |
| } |
| } |
| |
| return 0; |
| |
| fail: |
| for (i = 0; i < frames_priv->nb_mapped_frames; i++) { |
| AVOpenCLFrameDescriptor *desc = &frames_priv->mapped_frames[i]; |
| for (p = 0; p < desc->nb_planes; p++) { |
| if (desc->planes[p]) |
| clReleaseMemObject(desc->planes[p]); |
| } |
| } |
| av_freep(&frames_priv->mapped_frames); |
| frames_priv->nb_mapped_frames = 0; |
| return err; |
| } |
| |
| #endif |
| |
| #if HAVE_OPENCL_D3D11 |
| |
| static void opencl_unmap_from_d3d11(AVHWFramesContext *dst_fc, |
| HWMapDescriptor *hwmap) |
| { |
| AVOpenCLFrameDescriptor *desc = hwmap->priv; |
| OpenCLDeviceContext *device_priv = dst_fc->device_ctx->internal->priv; |
| OpenCLFramesContext *frames_priv = dst_fc->device_ctx->internal->priv; |
| cl_event event; |
| cl_int cle; |
| |
| cle = device_priv->clEnqueueReleaseD3D11ObjectsKHR( |
| frames_priv->command_queue, desc->nb_planes, desc->planes, |
| 0, NULL, &event); |
| if (cle != CL_SUCCESS) { |
| av_log(dst_fc, AV_LOG_ERROR, "Failed to release surface " |
| "handle: %d.\n", cle); |
| } |
| |
| opencl_wait_events(dst_fc, &event, 1); |
| } |
| |
| static int opencl_map_from_d3d11(AVHWFramesContext *dst_fc, AVFrame *dst, |
| const AVFrame *src, int flags) |
| { |
| OpenCLDeviceContext *device_priv = dst_fc->device_ctx->internal->priv; |
| OpenCLFramesContext *frames_priv = dst_fc->internal->priv; |
| AVOpenCLFrameDescriptor *desc; |
| cl_event event; |
| cl_int cle; |
| int err, index, i; |
| |
| index = (intptr_t)src->data[1]; |
| if (index >= frames_priv->nb_mapped_frames) { |
| av_log(dst_fc, AV_LOG_ERROR, "Texture array index out of range for " |
| "mapping: %d >= %d.\n", index, frames_priv->nb_mapped_frames); |
| return AVERROR(EINVAL); |
| } |
| |
| av_log(dst_fc, AV_LOG_DEBUG, "Map D3D11 texture %d to OpenCL.\n", |
| index); |
| |
| desc = &frames_priv->mapped_frames[index]; |
| |
| cle = device_priv->clEnqueueAcquireD3D11ObjectsKHR( |
| frames_priv->command_queue, desc->nb_planes, desc->planes, |
| 0, NULL, &event); |
| if (cle != CL_SUCCESS) { |
| av_log(dst_fc, AV_LOG_ERROR, "Failed to acquire surface " |
| "handle: %d.\n", cle); |
| return AVERROR(EIO); |
| } |
| |
| err = opencl_wait_events(dst_fc, &event, 1); |
| if (err < 0) |
| goto fail; |
| |
| for (i = 0; i < desc->nb_planes; i++) |
| dst->data[i] = (uint8_t*)desc->planes[i]; |
| |
| err = ff_hwframe_map_create(dst->hw_frames_ctx, dst, src, |
| &opencl_unmap_from_d3d11, desc); |
| if (err < 0) |
| goto fail; |
| |
| dst->width = src->width; |
| dst->height = src->height; |
| |
| return 0; |
| |
| fail: |
| cle = device_priv->clEnqueueReleaseD3D11ObjectsKHR( |
| frames_priv->command_queue, desc->nb_planes, desc->planes, |
| 0, NULL, &event); |
| if (cle == CL_SUCCESS) |
| opencl_wait_events(dst_fc, &event, 1); |
| return err; |
| } |
| |
| static int opencl_frames_derive_from_d3d11(AVHWFramesContext *dst_fc, |
| AVHWFramesContext *src_fc, int flags) |
| { |
| AVOpenCLDeviceContext *dst_dev = dst_fc->device_ctx->hwctx; |
| AVD3D11VAFramesContext *src_hwctx = src_fc->hwctx; |
| OpenCLDeviceContext *device_priv = dst_fc->device_ctx->internal->priv; |
| OpenCLFramesContext *frames_priv = dst_fc->internal->priv; |
| cl_mem_flags cl_flags; |
| cl_int cle; |
| int err, i, p, nb_planes; |
| |
| if (src_fc->sw_format != AV_PIX_FMT_NV12) { |
| av_log(dst_fc, AV_LOG_ERROR, "Only NV12 textures are supported " |
| "for D3D11 to OpenCL mapping.\n"); |
| return AVERROR(EINVAL); |
| } |
| nb_planes = 2; |
| |
| if (src_fc->initial_pool_size == 0) { |
| av_log(dst_fc, AV_LOG_ERROR, "Only fixed-size pools are supported " |
| "for D3D11 to OpenCL mapping.\n"); |
| return AVERROR(EINVAL); |
| } |
| |
| cl_flags = opencl_mem_flags_for_mapping(flags); |
| if (!cl_flags) |
| return AVERROR(EINVAL); |
| |
| frames_priv->nb_mapped_frames = src_fc->initial_pool_size; |
| |
| frames_priv->mapped_frames = |
| av_mallocz_array(frames_priv->nb_mapped_frames, |
| sizeof(*frames_priv->mapped_frames)); |
| if (!frames_priv->mapped_frames) |
| return AVERROR(ENOMEM); |
| |
| for (i = 0; i < frames_priv->nb_mapped_frames; i++) { |
| AVOpenCLFrameDescriptor *desc = &frames_priv->mapped_frames[i]; |
| desc->nb_planes = nb_planes; |
| for (p = 0; p < nb_planes; p++) { |
| UINT subresource = 2 * i + p; |
| |
| desc->planes[p] = |
| device_priv->clCreateFromD3D11Texture2DKHR( |
| dst_dev->context, cl_flags, src_hwctx->texture, |
| subresource, &cle); |
| if (!desc->planes[p]) { |
| av_log(dst_fc, AV_LOG_ERROR, "Failed to create CL " |
| "image from plane %d of D3D texture " |
| "index %d (subresource %u): %d.\n", |
| p, i, (unsigned int)subresource, cle); |
| err = AVERROR(EIO); |
| goto fail; |
| } |
| } |
| } |
| |
| return 0; |
| |
| fail: |
| for (i = 0; i < frames_priv->nb_mapped_frames; i++) { |
| AVOpenCLFrameDescriptor *desc = &frames_priv->mapped_frames[i]; |
| for (p = 0; p < desc->nb_planes; p++) { |
| if (desc->planes[p]) |
| clReleaseMemObject(desc->planes[p]); |
| } |
| } |
| av_freep(&frames_priv->mapped_frames); |
| frames_priv->nb_mapped_frames = 0; |
| return err; |
| } |
| |
| #endif |
| |
| #if HAVE_OPENCL_DRM_ARM |
| |
| typedef struct DRMARMtoOpenCLMapping { |
| int nb_objects; |
| cl_mem object_buffers[AV_DRM_MAX_PLANES]; |
| int nb_planes; |
| cl_mem plane_images[AV_DRM_MAX_PLANES]; |
| } DRMARMtoOpenCLMapping; |
| |
| static void opencl_unmap_from_drm_arm(AVHWFramesContext *dst_fc, |
| HWMapDescriptor *hwmap) |
| { |
| DRMARMtoOpenCLMapping *mapping = hwmap->priv; |
| int i; |
| |
| for (i = 0; i < mapping->nb_planes; i++) |
| clReleaseMemObject(mapping->plane_images[i]); |
| |
| for (i = 0; i < mapping->nb_objects; i++) |
| clReleaseMemObject(mapping->object_buffers[i]); |
| |
| av_free(mapping); |
| } |
| |
| static int opencl_map_from_drm_arm(AVHWFramesContext *dst_fc, AVFrame *dst, |
| const AVFrame *src, int flags) |
| { |
| AVHWFramesContext *src_fc = |
| (AVHWFramesContext*)src->hw_frames_ctx->data; |
| AVOpenCLDeviceContext *dst_dev = dst_fc->device_ctx->hwctx; |
| const AVDRMFrameDescriptor *desc; |
| DRMARMtoOpenCLMapping *mapping = NULL; |
| cl_mem_flags cl_flags; |
| const cl_import_properties_arm props[3] = { |
| CL_IMPORT_TYPE_ARM, CL_IMPORT_TYPE_DMA_BUF_ARM, 0, |
| }; |
| cl_int cle; |
| int err, i, j; |
| |
| desc = (const AVDRMFrameDescriptor*)src->data[0]; |
| |
| cl_flags = opencl_mem_flags_for_mapping(flags); |
| if (!cl_flags) |
| return AVERROR(EINVAL); |
| |
| mapping = av_mallocz(sizeof(*mapping)); |
| if (!mapping) |
| return AVERROR(ENOMEM); |
| |
| mapping->nb_objects = desc->nb_objects; |
| for (i = 0; i < desc->nb_objects; i++) { |
| int fd = desc->objects[i].fd; |
| |
| av_log(dst_fc, AV_LOG_DEBUG, "Map DRM PRIME fd %d to OpenCL.\n", fd); |
| |
| if (desc->objects[i].format_modifier) { |
| av_log(dst_fc, AV_LOG_DEBUG, "Warning: object %d fd %d has " |
| "nonzero format modifier %"PRId64", result may not " |
| "be as expected.\n", i, fd, |
| desc->objects[i].format_modifier); |
| } |
| |
| mapping->object_buffers[i] = |
| clImportMemoryARM(dst_dev->context, cl_flags, props, |
| &fd, desc->objects[i].size, &cle); |
| if (!mapping->object_buffers[i]) { |
| av_log(dst_fc, AV_LOG_ERROR, "Failed to create CL buffer " |
| "from object %d (fd %d, size %"SIZE_SPECIFIER") of DRM frame: %d.\n", |
| i, fd, desc->objects[i].size, cle); |
| err = AVERROR(EIO); |
| goto fail; |
| } |
| } |
| |
| mapping->nb_planes = 0; |
| for (i = 0; i < desc->nb_layers; i++) { |
| const AVDRMLayerDescriptor *layer = &desc->layers[i]; |
| |
| for (j = 0; j < layer->nb_planes; j++) { |
| const AVDRMPlaneDescriptor *plane = &layer->planes[j]; |
| cl_mem plane_buffer; |
| cl_image_format image_format; |
| cl_image_desc image_desc; |
| cl_buffer_region region; |
| int p = mapping->nb_planes; |
| |
| err = opencl_get_plane_format(src_fc->sw_format, p, |
| src_fc->width, src_fc->height, |
| &image_format, &image_desc); |
| if (err < 0) { |
| av_log(dst_fc, AV_LOG_ERROR, "Invalid plane %d (DRM " |
| "layer %d plane %d): %d.\n", p, i, j, err); |
| goto fail; |
| } |
| |
| region.origin = plane->offset; |
| region.size = image_desc.image_row_pitch * |
| image_desc.image_height; |
| |
| plane_buffer = |
| clCreateSubBuffer(mapping->object_buffers[plane->object_index], |
| cl_flags, |
| CL_BUFFER_CREATE_TYPE_REGION, |
| ®ion, &cle); |
| if (!plane_buffer) { |
| av_log(dst_fc, AV_LOG_ERROR, "Failed to create sub-buffer " |
| "for plane %d: %d.\n", p, cle); |
| err = AVERROR(EIO); |
| goto fail; |
| } |
| |
| image_desc.buffer = plane_buffer; |
| |
| mapping->plane_images[p] = |
| clCreateImage(dst_dev->context, cl_flags, |
| &image_format, &image_desc, NULL, &cle); |
| |
| // Unreference the sub-buffer immediately - we don't need it |
| // directly and a reference is held by the image. |
| clReleaseMemObject(plane_buffer); |
| |
| if (!mapping->plane_images[p]) { |
| av_log(dst_fc, AV_LOG_ERROR, "Failed to create image " |
| "for plane %d: %d.\n", p, cle); |
| err = AVERROR(EIO); |
| goto fail; |
| } |
| |
| ++mapping->nb_planes; |
| } |
| } |
| |
| for (i = 0; i < mapping->nb_planes; i++) |
| dst->data[i] = (uint8_t*)mapping->plane_images[i]; |
| |
| err = ff_hwframe_map_create(dst->hw_frames_ctx, dst, src, |
| &opencl_unmap_from_drm_arm, mapping); |
| if (err < 0) |
| goto fail; |
| |
| dst->width = src->width; |
| dst->height = src->height; |
| |
| return 0; |
| |
| fail: |
| for (i = 0; i < mapping->nb_planes; i++) { |
| clReleaseMemObject(mapping->plane_images[i]); |
| } |
| for (i = 0; i < mapping->nb_objects; i++) { |
| if (mapping->object_buffers[i]) |
| clReleaseMemObject(mapping->object_buffers[i]); |
| } |
| av_free(mapping); |
| return err; |
| } |
| |
| #endif |
| |
| static int opencl_map_from(AVHWFramesContext *hwfc, AVFrame *dst, |
| const AVFrame *src, int flags) |
| { |
| av_assert0(src->format == AV_PIX_FMT_OPENCL); |
| if (hwfc->sw_format != dst->format) |
| return AVERROR(ENOSYS); |
| return opencl_map_frame(hwfc, dst, src, flags); |
| } |
| |
| static int opencl_map_to(AVHWFramesContext *hwfc, AVFrame *dst, |
| const AVFrame *src, int flags) |
| { |
| av_unused OpenCLDeviceContext *priv = hwfc->device_ctx->internal->priv; |
| av_assert0(dst->format == AV_PIX_FMT_OPENCL); |
| switch (src->format) { |
| #if HAVE_OPENCL_DRM_BEIGNET |
| case AV_PIX_FMT_DRM_PRIME: |
| if (priv->beignet_drm_mapping_usable) |
| return opencl_map_from_drm_beignet(hwfc, dst, src, flags); |
| #endif |
| #if HAVE_OPENCL_VAAPI_BEIGNET |
| case AV_PIX_FMT_VAAPI: |
| if (priv->beignet_drm_mapping_usable) |
| return opencl_map_from_vaapi(hwfc, dst, src, flags); |
| #endif |
| #if HAVE_OPENCL_VAAPI_INTEL_MEDIA |
| case AV_PIX_FMT_QSV: |
| case AV_PIX_FMT_VAAPI: |
| if (priv->qsv_mapping_usable) |
| return opencl_map_from_qsv(hwfc, dst, src, flags); |
| #endif |
| #if HAVE_OPENCL_DXVA2 |
| case AV_PIX_FMT_DXVA2_VLD: |
| if (priv->dxva2_mapping_usable) |
| return opencl_map_from_dxva2(hwfc, dst, src, flags); |
| #endif |
| #if HAVE_OPENCL_D3D11 |
| case AV_PIX_FMT_D3D11: |
| if (priv->d3d11_mapping_usable) |
| return opencl_map_from_d3d11(hwfc, dst, src, flags); |
| #endif |
| #if HAVE_OPENCL_DRM_ARM |
| case AV_PIX_FMT_DRM_PRIME: |
| if (priv->drm_arm_mapping_usable) |
| return opencl_map_from_drm_arm(hwfc, dst, src, flags); |
| #endif |
| } |
| return AVERROR(ENOSYS); |
| } |
| |
| static int opencl_frames_derive_to(AVHWFramesContext *dst_fc, |
| AVHWFramesContext *src_fc, int flags) |
| { |
| av_unused OpenCLDeviceContext *priv = dst_fc->device_ctx->internal->priv; |
| switch (src_fc->device_ctx->type) { |
| #if HAVE_OPENCL_DRM_BEIGNET |
| case AV_HWDEVICE_TYPE_DRM: |
| if (!priv->beignet_drm_mapping_usable) |
| return AVERROR(ENOSYS); |
| break; |
| #endif |
| #if HAVE_OPENCL_VAAPI_BEIGNET |
| case AV_HWDEVICE_TYPE_VAAPI: |
| if (!priv->beignet_drm_mapping_usable) |
| return AVERROR(ENOSYS); |
| break; |
| #endif |
| #if HAVE_OPENCL_VAAPI_INTEL_MEDIA |
| case AV_HWDEVICE_TYPE_QSV: |
| case AV_HWDEVICE_TYPE_VAAPI: |
| if (!priv->qsv_mapping_usable) |
| return AVERROR(ENOSYS); |
| break; |
| #endif |
| #if HAVE_OPENCL_DXVA2 |
| case AV_HWDEVICE_TYPE_DXVA2: |
| if (!priv->dxva2_mapping_usable) |
| return AVERROR(ENOSYS); |
| { |
| int err; |
| err = opencl_frames_derive_from_dxva2(dst_fc, src_fc, flags); |
| if (err < 0) |
| return err; |
| } |
| break; |
| #endif |
| #if HAVE_OPENCL_D3D11 |
| case AV_HWDEVICE_TYPE_D3D11VA: |
| if (!priv->d3d11_mapping_usable) |
| return AVERROR(ENOSYS); |
| { |
| int err; |
| err = opencl_frames_derive_from_d3d11(dst_fc, src_fc, flags); |
| if (err < 0) |
| return err; |
| } |
| break; |
| #endif |
| #if HAVE_OPENCL_DRM_ARM |
| case AV_HWDEVICE_TYPE_DRM: |
| if (!priv->drm_arm_mapping_usable) |
| return AVERROR(ENOSYS); |
| break; |
| #endif |
| default: |
| return AVERROR(ENOSYS); |
| } |
| return opencl_frames_init_command_queue(dst_fc); |
| } |
| |
| const HWContextType ff_hwcontext_type_opencl = { |
| .type = AV_HWDEVICE_TYPE_OPENCL, |
| .name = "OpenCL", |
| |
| .device_hwctx_size = sizeof(AVOpenCLDeviceContext), |
| .device_priv_size = sizeof(OpenCLDeviceContext), |
| .frames_hwctx_size = sizeof(AVOpenCLFramesContext), |
| .frames_priv_size = sizeof(OpenCLFramesContext), |
| |
| .device_create = &opencl_device_create, |
| .device_derive = &opencl_device_derive, |
| .device_init = &opencl_device_init, |
| .device_uninit = &opencl_device_uninit, |
| |
| .frames_get_constraints = &opencl_frames_get_constraints, |
| .frames_init = &opencl_frames_init, |
| .frames_uninit = &opencl_frames_uninit, |
| .frames_get_buffer = &opencl_get_buffer, |
| |
| .transfer_get_formats = &opencl_transfer_get_formats, |
| .transfer_data_to = &opencl_transfer_data_to, |
| .transfer_data_from = &opencl_transfer_data_from, |
| |
| .map_from = &opencl_map_from, |
| .map_to = &opencl_map_to, |
| |