/* * Copyright (C) 2007 Intel Corporation * Copyright (C) 2016 Florent Revest * Copyright (C) 2018 Paul Kocialkowski * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the * "Software"), to deal in the Software without restriction, including * without limitation the rights to use, copy, modify, merge, publish, * distribute, sub license, and/or sell copies of the Software, and to * permit persons to whom the Software is furnished to do so, subject to * the following conditions: * * The above copyright notice and this permission notice (including the * next paragraph) shall be included in all copies or substantial portions * of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. * IN NO EVENT SHALL PRECISION INSIGHT AND/OR ITS SUPPLIERS BE LIABLE FOR * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. */ #include "picture.h" #include "buffer.h" #include "config.h" #include "context.h" #include "request.h" #include "surface.h" #include "h264.h" #include "h265.h" #include "mpeg2.h" #include #include #include #include #include #include #include "media.h" #include "utils.h" #include "v4l2.h" #include "autoconfig.h" static VAStatus codec_store_buffer(struct request_data *driver_data, struct object_context *context, VAProfile profile, struct object_surface *surface_object, struct object_buffer *buffer_object) { switch (buffer_object->type) { case VASliceDataBufferType: /* * Since there is no guarantee that the allocation * order is the same as the submission order (via * RenderPicture), we can't use a V4L2 buffer directly * and have to copy from a regular buffer. */ if (context->h264_start_code) { static const char start_code[3] = { 0x00, 0x00, 0x01 }; memcpy(surface_object->source_data + surface_object->slices_size, start_code, sizeof(start_code)); surface_object->slices_size += sizeof(start_code); } memcpy(surface_object->source_data + surface_object->slices_size, buffer_object->data, buffer_object->size * buffer_object->count); surface_object->slices_size += buffer_object->size * buffer_object->count; surface_object->slices_count++; break; case VAPictureParameterBufferType: switch (profile) { case VAProfileMPEG2Simple: case VAProfileMPEG2Main: memcpy(&surface_object->params.mpeg2.picture, buffer_object->data, sizeof(surface_object->params.mpeg2.picture)); break; case VAProfileH264Main: case VAProfileH264High: case VAProfileH264ConstrainedBaseline: case VAProfileH264MultiviewHigh: case VAProfileH264StereoHigh: memcpy(&surface_object->params.h264.picture, buffer_object->data, sizeof(surface_object->params.h264.picture)); break; case VAProfileHEVCMain: memcpy(&surface_object->params.h265.picture, buffer_object->data, sizeof(surface_object->params.h265.picture)); break; default: break; } break; case VASliceParameterBufferType: switch (profile) { case VAProfileH264Main: case VAProfileH264High: case VAProfileH264ConstrainedBaseline: case VAProfileH264MultiviewHigh: case VAProfileH264StereoHigh: memcpy(&surface_object->params.h264.slice, buffer_object->data, sizeof(surface_object->params.h264.slice)); break; case VAProfileHEVCMain: memcpy(&surface_object->params.h265.slice, buffer_object->data, sizeof(surface_object->params.h265.slice)); break; default: break; } break; case VAIQMatrixBufferType: switch (profile) { case VAProfileMPEG2Simple: case VAProfileMPEG2Main: memcpy(&surface_object->params.mpeg2.iqmatrix, buffer_object->data, sizeof(surface_object->params.mpeg2.iqmatrix)); surface_object->params.mpeg2.iqmatrix_set = true; break; case VAProfileH264Main: case VAProfileH264High: case VAProfileH264ConstrainedBaseline: case VAProfileH264MultiviewHigh: case VAProfileH264StereoHigh: memcpy(&surface_object->params.h264.matrix, buffer_object->data, sizeof(surface_object->params.h264.matrix)); surface_object->params.h264.matrix_set = true; break; case VAProfileHEVCMain: memcpy(&surface_object->params.h265.iqmatrix, buffer_object->data, sizeof(surface_object->params.h265.iqmatrix)); surface_object->params.h265.iqmatrix_set = true; break; default: break; } break; default: break; } return VA_STATUS_SUCCESS; } static VAStatus codec_set_controls(struct request_data *driver_data, struct object_context *context, VAProfile profile, struct object_surface *surface_object) { int rc; switch (profile) { case VAProfileMPEG2Simple: case VAProfileMPEG2Main: rc = mpeg2_set_controls(driver_data, context, surface_object); if (rc < 0) return VA_STATUS_ERROR_OPERATION_FAILED; break; case VAProfileH264Main: case VAProfileH264High: case VAProfileH264ConstrainedBaseline: case VAProfileH264MultiviewHigh: case VAProfileH264StereoHigh: rc = h264_set_controls(driver_data, context, profile, surface_object); if (rc < 0) return VA_STATUS_ERROR_OPERATION_FAILED; break; case VAProfileHEVCMain: /* Fourier-local: HEVC stripped, no HW support on RK3566. */ return VA_STATUS_ERROR_UNSUPPORTED_PROFILE; default: return VA_STATUS_ERROR_UNSUPPORTED_PROFILE; } return VA_STATUS_SUCCESS; } VAStatus RequestBeginPicture(VADriverContextP context, VAContextID context_id, VASurfaceID surface_id) { struct request_data *driver_data = context->pDriverData; struct object_context *context_object; struct object_surface *surface_object; struct request_pool_slot *slot; int slot_index; context_object = CONTEXT(driver_data, context_id); if (context_object == NULL) return VA_STATUS_ERROR_INVALID_CONTEXT; surface_object = SURFACE(driver_data, surface_id); if (surface_object == NULL) return VA_STATUS_ERROR_INVALID_SURFACE; if (surface_object->status == VASurfaceRendering) RequestSyncSurface(context, surface_id); /* * Borrow an OUTPUT (bitstream-input) slot from the driver-wide * pool for the duration of this Begin/Render/End cycle. The * surface's source_* fields hold the borrow's mmap pointer/size/ * V4L2 buffer index until RequestSyncSurface releases it after * VIDIOC_DQBUF. */ slot_index = request_pool_acquire(&driver_data->output_pool); if (slot_index < 0) return VA_STATUS_ERROR_ALLOCATION_FAILED; slot = request_pool_slot(&driver_data->output_pool, (unsigned int)slot_index); if (slot == NULL) { request_pool_release(&driver_data->output_pool, (unsigned int)slot_index); return VA_STATUS_ERROR_ALLOCATION_FAILED; } surface_object->source_index = slot->index; surface_object->source_data = slot->data; surface_object->source_size = slot->size; surface_object->slices_size = 0; surface_object->slices_count = 0; surface_object->params.h264.matrix_set = false; surface_object->status = VASurfaceRendering; context_object->render_surface_id = surface_id; return VA_STATUS_SUCCESS; } VAStatus RequestRenderPicture(VADriverContextP context, VAContextID context_id, VABufferID *buffers_ids, int buffers_count) { struct request_data *driver_data = context->pDriverData; struct object_context *context_object; struct object_config *config_object; struct object_surface *surface_object; struct object_buffer *buffer_object; int rc; int i; context_object = CONTEXT(driver_data, context_id); if (context_object == NULL) return VA_STATUS_ERROR_INVALID_CONTEXT; config_object = CONFIG(driver_data, context_object->config_id); if (config_object == NULL) return VA_STATUS_ERROR_INVALID_CONFIG; surface_object = SURFACE(driver_data, context_object->render_surface_id); if (surface_object == NULL) return VA_STATUS_ERROR_INVALID_SURFACE; for (i = 0; i < buffers_count; i++) { buffer_object = BUFFER(driver_data, buffers_ids[i]); if (buffer_object == NULL) return VA_STATUS_ERROR_INVALID_BUFFER; rc = codec_store_buffer(driver_data, context_object, config_object->profile, surface_object, buffer_object); if (rc != VA_STATUS_SUCCESS) return rc; } return VA_STATUS_SUCCESS; } VAStatus RequestEndPicture(VADriverContextP context, VAContextID context_id) { struct request_data *driver_data = context->pDriverData; struct object_context *context_object; struct object_config *config_object; struct object_surface *surface_object; struct video_format *video_format; unsigned int output_type, capture_type; int request_fd; VAStatus status; int rc; video_format = driver_data->video_format; if (video_format == NULL) return VA_STATUS_ERROR_OPERATION_FAILED; output_type = v4l2_type_video_output(video_format->v4l2_mplane); capture_type = v4l2_type_video_capture(video_format->v4l2_mplane); context_object = CONTEXT(driver_data, context_id); if (context_object == NULL) return VA_STATUS_ERROR_INVALID_CONTEXT; config_object = CONFIG(driver_data, context_object->config_id); if (config_object == NULL) return VA_STATUS_ERROR_INVALID_CONFIG; surface_object = SURFACE(driver_data, context_object->render_surface_id); if (surface_object == NULL) return VA_STATUS_ERROR_INVALID_SURFACE; gettimeofday(&surface_object->timestamp, NULL); request_fd = surface_object->request_fd; if (request_fd < 0) { request_fd = media_request_alloc(driver_data->media_fd); if (request_fd < 0) return VA_STATUS_ERROR_OPERATION_FAILED; surface_object->request_fd = request_fd; } rc = codec_set_controls(driver_data, context_object, config_object->profile, surface_object); if (rc != VA_STATUS_SUCCESS) return rc; /* * DEBUG INSTRUMENTATION (0011): write a sentinel pattern into * the CAPTURE buffer's first 32 bytes BEFORE QBUF. If after * DQBUF the sentinel survives (per surface.c hex dump), the * kernel never wrote to this buffer. If the sentinel is gone * (replaced by zeros), the kernel did write but our CPU read * sees stale-cached data — cache-coherency issue. */ { unsigned char *p = (unsigned char *) surface_object->destination_map[0]; if (p != NULL) { unsigned int i; for (i = 0; i < 32; i++) p[i] = 0xab; } } rc = v4l2_queue_buffer(driver_data->video_fd, -1, capture_type, NULL, surface_object->destination_index, 0, surface_object->destination_buffers_count); if (rc < 0) return VA_STATUS_ERROR_OPERATION_FAILED; /* * DEBUG INSTRUMENTATION (0010): hex-dump first 32 bytes of the * OUTPUT buffer at the moment we hand it to the kernel. Helps * pin down whether our bitstream prepend logic is correct. * For a valid ANNEX_B IDR slice the dump should start * 00 00 01 65 ... (00 00 01 = start code; 0x65 = nal_ref_idc=3, * nal_unit_type=5 = IDR slice). Removed once Step 1 decode is * verified working. */ { const unsigned char *p = surface_object->source_data; char hex[32 * 3 + 1] = { 0 }; unsigned int i, n = surface_object->slices_size < 32 ? surface_object->slices_size : 32; for (i = 0; i < n; i++) snprintf(hex + i * 3, 4, " %02x", p[i]); request_log("OUTPUT[idx=%u, len=%u]:%s\n", surface_object->source_index, surface_object->slices_size, hex); } rc = v4l2_queue_buffer(driver_data->video_fd, request_fd, output_type, &surface_object->timestamp, surface_object->source_index, surface_object->slices_size, 1); if (rc < 0) return VA_STATUS_ERROR_OPERATION_FAILED; surface_object->slices_size = 0; status = RequestSyncSurface(context, context_object->render_surface_id); if (status != VA_STATUS_SUCCESS) return status; context_object->render_surface_id = VA_INVALID_ID; return VA_STATUS_SUCCESS; }