• R/O
  • HTTP
  • SSH
  • HTTPS

Commit

Tags
No Tags

Frequently used words (click to add to your profile)

javac++androidlinuxc#windowsobjective-ccocoa誰得qtpythonphprubygameguibathyscaphec計画中(planning stage)翻訳omegatframeworktwitterdomtestvb.netdirectxゲームエンジンbtronarduinopreviewer

hardware/intel/intel-driver


Commit MetaInfo

Revision185375bded4094ee534179b819ac4495c6ab37d2 (tree)
Time2015-03-24 13:06:02
AuthorGwenole Beauchesne <gb.devel@gmai...>
CommiterXiang, Haihao

Log Message

vpp: add support for "low-power" mode.

Add support for "low-power" mode expressed with VA_PROC_PIPELINE_FAST
flag set to VAProcPipelineParameterBuffer.pipeline_flags. The purpose
is to discard any complex operation that would consume too many HW
resources.

While doing so, also try to optimize for cases where we only want to
perform format conversion, scaling and basic bob-deinterlacing.

Signed-off-by: Gwenole Beauchesne <gwenole.beauchesne@intel.com>

Change Summary

Incremental Difference

--- a/src/i965_post_processing.c
+++ b/src/i965_post_processing.c
@@ -5445,6 +5445,241 @@ static const int proc_frame_to_pp_frame[3] = {
54455445 I965_SURFACE_FLAG_BOTTOME_FIELD_FIRST
54465446 };
54475447
5448+enum {
5449+ PP_OP_CHANGE_FORMAT = 1 << 0,
5450+ PP_OP_CHANGE_SIZE = 1 << 1,
5451+ PP_OP_DEINTERLACE = 1 << 2,
5452+ PP_OP_COMPLEX = 1 << 3,
5453+};
5454+
5455+static int
5456+pp_get_kernel_index(uint32_t src_fourcc, uint32_t dst_fourcc, uint32_t pp_ops,
5457+ uint32_t filter_flags)
5458+{
5459+ int pp_index = -1;
5460+
5461+ if (!dst_fourcc)
5462+ dst_fourcc = src_fourcc;
5463+
5464+ switch (src_fourcc) {
5465+ case VA_FOURCC_RGBX:
5466+ case VA_FOURCC_RGBA:
5467+ case VA_FOURCC_BGRX:
5468+ case VA_FOURCC_BGRA:
5469+ switch (dst_fourcc) {
5470+ case VA_FOURCC_NV12:
5471+ pp_index = PP_RGBX_LOAD_SAVE_NV12;
5472+ break;
5473+ }
5474+ break;
5475+ case VA_FOURCC_YUY2:
5476+ case VA_FOURCC_UYVY:
5477+ switch (dst_fourcc) {
5478+ case VA_FOURCC_NV12:
5479+ pp_index = PP_PA_LOAD_SAVE_NV12;
5480+ break;
5481+ case VA_FOURCC_I420:
5482+ case VA_FOURCC_YV12:
5483+ pp_index = PP_PA_LOAD_SAVE_PL3;
5484+ break;
5485+ case VA_FOURCC_YUY2:
5486+ case VA_FOURCC_UYVY:
5487+ pp_index = PP_PA_LOAD_SAVE_PA;
5488+ break;
5489+ }
5490+ break;
5491+ case VA_FOURCC_NV12:
5492+ switch (dst_fourcc) {
5493+ case VA_FOURCC_NV12:
5494+ if (pp_ops & PP_OP_CHANGE_SIZE)
5495+ pp_index = avs_is_needed(filter_flags) ?
5496+ PP_NV12_AVS : PP_NV12_SCALING;
5497+ else
5498+ pp_index = PP_NV12_LOAD_SAVE_N12;
5499+ break;
5500+ case VA_FOURCC_I420:
5501+ case VA_FOURCC_YV12:
5502+ case VA_FOURCC_IMC1:
5503+ case VA_FOURCC_IMC3:
5504+ pp_index = PP_NV12_LOAD_SAVE_PL3;
5505+ break;
5506+ case VA_FOURCC_YUY2:
5507+ case VA_FOURCC_UYVY:
5508+ pp_index = PP_NV12_LOAD_SAVE_PA;
5509+ break;
5510+ case VA_FOURCC_RGBX:
5511+ case VA_FOURCC_RGBA:
5512+ case VA_FOURCC_BGRX:
5513+ case VA_FOURCC_BGRA:
5514+ pp_index = PP_NV12_LOAD_SAVE_RGBX;
5515+ break;
5516+ }
5517+ break;
5518+ case VA_FOURCC_I420:
5519+ case VA_FOURCC_YV12:
5520+ case VA_FOURCC_IMC1:
5521+ case VA_FOURCC_IMC3:
5522+ case VA_FOURCC_YV16:
5523+ case VA_FOURCC_411P:
5524+ case VA_FOURCC_422H:
5525+ case VA_FOURCC_422V:
5526+ case VA_FOURCC_444P:
5527+ switch (dst_fourcc) {
5528+ case VA_FOURCC_NV12:
5529+ pp_index = PP_PL3_LOAD_SAVE_N12;
5530+ break;
5531+ case VA_FOURCC_I420:
5532+ case VA_FOURCC_YV12:
5533+ case VA_FOURCC_IMC1:
5534+ case VA_FOURCC_IMC3:
5535+ pp_index = PP_PL3_LOAD_SAVE_PL3;
5536+ break;
5537+ case VA_FOURCC_YUY2:
5538+ case VA_FOURCC_UYVY:
5539+ pp_index = PP_PL3_LOAD_SAVE_PA;
5540+ break;
5541+ }
5542+ break;
5543+ }
5544+ return pp_index;
5545+}
5546+
5547+static VAStatus
5548+i965_proc_picture_fast(VADriverContextP ctx,
5549+ struct i965_proc_context *proc_context, struct proc_state *proc_state)
5550+{
5551+ struct i965_driver_data * const i965 = i965_driver_data(ctx);
5552+ const VAProcPipelineParameterBuffer * const pipeline_param =
5553+ (VAProcPipelineParameterBuffer *)proc_state->pipeline_param->buffer;
5554+ struct object_surface *src_obj_surface, *dst_obj_surface;
5555+ struct i965_surface src_surface, dst_surface;
5556+ const VAProcFilterParameterBufferDeinterlacing *deint_params = NULL;
5557+ VARectangle src_rect, dst_rect;
5558+ VAStatus status;
5559+ uint32_t i, filter_flags = 0, pp_ops = 0;
5560+ int pp_index;
5561+
5562+ /* Validate pipeline parameters */
5563+ if (pipeline_param->num_filters > 0 && !pipeline_param->filters)
5564+ return VA_STATUS_ERROR_INVALID_PARAMETER;
5565+
5566+ for (i = 0; i < pipeline_param->num_filters; i++) {
5567+ const VAProcFilterParameterBuffer *filter;
5568+ struct object_buffer * const obj_buffer =
5569+ BUFFER(pipeline_param->filters[i]);
5570+
5571+ assert(obj_buffer && obj_buffer->buffer_store);
5572+ if (!obj_buffer || !obj_buffer->buffer_store)
5573+ return VA_STATUS_ERROR_INVALID_PARAMETER;
5574+
5575+ filter = (VAProcFilterParameterBuffer *)
5576+ obj_buffer->buffer_store->buffer;
5577+ switch (filter->type) {
5578+ case VAProcFilterDeinterlacing:
5579+ pp_ops |= PP_OP_DEINTERLACE;
5580+ deint_params = (VAProcFilterParameterBufferDeinterlacing *)filter;
5581+ break;
5582+ default:
5583+ pp_ops |= PP_OP_COMPLEX;
5584+ break;
5585+ }
5586+ }
5587+ filter_flags |= pipeline_param->filter_flags & VA_FILTER_SCALING_MASK;
5588+
5589+ /* Validate source surface */
5590+ src_obj_surface = SURFACE(pipeline_param->surface);
5591+ if (!src_obj_surface)
5592+ return VA_STATUS_ERROR_INVALID_SURFACE;
5593+
5594+ if (!src_obj_surface->fourcc)
5595+ return VA_STATUS_ERROR_INVALID_IMAGE_FORMAT;
5596+
5597+ if (pipeline_param->surface_region) {
5598+ src_rect.x = pipeline_param->surface_region->x;
5599+ src_rect.y = pipeline_param->surface_region->y;
5600+ src_rect.width = pipeline_param->surface_region->width;
5601+ src_rect.height = pipeline_param->surface_region->height;
5602+ } else {
5603+ src_rect.x = 0;
5604+ src_rect.y = 0;
5605+ src_rect.width = src_obj_surface->orig_width;
5606+ src_rect.height = src_obj_surface->orig_height;
5607+ }
5608+
5609+ src_surface.base = &src_obj_surface->base;
5610+ src_surface.type = I965_SURFACE_TYPE_SURFACE;
5611+ src_surface.flags = I965_SURFACE_FLAG_FRAME;
5612+
5613+ if (pp_ops & PP_OP_DEINTERLACE) {
5614+ filter_flags |= !(deint_params->flags & VA_DEINTERLACING_BOTTOM_FIELD) ?
5615+ VA_TOP_FIELD : VA_BOTTOM_FIELD;
5616+ if (deint_params->algorithm != VAProcDeinterlacingBob)
5617+ pp_ops |= PP_OP_COMPLEX;
5618+ }
5619+ else if (pipeline_param->filter_flags & (VA_TOP_FIELD | VA_BOTTOM_FIELD)) {
5620+ filter_flags |= (pipeline_param->filter_flags & VA_TOP_FIELD) ?
5621+ VA_TOP_FIELD : VA_BOTTOM_FIELD;
5622+ pp_ops |= PP_OP_DEINTERLACE;
5623+ }
5624+ if (pp_ops & PP_OP_DEINTERLACE) // XXX: no bob-deinterlacing optimization yet
5625+ pp_ops |= PP_OP_COMPLEX;
5626+
5627+ /* Validate target surface */
5628+ dst_obj_surface = SURFACE(proc_state->current_render_target);
5629+ if (!dst_obj_surface)
5630+ return VA_STATUS_ERROR_INVALID_SURFACE;
5631+
5632+ if (dst_obj_surface->fourcc &&
5633+ dst_obj_surface->fourcc != src_obj_surface->fourcc)
5634+ pp_ops |= PP_OP_CHANGE_FORMAT;
5635+
5636+ if (pipeline_param->output_region) {
5637+ dst_rect.x = pipeline_param->output_region->x;
5638+ dst_rect.y = pipeline_param->output_region->y;
5639+ dst_rect.width = pipeline_param->output_region->width;
5640+ dst_rect.height = pipeline_param->output_region->height;
5641+ } else {
5642+ dst_rect.x = 0;
5643+ dst_rect.y = 0;
5644+ dst_rect.width = dst_obj_surface->orig_width;
5645+ dst_rect.height = dst_obj_surface->orig_height;
5646+ }
5647+
5648+ if (dst_rect.width != src_rect.width || dst_rect.height != src_rect.height)
5649+ pp_ops |= PP_OP_CHANGE_SIZE;
5650+
5651+ dst_surface.base = &dst_obj_surface->base;
5652+ dst_surface.type = I965_SURFACE_TYPE_SURFACE;
5653+ dst_surface.flags = I965_SURFACE_FLAG_FRAME;
5654+
5655+ /* Validate "fast-path" processing capabilities */
5656+ if (!IS_GEN7(i965->intel.device_info)) {
5657+ if ((pp_ops & PP_OP_CHANGE_FORMAT) && (pp_ops & PP_OP_CHANGE_SIZE))
5658+ return VA_STATUS_ERROR_UNIMPLEMENTED; // temporary surface is needed
5659+ }
5660+ if (pipeline_param->pipeline_flags & VA_PROC_PIPELINE_FAST) {
5661+ filter_flags &= ~VA_FILTER_SCALING_MASK;
5662+ filter_flags |= VA_FILTER_SCALING_FAST;
5663+ }
5664+ else {
5665+ if (pp_ops & PP_OP_COMPLEX)
5666+ return VA_STATUS_ERROR_UNIMPLEMENTED; // full pipeline is needed
5667+ if ((filter_flags & VA_FILTER_SCALING_MASK) > VA_FILTER_SCALING_HQ)
5668+ return VA_STATUS_ERROR_UNIMPLEMENTED;
5669+ }
5670+
5671+ pp_index = pp_get_kernel_index(src_obj_surface->fourcc,
5672+ dst_obj_surface->fourcc, pp_ops, filter_flags);
5673+ if (pp_index < 0)
5674+ return VA_STATUS_ERROR_UNIMPLEMENTED;
5675+
5676+ proc_context->pp_context.filter_flags = filter_flags;
5677+ status = i965_post_processing_internal(ctx, &proc_context->pp_context,
5678+ &src_surface, &src_rect, &dst_surface, &dst_rect, pp_index, NULL);
5679+ intel_batchbuffer_flush(proc_context->pp_context.batch);
5680+ return status;
5681+}
5682+
54485683 VAStatus
54495684 i965_proc_picture(VADriverContextP ctx,
54505685 VAProfile profile,
@@ -5465,6 +5700,10 @@ i965_proc_picture(VADriverContextP ctx,
54655700 unsigned int tiling = 0, swizzle = 0;
54665701 int in_width, in_height;
54675702
5703+ status = i965_proc_picture_fast(ctx, proc_context, proc_state);
5704+ if (status != VA_STATUS_ERROR_UNIMPLEMENTED)
5705+ return status;
5706+
54685707 if (pipeline_param->surface == VA_INVALID_ID ||
54695708 proc_state->current_render_target == VA_INVALID_ID) {
54705709 status = VA_STATUS_ERROR_INVALID_SURFACE;