#ifndef __I965_POST_PROCESSING_H__
#define __I965_POST_PROCESSING_H__
-#define MAX_PP_SURFACES 32
+#include "i965_vpp_avs.h"
+#include <drm.h>
+#include <i915_drm.h>
+#include <intel_bufmgr.h>
+#include "i965_gpe_utils.h"
-#define I965_PP_FLAG_TOP_FIELD 0x00000001
-#define I965_PP_FLAG_BOTTOM_FIELD 0x00000002
+#define MAX_PP_SURFACES 48
-#define I965_PP_FLAG_SCALING 0x00000010
-#define I965_PP_FLAG_AVS 0x00000020
-#define I965_PP_FLAG_DEINTERLACING 0x00000100 /* XXX: don't support MCDI yet */
-#define I965_PP_FLAG_DENOISE 0x00000200
+struct i965_gpe_context;
-enum
-{
+enum {
PP_NULL = 0,
- PP_NV12_LOAD_SAVE,
+ PP_NV12_LOAD_SAVE_N12,
+ PP_NV12_LOAD_SAVE_PL3,
+ PP_PL3_LOAD_SAVE_N12,
+ PP_PL3_LOAD_SAVE_PL3,
PP_NV12_SCALING,
PP_NV12_AVS,
PP_NV12_DNDI,
+ PP_NV12_DN,
+ PP_NV12_LOAD_SAVE_PA,
+ PP_PL3_LOAD_SAVE_PA,
+ PP_PA_LOAD_SAVE_NV12,
+ PP_PA_LOAD_SAVE_PL3,
+ PP_PA_LOAD_SAVE_PA,
+ PP_RGBX_LOAD_SAVE_NV12,
+ PP_NV12_LOAD_SAVE_RGBX,
+ NUM_PP_MODULES,
};
-#define NUM_PP_MODULES 5
+struct i965_post_processing_context;
-struct pp_load_save_context
-{
+struct pp_load_save_context {
+ int dest_x;
+ int dest_y;
int dest_w;
int dest_h;
};
-struct pp_scaling_context
-{
+struct pp_scaling_context {
int dest_x; /* in pixel */
int dest_y; /* in pixel */
int dest_w;
int dest_h;
- int src_normalized_x;
- int src_normalized_y;
+ float src_normalized_x;
+ float src_normalized_y;
};
-struct pp_avs_context
-{
+struct pp_avs_context {
+ AVSState state;
int dest_x; /* in pixel */
int dest_y; /* in pixel */
int dest_w;
int dest_h;
- int src_normalized_x;
- int src_normalized_y;
+ float src_normalized_x;
+ float src_normalized_y;
int src_w;
int src_h;
+ float horiz_range;
};
-struct pp_dndi_context
-{
+enum {
+ DNDI_FRAME_IN_CURRENT = 0,
+ DNDI_FRAME_IN_PREVIOUS,
+ DNDI_FRAME_IN_STMM,
+ DNDI_FRAME_OUT_STMM,
+ DNDI_FRAME_OUT_CURRENT,
+ DNDI_FRAME_OUT_PREVIOUS,
+ DNDI_FRAME_STORE_COUNT
+};
+
+typedef struct dndi_frame_store {
+ struct object_surface *obj_surface;
+ VASurfaceID surface_id; /* always relative to the input surface */
+ unsigned int is_scratch_surface : 1;
+} DNDIFrameStore;
+
+struct pp_dndi_context {
+ int dest_w;
+ int dest_h;
+ DNDIFrameStore frame_store[DNDI_FRAME_STORE_COUNT];
+
+ /* Temporary flags live until the current picture is processed */
+ unsigned int is_di_enabled : 1;
+ unsigned int is_di_adv_enabled : 1;
+ unsigned int is_first_frame : 1;
+ unsigned int is_second_field : 1;
+};
+
+struct pp_dn_context {
int dest_w;
int dest_h;
+ dri_bo *stmm_bo;
};
-struct pp_module
-{
+struct i965_post_processing_context;
+
+struct pp_module {
struct i965_kernel kernel;
-
+
/* others */
- void (*initialize)(VADriverContextP ctx,
- VASurfaceID in_surface_id, VASurfaceID out_surface_id,
- const VARectangle *src_rect, const VARectangle *dst_rect);
+ VAStatus(*initialize)(VADriverContextP ctx, struct i965_post_processing_context *pp_context,
+ const struct i965_surface *src_surface,
+ const VARectangle *src_rect,
+ struct i965_surface *dst_surface,
+ const VARectangle *dst_rect,
+ void *filter_param);
};
-struct pp_static_parameter
-{
+struct pp_static_parameter {
struct {
/* Procamp r1.0 */
float procamp_constant_c0;
-
+
/* Load and Same r1.1 */
- unsigned int source_packed_y_offset:8;
- unsigned int source_packed_u_offset:8;
- unsigned int source_packed_v_offset:8;
- unsigned int pad0:8;
+ unsigned int source_packed_y_offset: 8;
+ unsigned int source_packed_u_offset: 8;
+ unsigned int source_packed_v_offset: 8;
+ unsigned int source_rgb_layout: 8; // 1 for |R|G|B|X| layout, 0 for |B|G|R|X| layout
union {
/* Load and Save r1.2 */
struct {
- unsigned int destination_packed_y_offset:8;
- unsigned int destination_packed_u_offset:8;
- unsigned int destination_packed_v_offset:8;
- unsigned int pad0:8;
+ unsigned int destination_packed_y_offset: 8;
+ unsigned int destination_packed_u_offset: 8;
+ unsigned int destination_packed_v_offset: 8;
+ unsigned int pad0: 8;
} load_and_save;
/* CSC r1.2 */
struct {
- unsigned int destination_rgb_format:8;
- unsigned int pad0:24;
+ unsigned int pad0: 24;
+ unsigned int destination_rgb_layout: 8; // 1 for |R|G|B|X| layout, 0 for |B|G|R|X| layout
} csc;
} r1_2;
-
+
/* Procamp r1.3 */
float procamp_constant_c1;
float procamp_constant_c2;
/* DI r1.5 */
- unsigned int statistics_surface_picth:16; /* Devided by 2 */
- unsigned int pad1:16;
+ unsigned int statistics_surface_picth: 16; /* Devided by 2 */
+ unsigned int pad1: 16;
union {
/* DI r1.6 */
struct {
- unsigned int pad0:24;
- unsigned int top_field_first:8;
+ unsigned int pad0: 24;
+ unsigned int top_field_first: 8;
} di;
/* AVS/Scaling r1.6 */
/* Procamp r1.7 */
float procamp_constant_c5;
} grf1;
-
+
struct {
/* Procamp r2.0 */
float procamp_constant_c3;
/* Blending r3.2 */
float normalized_alpha_y_scaling;
-
+
/* WG+CSC r3.3 */
float wg_csc_constant_c4;
float wg_csc_constant_c1;
/* ALL r3.5 */
- int horizontal_origin_offset:16;
- int vertical_origin_offset:16;
+ int horizontal_origin_offset: 16;
+ int vertical_origin_offset: 16;
/* Shared r3.6*/
union {
union {
/* AVS */
struct {
- unsigned int pad1:15;
- unsigned int nlas:1;
- unsigned int pad2:16;
+ unsigned int pad1: 15;
+ unsigned int nlas: 1;
+ unsigned int pad2: 16;
} avs;
/* DI */
struct {
- unsigned int motion_history_coefficient_m2:8;
- unsigned int motion_history_coefficient_m1:8;
- unsigned int pad0:16;
+ unsigned int motion_history_coefficient_m2: 8;
+ unsigned int motion_history_coefficient_m1: 8;
+ unsigned int pad0: 16;
} di;
} r4_2;
} grf4;
};
-struct pp_inline_parameter
-{
+struct pp_inline_parameter {
struct {
/* ALL r5.0 */
- int destination_block_horizontal_origin:16;
- int destination_block_vertical_origin:16;
+ int destination_block_horizontal_origin: 16;
+ int destination_block_vertical_origin: 16;
/* Shared r5.1 */
union {
/* FMD */
struct {
- unsigned int variance_surface_vertical_origin:16;
- unsigned int pad0:16;
+ unsigned int variance_surface_vertical_origin: 16;
+ unsigned int pad0: 16;
} fmd;
- } r5_1;
+ } r5_1;
/* AVS/Scaling r5.2 */
float source_surface_block_normalized_vertical_origin;
float alpha_surface_block_normalized_vertical_origin;
/* Alpha r5.5 */
- unsigned int alpha_mask_x:16;
- unsigned int alpha_mask_y:8;
- unsigned int block_count_x:8;
+ unsigned int alpha_mask_x: 16;
+ unsigned int alpha_mask_y: 8;
+ unsigned int block_count_x: 8;
/* r5.6 */
- unsigned int block_horizontal_mask:16;
- unsigned int block_vertical_mask:8;
- unsigned int number_blocks:8;
+ /* we only support M*1 or 1*N block partitation now.
+ * -- it means asm code only need update this mask from grf6 for the last block
+ */
+ unsigned int block_horizontal_mask: 16;
+ unsigned int block_vertical_mask: 8;
+ unsigned int number_blocks: 8;
/* AVS/Scaling r5.7 */
float normalized_video_x_scaling_step;
/* AVS r6.0 */
float video_step_delta;
- /* r6.1-r6.7 */
+ /* r6.1 */ // sizeof(int) == 4?
+ unsigned int block_horizontal_mask_right: 16;
+ unsigned int block_vertical_mask_bottom: 8;
+ unsigned int pad1: 8;
+
+ /* r6.2 */
+ unsigned int block_horizontal_mask_middle: 16;
+ unsigned int pad2: 16;
+
+ /* r6.3-r6.7 */
+ unsigned int padx[5];
+ } grf6;
+};
+
+struct gen7_pp_static_parameter {
+ struct {
+ /* r1.0-r1.5 */
+ unsigned int padx[6];
+ /* r1.6 */
+ unsigned int di_statistics_surface_pitch_div2: 16;
+ unsigned int di_statistics_surface_height_div4: 16;
+ /* r1.7 */
+ unsigned int di_top_field_first: 8;
+ unsigned int pad0: 16;
+ unsigned int pointer_to_inline_parameter: 8; /* value: 7 */
+ } grf1;
+
+ struct {
+ /* r2.0 */
+ /* Indicates whether the rgb is swapped for the src surface
+ * 0: RGBX(MSB. X-B-G-R). 1: BGRX(MSB: X-R-G-B)
+ */
+ unsigned int src_avs_rgb_swap: 1;
+ unsigned int pad3: 31;
+
+ /* r2.1 */
+ unsigned int pad2: 16;
+ unsigned int save_avs_rgb_swap: 1; /* 0: RGB, 1: BGR */
+ unsigned int avs_wa_enable: 1; /* must enabled for GEN7 */
+ unsigned int ief_enable: 1;
+ unsigned int avs_wa_width: 13;
+
+ /* 2.2 */
+ float avs_wa_one_div_256_width;
+
+ /* 2.3 */
+ float avs_wa_five_div_256_width;
+
+ /* 2.4 - 2.6 */
+ unsigned int padx[3];
+
+ /* r2.7 */
+ unsigned int di_destination_packed_y_component_offset: 8;
+ unsigned int di_destination_packed_u_component_offset: 8;
+ unsigned int di_destination_packed_v_component_offset: 8;
+ unsigned int alpha: 8;
+ } grf2;
+
+ struct {
+ float sampler_load_horizontal_scaling_step_ratio;
+ unsigned int padx[7];
+ } grf3;
+
+ struct {
+ float sampler_load_vertical_scaling_step;
+ unsigned int pad0;
+ unsigned int di_hoffset_svf_from_dvf: 16;
+ unsigned int di_voffset_svf_from_dvf: 16;
+ unsigned int padx[5];
+ } grf4;
+
+ struct {
+ float sampler_load_vertical_frame_origin;
+ unsigned int padx[7];
+ } grf5;
+
+ struct {
+ float sampler_load_horizontal_frame_origin;
unsigned int padx[7];
} grf6;
+
+ struct {
+ /* r7.0 -> r7.3 */
+ float coef_ry;
+ float coef_ru;
+ float coef_rv;
+ float coef_yd;
+
+ /* r7.4 -> r7.7 */
+ float coef_gy;
+ float coef_gu;
+ float coef_gv;
+ float coef_ud;
+ } grf7;
+
+ struct {
+ /* r8.0 -> r8.3 */
+ float coef_by;
+ float coef_bu;
+ float coef_bv;
+ float coef_vd;
+
+ /* r8.4 -> r8.7 */
+ unsigned int padx[4];
+ } grf8;
+};
+
+struct gen7_pp_inline_parameter {
+ struct {
+ /* r9.0 */
+ unsigned int destination_block_horizontal_origin: 16;
+ unsigned int destination_block_vertical_origin: 16;
+ /* r9.1: 0xffffffff */
+ unsigned int constant_0;
+ /* r9.2 */
+ unsigned int pad0;
+ /* r9.3 */
+ unsigned int pad1;
+ /* r9.4 */
+ float sampler_load_main_video_x_scaling_step;
+ /* r9.5 */
+ unsigned int pad2;
+ /* r9.6: must be zero */
+ unsigned int avs_vertical_block_number;
+ /* r9.7: 0 */
+ unsigned int group_id_number;
+ } grf9;
+
+ struct {
+ unsigned int padx[8];
+ } grf10;
};
-struct i965_post_processing_context
-{
+struct i965_post_processing_context {
int current_pp;
struct pp_module pp_modules[NUM_PP_MODULES];
- struct pp_static_parameter pp_static_parameter;
- struct pp_inline_parameter pp_inline_parameter;
+ void *pp_static_parameter;
+ void *pp_inline_parameter;
struct {
dri_bo *bo;
- } curbe;
-
- struct {
- dri_bo *ss_bo;
- dri_bo *s_bo;
- } surfaces[MAX_PP_SURFACES];
+ } surface_state_binding_table;
struct {
dri_bo *bo;
- } binding_table;
+ } curbe;
struct {
dri_bo *bo;
} urb;
struct {
- dri_bo *bo;
- } stmm;
-
- union {
- struct pp_load_save_context pp_load_save_context;
- struct pp_scaling_context pp_scaling_context;
- struct pp_avs_context pp_avs_context;
- struct pp_dndi_context pp_dndi_context;
- } private_context;
+ unsigned int gpgpu_mode : 1;
+ unsigned int pad0 : 7;
+ unsigned int max_num_threads : 16;
+ unsigned int num_urb_entries : 8;
+ unsigned int urb_entry_size : 16;
+ unsigned int curbe_allocation_size : 16;
+ } vfe_gpu_state;
+
+ struct intel_vebox_context *vebox_proc_ctx;
+
+ struct pp_load_save_context pp_load_save_context;
+ struct pp_scaling_context pp_scaling_context;
+ struct pp_avs_context pp_avs_context;
+ struct pp_dndi_context pp_dndi_context;
+ struct pp_dn_context pp_dn_context;
+ void *private_context; /* pointer to the current private context */
+ void *pipeline_param; /* pointer to the pipeline parameter */
+ /**
+ * \ref Extra filter flags used as a fast path.
+ *
+ * This corresponds to vaPutSurface() flags, for direct rendering,
+ * or to VAProcPipelineParameterBuffer.filter_flags when the VPP
+ * interfaces are used. In the latter case, this is just a copy of
+ * that field.
+ */
+ unsigned int filter_flags;
int (*pp_x_steps)(void *private_context);
int (*pp_y_steps)(void *private_context);
int (*pp_set_block_parameter)(struct i965_post_processing_context *pp_context, int x, int y);
-
- /* video process based on hsw vebox */
- struct intel_vebox_context *pp_vebox_context;
+
+ struct intel_batchbuffer *batch;
+
+ unsigned int block_horizontal_mask_left: 16;
+ unsigned int block_horizontal_mask_right: 16;
+ unsigned int block_vertical_mask_bottom: 8;
+
+ struct {
+ dri_bo *bo;
+ int bo_size;
+ unsigned int end_offset;
+ } instruction_state;
+
+ struct {
+ dri_bo *bo;
+ } indirect_state;
+
+ struct {
+ dri_bo *bo;
+ int bo_size;
+ unsigned int end_offset;
+ } dynamic_state;
+
+ unsigned int sampler_offset;
+ int sampler_size;
+ unsigned int idrt_offset;
+ int idrt_size;
+ unsigned int curbe_offset;
+ int curbe_size;
+
+ VAStatus(*intel_post_processing)(VADriverContextP ctx,
+ struct i965_post_processing_context *pp_context,
+ const struct i965_surface *src_surface,
+ const VARectangle *src_rect,
+ struct i965_surface *dst_surface,
+ const VARectangle *dst_rect,
+ int pp_index,
+ void * filter_param);
+ void (*finalize)(VADriverContextP ctx,
+ struct i965_post_processing_context *pp_context);
+
+
+ struct i965_gpe_context scaling_gpe_context;
+
+#define VPPGPE_8BIT_8BIT (1 << 0)
+#define VPPGPE_8BIT_10BIT (1 << 1)
+#define VPPGPE_10BIT_10BIT (1 << 2)
+#define VPPGPE_10BIT_8BIT (1 << 3)
+#define VPPGPE_8BIT_420_RGB32 (1 << 4)
+
+ unsigned int scaling_gpe_context_initialized;
+};
+
+struct i965_proc_context {
+ struct hw_context base;
+ void *driver_context;
+ struct i965_post_processing_context pp_context;
};
VASurfaceID
i965_post_processing(
VADriverContextP ctx,
- VASurfaceID surface,
+ struct object_surface *obj_surface,
const VARectangle *src_rect,
const VARectangle *dst_rect,
- unsigned int flags,
- int *has_done_scaling
+ unsigned int va_flags,
+ int *has_done_scaling,
+ VARectangle *calibrated_rect
);
-Bool
+VAStatus
+i965_scaling_processing(
+ VADriverContextP ctx,
+ struct object_surface *src_surface_obj,
+ const VARectangle *src_rect,
+ struct object_surface *dst_surface_obj,
+ const VARectangle *dst_rect,
+ unsigned int va_flags
+);
+
+VAStatus
+i965_image_processing(VADriverContextP ctx,
+ const struct i965_surface *src_surface,
+ const VARectangle *src_rect,
+ struct i965_surface *dst_surface,
+ const VARectangle *dst_rect);
+
+void
i965_post_processing_terminate(VADriverContextP ctx);
-Bool
+bool
i965_post_processing_init(VADriverContextP ctx);
+
+extern VAStatus
+i965_proc_picture(VADriverContextP ctx,
+ VAProfile profile,
+ union codec_state *codec_state,
+ struct hw_context *hw_context);
+
+int
+pp_get_surface_fourcc(VADriverContextP ctx, const struct i965_surface *surface);
+
#endif /* __I965_POST_PROCESSING_H__ */