kolibrios-fun/drivers/video/i965/gen75_vpp_vebox.c
Sergey Semyonov (Serge) 84ab2d2d6b intel: update 2D driver & VA driver
git-svn-id: svn://kolibrios.org@3769 a494cfbc-eb01-0410-851d-a64ba20cac60
2013-07-06 06:25:41 +00:00

862 lines
34 KiB
C

/*
* Copyright © 2011 Intel Corporation
*
* Permission is hereby granted, free of charge, to any person obtaining a
* copy of this software and associated documentation files (the
* "Software"), to deal in the Software without restriction, including
* without limitation the rights to use, copy, modify, merge, publish,
* distribute, sub license, and/or sell copies of the Software, and to
* permit persons to whom the Software is furnished to do so, subject to
* the following conditions:
*
* The above copyright notice and this permission notice (including the
* next paragraph) shall be included in all copies or substantial portions
* of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
* IN NO EVENT SHALL PRECISION INSIGHT AND/OR ITS SUPPLIERS BE LIABLE FOR
* ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
* TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
* SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
*
* Authors:
* Li Xiaowei <xiaowei.a.li@intel.com>
*/
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <assert.h>
#include <math.h>
#include "intel_batchbuffer.h"
#include "intel_driver.h"
#include "i965_defines.h"
#include "i965_structs.h"
#include "gen75_vpp_vebox.h"
#define PI 3.1415926
extern VAStatus
i965_CreateSurfaces(VADriverContextP ctx,
int width,
int height,
int format,
int num_surfaces,
VASurfaceID *surfaces);
int format_convert(float src, int out_int_bits, int out_frac_bits,int out_sign_flag)
{
unsigned char negative_flag = (src < 0.0) ? 1 : 0;
float src_1 = (!negative_flag)? src: -src ;
unsigned int factor = 1 << out_frac_bits;
int output_value = 0;
unsigned int integer_part = 0;//floor(src_1);
unsigned int fraction_part = ((int)((src_1 - integer_part) * factor)) & (factor - 1) ;
output_value = (integer_part << out_frac_bits) | fraction_part;
if(negative_flag)
output_value = (~output_value + 1) & ((1 <<(out_int_bits + out_frac_bits)) -1);
if(out_sign_flag == 1 && negative_flag)
{
output_value |= negative_flag <<(out_int_bits + out_frac_bits);
}
return output_value;
}
void hsw_veb_dndi_table(VADriverContextP ctx, struct intel_vebox_context *proc_ctx)
{
unsigned int* p_table ;
/*
VAProcFilterParameterBufferDeinterlacing *di_param =
(VAProcFilterParameterBufferDeinterlacing *) proc_ctx->filter_di;
VAProcFilterParameterBuffer * dn_param =
(VAProcFilterParameterBuffer *) proc_ctx->filter_dn;
*/
p_table = (unsigned int *)proc_ctx->dndi_state_table.ptr;
*p_table ++ = 0; // reserved . w0
*p_table ++ = ( 0 << 24 | // denoise STAD threshold . w1
128 << 16 | // dnmh_history_max
0 << 12 | // reserved
8 << 8 | // dnmh_delta[3:0]
0 ); // denoise ASD threshold
*p_table ++ = ( 0 << 30 | // reserved . w2
16 << 24 | // temporal diff th
0 << 22 | // reserved.
8 << 16 | // low temporal diff th
0 << 13 | // STMM C2
0 << 8 | // denoise moving pixel th
64 ); // denoise th for sum of complexity measure
*p_table ++ = ( 0 << 30 | // reserved . w3
4 << 24 | // good neighbor th[5:0]
9 << 20 | // CAT slope minus 1
5 << 16 | // SAD Tight in
0 << 14 | // smooth mv th
0 << 12 | // reserved
1 << 8 | // bne_edge_th[3:0]
15 ); // block noise estimate noise th
*p_table ++ = ( 0 << 31 | // STMM blending constant select. w4
64 << 24 | // STMM trc1
0 << 16 | // STMM trc2
0 << 14 | // reserved
2 << 8 | // VECM_mul
128 ); // maximum STMM
*p_table ++ = ( 0 << 24 | // minumum STMM . W5
0 << 22 | // STMM shift down
0 << 20 | // STMM shift up
7 << 16 | // STMM output shift
128 << 8 | // SDI threshold
8 ); // SDI delta
*p_table ++ = ( 0 << 24 | // SDI fallback mode 1 T1 constant . W6
0 << 16 | // SDI fallback mode 1 T2 constant
0 << 8 | // SDI fallback mode 2 constant(angle2x1)
0 ); // FMD temporal difference threshold
*p_table ++ = ( 32 << 24 | // FMD #1 vertical difference th . w7
32 << 16 | // FMD #2 vertical difference th
1 << 14 | // CAT th1
32 << 8 | // FMD tear threshold
0 << 7 | // MCDI Enable, use motion compensated deinterlace algorithm
0 << 6 | // progressive DN
0 << 4 | // reserved
0 << 3 | // DN/DI Top First
0 ); // reserved
*p_table ++ = ( 0 << 29 | // reserved . W8
0 << 23 | // dnmh_history_init[5:0]
10 << 19 | // neighborPixel th
0 << 18 | // reserved
0 << 16 | // FMD for 2nd field of previous frame
25 << 10 | // MC pixel consistency th
0 << 8 | // FMD for 1st field for current frame
10 << 4 | // SAD THB
5 ); // SAD THA
*p_table ++ = ( 0 << 24 | // reserved
0 << 16 | // chr_dnmh_stad_th
0 << 13 | // reserved
0 << 12 | // chrome denoise enable
0 << 6 | // chr temp diff th
0 ); // chr temp diff low
}
void hsw_veb_iecp_std_table(VADriverContextP ctx, struct intel_vebox_context *proc_ctx)
{
unsigned int *p_table = proc_ctx->iecp_state_table.ptr + 0 ;
/*
VAProcFilterParameterBuffer * std_param =
(VAProcFilterParameterBuffer *) proc_ctx->filter_std;
*/
if(!(proc_ctx->filters_mask & VPP_IECP_STD_STE)){
memset(p_table, 0, 29 * 4);
}else{
*p_table ++ = 0x9a6e39f0;
*p_table ++ = 0x400c0000;
*p_table ++ = 0x00001180;
*p_table ++ = 0xfe2f2e00;
*p_table ++ = 0x000000ff;
*p_table ++ = 0x00140000;
*p_table ++ = 0xd82e0000;
*p_table ++ = 0x8285ecec;
*p_table ++ = 0x00008282;
*p_table ++ = 0x00000000;
*p_table ++ = 0x02117000;
*p_table ++ = 0xa38fec96;
*p_table ++ = 0x0000c8c8;
*p_table ++ = 0x00000000;
*p_table ++ = 0x01478000;
*p_table ++ = 0x0007c306;
*p_table ++ = 0x00000000;
*p_table ++ = 0x00000000;
*p_table ++ = 0x1c1bd000;
*p_table ++ = 0x00000000;
*p_table ++ = 0x00000000;
*p_table ++ = 0x00000000;
*p_table ++ = 0x0007cf80;
*p_table ++ = 0x00000000;
*p_table ++ = 0x00000000;
*p_table ++ = 0x1c080000;
*p_table ++ = 0x00000000;
*p_table ++ = 0x00000000;
*p_table ++ = 0x00000000;
}
}
void hsw_veb_iecp_ace_table(VADriverContextP ctx, struct intel_vebox_context *proc_ctx)
{
unsigned int *p_table = (unsigned int*)(proc_ctx->iecp_state_table.ptr + 116);
if(!(proc_ctx->filters_mask & VPP_IECP_ACE)){
memset(p_table, 0, 13 * 4);
}else{
*p_table ++ = 0x00000068;
*p_table ++ = 0x4c382410;
*p_table ++ = 0x9c887460;
*p_table ++ = 0xebd8c4b0;
*p_table ++ = 0x604c3824;
*p_table ++ = 0xb09c8874;
*p_table ++ = 0x0000d8c4;
*p_table ++ = 0x00000000;
*p_table ++ = 0x00000000;
*p_table ++ = 0x00000000;
*p_table ++ = 0x00000000;
*p_table ++ = 0x00000000;
*p_table ++ = 0x00000000;
}
}
void hsw_veb_iecp_tcc_table(VADriverContextP ctx, struct intel_vebox_context *proc_ctx)
{
unsigned int *p_table = (unsigned int*)(proc_ctx->iecp_state_table.ptr + 168);
/*
VAProcFilterParameterBuffer * tcc_param =
(VAProcFilterParameterBuffer *) proc_ctx->filter_iecp_tcc;
*/
if(!(proc_ctx->filters_mask & VPP_IECP_TCC)){
memset(p_table, 0, 11 * 4);
}else{
*p_table ++ = 0x00000000;
*p_table ++ = 0x00000000;
*p_table ++ = 0x1e34cc91;
*p_table ++ = 0x3e3cce91;
*p_table ++ = 0x02e80195;
*p_table ++ = 0x0197046b;
*p_table ++ = 0x01790174;
*p_table ++ = 0x00000000;
*p_table ++ = 0x00000000;
*p_table ++ = 0x03030000;
*p_table ++ = 0x009201c0;
}
}
void hsw_veb_iecp_pro_amp_table(VADriverContextP ctx, struct intel_vebox_context *proc_ctx)
{
unsigned int contrast = 0x80; //default
int brightness = 0x00; //default
int cos_c_s = 256 ; //default
int sin_c_s = 0; //default
unsigned int *p_table = (unsigned int*)(proc_ctx->iecp_state_table.ptr + 212);
if(!(proc_ctx->filters_mask & VPP_IECP_PRO_AMP)){
memset(p_table, 0, 2 * 4);
}else {
float tmp_value = 0.0;
float src_saturation = 1.0;
float src_hue = 0.0;
float src_contrast = 1.0;
/*
float src_brightness = 0.0;
VAProcFilterParameterBufferColorBalance * amp_param =
(VAProcFilterParameterBufferColorBalance *) proc_ctx->filter_iecp_amp;
VAProcColorBalanceType attrib = amp_param->attrib;
if(attrib == VAProcColorBalanceHue) {
src_hue = amp_param->value; //(-180.0, 180.0)
}else if(attrib == VAProcColorBalanceSaturation) {
src_saturation = amp_param->value; //(0.0, 10.0)
}else if(attrib == VAProcColorBalanceBrightness) {
src_brightness = amp_param->value; // (-100.0, 100.0)
brightness = format_convert(src_brightness, 7, 4, 1);
}else if(attrib == VAProcColorBalanceContrast) {
src_contrast = amp_param->value; // (0.0, 10.0)
contrast = format_convert(src_contrast, 4, 7, 0);
}
*/
tmp_value = cos(src_hue/180*PI) * src_contrast * src_saturation;
cos_c_s = format_convert(tmp_value, 7, 8, 1);
tmp_value = sin(src_hue/180*PI) * src_contrast * src_saturation;
sin_c_s = format_convert(tmp_value, 7, 8, 1);
*p_table ++ = ( 0 << 28 | //reserved
contrast << 17 | //contrast value (U4.7 format)
0 << 13 | //reserved
brightness << 1| // S7.4 format
1);
*p_table ++ = ( cos_c_s << 16 | // cos(h) * contrast * saturation
sin_c_s); // sin(h) * contrast * saturation
}
}
void hsw_veb_iecp_csc_table(VADriverContextP ctx, struct intel_vebox_context *proc_ctx)
{
unsigned int *p_table = (unsigned int*)(proc_ctx->iecp_state_table.ptr + 220);
float tran_coef[9] = {1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0};
float v_coef[3] = {0.0, 0.0, 0.0};
float u_coef[3] = {0.0, 0.0, 0.0};
int is_transform_enabled = 0;
if(!(proc_ctx->filters_mask & VPP_IECP_CSC)){
memset(p_table, 0, 8 * 4);
return;
}
/*
VAProcColorStandardType in_color_std = proc_ctx->pipeline_param->surface_color_standard;
VAProcColorStandardType out_color_std = proc_ctx->pipeline_param->output_color_standard;
assert(in_color_std == out_color_std);
*/
if(proc_ctx->fourcc_input == VA_FOURCC('R','G','B','A') &&
(proc_ctx->fourcc_output == VA_FOURCC('N','V','1','2') ||
proc_ctx->fourcc_output == VA_FOURCC('Y','V','1','2') ||
proc_ctx->fourcc_output == VA_FOURCC('Y','V','Y','2') ||
proc_ctx->fourcc_output == VA_FOURCC('A','Y','U','V'))) {
tran_coef[0] = 0.257;
tran_coef[1] = 0.504;
tran_coef[2] = 0.098;
tran_coef[3] = -0.148;
tran_coef[4] = -0.291;
tran_coef[5] = 0.439;
tran_coef[6] = 0.439;
tran_coef[7] = -0.368;
tran_coef[8] = -0.071;
u_coef[0] = 16 * 4;
u_coef[1] = 128 * 4;
u_coef[2] = 128 * 4;
is_transform_enabled = 1;
}else if((proc_ctx->fourcc_input == VA_FOURCC('N','V','1','2') ||
proc_ctx->fourcc_input == VA_FOURCC('Y','V','1','2') ||
proc_ctx->fourcc_input == VA_FOURCC('Y','U','Y','2') ||
proc_ctx->fourcc_input == VA_FOURCC('A','Y','U','V'))&&
proc_ctx->fourcc_output == VA_FOURCC('R','G','B','A')) {
tran_coef[0] = 1.164;
tran_coef[1] = 0.000;
tran_coef[2] = 1.569;
tran_coef[3] = 1.164;
tran_coef[4] = -0.813;
tran_coef[5] = -0.392;
tran_coef[6] = 1.164;
tran_coef[7] = 2.017;
tran_coef[8] = 0.000;
v_coef[0] = -16 * 4;
v_coef[1] = -128 * 4;
v_coef[2] = -128 * 4;
is_transform_enabled = 1;
}else if(proc_ctx->fourcc_input != proc_ctx->fourcc_output){
//enable when input and output format are different.
is_transform_enabled = 1;
}
if(is_transform_enabled == 0){
memset(p_table, 0, 8 * 4);
}else{
*p_table ++ = ( 0 << 29 | //reserved
format_convert(tran_coef[1], 2, 10, 1) << 16 | //c1, s2.10 format
format_convert(tran_coef[0], 2, 10, 1) << 3 | //c0, s2.10 format
0 << 2 | //reserved
0 << 1 | // yuv_channel swap
is_transform_enabled);
*p_table ++ = ( 0 << 26 | //reserved
format_convert(tran_coef[3], 2, 10, 1) << 13 |
format_convert(tran_coef[2], 2, 10, 1));
*p_table ++ = ( 0 << 26 | //reserved
format_convert(tran_coef[5], 2, 10, 1) << 13 |
format_convert(tran_coef[4], 2, 10, 1));
*p_table ++ = ( 0 << 26 | //reserved
format_convert(tran_coef[7], 2, 10, 1) << 13 |
format_convert(tran_coef[6], 2, 10, 1));
*p_table ++ = ( 0 << 13 | //reserved
format_convert(tran_coef[8], 2, 10, 1));
*p_table ++ = ( 0 << 22 | //reserved
format_convert(u_coef[0], 10, 0, 1) << 11 |
format_convert(v_coef[0], 10, 0, 1));
*p_table ++ = ( 0 << 22 | //reserved
format_convert(u_coef[1], 10, 0, 1) << 11 |
format_convert(v_coef[1], 10, 0, 1));
*p_table ++ = ( 0 << 22 | //reserved
format_convert(u_coef[2], 10, 0, 1) << 11 |
format_convert(v_coef[2], 10, 0, 1));
}
}
void hsw_veb_iecp_aoi_table(VADriverContextP ctx, struct intel_vebox_context *proc_ctx)
{
unsigned int *p_table = (unsigned int*)(proc_ctx->iecp_state_table.ptr + 252);
/*
VAProcFilterParameterBuffer * tcc_param =
(VAProcFilterParameterBuffer *) proc_ctx->filter_iecp_tcc;
*/
if(!(proc_ctx->filters_mask & VPP_IECP_AOI)){
memset(p_table, 0, 3 * 4);
}else{
*p_table ++ = 0x00000000;
*p_table ++ = 0x00030000;
*p_table ++ = 0x00030000;
}
}
void hsw_veb_state_table_setup(VADriverContextP ctx, struct intel_vebox_context *proc_ctx)
{
if(proc_ctx->filters_mask & 0x000000ff) {
dri_bo *dndi_bo = proc_ctx->dndi_state_table.bo;
dri_bo_map(dndi_bo, 1);
proc_ctx->dndi_state_table.ptr = dndi_bo->virtual;
hsw_veb_dndi_table(ctx, proc_ctx);
dri_bo_unmap(dndi_bo);
}
if(proc_ctx->filters_mask & 0x0000ff00 ||
proc_ctx->fourcc_input != proc_ctx->fourcc_output) {
dri_bo *iecp_bo = proc_ctx->iecp_state_table.bo;
dri_bo_map(iecp_bo, 1);
proc_ctx->iecp_state_table.ptr = iecp_bo->virtual;
hsw_veb_iecp_std_table(ctx, proc_ctx);
hsw_veb_iecp_ace_table(ctx, proc_ctx);
hsw_veb_iecp_tcc_table(ctx, proc_ctx);
hsw_veb_iecp_pro_amp_table(ctx, proc_ctx);
hsw_veb_iecp_csc_table(ctx, proc_ctx);
hsw_veb_iecp_aoi_table(ctx, proc_ctx);
dri_bo_unmap(iecp_bo);
}
}
void hsw_veb_state_command(VADriverContextP ctx, struct intel_vebox_context *proc_ctx)
{
struct intel_batchbuffer *batch = proc_ctx->batch;
unsigned int is_dn_enabled = (proc_ctx->filters_mask & 0x01)? 1: 0;
unsigned int is_di_enabled = (proc_ctx->filters_mask & 0x02)? 1: 0;
unsigned int is_iecp_enabled = (proc_ctx->filters_mask & 0xff00)?1:0;
BEGIN_VEB_BATCH(batch, 6);
OUT_VEB_BATCH(batch, VEB_STATE | (6 - 2));
OUT_VEB_BATCH(batch,
0 << 26 | // state surface control bits
0 << 11 | // reserved.
0 << 10 | // pipe sync disable
2 << 8 | // DI output frame
0 << 7 | // 444->422 downsample method
0 << 6 | // 422->420 downsample method
!!(proc_ctx->is_first_frame && (is_di_enabled || is_dn_enabled)) << 5 | // DN/DI first frame
is_di_enabled << 4 | // DI enable
is_dn_enabled << 3 | // DN enable
is_iecp_enabled << 2 | // global IECP enabled
0 << 1 | // ColorGamutCompressionEnable
0 ) ; // ColorGamutExpansionEnable.
OUT_RELOC(batch,
proc_ctx->dndi_state_table.bo,
I915_GEM_DOMAIN_INSTRUCTION, 0, 0);
OUT_RELOC(batch,
proc_ctx->iecp_state_table.bo,
I915_GEM_DOMAIN_INSTRUCTION, 0, 0);
OUT_RELOC(batch,
proc_ctx->gamut_state_table.bo,
I915_GEM_DOMAIN_INSTRUCTION, 0, 0);
OUT_RELOC(batch,
proc_ctx->vertex_state_table.bo,
I915_GEM_DOMAIN_INSTRUCTION, 0, 0);
ADVANCE_VEB_BATCH(batch);
}
void hsw_veb_surface_state(VADriverContextP ctx, struct intel_vebox_context *proc_ctx, unsigned int is_output)
{
struct i965_driver_data *i965 = i965_driver_data(ctx);
struct intel_batchbuffer *batch = proc_ctx->batch;
unsigned int u_offset_y = 0, v_offset_y = 0;
unsigned int is_uv_interleaved = 0, tiling = 0, swizzle = 0;
unsigned int surface_format = PLANAR_420_8;
struct object_surface* obj_surf = NULL;
unsigned int surface_pitch = 0;
unsigned int half_pitch_chroma = 0;
if(is_output){
obj_surf = SURFACE(proc_ctx->frame_store[FRAME_OUT_CURRENT].surface_id);
}else {
obj_surf = SURFACE(proc_ctx->frame_store[FRAME_IN_CURRENT].surface_id);
}
if (obj_surf->fourcc == VA_FOURCC_NV12) {
surface_format = PLANAR_420_8;
surface_pitch = obj_surf->width;
printf("NV12, is_output=%d, width = %d, pitch is = %d\n",is_output, obj_surf->orig_width, obj_surf->width);
is_uv_interleaved = 1;
half_pitch_chroma = 0;
} else if (obj_surf->fourcc == VA_FOURCC_YUY2) {
surface_format = YCRCB_NORMAL;
surface_pitch = obj_surf->width * 2;
is_uv_interleaved = 0;
half_pitch_chroma = 0;
} else if (obj_surf->fourcc == VA_FOURCC_AYUV) {
surface_format = PACKED_444A_8;
surface_pitch = obj_surf->width * 4;
is_uv_interleaved = 0;
half_pitch_chroma = 0;
} else if (obj_surf->fourcc == VA_FOURCC_RGBA) {
surface_format = R8G8B8A8_UNORM_SRGB;
surface_pitch = obj_surf->width * 4;
is_uv_interleaved = 0;
half_pitch_chroma = 0;
}
u_offset_y = obj_surf->y_cb_offset;
v_offset_y = obj_surf->y_cr_offset;
dri_bo_get_tiling(obj_surf->bo, &tiling, &swizzle);
BEGIN_VEB_BATCH(batch, 6);
OUT_VEB_BATCH(batch, VEB_SURFACE_STATE | (6 - 2));
OUT_VEB_BATCH(batch,
0 << 1 | // reserved
is_output); // surface indentification.
OUT_VEB_BATCH(batch,
(proc_ctx->pic_height - 1) << 18 | // height . w3
(proc_ctx->pic_width ) << 4 | // width
0); // reserve
OUT_VEB_BATCH(batch,
surface_format << 28 | // surface format, YCbCr420. w4
is_uv_interleaved << 27 | // interleave chrome , two seperate palar
0 << 20 | // reserved
(surface_pitch - 1) << 3 | // surface pitch, 64 align
half_pitch_chroma << 2 | // half pitch for chrome
!!tiling << 1 | // tiled surface, linear surface used
(tiling == I915_TILING_Y)); // tiled walk, ignored when liner surface
OUT_VEB_BATCH(batch,
0 << 29 | // reserved . w5
0 << 16 | // X offset for V(Cb)
0 << 15 | // reserved
u_offset_y); // Y offset for V(Cb)
OUT_VEB_BATCH(batch,
0 << 29 | // reserved . w6
0 << 16 | // X offset for V(Cr)
0 << 15 | // reserved
v_offset_y ); // Y offset for V(Cr)
ADVANCE_VEB_BATCH(batch);
}
void hsw_veb_dndi_iecp_command(VADriverContextP ctx, struct intel_vebox_context *proc_ctx)
{
struct intel_batchbuffer *batch = proc_ctx->batch;
unsigned char frame_ctrl_bits = 0;
unsigned int startingX = 0;
unsigned int endingX = proc_ctx->pic_width;
BEGIN_VEB_BATCH(batch, 10);
OUT_VEB_BATCH(batch, VEB_DNDI_IECP_STATE | (10 - 2));
OUT_VEB_BATCH(batch,
startingX << 16 |
endingX);
OUT_RELOC(batch,
proc_ctx->frame_store[FRAME_IN_CURRENT].bo,
I915_GEM_DOMAIN_RENDER, 0, frame_ctrl_bits);
OUT_RELOC(batch,
proc_ctx->frame_store[FRAME_IN_PREVIOUS].bo,
I915_GEM_DOMAIN_RENDER, 0, frame_ctrl_bits);
OUT_RELOC(batch,
proc_ctx->frame_store[FRAME_IN_STMM].bo,
I915_GEM_DOMAIN_RENDER, 0, frame_ctrl_bits);
OUT_RELOC(batch,
proc_ctx->frame_store[FRAME_OUT_STMM].bo,
I915_GEM_DOMAIN_RENDER, I915_GEM_DOMAIN_RENDER, frame_ctrl_bits);
OUT_RELOC(batch,
proc_ctx->frame_store[FRAME_OUT_CURRENT_DN].bo,
I915_GEM_DOMAIN_RENDER, I915_GEM_DOMAIN_RENDER, frame_ctrl_bits);
OUT_RELOC(batch,
proc_ctx->frame_store[FRAME_OUT_CURRENT].bo,
I915_GEM_DOMAIN_RENDER, I915_GEM_DOMAIN_RENDER, frame_ctrl_bits);
OUT_RELOC(batch,
proc_ctx->frame_store[FRAME_OUT_PREVIOUS].bo,
I915_GEM_DOMAIN_RENDER, I915_GEM_DOMAIN_RENDER, frame_ctrl_bits);
OUT_RELOC(batch,
proc_ctx->frame_store[FRAME_OUT_STATISTIC].bo,
I915_GEM_DOMAIN_RENDER, I915_GEM_DOMAIN_RENDER, frame_ctrl_bits);
ADVANCE_VEB_BATCH(batch);
}
void hsw_veb_surface_reference(VADriverContextP ctx,
struct intel_vebox_context *proc_ctx)
{
struct object_surface * obj_surf;
struct i965_driver_data *i965 = i965_driver_data(ctx);
/* update the input surface */
obj_surf = SURFACE(proc_ctx->surface_input);
proc_ctx->frame_store[FRAME_IN_CURRENT].surface_id = proc_ctx->surface_input;
proc_ctx->frame_store[FRAME_IN_CURRENT].bo = obj_surf->bo;
proc_ctx->frame_store[FRAME_IN_CURRENT].is_internal_surface = 0;
dri_bo_reference(proc_ctx->frame_store[FRAME_IN_CURRENT].bo);
/* update the output surface */
if(proc_ctx->filters_mask == VPP_DNDI_DN){
obj_surf = SURFACE(proc_ctx->surface_output);
proc_ctx->frame_store[FRAME_OUT_CURRENT_DN].surface_id = proc_ctx->surface_output;
proc_ctx->frame_store[FRAME_OUT_CURRENT_DN].bo = obj_surf->bo;
proc_ctx->frame_store[FRAME_OUT_CURRENT_DN].is_internal_surface = 0;
dri_bo_reference(proc_ctx->frame_store[FRAME_OUT_CURRENT_DN].bo);
}else {
obj_surf = SURFACE(proc_ctx->surface_output);
proc_ctx->frame_store[FRAME_OUT_CURRENT].surface_id = proc_ctx->surface_output;
proc_ctx->frame_store[FRAME_OUT_CURRENT].bo = obj_surf->bo;
proc_ctx->frame_store[FRAME_OUT_CURRENT].is_internal_surface = 0;
dri_bo_reference(proc_ctx->frame_store[FRAME_OUT_CURRENT].bo);
}
}
void hsw_veb_surface_unreference(VADriverContextP ctx,
struct intel_vebox_context *proc_ctx)
{
/* unreference the input surface */
dri_bo_unreference(proc_ctx->frame_store[FRAME_IN_CURRENT].bo);
proc_ctx->frame_store[FRAME_IN_CURRENT].surface_id = -1;
proc_ctx->frame_store[FRAME_IN_CURRENT].bo = NULL;
proc_ctx->frame_store[FRAME_IN_CURRENT].is_internal_surface = 0;
dri_bo_unreference(proc_ctx->frame_store[FRAME_IN_CURRENT].bo);
/* unreference the shared output surface */
if(proc_ctx->filters_mask == VPP_DNDI_DN){
proc_ctx->frame_store[FRAME_OUT_CURRENT_DN].surface_id = -1;
proc_ctx->frame_store[FRAME_OUT_CURRENT_DN].bo = NULL;
proc_ctx->frame_store[FRAME_OUT_CURRENT_DN].is_internal_surface = 0;
dri_bo_unreference(proc_ctx->frame_store[FRAME_OUT_CURRENT_DN].bo);
}else{
proc_ctx->frame_store[FRAME_OUT_CURRENT].surface_id = -1;
proc_ctx->frame_store[FRAME_OUT_CURRENT].bo = NULL;
proc_ctx->frame_store[FRAME_OUT_CURRENT].is_internal_surface = 0;
dri_bo_unreference(proc_ctx->frame_store[FRAME_OUT_CURRENT].bo);
}
}
void hsw_veb_resource_prepare(VADriverContextP ctx,
struct intel_vebox_context *proc_ctx)
{
VAStatus va_status;
dri_bo *bo;
struct i965_driver_data *i965 = i965_driver_data(ctx);
unsigned int input_fourcc, output_fourcc;
unsigned int input_sampling, output_sampling;
unsigned int input_tiling, output_tiling;
unsigned int i, swizzle;
struct object_surface* obj_surf_in = SURFACE(proc_ctx->surface_input);
struct object_surface* obj_surf_out = SURFACE(proc_ctx->surface_output);
assert(obj_surf_in->orig_width == obj_surf_out->orig_width &&
obj_surf_in->orig_height == obj_surf_out->orig_height);
proc_ctx->pic_width = obj_surf_in->orig_width;
proc_ctx->pic_height = obj_surf_in->orig_height;
/* record vebox pipeline input surface format information*/
if(obj_surf_in->bo == NULL){
input_fourcc = VA_FOURCC('N','V','1','2');
input_sampling = SUBSAMPLE_YUV420;
input_tiling = 1;
i965_check_alloc_surface_bo(ctx, obj_surf_in, input_tiling, input_fourcc, input_sampling);
} else {
input_fourcc = obj_surf_in->fourcc;
input_sampling = obj_surf_in->subsampling;
dri_bo_get_tiling(obj_surf_in->bo, &input_tiling, &swizzle);
input_tiling = !!input_tiling;
}
/* record vebox pipeline output surface format information */
if(obj_surf_out->bo == NULL){
output_fourcc = VA_FOURCC('N','V','1','2');
output_sampling = SUBSAMPLE_YUV420;
output_tiling = 1;
i965_check_alloc_surface_bo(ctx, obj_surf_out, output_tiling, output_fourcc, output_sampling);
}else {
output_fourcc = obj_surf_out->fourcc;
output_sampling = obj_surf_out->subsampling;
dri_bo_get_tiling(obj_surf_out->bo, &output_tiling, &swizzle);
output_tiling = !!output_tiling;
}
assert(input_fourcc == VA_FOURCC_NV12 ||
input_fourcc == VA_FOURCC_YUY2 ||
input_fourcc == VA_FOURCC_AYUV ||
input_fourcc == VA_FOURCC_RGBA);
assert(output_fourcc == VA_FOURCC_NV12 ||
output_fourcc == VA_FOURCC_YUY2 ||
output_fourcc == VA_FOURCC_AYUV ||
output_fourcc == VA_FOURCC_RGBA);
proc_ctx->fourcc_input = input_fourcc;
proc_ctx->fourcc_output = output_fourcc;
/* allocate vebox pipeline surfaces */
VASurfaceID surfaces[FRAME_STORE_SUM];
va_status = i965_CreateSurfaces(ctx,
proc_ctx ->pic_width,
proc_ctx ->pic_height,
VA_RT_FORMAT_YUV420,
FRAME_STORE_SUM,
surfaces);
assert(va_status == VA_STATUS_SUCCESS);
for(i = FRAME_IN_CURRENT; i < FRAME_STORE_SUM; i ++) {
proc_ctx->frame_store[i].surface_id = surfaces[i];
struct object_surface* obj_surf = SURFACE(surfaces[i]);
if( i == FRAME_IN_CURRENT) {
proc_ctx->frame_store[i].surface_id = proc_ctx->surface_input;
proc_ctx->frame_store[i].bo = (SURFACE(proc_ctx->surface_input))->bo;
proc_ctx->frame_store[i].is_internal_surface = 0;
continue;
}else if( i == FRAME_IN_PREVIOUS || i == FRAME_OUT_CURRENT_DN) {
i965_check_alloc_surface_bo(ctx, obj_surf, input_tiling, input_fourcc, input_sampling);
} else if( i == FRAME_IN_STMM || i == FRAME_OUT_STMM){
i965_check_alloc_surface_bo(ctx, obj_surf, 1, input_fourcc, input_sampling);
} else if( i >= FRAME_OUT_CURRENT){
i965_check_alloc_surface_bo(ctx, obj_surf, output_tiling, output_fourcc, output_sampling);
}
proc_ctx->frame_store[i].bo = obj_surf->bo;
dri_bo_reference(proc_ctx->frame_store[i].bo);
proc_ctx->frame_store[i].is_internal_surface = 1;
}
/* alloc dndi state table */
dri_bo_unreference(proc_ctx->dndi_state_table.bo);
bo = dri_bo_alloc(i965->intel.bufmgr,
"vebox: dndi state Buffer",
0x1000, 0x1000);
proc_ctx->dndi_state_table.bo = bo;
dri_bo_reference(proc_ctx->dndi_state_table.bo);
/* alloc iecp state table */
dri_bo_unreference(proc_ctx->iecp_state_table.bo);
bo = dri_bo_alloc(i965->intel.bufmgr,
"vebox: iecp state Buffer",
0x1000, 0x1000);
proc_ctx->iecp_state_table.bo = bo;
dri_bo_reference(proc_ctx->iecp_state_table.bo);
/* alloc gamut state table */
dri_bo_unreference(proc_ctx->gamut_state_table.bo);
bo = dri_bo_alloc(i965->intel.bufmgr,
"vebox: gamut state Buffer",
0x1000, 0x1000);
proc_ctx->gamut_state_table.bo = bo;
dri_bo_reference(proc_ctx->gamut_state_table.bo);
/* alloc vertex state table */
dri_bo_unreference(proc_ctx->vertex_state_table.bo);
bo = dri_bo_alloc(i965->intel.bufmgr,
"vertex: iecp state Buffer",
0x1000, 0x1000);
proc_ctx->vertex_state_table.bo = bo;
dri_bo_reference(proc_ctx->vertex_state_table.bo);
}
VAStatus gen75_vebox_process_picture(VADriverContextP ctx,
struct intel_vebox_context *proc_ctx)
{
VAStatus va_status = VA_STATUS_SUCCESS;
if(proc_ctx->is_first_frame)
hsw_veb_resource_prepare(ctx, proc_ctx);
hsw_veb_surface_reference(ctx, proc_ctx);
intel_batchbuffer_start_atomic_veb(proc_ctx->batch, 0x1000);
intel_batchbuffer_emit_mi_flush(proc_ctx->batch);
hsw_veb_surface_state(ctx, proc_ctx, INPUT_SURFACE);
hsw_veb_surface_state(ctx, proc_ctx, OUTPUT_SURFACE);
hsw_veb_state_table_setup(ctx, proc_ctx);
hsw_veb_state_command(ctx, proc_ctx);
hsw_veb_dndi_iecp_command(ctx, proc_ctx);
intel_batchbuffer_end_atomic(proc_ctx->batch);
intel_batchbuffer_flush(proc_ctx->batch);
hsw_veb_surface_unreference(ctx, proc_ctx);
if(proc_ctx->is_first_frame)
proc_ctx->is_first_frame = 0;
return va_status;
}
void gen75_vebox_context_destroy(VADriverContextP ctx,
struct intel_vebox_context *proc_ctx)
{
int i;
/* release vebox pipeline surface */
for(i = 0; i < FRAME_STORE_SUM; i ++) {
if(proc_ctx->frame_store[i].is_internal_surface){
dri_bo_unreference(proc_ctx->frame_store[i].bo);
}
proc_ctx->frame_store[i].surface_id = -1;
proc_ctx->frame_store[i].bo = NULL;
}
/* release dndi state table */
dri_bo_unreference(proc_ctx->dndi_state_table.bo);
proc_ctx->dndi_state_table.bo = NULL;
/* release iecp state table */
dri_bo_unreference(proc_ctx->iecp_state_table.bo);
proc_ctx->dndi_state_table.bo = NULL;
intel_batchbuffer_free(proc_ctx->batch);
free(proc_ctx);
}
struct intel_vebox_context * gen75_vebox_context_init(VADriverContextP ctx)
{
struct intel_driver_data *intel = intel_driver_data(ctx);
struct intel_vebox_context *proc_context = calloc(1, sizeof(struct intel_vebox_context));
proc_context->batch = intel_batchbuffer_new(intel, I915_EXEC_VEBOX, 0);
memset(proc_context->frame_store, 0, sizeof(VEBFrameStore)*FRAME_STORE_SUM);
proc_context->filters_mask = 0;
proc_context->is_first_frame = 1;
proc_context->filters_mask = 0;
return proc_context;
}