mirror of
https://github.com/tiagovignatti/intel-gpu-tools.git
synced 2025-06-08 16:36:14 +00:00
For posterity, I've squashed these commits against Damien's request. rendercopy/gen8: Fix the include guards rendercopy/gen8: Update the 3DSTATE_MULTISAMPLE opcode The opcode has changed in BDW. rendercopy/gen8: Add the VF_TOPOLOGY state The primitive type has moved out of the 3DPRIMITIVE to its own state, VF_TOPOLOGY. rendercopy/gen8: Fixup 3STATE_PS Update the state to the latest BSpec, in particular the thread count was using a wrong shift and we were missing kernel2 offset. rendercopy/gen8: Update 3DSTATE_BASE_ADDRESS This state has seen its fields moved around a bit, follow the BSpec. rendercopy/gen8: Allocate 64 VUEs The simulator screams at us if we try to allocate less than that. rendercopy/gen8: Surface states have to be 64 bytes a aligned rendercopy/gen8: Vertical/horizontal align 2 does not exist any more So set them to 4. This should not matter with rendercopy (which is not using compressed textures), but it makes the simulator moan. rendercopy/gen8: Make sure the vertex buffer is 8 bytes aligned rendercopy/gen8: Adjust 3DSTATE_VERTEX_BUFFERS for gen8 The address of the buffer is now on 48 bits. Also the size was computed as offset + size where the field is really the size of the buffer itself, not the end address. rendercopy/gen8: Update the SF/SBE states for gen8 gen8 has a few changes around those states and a new ones RASTER and SBE_SWIZ. rendercopy/gen8: Add the PS_EXTRA and PS_BLEND states rendercopy/gen8: Fix building with DEBUG_RENDERCOPY defined The forward declaration was missing the final ';'. Let's move the whole function at the top instead. rendercopy/gen8: Update the PS and CONSTANT_PS states rendercopy/gen8: Fix the red channel selection Make it output red. rendercopy/gen8: Update the write -1 shader With the latest assembler changes from Haihao. rendercopy/gen8: Remove blit.g8a There is no diff between this file and blig.g7a. Remove it. rendercopy/gen8: Fix the surface relocation offset The surface base address is now at dwords 8/9 so the relocation has to mirror the change. rendercopy/gen8: Add the VF_INSTANCING state Should work without, but doesn't hurt to add it. rendercopy/gen8: Set the Attribule enable field in PS_EXTRA When the SF is set up to output some attributes, the pixel shader also have to be told there's attributes to care about. rendercopy/gen8: Set the force bits to read URB offset/length If we want to override the URB offset/length in the SBE state itself, we need to set the force bits on (new in gen8) Signed-off-by: Damien Lespiau <damien.lespiau@intel.com> Acked-by: Kenneth Graunke <kenneth@whitecape.org> Signed-off-by: Ben Widawsky <ben@bwidawsk.net>
327 lines
8.4 KiB
C
327 lines
8.4 KiB
C
#ifndef GEN8_RENDER_H
|
|
#define GEN8_RENDER_H
|
|
|
|
#include "gen6_render.h"
|
|
|
|
#define GEN7_3DSTATE_URB_VS (0x7830 << 16)
|
|
#define GEN7_3DSTATE_URB_HS (0x7831 << 16)
|
|
#define GEN7_3DSTATE_URB_DS (0x7832 << 16)
|
|
#define GEN7_3DSTATE_URB_GS (0x7833 << 16)
|
|
|
|
#define GEN6_3DSTATE_SCISSOR_STATE_POINTERS GEN6_3D(3, 0, 0xf)
|
|
#define GEN7_3DSTATE_CLEAR_PARAMS GEN6_3D(3, 0, 0x04)
|
|
#define GEN7_3DSTATE_DEPTH_BUFFER GEN6_3D(3, 0, 0x05)
|
|
#define GEN7_3DSTATE_STENCIL_BUFFER GEN6_3D(3, 0, 0x06)
|
|
#define GEN7_3DSTATE_HIER_DEPTH_BUFFER GEN6_3D(3, 0, 0x07)
|
|
#define GEN8_3DSTATE_MULTISAMPLE GEN6_3D(3, 0, 0x0d)
|
|
# define GEN8_3DSTATE_MULTISAMPLE_PIXEL_LOCATION_CENTER (0 << 4)
|
|
# define GEN8_3DSTATE_MULTISAMPLE_PIXEL_LOCATION_UPPER_LEFT (1 << 4)
|
|
# define GEN8_3DSTATE_MULTISAMPLE_NUMSAMPLES_1 (0 << 1)
|
|
# define GEN8_3DSTATE_MULTISAMPLE_NUMSAMPLES_2 (1 << 1)
|
|
# define GEN8_3DSTATE_MULTISAMPLE_NUMSAMPLES_4 (2 << 1)
|
|
# define GEN8_3DSTATE_MULTISAMPLE_NUMSAMPLES_8 (3 << 1)
|
|
# define GEN9_3DSTATE_MULTISAMPLE_NUMSAMPLES_16 (4 << 1)
|
|
|
|
#define GEN8_3DSTATE_VF_INSTANCING GEN6_3D(3, 0, 0x49)
|
|
#define GEN7_3DSTATE_GS GEN6_3D(3, 0, 0x11)
|
|
#define GEN7_3DSTATE_CONSTANT_GS GEN6_3D(3, 0, 0x16)
|
|
#define GEN7_3DSTATE_CONSTANT_HS GEN6_3D(3, 0, 0x19)
|
|
#define GEN7_3DSTATE_CONSTANT_DS GEN6_3D(3, 0, 0x1a)
|
|
#define GEN7_3DSTATE_HS GEN6_3D(3, 0, 0x1b)
|
|
#define GEN7_3DSTATE_TE GEN6_3D(3, 0, 0x1c)
|
|
#define GEN7_3DSTATE_DS GEN6_3D(3, 0, 0x1d)
|
|
#define GEN7_3DSTATE_STREAMOUT GEN6_3D(3, 0, 0x1e)
|
|
#define GEN7_3DSTATE_SBE GEN6_3D(3, 0, 0x1f)
|
|
# define GEN8_SBE_FORCE_URB_ENTRY_READ_LENGTH (1 << 29)
|
|
# define GEN8_SBE_FORCE_URB_ENTRY_READ_OFFSET (1 << 28)
|
|
# define GEN7_SBE_NUM_OUTPUTS_SHIFT 22
|
|
# define GEN7_SBE_URB_ENTRY_READ_LENGTH_SHIFT 11
|
|
# define GEN8_SBE_URB_ENTRY_READ_OFFSET_SHIFT 5
|
|
#define GEN8_3DSTATE_SBE_SWIZ GEN6_3D(3, 0, 0x51)
|
|
#define GEN8_3DSTATE_RASTER GEN6_3D(3, 0, 0x50)
|
|
# define GEN8_RASTER_FRONT_WINDING_CCW (1 << 21)
|
|
# define GEN8_RASTER_CULL_NONE (1 << 16)
|
|
#define GEN7_3DSTATE_PS GEN6_3D(3, 0, 0x20)
|
|
#define GEN7_3DSTATE_VIEWPORT_STATE_POINTERS_SF_CLIP \
|
|
GEN6_3D(3, 0, 0x21)
|
|
#define GEN8_3DSTATE_PS_BLEND GEN6_3D(3, 0, 0x4d)
|
|
# define GEN8_PS_BLEND_HAS_WRITEABLE_RT (1 << 30)
|
|
#define GEN8_3DSTATE_PS_EXTRA GEN6_3D(3,0, 0x4f)
|
|
# define GEN8_PSX_PIXEL_SHADER_VALID (1 << 31)
|
|
# define GEN8_PSX_ATTRIBUTE_ENABLE (1 << 8)
|
|
|
|
#define GEN7_3DSTATE_VIEWPORT_STATE_POINTERS_CC GEN6_3D(3, 0, 0x23)
|
|
#define GEN7_3DSTATE_BLEND_STATE_POINTERS GEN6_3D(3, 0, 0x24)
|
|
#define GEN7_3DSTATE_DS_STATE_POINTERS GEN6_3D(3, 0, 0x25)
|
|
#define GEN7_3DSTATE_BINDING_TABLE_POINTERS_VS GEN6_3D(3, 0, 0x26)
|
|
#define GEN7_3DSTATE_BINDING_TABLE_POINTERS_HS GEN6_3D(3, 0, 0x27)
|
|
#define GEN7_3DSTATE_BINDING_TABLE_POINTERS_DS GEN6_3D(3, 0, 0x28)
|
|
#define GEN7_3DSTATE_BINDING_TABLE_POINTERS_GS GEN6_3D(3, 0, 0x29)
|
|
#define GEN7_3DSTATE_BINDING_TABLE_POINTERS_PS GEN6_3D(3, 0, 0x2a)
|
|
|
|
#define GEN7_3DSTATE_SAMPLER_STATE_POINTERS_VS GEN6_3D(3, 0, 0x2b)
|
|
#define GEN7_3DSTATE_SAMPLER_STATE_POINTERS_HS GEN6_3D(3, 0, 0x2c)
|
|
#define GEN7_3DSTATE_SAMPLER_STATE_POINTERS_DS GEN6_3D(3, 0, 0x2d)
|
|
#define GEN7_3DSTATE_SAMPLER_STATE_POINTERS_GS GEN6_3D(3, 0, 0x2e)
|
|
#define GEN7_3DSTATE_SAMPLER_STATE_POINTERS_PS GEN6_3D(3, 0, 0x2f)
|
|
|
|
#define GEN8_3DSTATE_VF_TOPOLOGY GEN6_3D(3, 0, 0x4b)
|
|
|
|
#define GEN7_3DSTATE_PUSH_CONSTANT_ALLOC_VS GEN6_3D(3, 1, 0x12)
|
|
#define GEN7_3DSTATE_PUSH_CONSTANT_ALLOC_HS GEN6_3D(3, 1, 0x13)
|
|
#define GEN7_3DSTATE_PUSH_CONSTANT_ALLOC_DS GEN6_3D(3, 1, 0x14)
|
|
#define GEN7_3DSTATE_PUSH_CONSTANT_ALLOC_GS GEN6_3D(3, 1, 0x15)
|
|
#define GEN7_3DSTATE_PUSH_CONSTANT_ALLOC_PS GEN6_3D(3, 1, 0x16)
|
|
|
|
/* Some random bits that we care about */
|
|
#define GEN7_VB0_BUFFER_ADDR_MOD_EN (1 << 14)
|
|
#define GEN7_3DSTATE_PS_PERSPECTIVE_PIXEL_BARYCENTRIC (1 << 11)
|
|
#define GEN7_3DSTATE_PS_ATTRIBUTE_ENABLED (1 << 10)
|
|
|
|
/* Random shifts */
|
|
#define GEN8_3DSTATE_PS_MAX_THREADS_SHIFT 23
|
|
|
|
/* Shamelessly ripped from mesa */
|
|
struct gen8_surface_state
|
|
{
|
|
struct {
|
|
uint32_t cube_pos_z:1;
|
|
uint32_t cube_neg_z:1;
|
|
uint32_t cube_pos_y:1;
|
|
uint32_t cube_neg_y:1;
|
|
uint32_t cube_pos_x:1;
|
|
uint32_t cube_neg_x:1;
|
|
uint32_t media_boundary_pixel_mode:2;
|
|
uint32_t render_cache_read_write:1;
|
|
uint32_t smapler_l2_bypass:1;
|
|
uint32_t vert_line_stride_ofs:1;
|
|
uint32_t vert_line_stride:1;
|
|
uint32_t tiled_mode:2;
|
|
uint32_t horizontal_alignment:2;
|
|
uint32_t vertical_alignment:2;
|
|
uint32_t surface_format:9; /**< BRW_SURFACEFORMAT_x */
|
|
uint32_t pad0:1;
|
|
uint32_t is_array:1;
|
|
uint32_t surface_type:3; /**< BRW_SURFACE_1D/2D/3D/CUBE */
|
|
} ss0;
|
|
|
|
struct {
|
|
uint32_t qpitch:15;
|
|
uint32_t pad1:4;
|
|
uint32_t base_mip_level:5;
|
|
uint32_t memory_object_control:7;
|
|
uint32_t pad0:1;
|
|
} ss1;
|
|
|
|
struct {
|
|
uint32_t width:14;
|
|
uint32_t pad1:2;
|
|
uint32_t height:14;
|
|
uint32_t pad0:2;
|
|
} ss2;
|
|
|
|
struct {
|
|
uint32_t pitch:18;
|
|
uint32_t pad:3;
|
|
uint32_t depth:11;
|
|
} ss3;
|
|
|
|
struct {
|
|
uint32_t minimum_array_element:27;
|
|
uint32_t pad0:5;
|
|
} ss4;
|
|
|
|
struct {
|
|
uint32_t mip_count:4;
|
|
uint32_t min_lod:4;
|
|
uint32_t pad3:6;
|
|
uint32_t coherency_type:1;
|
|
uint32_t pad2:5;
|
|
uint32_t ewa_disable_for_cube:1;
|
|
uint32_t y_offset:3;
|
|
uint32_t pad0:1;
|
|
uint32_t x_offset:7;
|
|
} ss5;
|
|
|
|
struct {
|
|
uint32_t pad; /* Multisample Control Surface stuff */
|
|
} ss6;
|
|
|
|
struct {
|
|
uint32_t resource_min_lod:12;
|
|
|
|
/* Only on Haswell */
|
|
uint32_t pad0:4;
|
|
uint32_t shader_chanel_select_a:3;
|
|
uint32_t shader_chanel_select_b:3;
|
|
uint32_t shader_chanel_select_g:3;
|
|
uint32_t shader_chanel_select_r:3;
|
|
|
|
uint32_t alpha_clear_color:1;
|
|
uint32_t blue_clear_color:1;
|
|
uint32_t green_clear_color:1;
|
|
uint32_t red_clear_color:1;
|
|
} ss7;
|
|
|
|
struct {
|
|
uint32_t base_addr;
|
|
} ss8;
|
|
|
|
struct {
|
|
uint32_t base_addr_hi:16;
|
|
uint32_t pad0:16;
|
|
} ss9;
|
|
|
|
struct {
|
|
uint32_t pad0:12;
|
|
uint32_t aux_base_addr:20;
|
|
} ss10;
|
|
|
|
struct {
|
|
uint32_t aux_base_addr_hi:16;
|
|
uint32_t pad:16;
|
|
} ss11;
|
|
|
|
struct {
|
|
uint32_t hiz_depth_clear_value;
|
|
} ss12;
|
|
|
|
struct {
|
|
uint32_t reserved;
|
|
} ss13;
|
|
|
|
struct {
|
|
uint32_t reserved;
|
|
} ss14;
|
|
|
|
struct {
|
|
uint32_t reserved;
|
|
} ss15;
|
|
};
|
|
|
|
struct gen8_sampler_state
|
|
{
|
|
struct
|
|
{
|
|
uint32_t aniso_algorithm:1;
|
|
uint32_t lod_bias:13;
|
|
uint32_t min_filter:3;
|
|
uint32_t mag_filter:3;
|
|
uint32_t mip_filter:2;
|
|
uint32_t base_level:5;
|
|
uint32_t lod_preclamp:2;
|
|
uint32_t default_color_mode:1;
|
|
uint32_t pad0:1;
|
|
uint32_t disable:1;
|
|
} ss0;
|
|
|
|
struct
|
|
{
|
|
uint32_t cube_control_mode:1;
|
|
uint32_t shadow_function:3;
|
|
uint32_t chromakey_mode:1;
|
|
uint32_t chromakey_index:2;
|
|
uint32_t chromakey_enable:1;
|
|
uint32_t max_lod:12;
|
|
uint32_t min_lod:12;
|
|
} ss1;
|
|
|
|
struct
|
|
{
|
|
uint32_t lod_clamp_mag_mode:1;
|
|
uint32_t flexible_filter_valign:1;
|
|
uint32_t flexible_filter_halign:1;
|
|
uint32_t flexible_filter_coeff_size:1;
|
|
uint32_t flexible_filter_mode:1;
|
|
uint32_t pad1:1;
|
|
uint32_t indirect_state_ptr:18;
|
|
uint32_t pad0:2;
|
|
uint32_t sep_filter_height:2;
|
|
uint32_t sep_filter_width:2;
|
|
uint32_t sep_filter_coeff_table_size:2;
|
|
} ss2;
|
|
|
|
struct
|
|
{
|
|
uint32_t r_wrap_mode:3;
|
|
uint32_t t_wrap_mode:3;
|
|
uint32_t s_wrap_mode:3;
|
|
uint32_t pad:1;
|
|
uint32_t non_normalized_coord:1;
|
|
uint32_t trilinear_quality:2;
|
|
uint32_t address_round:6;
|
|
uint32_t max_aniso:3;
|
|
uint32_t pad0:2;
|
|
uint32_t non_sep_filter_footprint_mask:8;
|
|
} ss3;
|
|
};
|
|
|
|
struct gen8_blend_state {
|
|
struct {
|
|
uint32_t pad0:19;
|
|
uint32_t y_dither_offset:2;
|
|
uint32_t x_dither_offset:2;
|
|
uint32_t dither_enable:1;
|
|
uint32_t alpha_test_func:3;
|
|
uint32_t alpha_test:1;
|
|
uint32_t alpha_to_coverage_dither:1;
|
|
uint32_t alpha_to_one:1;
|
|
uint32_t ia_blend:1;
|
|
uint32_t alpha_to_coverage:1;
|
|
} bs0;
|
|
|
|
struct {
|
|
uint64_t write_disable_blue:1;
|
|
uint64_t write_disable_green:1;
|
|
uint64_t write_disable_red:1;
|
|
uint64_t write_disable_alpha:1;
|
|
uint64_t pad1:1;
|
|
uint64_t alpha_blend_func:3;
|
|
uint64_t dest_alpha_blend_factor:5;
|
|
uint64_t source_alpha_blend_factor:5;
|
|
uint64_t color_blend_func:3;
|
|
uint64_t dest_blend_factor:5;
|
|
uint64_t source_blend_factor:5;
|
|
uint64_t color_buffer_blend:1;
|
|
uint64_t post_blend_color_clamp:1;
|
|
uint64_t pre_blend_color_clamp:1;
|
|
uint64_t color_clamp_range:2;
|
|
uint64_t pre_blend_source_only_clamp:1;
|
|
uint64_t pad0:22;
|
|
uint64_t logic_op_func:4;
|
|
uint64_t logic_op_enable:1;
|
|
} bs[16];
|
|
};
|
|
|
|
struct gen7_sf_clip_viewport {
|
|
struct {
|
|
float m00;
|
|
float m11;
|
|
float m22;
|
|
float m30;
|
|
float m31;
|
|
float m32;
|
|
} viewport;
|
|
|
|
uint32_t pad0[2];
|
|
|
|
struct {
|
|
float xmin;
|
|
float xmax;
|
|
float ymin;
|
|
float ymax;
|
|
} guardband;
|
|
|
|
float pad1[4];
|
|
};
|
|
|
|
struct gen6_scissor_rect
|
|
{
|
|
uint32_t xmin:16;
|
|
uint32_t ymin:16;
|
|
uint32_t xmax:16;
|
|
uint32_t ymax:16;
|
|
};
|
|
|
|
#endif
|