@@ -776,6 +776,7 @@ enum opcode { | |||
SHADER_OPCODE_SHADER_TIME_ADD, | |||
SHADER_OPCODE_UNTYPED_ATOMIC, | |||
SHADER_OPCODE_UNTYPED_SURFACE_READ, | |||
FS_OPCODE_DDX, | |||
FS_OPCODE_DDY, |
@@ -433,6 +433,14 @@ brw_untyped_atomic(struct brw_compile *p, | |||
GLuint msg_length, | |||
GLuint response_length); | |||
void | |||
brw_untyped_surface_read(struct brw_compile *p, | |||
struct brw_reg dest, | |||
struct brw_reg mrf, | |||
GLuint bind_table_index, | |||
GLuint msg_length, | |||
GLuint response_length); | |||
/*********************************************************************** | |||
* brw_eu_util.c: | |||
*/ |
@@ -2547,6 +2547,62 @@ brw_untyped_atomic(struct brw_compile *p, | |||
insn->header.access_mode == BRW_ALIGN_1); | |||
} | |||
static void | |||
brw_set_dp_untyped_surface_read_message(struct brw_compile *p, | |||
struct brw_instruction *insn, | |||
GLuint bind_table_index, | |||
GLuint msg_length, | |||
GLuint response_length, | |||
bool header_present) | |||
{ | |||
const unsigned dispatch_width = | |||
(insn->header.execution_size == BRW_EXECUTE_16 ? 16 : 8); | |||
const unsigned num_channels = response_length / (dispatch_width / 8); | |||
if (p->brw->is_haswell) { | |||
brw_set_message_descriptor(p, insn, HSW_SFID_DATAPORT_DATA_CACHE_1, | |||
msg_length, response_length, | |||
header_present, false); | |||
insn->bits3.gen7_dp.msg_type = HSW_DATAPORT_DC_PORT1_UNTYPED_SURFACE_READ; | |||
} else { | |||
brw_set_message_descriptor(p, insn, GEN7_SFID_DATAPORT_DATA_CACHE, | |||
msg_length, response_length, | |||
header_present, false); | |||
insn->bits3.gen7_dp.msg_type = GEN7_DATAPORT_DC_UNTYPED_SURFACE_READ; | |||
} | |||
if (insn->header.access_mode == BRW_ALIGN_1) { | |||
if (dispatch_width == 16) | |||
insn->bits3.ud |= 1 << 12; /* SIMD16 mode */ | |||
else | |||
insn->bits3.ud |= 2 << 12; /* SIMD8 mode */ | |||
} | |||
insn->bits3.gen7_dp.binding_table_index = bind_table_index; | |||
/* Set mask of 32-bit channels to drop. */ | |||
insn->bits3.ud |= (0xf & (0xf << num_channels)) << 8; | |||
} | |||
void | |||
brw_untyped_surface_read(struct brw_compile *p, | |||
struct brw_reg dest, | |||
struct brw_reg mrf, | |||
GLuint bind_table_index, | |||
GLuint msg_length, | |||
GLuint response_length) | |||
{ | |||
struct brw_instruction *insn = next_insn(p, BRW_OPCODE_SEND); | |||
brw_set_dest(p, insn, retype(dest, BRW_REGISTER_TYPE_UD)); | |||
brw_set_src0(p, insn, retype(mrf, BRW_REGISTER_TYPE_UD)); | |||
brw_set_dp_untyped_surface_read_message( | |||
p, insn, bind_table_index, msg_length, response_length, | |||
insn->header.access_mode == BRW_ALIGN_1); | |||
} | |||
/** | |||
* This instruction is generated as a single-channel align1 instruction by | |||
* both the VS and FS stages when using INTEL_DEBUG=shader_time. |
@@ -773,6 +773,7 @@ fs_visitor::implied_mrf_writes(fs_inst *inst) | |||
case FS_OPCODE_SPILL: | |||
return 2; | |||
case SHADER_OPCODE_UNTYPED_ATOMIC: | |||
case SHADER_OPCODE_UNTYPED_SURFACE_READ: | |||
return 0; | |||
default: | |||
assert(!"not reached"); |
@@ -559,6 +559,10 @@ private: | |||
struct brw_reg atomic_op, | |||
struct brw_reg surf_index); | |||
void generate_untyped_surface_read(fs_inst *inst, | |||
struct brw_reg dst, | |||
struct brw_reg surf_index); | |||
void mark_surface_used(unsigned surf_index); | |||
void patch_discard_jumps_to_fb_writes(); |
@@ -1206,6 +1206,20 @@ fs_generator::generate_untyped_atomic(fs_inst *inst, struct brw_reg dst, | |||
mark_surface_used(surf_index.dw1.ud); | |||
} | |||
void | |||
fs_generator::generate_untyped_surface_read(fs_inst *inst, struct brw_reg dst, | |||
struct brw_reg surf_index) | |||
{ | |||
assert(surf_index.file == BRW_IMMEDIATE_VALUE && | |||
surf_index.type == BRW_REGISTER_TYPE_UD); | |||
brw_untyped_surface_read(p, dst, brw_message_reg(inst->base_mrf), | |||
surf_index.dw1.ud, | |||
inst->mlen, dispatch_width / 8); | |||
mark_surface_used(surf_index.dw1.ud); | |||
} | |||
void | |||
fs_generator::generate_code(exec_list *instructions) | |||
{ | |||
@@ -1609,6 +1623,10 @@ fs_generator::generate_code(exec_list *instructions) | |||
generate_untyped_atomic(inst, dst, src[0], src[1]); | |||
break; | |||
case SHADER_OPCODE_UNTYPED_SURFACE_READ: | |||
generate_untyped_surface_read(inst, dst, src[0]); | |||
break; | |||
case FS_OPCODE_SET_SIMD4X2_OFFSET: | |||
generate_set_simd4x2_offset(inst, dst, src[0]); | |||
break; |
@@ -277,6 +277,7 @@ vec4_visitor::implied_mrf_writes(vec4_instruction *inst) | |||
case SHADER_OPCODE_TG4_OFFSET: | |||
return inst->header_present ? 1 : 0; | |||
case SHADER_OPCODE_UNTYPED_ATOMIC: | |||
case SHADER_OPCODE_UNTYPED_SURFACE_READ: | |||
return 0; | |||
default: | |||
assert(!"not reached"); |
@@ -622,6 +622,10 @@ private: | |||
struct brw_reg atomic_op, | |||
struct brw_reg surf_index); | |||
void generate_untyped_surface_read(vec4_instruction *inst, | |||
struct brw_reg dst, | |||
struct brw_reg surf_index); | |||
void mark_surface_used(unsigned surf_index); | |||
struct brw_context *brw; |
@@ -872,6 +872,21 @@ vec4_generator::generate_untyped_atomic(vec4_instruction *inst, | |||
mark_surface_used(surf_index.dw1.ud); | |||
} | |||
void | |||
vec4_generator::generate_untyped_surface_read(vec4_instruction *inst, | |||
struct brw_reg dst, | |||
struct brw_reg surf_index) | |||
{ | |||
assert(surf_index.file == BRW_IMMEDIATE_VALUE && | |||
surf_index.type == BRW_REGISTER_TYPE_UD); | |||
brw_untyped_surface_read(p, dst, brw_message_reg(inst->base_mrf), | |||
surf_index.dw1.ud, | |||
inst->mlen, 1); | |||
mark_surface_used(surf_index.dw1.ud); | |||
} | |||
/** | |||
* Generate assembly for a Vec4 IR instruction. | |||
* | |||
@@ -1188,6 +1203,10 @@ vec4_generator::generate_vec4_instruction(vec4_instruction *instruction, | |||
generate_untyped_atomic(inst, dst, src[0], src[1]); | |||
break; | |||
case SHADER_OPCODE_UNTYPED_SURFACE_READ: | |||
generate_untyped_surface_read(inst, dst, src[0]); | |||
break; | |||
case VS_OPCODE_UNPACK_FLAGS_SIMD4X2: | |||
generate_unpack_flags(inst, dst); | |||
break; |