|
|
|
@@ -216,18 +216,18 @@ static void transform_CEIL(struct radeon_compiler* c, |
|
|
|
rc_remove_instruction(inst); |
|
|
|
} |
|
|
|
|
|
|
|
static void transform_DP3(struct radeon_compiler* c, |
|
|
|
static void transform_DP2(struct radeon_compiler* c, |
|
|
|
struct rc_instruction* inst) |
|
|
|
{ |
|
|
|
struct rc_src_register src0 = inst->U.I.SrcReg[0]; |
|
|
|
struct rc_src_register src1 = inst->U.I.SrcReg[1]; |
|
|
|
src0.Negate &= ~RC_MASK_W; |
|
|
|
src0.Swizzle &= ~(7 << (3 * 3)); |
|
|
|
src0.Swizzle |= RC_SWIZZLE_ZERO << (3 * 3); |
|
|
|
src1.Negate &= ~RC_MASK_W; |
|
|
|
src1.Swizzle &= ~(7 << (3 * 3)); |
|
|
|
src1.Swizzle |= RC_SWIZZLE_ZERO << (3 * 3); |
|
|
|
emit2(c, inst->Prev, RC_OPCODE_DP4, inst->U.I.SaturateMode, inst->U.I.DstReg, src0, src1); |
|
|
|
src0.Negate &= ~(RC_MASK_Z | RC_MASK_W); |
|
|
|
src0.Swizzle &= ~(63 << (3 * 2)); |
|
|
|
src0.Swizzle |= (RC_SWIZZLE_ZERO << (3 * 2)) | (RC_SWIZZLE_ZERO << (3 * 3)); |
|
|
|
src1.Negate &= ~(RC_MASK_Z | RC_MASK_W); |
|
|
|
src1.Swizzle &= ~(63 << (3 * 2)); |
|
|
|
src1.Swizzle |= (RC_SWIZZLE_ZERO << (3 * 2)) | (RC_SWIZZLE_ZERO << (3 * 3)); |
|
|
|
emit2(c, inst->Prev, RC_OPCODE_DP3, inst->U.I.SaturateMode, inst->U.I.DstReg, src0, src1); |
|
|
|
rc_remove_instruction(inst); |
|
|
|
} |
|
|
|
|
|
|
|
@@ -553,6 +553,7 @@ int radeonTransformALU( |
|
|
|
switch(inst->U.I.Opcode) { |
|
|
|
case RC_OPCODE_ABS: transform_ABS(c, inst); return 1; |
|
|
|
case RC_OPCODE_CEIL: transform_CEIL(c, inst); return 1; |
|
|
|
case RC_OPCODE_DP2: transform_DP2(c, inst); return 1; |
|
|
|
case RC_OPCODE_DPH: transform_DPH(c, inst); return 1; |
|
|
|
case RC_OPCODE_DST: transform_DST(c, inst); return 1; |
|
|
|
case RC_OPCODE_FLR: transform_FLR(c, inst); return 1; |
|
|
|
@@ -615,6 +616,29 @@ static void transform_r300_vertex_CMP(struct radeon_compiler* c, |
|
|
|
rc_remove_instruction(inst); |
|
|
|
} |
|
|
|
|
|
|
|
static void transform_r300_vertex_DP2(struct radeon_compiler* c, |
|
|
|
struct rc_instruction* inst) |
|
|
|
{ |
|
|
|
struct rc_instruction *next_inst = inst->Next; |
|
|
|
transform_DP2(c, inst); |
|
|
|
next_inst->Prev->U.I.Opcode = RC_OPCODE_DP4; |
|
|
|
} |
|
|
|
|
|
|
|
static void transform_r300_vertex_DP3(struct radeon_compiler* c, |
|
|
|
struct rc_instruction* inst) |
|
|
|
{ |
|
|
|
struct rc_src_register src0 = inst->U.I.SrcReg[0]; |
|
|
|
struct rc_src_register src1 = inst->U.I.SrcReg[1]; |
|
|
|
src0.Negate &= ~RC_MASK_W; |
|
|
|
src0.Swizzle &= ~(7 << (3 * 3)); |
|
|
|
src0.Swizzle |= RC_SWIZZLE_ZERO << (3 * 3); |
|
|
|
src1.Negate &= ~RC_MASK_W; |
|
|
|
src1.Swizzle &= ~(7 << (3 * 3)); |
|
|
|
src1.Swizzle |= RC_SWIZZLE_ZERO << (3 * 3); |
|
|
|
emit2(c, inst->Prev, RC_OPCODE_DP4, inst->U.I.SaturateMode, inst->U.I.DstReg, src0, src1); |
|
|
|
rc_remove_instruction(inst); |
|
|
|
} |
|
|
|
|
|
|
|
static void transform_r300_vertex_fix_LIT(struct radeon_compiler* c, |
|
|
|
struct rc_instruction* inst) |
|
|
|
{ |
|
|
|
@@ -758,7 +782,8 @@ int r300_transform_vertex_alu( |
|
|
|
case RC_OPCODE_ABS: transform_r300_vertex_ABS(c, inst); return 1; |
|
|
|
case RC_OPCODE_CEIL: transform_CEIL(c, inst); return 1; |
|
|
|
case RC_OPCODE_CMP: transform_r300_vertex_CMP(c, inst); return 1; |
|
|
|
case RC_OPCODE_DP3: transform_DP3(c, inst); return 1; |
|
|
|
case RC_OPCODE_DP2: transform_r300_vertex_DP2(c, inst); return 1; |
|
|
|
case RC_OPCODE_DP3: transform_r300_vertex_DP3(c, inst); return 1; |
|
|
|
case RC_OPCODE_DPH: transform_DPH(c, inst); return 1; |
|
|
|
case RC_OPCODE_FLR: transform_FLR(c, inst); return 1; |
|
|
|
case RC_OPCODE_LIT: transform_r300_vertex_fix_LIT(c, inst); return 1; |