mirror of
				https://git.suyu.dev/suyu/suyu.git
				synced 2025-10-25 03:46:43 +08:00 
			
		
		
		
	shader_ir/warp: Implement FSWZADD
This commit is contained in:
		
							parent
							
								
									08b2b1080a
								
							
						
					
					
						commit
						56e237d1f9
					
				| @ -615,6 +615,14 @@ union Instruction { | |||||||
|         BitField<34, 13, u64> mask_imm; |         BitField<34, 13, u64> mask_imm; | ||||||
|     } shfl; |     } shfl; | ||||||
| 
 | 
 | ||||||
|  |     union { | ||||||
|  |         BitField<44, 1, u64> ftz; | ||||||
|  |         BitField<39, 2, u64> tab5cb8_2; | ||||||
|  |         BitField<38, 1, u64> ndv; | ||||||
|  |         BitField<47, 1, u64> cc; | ||||||
|  |         BitField<28, 8, u64> swizzle; | ||||||
|  |     } fswzadd; | ||||||
|  | 
 | ||||||
|     union { |     union { | ||||||
|         BitField<8, 8, Register> gpr; |         BitField<8, 8, Register> gpr; | ||||||
|         BitField<20, 24, s64> offset; |         BitField<20, 24, s64> offset; | ||||||
| @ -1590,6 +1598,7 @@ public: | |||||||
|         DEPBAR, |         DEPBAR, | ||||||
|         VOTE, |         VOTE, | ||||||
|         SHFL, |         SHFL, | ||||||
|  |         FSWZADD, | ||||||
|         BFE_C, |         BFE_C, | ||||||
|         BFE_R, |         BFE_R, | ||||||
|         BFE_IMM, |         BFE_IMM, | ||||||
| @ -1888,6 +1897,7 @@ private: | |||||||
|             INST("1111000011110---", Id::DEPBAR, Type::Synch, "DEPBAR"), |             INST("1111000011110---", Id::DEPBAR, Type::Synch, "DEPBAR"), | ||||||
|             INST("0101000011011---", Id::VOTE, Type::Warp, "VOTE"), |             INST("0101000011011---", Id::VOTE, Type::Warp, "VOTE"), | ||||||
|             INST("1110111100010---", Id::SHFL, Type::Warp, "SHFL"), |             INST("1110111100010---", Id::SHFL, Type::Warp, "SHFL"), | ||||||
|  |             INST("0101000011111---", Id::FSWZADD, Type::Warp, "FSWZADD"), | ||||||
|             INST("1110111111011---", Id::LD_A, Type::Memory, "LD_A"), |             INST("1110111111011---", Id::LD_A, Type::Memory, "LD_A"), | ||||||
|             INST("1110111101001---", Id::LD_S, Type::Memory, "LD_S"), |             INST("1110111101001---", Id::LD_S, Type::Memory, "LD_S"), | ||||||
|             INST("1110111101000---", Id::LD_L, Type::Memory, "LD_L"), |             INST("1110111101000---", Id::LD_L, Type::Memory, "LD_L"), | ||||||
|  | |||||||
| @ -1379,6 +1379,20 @@ private: | |||||||
|         return GenerateUnary(operation, "float", Type::Float, type); |         return GenerateUnary(operation, "float", Type::Float, type); | ||||||
|     } |     } | ||||||
| 
 | 
 | ||||||
|  |     Expression FSwizzleAdd(Operation operation) { | ||||||
|  |         const std::string op_a = VisitOperand(operation, 0).AsFloat(); | ||||||
|  |         const std::string op_b = VisitOperand(operation, 1).AsFloat(); | ||||||
|  |         const std::string instr_mask = VisitOperand(operation, 2).AsUint(); | ||||||
|  | 
 | ||||||
|  |         const std::string mask = code.GenerateTemporary(); | ||||||
|  |         code.AddLine("uint {} = {} >> ((gl_SubGroupInvocationARB & 3) << 1);", mask, instr_mask); | ||||||
|  | 
 | ||||||
|  |         const std::string modifier_a = fmt::format("fswzadd_modifiers_a[{} & 3]", mask); | ||||||
|  |         const std::string modifier_b = fmt::format("fswzadd_modifiers_b[{} & 3]", mask); | ||||||
|  |         return {fmt::format("(({} * {}) + ({} * {}))", op_a, modifier_a, op_b, modifier_b), | ||||||
|  |                 Type::Float}; | ||||||
|  |     } | ||||||
|  | 
 | ||||||
|     Expression ICastFloat(Operation operation) { |     Expression ICastFloat(Operation operation) { | ||||||
|         return GenerateUnary(operation, "int", Type::Int, Type::Float); |         return GenerateUnary(operation, "int", Type::Int, Type::Float); | ||||||
|     } |     } | ||||||
| @ -1991,6 +2005,7 @@ private: | |||||||
|         &GLSLDecompiler::FTrunc, |         &GLSLDecompiler::FTrunc, | ||||||
|         &GLSLDecompiler::FCastInteger<Type::Int>, |         &GLSLDecompiler::FCastInteger<Type::Int>, | ||||||
|         &GLSLDecompiler::FCastInteger<Type::Uint>, |         &GLSLDecompiler::FCastInteger<Type::Uint>, | ||||||
|  |         &GLSLDecompiler::FSwizzleAdd, | ||||||
| 
 | 
 | ||||||
|         &GLSLDecompiler::Add<Type::Int>, |         &GLSLDecompiler::Add<Type::Int>, | ||||||
|         &GLSLDecompiler::Mul<Type::Int>, |         &GLSLDecompiler::Mul<Type::Int>, | ||||||
| @ -2460,6 +2475,9 @@ bvec2 HalfFloatNanComparison(bvec2 comparison, vec2 pair1, vec2 pair2) { | |||||||
|     bvec2 is_nan2 = isnan(pair2); |     bvec2 is_nan2 = isnan(pair2); | ||||||
|     return bvec2(comparison.x || is_nan1.x || is_nan2.x, comparison.y || is_nan1.y || is_nan2.y); |     return bvec2(comparison.x || is_nan1.x || is_nan2.x, comparison.y || is_nan1.y || is_nan2.y); | ||||||
| } | } | ||||||
|  | 
 | ||||||
|  | const float fswzadd_modifiers_a[] = float[4](-1.0f,  1.0f, -1.0f,  0.0f ); | ||||||
|  | const float fswzadd_modifiers_b[] = float[4](-1.0f, -1.0f,  1.0f, -1.0f ); | ||||||
| )"; | )"; | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | |||||||
| @ -783,6 +783,11 @@ private: | |||||||
|         return {}; |         return {}; | ||||||
|     } |     } | ||||||
| 
 | 
 | ||||||
|  |     Id FSwizzleAdd(Operation operation) { | ||||||
|  |         UNIMPLEMENTED(); | ||||||
|  |         return {}; | ||||||
|  |     } | ||||||
|  | 
 | ||||||
|     Id HNegate(Operation operation) { |     Id HNegate(Operation operation) { | ||||||
|         UNIMPLEMENTED(); |         UNIMPLEMENTED(); | ||||||
|         return {}; |         return {}; | ||||||
| @ -1363,6 +1368,7 @@ private: | |||||||
|         &SPIRVDecompiler::Unary<&Module::OpTrunc, Type::Float>, |         &SPIRVDecompiler::Unary<&Module::OpTrunc, Type::Float>, | ||||||
|         &SPIRVDecompiler::Unary<&Module::OpConvertSToF, Type::Float, Type::Int>, |         &SPIRVDecompiler::Unary<&Module::OpConvertSToF, Type::Float, Type::Int>, | ||||||
|         &SPIRVDecompiler::Unary<&Module::OpConvertUToF, Type::Float, Type::Uint>, |         &SPIRVDecompiler::Unary<&Module::OpConvertUToF, Type::Float, Type::Uint>, | ||||||
|  |         &SPIRVDecompiler::FSwizzleAdd, | ||||||
| 
 | 
 | ||||||
|         &SPIRVDecompiler::Binary<&Module::OpIAdd, Type::Int>, |         &SPIRVDecompiler::Binary<&Module::OpIAdd, Type::Int>, | ||||||
|         &SPIRVDecompiler::Binary<&Module::OpIMul, Type::Int>, |         &SPIRVDecompiler::Binary<&Module::OpIMul, Type::Int>, | ||||||
|  | |||||||
| @ -94,6 +94,15 @@ u32 ShaderIR::DecodeWarp(NodeBlock& bb, u32 pc) { | |||||||
|             Operation(OperationCode::ShuffleIndexed, GetRegister(instr.gpr8), src_thread_id)); |             Operation(OperationCode::ShuffleIndexed, GetRegister(instr.gpr8), src_thread_id)); | ||||||
|         break; |         break; | ||||||
|     } |     } | ||||||
|  |     case OpCode::Id::FSWZADD: { | ||||||
|  |         UNIMPLEMENTED_IF(instr.fswzadd.ndv); | ||||||
|  | 
 | ||||||
|  |         Node op_a = GetRegister(instr.gpr8); | ||||||
|  |         Node op_b = GetRegister(instr.gpr20); | ||||||
|  |         Node mask = Immediate(static_cast<u32>(instr.fswzadd.swizzle)); | ||||||
|  |         SetRegister(bb, instr.gpr0, Operation(OperationCode::FSwizzleAdd, op_a, op_b, mask)); | ||||||
|  |         break; | ||||||
|  |     } | ||||||
|     default: |     default: | ||||||
|         UNIMPLEMENTED_MSG("Unhandled warp instruction: {}", opcode->get().GetName()); |         UNIMPLEMENTED_MSG("Unhandled warp instruction: {}", opcode->get().GetName()); | ||||||
|         break; |         break; | ||||||
|  | |||||||
| @ -47,6 +47,7 @@ enum class OperationCode { | |||||||
|     FTrunc,        /// (MetaArithmetic, float a) -> float
 |     FTrunc,        /// (MetaArithmetic, float a) -> float
 | ||||||
|     FCastInteger,  /// (MetaArithmetic, int a) -> float
 |     FCastInteger,  /// (MetaArithmetic, int a) -> float
 | ||||||
|     FCastUInteger, /// (MetaArithmetic, uint a) -> float
 |     FCastUInteger, /// (MetaArithmetic, uint a) -> float
 | ||||||
|  |     FSwizzleAdd,   /// (float a, float b, uint mask) -> float
 | ||||||
| 
 | 
 | ||||||
|     IAdd,                  /// (MetaArithmetic, int a, int b) -> int
 |     IAdd,                  /// (MetaArithmetic, int a, int b) -> int
 | ||||||
|     IMul,                  /// (MetaArithmetic, int a, int b) -> int
 |     IMul,                  /// (MetaArithmetic, int a, int b) -> int
 | ||||||
|  | |||||||
		Loading…
	
	
			
			x
			
			
		
	
		Reference in New Issue
	
	Block a user