mirror of
https://github.com/starr-dusT/yuzu-mainline
synced 2024-03-05 21:12:25 -08:00
f43995ec53
Operations done before the main half float operation (like HAdd) were managing a packed value instead of the unpacked one. Adding an unpacked operation allows us to drop the per-operand MetaHalfArithmetic entry, simplifying the code overall.
73 lines
2.9 KiB
C++
73 lines
2.9 KiB
C++
// Copyright 2018 yuzu Emulator Project
|
|
// Licensed under GPLv2 or any later version
|
|
// Refer to the license.txt file included.
|
|
|
|
#include <tuple>
|
|
|
|
#include "common/assert.h"
|
|
#include "common/common_types.h"
|
|
#include "video_core/engines/shader_bytecode.h"
|
|
#include "video_core/shader/shader_ir.h"
|
|
|
|
namespace VideoCommon::Shader {
|
|
|
|
using Tegra::Shader::HalfPrecision;
|
|
using Tegra::Shader::HalfType;
|
|
using Tegra::Shader::Instruction;
|
|
using Tegra::Shader::OpCode;
|
|
|
|
u32 ShaderIR::DecodeHfma2(NodeBlock& bb, u32 pc) {
|
|
const Instruction instr = {program_code[pc]};
|
|
const auto opcode = OpCode::Decode(instr);
|
|
|
|
if (opcode->get().GetId() == OpCode::Id::HFMA2_RR) {
|
|
UNIMPLEMENTED_IF(instr.hfma2.rr.precision != HalfPrecision::None);
|
|
} else {
|
|
UNIMPLEMENTED_IF(instr.hfma2.precision != HalfPrecision::None);
|
|
}
|
|
|
|
constexpr auto identity = HalfType::H0_H1;
|
|
bool neg_b{}, neg_c{};
|
|
auto [saturate, type_b, op_b, type_c,
|
|
op_c] = [&]() -> std::tuple<bool, HalfType, Node, HalfType, Node> {
|
|
switch (opcode->get().GetId()) {
|
|
case OpCode::Id::HFMA2_CR:
|
|
neg_b = instr.hfma2.negate_b;
|
|
neg_c = instr.hfma2.negate_c;
|
|
return {instr.hfma2.saturate, instr.hfma2.type_b,
|
|
GetConstBuffer(instr.cbuf34.index, instr.cbuf34.GetOffset()),
|
|
instr.hfma2.type_reg39, GetRegister(instr.gpr39)};
|
|
case OpCode::Id::HFMA2_RC:
|
|
neg_b = instr.hfma2.negate_b;
|
|
neg_c = instr.hfma2.negate_c;
|
|
return {instr.hfma2.saturate, instr.hfma2.type_reg39, GetRegister(instr.gpr39),
|
|
instr.hfma2.type_b,
|
|
GetConstBuffer(instr.cbuf34.index, instr.cbuf34.GetOffset())};
|
|
case OpCode::Id::HFMA2_RR:
|
|
neg_b = instr.hfma2.rr.negate_b;
|
|
neg_c = instr.hfma2.rr.negate_c;
|
|
return {instr.hfma2.rr.saturate, instr.hfma2.type_b, GetRegister(instr.gpr20),
|
|
instr.hfma2.rr.type_c, GetRegister(instr.gpr39)};
|
|
case OpCode::Id::HFMA2_IMM_R:
|
|
neg_c = instr.hfma2.negate_c;
|
|
return {instr.hfma2.saturate, identity, UnpackHalfImmediate(instr, true),
|
|
instr.hfma2.type_reg39, GetRegister(instr.gpr39)};
|
|
default:
|
|
return {false, identity, Immediate(0), identity, Immediate(0)};
|
|
}
|
|
}();
|
|
UNIMPLEMENTED_IF_MSG(saturate, "HFMA2 saturation is not implemented");
|
|
|
|
const Node op_a = UnpackHalfFloat(GetRegister(instr.gpr8), instr.hfma2.type_a);
|
|
op_b = GetOperandAbsNegHalf(UnpackHalfFloat(op_b, type_b), false, neg_b);
|
|
op_c = GetOperandAbsNegHalf(UnpackHalfFloat(op_c, type_c), false, neg_c);
|
|
|
|
Node value = Operation(OperationCode::HFma, PRECISE, op_a, op_b, op_c);
|
|
value = HalfMerge(GetRegister(instr.gpr0), value, instr.hfma2.merge);
|
|
|
|
SetRegister(bb, instr.gpr0, value);
|
|
|
|
return pc;
|
|
}
|
|
|
|
} // namespace VideoCommon::Shader
|