8 changed files with 227 additions and 31 deletions
-
2src/shader_recompiler/CMakeLists.txt
-
4src/shader_recompiler/frontend/maxwell/maxwell.inc
-
25src/shader_recompiler/frontend/maxwell/translate/impl/common_funcs.cpp
-
2src/shader_recompiler/frontend/maxwell/translate/impl/common_funcs.h
-
7src/shader_recompiler/frontend/maxwell/translate/impl/impl.h
-
77src/shader_recompiler/frontend/maxwell/translate/impl/logic_operation.cpp
-
117src/shader_recompiler/frontend/maxwell/translate/impl/logic_operation_three_input.cpp
-
24src/shader_recompiler/frontend/maxwell/translate/impl/not_implemented.cpp
@ -0,0 +1,77 @@ |
|||||
|
// Copyright 2021 yuzu Emulator Project
|
||||
|
// Licensed under GPLv2 or any later version
|
||||
|
// Refer to the license.txt file included.
|
||||
|
|
||||
|
#include "common/bit_field.h"
|
||||
|
#include "common/common_types.h"
|
||||
|
#include "shader_recompiler/frontend/maxwell/translate/impl/common_funcs.h"
|
||||
|
#include "shader_recompiler/frontend/maxwell/translate/impl/impl.h"
|
||||
|
|
||||
|
namespace Shader::Maxwell { |
||||
|
namespace { |
||||
|
enum class LogicalOp : u64 { |
||||
|
AND, |
||||
|
OR, |
||||
|
XOR, |
||||
|
PASS_B, |
||||
|
}; |
||||
|
|
||||
|
[[nodiscard]] IR::U32 LogicalOperation(IR::IREmitter& ir, const IR::U32& operand_1, |
||||
|
const IR::U32& operand_2, LogicalOp op) { |
||||
|
switch (op) { |
||||
|
case LogicalOp::AND: |
||||
|
return ir.BitwiseAnd(operand_1, operand_2); |
||||
|
case LogicalOp::OR: |
||||
|
return ir.BitwiseOr(operand_1, operand_2); |
||||
|
case LogicalOp::XOR: |
||||
|
return ir.BitwiseXor(operand_1, operand_2); |
||||
|
case LogicalOp::PASS_B: |
||||
|
return operand_2; |
||||
|
default: |
||||
|
throw NotImplementedException("Invalid Logical operation {}", op); |
||||
|
} |
||||
|
} |
||||
|
|
||||
|
void LOP(TranslatorVisitor& v, u64 insn, IR::U32 op_b) { |
||||
|
union { |
||||
|
u64 insn; |
||||
|
BitField<0, 8, IR::Reg> dest_reg; |
||||
|
BitField<8, 8, IR::Reg> src_reg; |
||||
|
BitField<39, 1, u64> neg_a; |
||||
|
BitField<40, 1, u64> neg_b; |
||||
|
BitField<41, 2, LogicalOp> bit_op; |
||||
|
BitField<43, 1, u64> x; |
||||
|
BitField<44, 2, PredicateOp> pred_op; |
||||
|
BitField<48, 3, IR::Pred> pred; |
||||
|
} const lop{insn}; |
||||
|
|
||||
|
if (lop.x != 0) { |
||||
|
throw NotImplementedException("LOP X"); |
||||
|
} |
||||
|
IR::U32 op_a{v.X(lop.src_reg)}; |
||||
|
if (lop.neg_a != 0) { |
||||
|
op_a = v.ir.BitwiseNot(op_a); |
||||
|
} |
||||
|
if (lop.neg_b != 0) { |
||||
|
op_b = v.ir.BitwiseNot(op_b); |
||||
|
} |
||||
|
|
||||
|
const IR::U32 result{LogicalOperation(v.ir, op_a, op_b, lop.bit_op)}; |
||||
|
const IR::U1 pred_result{PredicateOperation(v.ir, result, lop.pred_op)}; |
||||
|
v.X(lop.dest_reg, result); |
||||
|
v.ir.SetPred(lop.pred, pred_result); |
||||
|
} |
||||
|
} // Anonymous namespace
|
||||
|
|
||||
|
void TranslatorVisitor::LOP_reg(u64 insn) { |
||||
|
LOP(*this, insn, GetReg20(insn)); |
||||
|
} |
||||
|
|
||||
|
void TranslatorVisitor::LOP_cbuf(u64 insn) { |
||||
|
LOP(*this, insn, GetCbuf(insn)); |
||||
|
} |
||||
|
|
||||
|
void TranslatorVisitor::LOP_imm(u64 insn) { |
||||
|
LOP(*this, insn, GetImm20(insn)); |
||||
|
} |
||||
|
} // namespace Shader::Maxwell
|
||||
@ -0,0 +1,117 @@ |
|||||
|
// Copyright 2021 yuzu Emulator Project
|
||||
|
// Licensed under GPLv2 or any later version
|
||||
|
// Refer to the license.txt file included.
|
||||
|
|
||||
|
#include "common/bit_field.h"
|
||||
|
#include "common/common_types.h"
|
||||
|
#include "shader_recompiler/frontend/maxwell/translate/impl/common_funcs.h"
|
||||
|
#include "shader_recompiler/frontend/maxwell/translate/impl/impl.h"
|
||||
|
|
||||
|
namespace Shader::Maxwell { |
||||
|
namespace { |
||||
|
// https://forums.developer.nvidia.com/t/reverse-lut-for-lop3-lut/110651
|
||||
|
// Emulate GPU's LOP3.LUT (three-input logic op with 8-bit truth table)
|
||||
|
IR::U32 ApplyLUT(IR::IREmitter& ir, const IR::U32& a, const IR::U32& b, const IR::U32& c, |
||||
|
u64 ttbl) { |
||||
|
IR::U32 r{ir.Imm32(0)}; |
||||
|
const IR::U32 not_a{ir.BitwiseNot(a)}; |
||||
|
const IR::U32 not_b{ir.BitwiseNot(b)}; |
||||
|
const IR::U32 not_c{ir.BitwiseNot(c)}; |
||||
|
if (ttbl & 0x01) { |
||||
|
// r |= ~a & ~b & ~c;
|
||||
|
const auto lhs{ir.BitwiseAnd(not_a, not_b)}; |
||||
|
const auto rhs{ir.BitwiseAnd(lhs, not_c)}; |
||||
|
r = ir.BitwiseOr(r, rhs); |
||||
|
} |
||||
|
if (ttbl & 0x02) { |
||||
|
// r |= ~a & ~b & c;
|
||||
|
const auto lhs{ir.BitwiseAnd(not_a, not_b)}; |
||||
|
const auto rhs{ir.BitwiseAnd(lhs, c)}; |
||||
|
r = ir.BitwiseOr(r, rhs); |
||||
|
} |
||||
|
if (ttbl & 0x04) { |
||||
|
// r |= ~a & b & ~c;
|
||||
|
const auto lhs{ir.BitwiseAnd(not_a, b)}; |
||||
|
const auto rhs{ir.BitwiseAnd(lhs, not_c)}; |
||||
|
r = ir.BitwiseOr(r, rhs); |
||||
|
} |
||||
|
if (ttbl & 0x08) { |
||||
|
// r |= ~a & b & c;
|
||||
|
const auto lhs{ir.BitwiseAnd(not_a, b)}; |
||||
|
const auto rhs{ir.BitwiseAnd(lhs, c)}; |
||||
|
r = ir.BitwiseOr(r, rhs); |
||||
|
} |
||||
|
if (ttbl & 0x10) { |
||||
|
// r |= a & ~b & ~c;
|
||||
|
const auto lhs{ir.BitwiseAnd(a, not_b)}; |
||||
|
const auto rhs{ir.BitwiseAnd(lhs, not_c)}; |
||||
|
r = ir.BitwiseOr(r, rhs); |
||||
|
} |
||||
|
if (ttbl & 0x20) { |
||||
|
// r |= a & ~b & c;
|
||||
|
const auto lhs{ir.BitwiseAnd(a, not_b)}; |
||||
|
const auto rhs{ir.BitwiseAnd(lhs, c)}; |
||||
|
r = ir.BitwiseOr(r, rhs); |
||||
|
} |
||||
|
if (ttbl & 0x40) { |
||||
|
// r |= a & b & ~c;
|
||||
|
const auto lhs{ir.BitwiseAnd(a, b)}; |
||||
|
const auto rhs{ir.BitwiseAnd(lhs, not_c)}; |
||||
|
r = ir.BitwiseOr(r, rhs); |
||||
|
} |
||||
|
if (ttbl & 0x80) { |
||||
|
// r |= a & b & c;
|
||||
|
const auto lhs{ir.BitwiseAnd(a, b)}; |
||||
|
const auto rhs{ir.BitwiseAnd(lhs, c)}; |
||||
|
r = ir.BitwiseOr(r, rhs); |
||||
|
} |
||||
|
return r; |
||||
|
} |
||||
|
|
||||
|
IR::U32 LOP3(TranslatorVisitor& v, u64 insn, const IR::U32& op_b, const IR::U32& op_c, u64 lut) { |
||||
|
union { |
||||
|
u64 insn; |
||||
|
BitField<0, 8, IR::Reg> dest_reg; |
||||
|
BitField<8, 8, IR::Reg> src_reg; |
||||
|
} const lop3{insn}; |
||||
|
|
||||
|
const IR::U32 op_a{v.X(lop3.src_reg)}; |
||||
|
const IR::U32 result{ApplyLUT(v.ir, op_a, op_b, op_c, lut)}; |
||||
|
v.X(lop3.dest_reg, result); |
||||
|
return result; |
||||
|
} |
||||
|
|
||||
|
u64 GetLut48(u64 insn) { |
||||
|
union { |
||||
|
u64 raw; |
||||
|
BitField<48, 8, u64> lut; |
||||
|
} const lut{insn}; |
||||
|
return lut.lut; |
||||
|
} |
||||
|
} // Anonymous namespace
|
||||
|
|
||||
|
void TranslatorVisitor::LOP3_reg(u64 insn) { |
||||
|
union { |
||||
|
u64 insn; |
||||
|
BitField<28, 8, u64> lut; |
||||
|
BitField<38, 1, u64> x; |
||||
|
BitField<36, 2, PredicateOp> pred_op; |
||||
|
BitField<48, 3, IR::Pred> pred; |
||||
|
} const lop3{insn}; |
||||
|
|
||||
|
if (lop3.x != 0) { |
||||
|
throw NotImplementedException("LOP3 X"); |
||||
|
} |
||||
|
const IR::U32 result{LOP3(*this, insn, GetReg20(insn), GetReg39(insn), lop3.lut)}; |
||||
|
const IR::U1 pred_result{PredicateOperation(ir, result, lop3.pred_op)}; |
||||
|
ir.SetPred(lop3.pred, pred_result); |
||||
|
} |
||||
|
|
||||
|
void TranslatorVisitor::LOP3_cbuf(u64 insn) { |
||||
|
LOP3(*this, insn, GetCbuf(insn), GetReg39(insn), GetLut48(insn)); |
||||
|
} |
||||
|
|
||||
|
void TranslatorVisitor::LOP3_imm(u64 insn) { |
||||
|
LOP3(*this, insn, GetImm20(insn), GetReg39(insn), GetLut48(insn)); |
||||
|
} |
||||
|
} // namespace Shader::Maxwell
|
||||
Write
Preview
Loading…
Cancel
Save
Reference in new issue