mirror of
https://git.suyu.dev/suyu/dynarmic.git
synced 2026-03-03 17:52:56 +00:00
A32: Implement ASIMD VTBX
This commit is contained in:
@@ -112,7 +112,7 @@ INST(asimd_VRSQRTE, "VRSQRTE", "111100111D11zz11dddd010
|
||||
// Miscellaneous
|
||||
INST(asimd_VEXT, "VEXT", "111100101D11nnnnddddiiiiNQM0mmmm") // ASIMD
|
||||
INST(asimd_VTBL, "VTBL", "111100111D11nnnndddd10zzN0M0mmmm") // ASIMD
|
||||
//INST(asimd_VTBX, "VTBX", "111100111D11nnnndddd10zzN1M0mmmm") // ASIMD
|
||||
INST(asimd_VTBX, "VTBX", "111100111D11nnnndddd10zzN1M0mmmm") // ASIMD
|
||||
//INST(asimd_VDUP_scalar, "VDUP (scalar)", "111100111D11iiiidddd11000QM0mmmm") // ASIMD
|
||||
|
||||
// One register and modified immediate
|
||||
|
||||
@@ -10,6 +10,31 @@
|
||||
|
||||
namespace Dynarmic::A32 {
|
||||
|
||||
static bool TableLookup(ArmTranslatorVisitor& v, bool is_vtbl, bool D, size_t Vn, size_t Vd, size_t len, bool N, bool M, size_t Vm) {
|
||||
const size_t length = len + 1;
|
||||
const auto d = ToVector(false, Vd, D);
|
||||
const auto m = ToVector(false, Vm, M);
|
||||
const auto n = ToVector(false, Vn, N);
|
||||
|
||||
if (RegNumber(n) + length > 32) {
|
||||
return v.UnpredictableInstruction();
|
||||
}
|
||||
|
||||
const IR::Table table = v.ir.VectorTable([&]{
|
||||
std::vector<IR::U64> result;
|
||||
for (size_t i = 0; i < length; ++i) {
|
||||
result.emplace_back(v.ir.GetExtendedRegister(n + i));
|
||||
}
|
||||
return result;
|
||||
}());
|
||||
const IR::U64 indicies = v.ir.GetExtendedRegister(m);
|
||||
const IR::U64 defaults = is_vtbl ? v.ir.Imm64(0) : IR::U64{v.ir.GetExtendedRegister(d)};
|
||||
const IR::U64 result = v.ir.VectorTableLookup(defaults, table, indicies);
|
||||
|
||||
v.ir.SetExtendedRegister(d, result);
|
||||
return true;
|
||||
}
|
||||
|
||||
bool ArmTranslatorVisitor::asimd_VEXT(bool D, size_t Vn, size_t Vd, Imm<4> imm4, bool N, bool Q, bool M, size_t Vm) {
|
||||
if (Q && (Common::Bit<0>(Vd) || Common::Bit<0>(Vn) || Common::Bit<0>(Vm))) {
|
||||
return UndefinedInstruction();
|
||||
@@ -33,28 +58,11 @@ bool ArmTranslatorVisitor::asimd_VEXT(bool D, size_t Vn, size_t Vd, Imm<4> imm4,
|
||||
}
|
||||
|
||||
bool ArmTranslatorVisitor::asimd_VTBL(bool D, size_t Vn, size_t Vd, size_t len, bool N, bool M, size_t Vm) {
|
||||
const size_t length = len + 1;
|
||||
const auto d = ToVector(false, Vd, D);
|
||||
const auto m = ToVector(false, Vm, M);
|
||||
const auto n = ToVector(false, Vn, N);
|
||||
return TableLookup(*this, true, D, Vn, Vd, len, N, M, Vm);
|
||||
}
|
||||
|
||||
if (RegNumber(n) + length > 32) {
|
||||
return UnpredictableInstruction();
|
||||
}
|
||||
|
||||
const IR::U64 table0 = ir.GetExtendedRegister(n);
|
||||
const IR::U64 table1 = length >= 2 ? IR::U64{ir.GetExtendedRegister(n + 1)} : ir.Imm64(0);
|
||||
const IR::U64 table2 = length >= 3 ? IR::U64{ir.GetExtendedRegister(n + 2)} : ir.Imm64(0);
|
||||
const IR::U64 table3 = length == 4 ? IR::U64{ir.GetExtendedRegister(n + 3)} : ir.Imm64(0);
|
||||
|
||||
const IR::Table table = ir.VectorTable(length <= 2
|
||||
? std::vector<IR::U128>{ir.Pack2x64To1x128(table0, table1)}
|
||||
: std::vector<IR::U128>{ir.Pack2x64To1x128(table0, table1), ir.Pack2x64To1x128(table2, table3)});
|
||||
const IR::U128 indicies = ir.GetVector(m);
|
||||
const IR::U128 result = ir.VectorTableLookup(ir.ZeroVector(), table, indicies);
|
||||
|
||||
ir.SetVector(d, result);
|
||||
return true;
|
||||
bool ArmTranslatorVisitor::asimd_VTBX(bool D, size_t Vn, size_t Vd, size_t len, bool N, bool M, size_t Vm) {
|
||||
return TableLookup(*this, false, D, Vn, Vd, len, N, M, Vm);
|
||||
}
|
||||
|
||||
} // namespace Dynarmic::A32
|
||||
|
||||
@@ -514,6 +514,7 @@ struct ArmTranslatorVisitor final {
|
||||
// Advanced SIMD miscellaneous
|
||||
bool asimd_VEXT(bool D, size_t Vn, size_t Vd, Imm<4> imm4, bool N, bool Q, bool M, size_t Vm);
|
||||
bool asimd_VTBL(bool D, size_t Vn, size_t Vd, size_t len, bool N, bool M, size_t Vm);
|
||||
bool asimd_VTBX(bool D, size_t Vn, size_t Vd, size_t len, bool N, bool M, size_t Vm);
|
||||
|
||||
// Advanced SIMD load/store structures
|
||||
bool v8_VST_multiple(bool D, Reg n, size_t Vd, Imm<4> type, size_t sz, size_t align, Reg m);
|
||||
|
||||
@@ -1739,14 +1739,26 @@ U128 IREmitter::VectorSub(size_t esize, const U128& a, const U128& b) {
|
||||
UNREACHABLE();
|
||||
}
|
||||
|
||||
Table IREmitter::VectorTable(std::vector<U64> values) {
|
||||
ASSERT(values.size() >= 1 && values.size() <= 4);
|
||||
values.resize(4);
|
||||
return Inst<Table>(Opcode::VectorTable, values[0], values[1], values[2], values[3]);
|
||||
}
|
||||
|
||||
Table IREmitter::VectorTable(std::vector<U128> values) {
|
||||
ASSERT(values.size() >= 1 && values.size() <= 4);
|
||||
values.resize(4);
|
||||
return Inst<Table>(Opcode::VectorTable, values[0], values[1], values[2], values[3]);
|
||||
}
|
||||
|
||||
U64 IREmitter::VectorTableLookup(const U64& defaults, const Table& table, const U64& indices) {
|
||||
ASSERT(table.GetInst()->GetArg(0).GetType() == Type::U64);
|
||||
return Inst<U64>(Opcode::VectorTableLookup64, defaults, table, indices);
|
||||
}
|
||||
|
||||
U128 IREmitter::VectorTableLookup(const U128& defaults, const Table& table, const U128& indices) {
|
||||
return Inst<U128>(Opcode::VectorTableLookup, defaults, table, indices);
|
||||
ASSERT(table.GetInst()->GetArg(0).GetType() == Type::U128);
|
||||
return Inst<U128>(Opcode::VectorTableLookup128, defaults, table, indices);
|
||||
}
|
||||
|
||||
U128 IREmitter::VectorUnsignedAbsoluteDifference(size_t esize, const U128& a, const U128& b) {
|
||||
|
||||
@@ -297,7 +297,9 @@ public:
|
||||
U128 VectorSignedSaturatedShiftLeft(size_t esize, const U128& a, const U128& b);
|
||||
U128 VectorSignedSaturatedShiftLeftUnsigned(size_t esize, const U128& a, const U128& b);
|
||||
U128 VectorSub(size_t esize, const U128& a, const U128& b);
|
||||
Table VectorTable(std::vector<U64> values);
|
||||
Table VectorTable(std::vector<U128> values);
|
||||
U64 VectorTableLookup(const U64& defaults, const Table& table, const U64& indices);
|
||||
U128 VectorTableLookup(const U128& defaults, const Table& table, const U128& indices);
|
||||
U128 VectorUnsignedAbsoluteDifference(size_t esize, const U128& a, const U128& b);
|
||||
U128 VectorUnsignedRecipEstimate(const U128& a);
|
||||
|
||||
@@ -470,8 +470,9 @@ OPCODE(VectorSub8, U128, U128
|
||||
OPCODE(VectorSub16, U128, U128, U128 )
|
||||
OPCODE(VectorSub32, U128, U128, U128 )
|
||||
OPCODE(VectorSub64, U128, U128, U128 )
|
||||
OPCODE(VectorTable, Table, U128, Opaque, Opaque, Opaque )
|
||||
OPCODE(VectorTableLookup, U128, U128, Table, U128 )
|
||||
OPCODE(VectorTable, Table, Opaque, Opaque, Opaque, Opaque )
|
||||
OPCODE(VectorTableLookup64, U64, U64, Table, U64 )
|
||||
OPCODE(VectorTableLookup128, U128, U128, Table, U128 )
|
||||
OPCODE(VectorUnsignedAbsoluteDifference8, U128, U128, U128 )
|
||||
OPCODE(VectorUnsignedAbsoluteDifference16, U128, U128, U128 )
|
||||
OPCODE(VectorUnsignedAbsoluteDifference32, U128, U128, U128 )
|
||||
|
||||
Reference in New Issue
Block a user