summaryrefslogtreecommitdiff
path: root/src/shader_recompiler/frontend/maxwell/translate/impl
diff options
context:
space:
mode:
Diffstat (limited to 'src/shader_recompiler/frontend/maxwell/translate/impl')
-rw-r--r--src/shader_recompiler/frontend/maxwell/translate/impl/load_store_local_shared.cpp197
-rw-r--r--src/shader_recompiler/frontend/maxwell/translate/impl/not_implemented.cpp16
2 files changed, 197 insertions, 16 deletions
diff --git a/src/shader_recompiler/frontend/maxwell/translate/impl/load_store_local_shared.cpp b/src/shader_recompiler/frontend/maxwell/translate/impl/load_store_local_shared.cpp
new file mode 100644
index 000000000..68963c8ea
--- /dev/null
+++ b/src/shader_recompiler/frontend/maxwell/translate/impl/load_store_local_shared.cpp
@@ -0,0 +1,197 @@
1// Copyright 2021 yuzu Emulator Project
2// Licensed under GPLv2 or any later version
3// Refer to the license.txt file included.
4
5#include "common/bit_field.h"
6#include "common/common_types.h"
7#include "shader_recompiler/frontend/maxwell/translate/impl/impl.h"
8
9namespace Shader::Maxwell {
10namespace {
11enum class Size : u64 {
12 U8,
13 S8,
14 U16,
15 S16,
16 B32,
17 B64,
18 B128,
19};
20
21IR::U32 Offset(TranslatorVisitor& v, u64 insn) {
22 union {
23 u64 raw;
24 BitField<8, 8, IR::Reg> offset_reg;
25 BitField<20, 24, u64> absolute_offset;
26 BitField<20, 24, s64> relative_offset;
27 } const encoding{insn};
28
29 if (encoding.offset_reg == IR::Reg::RZ) {
30 return v.ir.Imm32(static_cast<u32>(encoding.absolute_offset));
31 } else {
32 const s32 relative{static_cast<s32>(encoding.relative_offset.Value())};
33 return v.ir.IAdd(v.X(encoding.offset_reg), v.ir.Imm32(relative));
34 }
35}
36
37std::pair<int, bool> GetSize(u64 insn) {
38 union {
39 u64 raw;
40 BitField<48, 3, Size> size;
41 } const encoding{insn};
42
43 const Size nnn = encoding.size;
44 switch (encoding.size) {
45 case Size::U8:
46 return {8, false};
47 case Size::S8:
48 return {8, true};
49 case Size::U16:
50 return {16, false};
51 case Size::S16:
52 return {16, true};
53 case Size::B32:
54 return {32, false};
55 case Size::B64:
56 return {64, false};
57 case Size::B128:
58 return {128, false};
59 default:
60 throw NotImplementedException("Invalid size {}", encoding.size.Value());
61 }
62}
63
64IR::Reg Reg(u64 insn) {
65 union {
66 u64 raw;
67 BitField<0, 8, IR::Reg> reg;
68 } const encoding{insn};
69
70 return encoding.reg;
71}
72
73IR::U32 ByteOffset(IR::IREmitter& ir, const IR::U32& offset) {
74 return ir.BitwiseAnd(ir.ShiftLeftLogical(offset, ir.Imm32(3)), ir.Imm32(24));
75}
76
77IR::U32 ShortOffset(IR::IREmitter& ir, const IR::U32& offset) {
78 return ir.BitwiseAnd(ir.ShiftLeftLogical(offset, ir.Imm32(3)), ir.Imm32(16));
79}
80} // Anonymous namespace
81
82void TranslatorVisitor::LDL(u64 insn) {
83 const IR::U32 offset{Offset(*this, insn)};
84 const IR::U32 word_offset{ir.ShiftRightArithmetic(offset, ir.Imm32(2))};
85
86 const IR::Reg dest{Reg(insn)};
87 const auto [bit_size, is_signed]{GetSize(insn)};
88 switch (bit_size) {
89 case 8: {
90 const IR::U32 bit{ByteOffset(ir, offset)};
91 X(dest, ir.BitFieldExtract(ir.LoadLocal(word_offset), bit, ir.Imm32(8), is_signed));
92 break;
93 }
94 case 16: {
95 const IR::U32 bit{ShortOffset(ir, offset)};
96 X(dest, ir.BitFieldExtract(ir.LoadLocal(word_offset), bit, ir.Imm32(16), is_signed));
97 break;
98 }
99 case 32:
100 case 64:
101 case 128:
102 if (!IR::IsAligned(dest, bit_size / 32)) {
103 throw NotImplementedException("Unaligned destination register {}", dest);
104 }
105 X(dest, ir.LoadLocal(word_offset));
106 for (int i = 1; i < bit_size / 32; ++i) {
107 X(dest + i, ir.LoadLocal(ir.IAdd(word_offset, ir.Imm32(i))));
108 }
109 break;
110 }
111}
112
113void TranslatorVisitor::LDS(u64 insn) {
114 const IR::U32 offset{Offset(*this, insn)};
115 const IR::Reg dest{Reg(insn)};
116 const auto [bit_size, is_signed]{GetSize(insn)};
117 const IR::Value value{ir.LoadShared(bit_size, is_signed, offset)};
118 switch (bit_size) {
119 case 8:
120 case 16:
121 case 32:
122 X(dest, IR::U32{value});
123 break;
124 case 64:
125 case 128:
126 if (!IR::IsAligned(dest, bit_size / 32)) {
127 throw NotImplementedException("Unaligned destination register {}", dest);
128 }
129 for (int element = 0; element < bit_size / 32; ++element) {
130 X(dest + element, IR::U32{ir.CompositeExtract(value, element)});
131 }
132 break;
133 }
134}
135
136void TranslatorVisitor::STL(u64 insn) {
137 const IR::U32 offset{Offset(*this, insn)};
138 const IR::U32 word_offset{ir.ShiftRightArithmetic(offset, ir.Imm32(2))};
139
140 const IR::Reg reg{Reg(insn)};
141 const IR::U32 src{X(reg)};
142 const int bit_size{GetSize(insn).first};
143 switch (bit_size) {
144 case 8: {
145 const IR::U32 bit{ByteOffset(ir, offset)};
146 const IR::U32 value{ir.BitFieldInsert(ir.LoadLocal(word_offset), src, bit, ir.Imm32(8))};
147 ir.WriteLocal(word_offset, value);
148 break;
149 }
150 case 16: {
151 const IR::U32 bit{ShortOffset(ir, offset)};
152 const IR::U32 value{ir.BitFieldInsert(ir.LoadLocal(word_offset), src, bit, ir.Imm32(16))};
153 ir.WriteLocal(word_offset, value);
154 break;
155 }
156 case 32:
157 case 64:
158 case 128:
159 if (!IR::IsAligned(reg, bit_size / 32)) {
160 throw NotImplementedException("Unaligned source register");
161 }
162 ir.WriteLocal(word_offset, src);
163 for (int i = 1; i < bit_size / 32; ++i) {
164 ir.WriteLocal(ir.IAdd(word_offset, ir.Imm32(i)), X(reg + i));
165 }
166 break;
167 }
168}
169
170void TranslatorVisitor::STS(u64 insn) {
171 const IR::U32 offset{Offset(*this, insn)};
172 const IR::Reg reg{Reg(insn)};
173 const int bit_size{GetSize(insn).first};
174 switch (bit_size) {
175 case 8:
176 case 16:
177 case 32:
178 ir.WriteShared(bit_size, offset, X(reg));
179 break;
180 case 64:
181 if (!IR::IsAligned(reg, 2)) {
182 throw NotImplementedException("Unaligned source register {}", reg);
183 }
184 ir.WriteShared(64, offset, ir.CompositeConstruct(X(reg), X(reg + 1)));
185 break;
186 case 128: {
187 if (!IR::IsAligned(reg, 2)) {
188 throw NotImplementedException("Unaligned source register {}", reg);
189 }
190 const IR::Value vector{ir.CompositeConstruct(X(reg), X(reg + 1), X(reg + 2), X(reg + 3))};
191 ir.WriteShared(128, offset, vector);
192 break;
193 }
194 }
195}
196
197} // namespace Shader::Maxwell
diff --git a/src/shader_recompiler/frontend/maxwell/translate/impl/not_implemented.cpp b/src/shader_recompiler/frontend/maxwell/translate/impl/not_implemented.cpp
index 409216640..b62d8ee2a 100644
--- a/src/shader_recompiler/frontend/maxwell/translate/impl/not_implemented.cpp
+++ b/src/shader_recompiler/frontend/maxwell/translate/impl/not_implemented.cpp
@@ -193,14 +193,6 @@ void TranslatorVisitor::LD(u64) {
193 ThrowNotImplemented(Opcode::LD); 193 ThrowNotImplemented(Opcode::LD);
194} 194}
195 195
196void TranslatorVisitor::LDL(u64) {
197 ThrowNotImplemented(Opcode::LDL);
198}
199
200void TranslatorVisitor::LDS(u64) {
201 ThrowNotImplemented(Opcode::LDS);
202}
203
204void TranslatorVisitor::LEPC(u64) { 196void TranslatorVisitor::LEPC(u64) {
205 ThrowNotImplemented(Opcode::LEPC); 197 ThrowNotImplemented(Opcode::LEPC);
206} 198}
@@ -309,18 +301,10 @@ void TranslatorVisitor::ST(u64) {
309 ThrowNotImplemented(Opcode::ST); 301 ThrowNotImplemented(Opcode::ST);
310} 302}
311 303
312void TranslatorVisitor::STL(u64) {
313 ThrowNotImplemented(Opcode::STL);
314}
315
316void TranslatorVisitor::STP(u64) { 304void TranslatorVisitor::STP(u64) {
317 ThrowNotImplemented(Opcode::STP); 305 ThrowNotImplemented(Opcode::STP);
318} 306}
319 307
320void TranslatorVisitor::STS(u64) {
321 ThrowNotImplemented(Opcode::STS);
322}
323
324void TranslatorVisitor::SUATOM_cas(u64) { 308void TranslatorVisitor::SUATOM_cas(u64) {
325 ThrowNotImplemented(Opcode::SUATOM_cas); 309 ThrowNotImplemented(Opcode::SUATOM_cas);
326} 310}