diff options
| author | 2021-07-25 11:39:04 -0700 | |
|---|---|---|
| committer | 2021-07-25 11:39:04 -0700 | |
| commit | 98b26b6e126d4775fdf3f773fe8a8ac808a8ff8f (patch) | |
| tree | 816faa96c2c4d291825063433331a8ea4b3d08f1 /src/shader_recompiler/frontend/ir/ir_emitter.cpp | |
| parent | Merge pull request #6699 from lat9nq/common-threads (diff) | |
| parent | shader: Support out of bound local memory reads and immediate writes (diff) | |
| download | yuzu-98b26b6e126d4775fdf3f773fe8a8ac808a8ff8f.tar.gz yuzu-98b26b6e126d4775fdf3f773fe8a8ac808a8ff8f.tar.xz yuzu-98b26b6e126d4775fdf3f773fe8a8ac808a8ff8f.zip | |
Merge pull request #6585 from ameerj/hades
Shader Decompiler Rewrite
Diffstat (limited to 'src/shader_recompiler/frontend/ir/ir_emitter.cpp')
| -rw-r--r-- | src/shader_recompiler/frontend/ir/ir_emitter.cpp | 2017 |
1 files changed, 2017 insertions, 0 deletions
diff --git a/src/shader_recompiler/frontend/ir/ir_emitter.cpp b/src/shader_recompiler/frontend/ir/ir_emitter.cpp new file mode 100644 index 000000000..13159a68d --- /dev/null +++ b/src/shader_recompiler/frontend/ir/ir_emitter.cpp | |||
| @@ -0,0 +1,2017 @@ | |||
| 1 | // Copyright 2021 yuzu Emulator Project | ||
| 2 | // Licensed under GPLv2 or any later version | ||
| 3 | // Refer to the license.txt file included. | ||
| 4 | |||
| 5 | #include "common/bit_cast.h" | ||
| 6 | #include "shader_recompiler/frontend/ir/ir_emitter.h" | ||
| 7 | #include "shader_recompiler/frontend/ir/value.h" | ||
| 8 | |||
| 9 | namespace Shader::IR { | ||
| 10 | namespace { | ||
| 11 | [[noreturn]] void ThrowInvalidType(Type type) { | ||
| 12 | throw InvalidArgument("Invalid type {}", type); | ||
| 13 | } | ||
| 14 | |||
| 15 | Value MakeLodClampPair(IREmitter& ir, const F32& bias_lod, const F32& lod_clamp) { | ||
| 16 | if (!bias_lod.IsEmpty() && !lod_clamp.IsEmpty()) { | ||
| 17 | return ir.CompositeConstruct(bias_lod, lod_clamp); | ||
| 18 | } else if (!bias_lod.IsEmpty()) { | ||
| 19 | return bias_lod; | ||
| 20 | } else if (!lod_clamp.IsEmpty()) { | ||
| 21 | return lod_clamp; | ||
| 22 | } else { | ||
| 23 | return Value{}; | ||
| 24 | } | ||
| 25 | } | ||
| 26 | } // Anonymous namespace | ||
| 27 | |||
| 28 | U1 IREmitter::Imm1(bool value) const { | ||
| 29 | return U1{Value{value}}; | ||
| 30 | } | ||
| 31 | |||
| 32 | U8 IREmitter::Imm8(u8 value) const { | ||
| 33 | return U8{Value{value}}; | ||
| 34 | } | ||
| 35 | |||
| 36 | U16 IREmitter::Imm16(u16 value) const { | ||
| 37 | return U16{Value{value}}; | ||
| 38 | } | ||
| 39 | |||
| 40 | U32 IREmitter::Imm32(u32 value) const { | ||
| 41 | return U32{Value{value}}; | ||
| 42 | } | ||
| 43 | |||
| 44 | U32 IREmitter::Imm32(s32 value) const { | ||
| 45 | return U32{Value{static_cast<u32>(value)}}; | ||
| 46 | } | ||
| 47 | |||
| 48 | F32 IREmitter::Imm32(f32 value) const { | ||
| 49 | return F32{Value{value}}; | ||
| 50 | } | ||
| 51 | |||
| 52 | U64 IREmitter::Imm64(u64 value) const { | ||
| 53 | return U64{Value{value}}; | ||
| 54 | } | ||
| 55 | |||
| 56 | U64 IREmitter::Imm64(s64 value) const { | ||
| 57 | return U64{Value{static_cast<u64>(value)}}; | ||
| 58 | } | ||
| 59 | |||
| 60 | F64 IREmitter::Imm64(f64 value) const { | ||
| 61 | return F64{Value{value}}; | ||
| 62 | } | ||
| 63 | |||
| 64 | U1 IREmitter::ConditionRef(const U1& value) { | ||
| 65 | return Inst<U1>(Opcode::ConditionRef, value); | ||
| 66 | } | ||
| 67 | |||
| 68 | void IREmitter::Reference(const Value& value) { | ||
| 69 | Inst(Opcode::Reference, value); | ||
| 70 | } | ||
| 71 | |||
| 72 | void IREmitter::PhiMove(IR::Inst& phi, const Value& value) { | ||
| 73 | Inst(Opcode::PhiMove, Value{&phi}, value); | ||
| 74 | } | ||
| 75 | |||
| 76 | void IREmitter::Prologue() { | ||
| 77 | Inst(Opcode::Prologue); | ||
| 78 | } | ||
| 79 | |||
| 80 | void IREmitter::Epilogue() { | ||
| 81 | Inst(Opcode::Epilogue); | ||
| 82 | } | ||
| 83 | |||
| 84 | void IREmitter::DemoteToHelperInvocation() { | ||
| 85 | Inst(Opcode::DemoteToHelperInvocation); | ||
| 86 | } | ||
| 87 | |||
| 88 | void IREmitter::EmitVertex(const U32& stream) { | ||
| 89 | Inst(Opcode::EmitVertex, stream); | ||
| 90 | } | ||
| 91 | |||
| 92 | void IREmitter::EndPrimitive(const U32& stream) { | ||
| 93 | Inst(Opcode::EndPrimitive, stream); | ||
| 94 | } | ||
| 95 | |||
| 96 | void IREmitter::Barrier() { | ||
| 97 | Inst(Opcode::Barrier); | ||
| 98 | } | ||
| 99 | |||
| 100 | void IREmitter::WorkgroupMemoryBarrier() { | ||
| 101 | Inst(Opcode::WorkgroupMemoryBarrier); | ||
| 102 | } | ||
| 103 | |||
| 104 | void IREmitter::DeviceMemoryBarrier() { | ||
| 105 | Inst(Opcode::DeviceMemoryBarrier); | ||
| 106 | } | ||
| 107 | |||
| 108 | U32 IREmitter::GetReg(IR::Reg reg) { | ||
| 109 | return Inst<U32>(Opcode::GetRegister, reg); | ||
| 110 | } | ||
| 111 | |||
| 112 | void IREmitter::SetReg(IR::Reg reg, const U32& value) { | ||
| 113 | Inst(Opcode::SetRegister, reg, value); | ||
| 114 | } | ||
| 115 | |||
| 116 | U1 IREmitter::GetPred(IR::Pred pred, bool is_negated) { | ||
| 117 | if (pred == Pred::PT) { | ||
| 118 | return Imm1(!is_negated); | ||
| 119 | } | ||
| 120 | const U1 value{Inst<U1>(Opcode::GetPred, pred)}; | ||
| 121 | if (is_negated) { | ||
| 122 | return Inst<U1>(Opcode::LogicalNot, value); | ||
| 123 | } else { | ||
| 124 | return value; | ||
| 125 | } | ||
| 126 | } | ||
| 127 | |||
| 128 | void IREmitter::SetPred(IR::Pred pred, const U1& value) { | ||
| 129 | if (pred != IR::Pred::PT) { | ||
| 130 | Inst(Opcode::SetPred, pred, value); | ||
| 131 | } | ||
| 132 | } | ||
| 133 | |||
| 134 | U1 IREmitter::GetGotoVariable(u32 id) { | ||
| 135 | return Inst<U1>(Opcode::GetGotoVariable, id); | ||
| 136 | } | ||
| 137 | |||
| 138 | void IREmitter::SetGotoVariable(u32 id, const U1& value) { | ||
| 139 | Inst(Opcode::SetGotoVariable, id, value); | ||
| 140 | } | ||
| 141 | |||
| 142 | U32 IREmitter::GetIndirectBranchVariable() { | ||
| 143 | return Inst<U32>(Opcode::GetIndirectBranchVariable); | ||
| 144 | } | ||
| 145 | |||
| 146 | void IREmitter::SetIndirectBranchVariable(const U32& value) { | ||
| 147 | Inst(Opcode::SetIndirectBranchVariable, value); | ||
| 148 | } | ||
| 149 | |||
| 150 | U32 IREmitter::GetCbuf(const U32& binding, const U32& byte_offset) { | ||
| 151 | return Inst<U32>(Opcode::GetCbufU32, binding, byte_offset); | ||
| 152 | } | ||
| 153 | |||
| 154 | Value IREmitter::GetCbuf(const U32& binding, const U32& byte_offset, size_t bitsize, | ||
| 155 | bool is_signed) { | ||
| 156 | switch (bitsize) { | ||
| 157 | case 8: | ||
| 158 | return Inst<U32>(is_signed ? Opcode::GetCbufS8 : Opcode::GetCbufU8, binding, byte_offset); | ||
| 159 | case 16: | ||
| 160 | return Inst<U32>(is_signed ? Opcode::GetCbufS16 : Opcode::GetCbufU16, binding, byte_offset); | ||
| 161 | case 32: | ||
| 162 | return Inst<U32>(Opcode::GetCbufU32, binding, byte_offset); | ||
| 163 | case 64: | ||
| 164 | return Inst(Opcode::GetCbufU32x2, binding, byte_offset); | ||
| 165 | default: | ||
| 166 | throw InvalidArgument("Invalid bit size {}", bitsize); | ||
| 167 | } | ||
| 168 | } | ||
| 169 | |||
| 170 | F32 IREmitter::GetFloatCbuf(const U32& binding, const U32& byte_offset) { | ||
| 171 | return Inst<F32>(Opcode::GetCbufF32, binding, byte_offset); | ||
| 172 | } | ||
| 173 | |||
| 174 | U1 IREmitter::GetZFlag() { | ||
| 175 | return Inst<U1>(Opcode::GetZFlag); | ||
| 176 | } | ||
| 177 | |||
| 178 | U1 IREmitter::GetSFlag() { | ||
| 179 | return Inst<U1>(Opcode::GetSFlag); | ||
| 180 | } | ||
| 181 | |||
| 182 | U1 IREmitter::GetCFlag() { | ||
| 183 | return Inst<U1>(Opcode::GetCFlag); | ||
| 184 | } | ||
| 185 | |||
| 186 | U1 IREmitter::GetOFlag() { | ||
| 187 | return Inst<U1>(Opcode::GetOFlag); | ||
| 188 | } | ||
| 189 | |||
| 190 | void IREmitter::SetZFlag(const U1& value) { | ||
| 191 | Inst(Opcode::SetZFlag, value); | ||
| 192 | } | ||
| 193 | |||
| 194 | void IREmitter::SetSFlag(const U1& value) { | ||
| 195 | Inst(Opcode::SetSFlag, value); | ||
| 196 | } | ||
| 197 | |||
| 198 | void IREmitter::SetCFlag(const U1& value) { | ||
| 199 | Inst(Opcode::SetCFlag, value); | ||
| 200 | } | ||
| 201 | |||
| 202 | void IREmitter::SetOFlag(const U1& value) { | ||
| 203 | Inst(Opcode::SetOFlag, value); | ||
| 204 | } | ||
| 205 | |||
| 206 | static U1 GetFlowTest(IREmitter& ir, FlowTest flow_test) { | ||
| 207 | switch (flow_test) { | ||
| 208 | case FlowTest::F: | ||
| 209 | return ir.Imm1(false); | ||
| 210 | case FlowTest::LT: | ||
| 211 | return ir.LogicalXor(ir.LogicalAnd(ir.GetSFlag(), ir.LogicalNot(ir.GetZFlag())), | ||
| 212 | ir.GetOFlag()); | ||
| 213 | case FlowTest::EQ: | ||
| 214 | return ir.LogicalAnd(ir.LogicalNot(ir.GetSFlag()), ir.GetZFlag()); | ||
| 215 | case FlowTest::LE: | ||
| 216 | return ir.LogicalXor(ir.GetSFlag(), ir.LogicalOr(ir.GetZFlag(), ir.GetOFlag())); | ||
| 217 | case FlowTest::GT: | ||
| 218 | return ir.LogicalAnd(ir.LogicalXor(ir.LogicalNot(ir.GetSFlag()), ir.GetOFlag()), | ||
| 219 | ir.LogicalNot(ir.GetZFlag())); | ||
| 220 | case FlowTest::NE: | ||
| 221 | return ir.LogicalNot(ir.GetZFlag()); | ||
| 222 | case FlowTest::GE: | ||
| 223 | return ir.LogicalNot(ir.LogicalXor(ir.GetSFlag(), ir.GetOFlag())); | ||
| 224 | case FlowTest::NUM: | ||
| 225 | return ir.LogicalOr(ir.LogicalNot(ir.GetSFlag()), ir.LogicalNot(ir.GetZFlag())); | ||
| 226 | case FlowTest::NaN: | ||
| 227 | return ir.LogicalAnd(ir.GetSFlag(), ir.GetZFlag()); | ||
| 228 | case FlowTest::LTU: | ||
| 229 | return ir.LogicalXor(ir.GetSFlag(), ir.GetOFlag()); | ||
| 230 | case FlowTest::EQU: | ||
| 231 | return ir.GetZFlag(); | ||
| 232 | case FlowTest::LEU: | ||
| 233 | return ir.LogicalOr(ir.LogicalXor(ir.GetSFlag(), ir.GetOFlag()), ir.GetZFlag()); | ||
| 234 | case FlowTest::GTU: | ||
| 235 | return ir.LogicalXor(ir.LogicalNot(ir.GetSFlag()), | ||
| 236 | ir.LogicalOr(ir.GetZFlag(), ir.GetOFlag())); | ||
| 237 | case FlowTest::NEU: | ||
| 238 | return ir.LogicalOr(ir.GetSFlag(), ir.LogicalNot(ir.GetZFlag())); | ||
| 239 | case FlowTest::GEU: | ||
| 240 | return ir.LogicalXor(ir.LogicalOr(ir.LogicalNot(ir.GetSFlag()), ir.GetZFlag()), | ||
| 241 | ir.GetOFlag()); | ||
| 242 | case FlowTest::T: | ||
| 243 | return ir.Imm1(true); | ||
| 244 | case FlowTest::OFF: | ||
| 245 | return ir.LogicalNot(ir.GetOFlag()); | ||
| 246 | case FlowTest::LO: | ||
| 247 | return ir.LogicalNot(ir.GetCFlag()); | ||
| 248 | case FlowTest::SFF: | ||
| 249 | return ir.LogicalNot(ir.GetSFlag()); | ||
| 250 | case FlowTest::LS: | ||
| 251 | return ir.LogicalOr(ir.GetZFlag(), ir.LogicalNot(ir.GetCFlag())); | ||
| 252 | case FlowTest::HI: | ||
| 253 | return ir.LogicalAnd(ir.GetCFlag(), ir.LogicalNot(ir.GetZFlag())); | ||
| 254 | case FlowTest::SFT: | ||
| 255 | return ir.GetSFlag(); | ||
| 256 | case FlowTest::HS: | ||
| 257 | return ir.GetCFlag(); | ||
| 258 | case FlowTest::OFT: | ||
| 259 | return ir.GetOFlag(); | ||
| 260 | case FlowTest::RLE: | ||
| 261 | return ir.LogicalOr(ir.GetSFlag(), ir.GetZFlag()); | ||
| 262 | case FlowTest::RGT: | ||
| 263 | return ir.LogicalAnd(ir.LogicalNot(ir.GetSFlag()), ir.LogicalNot(ir.GetZFlag())); | ||
| 264 | case FlowTest::FCSM_TR: | ||
| 265 | LOG_WARNING(Shader, "(STUBBED) FCSM_TR"); | ||
| 266 | return ir.Imm1(false); | ||
| 267 | case FlowTest::CSM_TA: | ||
| 268 | case FlowTest::CSM_TR: | ||
| 269 | case FlowTest::CSM_MX: | ||
| 270 | case FlowTest::FCSM_TA: | ||
| 271 | case FlowTest::FCSM_MX: | ||
| 272 | default: | ||
| 273 | throw NotImplementedException("Flow test {}", flow_test); | ||
| 274 | } | ||
| 275 | } | ||
| 276 | |||
| 277 | U1 IREmitter::Condition(IR::Condition cond) { | ||
| 278 | const FlowTest flow_test{cond.GetFlowTest()}; | ||
| 279 | const auto [pred, is_negated]{cond.GetPred()}; | ||
| 280 | if (flow_test == FlowTest::T) { | ||
| 281 | return GetPred(pred, is_negated); | ||
| 282 | } | ||
| 283 | return LogicalAnd(GetPred(pred, is_negated), GetFlowTest(*this, flow_test)); | ||
| 284 | } | ||
| 285 | |||
| 286 | U1 IREmitter::GetFlowTestResult(FlowTest test) { | ||
| 287 | return GetFlowTest(*this, test); | ||
| 288 | } | ||
| 289 | |||
| 290 | F32 IREmitter::GetAttribute(IR::Attribute attribute) { | ||
| 291 | return GetAttribute(attribute, Imm32(0)); | ||
| 292 | } | ||
| 293 | |||
| 294 | F32 IREmitter::GetAttribute(IR::Attribute attribute, const U32& vertex) { | ||
| 295 | return Inst<F32>(Opcode::GetAttribute, attribute, vertex); | ||
| 296 | } | ||
| 297 | |||
| 298 | void IREmitter::SetAttribute(IR::Attribute attribute, const F32& value, const U32& vertex) { | ||
| 299 | Inst(Opcode::SetAttribute, attribute, value, vertex); | ||
| 300 | } | ||
| 301 | |||
| 302 | F32 IREmitter::GetAttributeIndexed(const U32& phys_address) { | ||
| 303 | return GetAttributeIndexed(phys_address, Imm32(0)); | ||
| 304 | } | ||
| 305 | |||
| 306 | F32 IREmitter::GetAttributeIndexed(const U32& phys_address, const U32& vertex) { | ||
| 307 | return Inst<F32>(Opcode::GetAttributeIndexed, phys_address, vertex); | ||
| 308 | } | ||
| 309 | |||
| 310 | void IREmitter::SetAttributeIndexed(const U32& phys_address, const F32& value, const U32& vertex) { | ||
| 311 | Inst(Opcode::SetAttributeIndexed, phys_address, value, vertex); | ||
| 312 | } | ||
| 313 | |||
| 314 | F32 IREmitter::GetPatch(Patch patch) { | ||
| 315 | return Inst<F32>(Opcode::GetPatch, patch); | ||
| 316 | } | ||
| 317 | |||
| 318 | void IREmitter::SetPatch(Patch patch, const F32& value) { | ||
| 319 | Inst(Opcode::SetPatch, patch, value); | ||
| 320 | } | ||
| 321 | |||
| 322 | void IREmitter::SetFragColor(u32 index, u32 component, const F32& value) { | ||
| 323 | Inst(Opcode::SetFragColor, Imm32(index), Imm32(component), value); | ||
| 324 | } | ||
| 325 | |||
| 326 | void IREmitter::SetSampleMask(const U32& value) { | ||
| 327 | Inst(Opcode::SetSampleMask, value); | ||
| 328 | } | ||
| 329 | |||
| 330 | void IREmitter::SetFragDepth(const F32& value) { | ||
| 331 | Inst(Opcode::SetFragDepth, value); | ||
| 332 | } | ||
| 333 | |||
| 334 | U32 IREmitter::WorkgroupIdX() { | ||
| 335 | return U32{CompositeExtract(Inst(Opcode::WorkgroupId), 0)}; | ||
| 336 | } | ||
| 337 | |||
| 338 | U32 IREmitter::WorkgroupIdY() { | ||
| 339 | return U32{CompositeExtract(Inst(Opcode::WorkgroupId), 1)}; | ||
| 340 | } | ||
| 341 | |||
| 342 | U32 IREmitter::WorkgroupIdZ() { | ||
| 343 | return U32{CompositeExtract(Inst(Opcode::WorkgroupId), 2)}; | ||
| 344 | } | ||
| 345 | |||
| 346 | Value IREmitter::LocalInvocationId() { | ||
| 347 | return Inst(Opcode::LocalInvocationId); | ||
| 348 | } | ||
| 349 | |||
| 350 | U32 IREmitter::LocalInvocationIdX() { | ||
| 351 | return U32{CompositeExtract(Inst(Opcode::LocalInvocationId), 0)}; | ||
| 352 | } | ||
| 353 | |||
| 354 | U32 IREmitter::LocalInvocationIdY() { | ||
| 355 | return U32{CompositeExtract(Inst(Opcode::LocalInvocationId), 1)}; | ||
| 356 | } | ||
| 357 | |||
| 358 | U32 IREmitter::LocalInvocationIdZ() { | ||
| 359 | return U32{CompositeExtract(Inst(Opcode::LocalInvocationId), 2)}; | ||
| 360 | } | ||
| 361 | |||
| 362 | U32 IREmitter::InvocationId() { | ||
| 363 | return Inst<U32>(Opcode::InvocationId); | ||
| 364 | } | ||
| 365 | |||
| 366 | U32 IREmitter::SampleId() { | ||
| 367 | return Inst<U32>(Opcode::SampleId); | ||
| 368 | } | ||
| 369 | |||
| 370 | U1 IREmitter::IsHelperInvocation() { | ||
| 371 | return Inst<U1>(Opcode::IsHelperInvocation); | ||
| 372 | } | ||
| 373 | |||
| 374 | F32 IREmitter::YDirection() { | ||
| 375 | return Inst<F32>(Opcode::YDirection); | ||
| 376 | } | ||
| 377 | |||
| 378 | U32 IREmitter::LaneId() { | ||
| 379 | return Inst<U32>(Opcode::LaneId); | ||
| 380 | } | ||
| 381 | |||
| 382 | U32 IREmitter::LoadGlobalU8(const U64& address) { | ||
| 383 | return Inst<U32>(Opcode::LoadGlobalU8, address); | ||
| 384 | } | ||
| 385 | |||
| 386 | U32 IREmitter::LoadGlobalS8(const U64& address) { | ||
| 387 | return Inst<U32>(Opcode::LoadGlobalS8, address); | ||
| 388 | } | ||
| 389 | |||
| 390 | U32 IREmitter::LoadGlobalU16(const U64& address) { | ||
| 391 | return Inst<U32>(Opcode::LoadGlobalU16, address); | ||
| 392 | } | ||
| 393 | |||
| 394 | U32 IREmitter::LoadGlobalS16(const U64& address) { | ||
| 395 | return Inst<U32>(Opcode::LoadGlobalS16, address); | ||
| 396 | } | ||
| 397 | |||
| 398 | U32 IREmitter::LoadGlobal32(const U64& address) { | ||
| 399 | return Inst<U32>(Opcode::LoadGlobal32, address); | ||
| 400 | } | ||
| 401 | |||
| 402 | Value IREmitter::LoadGlobal64(const U64& address) { | ||
| 403 | return Inst<Value>(Opcode::LoadGlobal64, address); | ||
| 404 | } | ||
| 405 | |||
| 406 | Value IREmitter::LoadGlobal128(const U64& address) { | ||
| 407 | return Inst<Value>(Opcode::LoadGlobal128, address); | ||
| 408 | } | ||
| 409 | |||
| 410 | void IREmitter::WriteGlobalU8(const U64& address, const U32& value) { | ||
| 411 | Inst(Opcode::WriteGlobalU8, address, value); | ||
| 412 | } | ||
| 413 | |||
| 414 | void IREmitter::WriteGlobalS8(const U64& address, const U32& value) { | ||
| 415 | Inst(Opcode::WriteGlobalS8, address, value); | ||
| 416 | } | ||
| 417 | |||
| 418 | void IREmitter::WriteGlobalU16(const U64& address, const U32& value) { | ||
| 419 | Inst(Opcode::WriteGlobalU16, address, value); | ||
| 420 | } | ||
| 421 | |||
| 422 | void IREmitter::WriteGlobalS16(const U64& address, const U32& value) { | ||
| 423 | Inst(Opcode::WriteGlobalS16, address, value); | ||
| 424 | } | ||
| 425 | |||
| 426 | void IREmitter::WriteGlobal32(const U64& address, const U32& value) { | ||
| 427 | Inst(Opcode::WriteGlobal32, address, value); | ||
| 428 | } | ||
| 429 | |||
| 430 | void IREmitter::WriteGlobal64(const U64& address, const IR::Value& vector) { | ||
| 431 | Inst(Opcode::WriteGlobal64, address, vector); | ||
| 432 | } | ||
| 433 | |||
| 434 | void IREmitter::WriteGlobal128(const U64& address, const IR::Value& vector) { | ||
| 435 | Inst(Opcode::WriteGlobal128, address, vector); | ||
| 436 | } | ||
| 437 | |||
| 438 | U32 IREmitter::LoadLocal(const IR::U32& word_offset) { | ||
| 439 | return Inst<U32>(Opcode::LoadLocal, word_offset); | ||
| 440 | } | ||
| 441 | |||
| 442 | void IREmitter::WriteLocal(const IR::U32& word_offset, const IR::U32& value) { | ||
| 443 | Inst(Opcode::WriteLocal, word_offset, value); | ||
| 444 | } | ||
| 445 | |||
| 446 | Value IREmitter::LoadShared(int bit_size, bool is_signed, const IR::U32& offset) { | ||
| 447 | switch (bit_size) { | ||
| 448 | case 8: | ||
| 449 | return Inst(is_signed ? Opcode::LoadSharedS8 : Opcode::LoadSharedU8, offset); | ||
| 450 | case 16: | ||
| 451 | return Inst(is_signed ? Opcode::LoadSharedS16 : Opcode::LoadSharedU16, offset); | ||
| 452 | case 32: | ||
| 453 | return Inst(Opcode::LoadSharedU32, offset); | ||
| 454 | case 64: | ||
| 455 | return Inst(Opcode::LoadSharedU64, offset); | ||
| 456 | case 128: | ||
| 457 | return Inst(Opcode::LoadSharedU128, offset); | ||
| 458 | } | ||
| 459 | throw InvalidArgument("Invalid bit size {}", bit_size); | ||
| 460 | } | ||
| 461 | |||
| 462 | void IREmitter::WriteShared(int bit_size, const IR::U32& offset, const IR::Value& value) { | ||
| 463 | switch (bit_size) { | ||
| 464 | case 8: | ||
| 465 | Inst(Opcode::WriteSharedU8, offset, value); | ||
| 466 | break; | ||
| 467 | case 16: | ||
| 468 | Inst(Opcode::WriteSharedU16, offset, value); | ||
| 469 | break; | ||
| 470 | case 32: | ||
| 471 | Inst(Opcode::WriteSharedU32, offset, value); | ||
| 472 | break; | ||
| 473 | case 64: | ||
| 474 | Inst(Opcode::WriteSharedU64, offset, value); | ||
| 475 | break; | ||
| 476 | case 128: | ||
| 477 | Inst(Opcode::WriteSharedU128, offset, value); | ||
| 478 | break; | ||
| 479 | default: | ||
| 480 | throw InvalidArgument("Invalid bit size {}", bit_size); | ||
| 481 | } | ||
| 482 | } | ||
| 483 | |||
| 484 | U1 IREmitter::GetZeroFromOp(const Value& op) { | ||
| 485 | return Inst<U1>(Opcode::GetZeroFromOp, op); | ||
| 486 | } | ||
| 487 | |||
| 488 | U1 IREmitter::GetSignFromOp(const Value& op) { | ||
| 489 | return Inst<U1>(Opcode::GetSignFromOp, op); | ||
| 490 | } | ||
| 491 | |||
| 492 | U1 IREmitter::GetCarryFromOp(const Value& op) { | ||
| 493 | return Inst<U1>(Opcode::GetCarryFromOp, op); | ||
| 494 | } | ||
| 495 | |||
| 496 | U1 IREmitter::GetOverflowFromOp(const Value& op) { | ||
| 497 | return Inst<U1>(Opcode::GetOverflowFromOp, op); | ||
| 498 | } | ||
| 499 | |||
| 500 | U1 IREmitter::GetSparseFromOp(const Value& op) { | ||
| 501 | return Inst<U1>(Opcode::GetSparseFromOp, op); | ||
| 502 | } | ||
| 503 | |||
| 504 | U1 IREmitter::GetInBoundsFromOp(const Value& op) { | ||
| 505 | return Inst<U1>(Opcode::GetInBoundsFromOp, op); | ||
| 506 | } | ||
| 507 | |||
| 508 | F16F32F64 IREmitter::FPAdd(const F16F32F64& a, const F16F32F64& b, FpControl control) { | ||
| 509 | if (a.Type() != b.Type()) { | ||
| 510 | throw InvalidArgument("Mismatching types {} and {}", a.Type(), b.Type()); | ||
| 511 | } | ||
| 512 | switch (a.Type()) { | ||
| 513 | case Type::F16: | ||
| 514 | return Inst<F16>(Opcode::FPAdd16, Flags{control}, a, b); | ||
| 515 | case Type::F32: | ||
| 516 | return Inst<F32>(Opcode::FPAdd32, Flags{control}, a, b); | ||
| 517 | case Type::F64: | ||
| 518 | return Inst<F64>(Opcode::FPAdd64, Flags{control}, a, b); | ||
| 519 | default: | ||
| 520 | ThrowInvalidType(a.Type()); | ||
| 521 | } | ||
| 522 | } | ||
| 523 | |||
| 524 | Value IREmitter::CompositeConstruct(const Value& e1, const Value& e2) { | ||
| 525 | if (e1.Type() != e2.Type()) { | ||
| 526 | throw InvalidArgument("Mismatching types {} and {}", e1.Type(), e2.Type()); | ||
| 527 | } | ||
| 528 | switch (e1.Type()) { | ||
| 529 | case Type::U32: | ||
| 530 | return Inst(Opcode::CompositeConstructU32x2, e1, e2); | ||
| 531 | case Type::F16: | ||
| 532 | return Inst(Opcode::CompositeConstructF16x2, e1, e2); | ||
| 533 | case Type::F32: | ||
| 534 | return Inst(Opcode::CompositeConstructF32x2, e1, e2); | ||
| 535 | case Type::F64: | ||
| 536 | return Inst(Opcode::CompositeConstructF64x2, e1, e2); | ||
| 537 | default: | ||
| 538 | ThrowInvalidType(e1.Type()); | ||
| 539 | } | ||
| 540 | } | ||
| 541 | |||
| 542 | Value IREmitter::CompositeConstruct(const Value& e1, const Value& e2, const Value& e3) { | ||
| 543 | if (e1.Type() != e2.Type() || e1.Type() != e3.Type()) { | ||
| 544 | throw InvalidArgument("Mismatching types {}, {}, and {}", e1.Type(), e2.Type(), e3.Type()); | ||
| 545 | } | ||
| 546 | switch (e1.Type()) { | ||
| 547 | case Type::U32: | ||
| 548 | return Inst(Opcode::CompositeConstructU32x3, e1, e2, e3); | ||
| 549 | case Type::F16: | ||
| 550 | return Inst(Opcode::CompositeConstructF16x3, e1, e2, e3); | ||
| 551 | case Type::F32: | ||
| 552 | return Inst(Opcode::CompositeConstructF32x3, e1, e2, e3); | ||
| 553 | case Type::F64: | ||
| 554 | return Inst(Opcode::CompositeConstructF64x3, e1, e2, e3); | ||
| 555 | default: | ||
| 556 | ThrowInvalidType(e1.Type()); | ||
| 557 | } | ||
| 558 | } | ||
| 559 | |||
| 560 | Value IREmitter::CompositeConstruct(const Value& e1, const Value& e2, const Value& e3, | ||
| 561 | const Value& e4) { | ||
| 562 | if (e1.Type() != e2.Type() || e1.Type() != e3.Type() || e1.Type() != e4.Type()) { | ||
| 563 | throw InvalidArgument("Mismatching types {}, {}, {}, and {}", e1.Type(), e2.Type(), | ||
| 564 | e3.Type(), e4.Type()); | ||
| 565 | } | ||
| 566 | switch (e1.Type()) { | ||
| 567 | case Type::U32: | ||
| 568 | return Inst(Opcode::CompositeConstructU32x4, e1, e2, e3, e4); | ||
| 569 | case Type::F16: | ||
| 570 | return Inst(Opcode::CompositeConstructF16x4, e1, e2, e3, e4); | ||
| 571 | case Type::F32: | ||
| 572 | return Inst(Opcode::CompositeConstructF32x4, e1, e2, e3, e4); | ||
| 573 | case Type::F64: | ||
| 574 | return Inst(Opcode::CompositeConstructF64x4, e1, e2, e3, e4); | ||
| 575 | default: | ||
| 576 | ThrowInvalidType(e1.Type()); | ||
| 577 | } | ||
| 578 | } | ||
| 579 | |||
| 580 | Value IREmitter::CompositeExtract(const Value& vector, size_t element) { | ||
| 581 | const auto read{[&](Opcode opcode, size_t limit) -> Value { | ||
| 582 | if (element >= limit) { | ||
| 583 | throw InvalidArgument("Out of bounds element {}", element); | ||
| 584 | } | ||
| 585 | return Inst(opcode, vector, Value{static_cast<u32>(element)}); | ||
| 586 | }}; | ||
| 587 | switch (vector.Type()) { | ||
| 588 | case Type::U32x2: | ||
| 589 | return read(Opcode::CompositeExtractU32x2, 2); | ||
| 590 | case Type::U32x3: | ||
| 591 | return read(Opcode::CompositeExtractU32x3, 3); | ||
| 592 | case Type::U32x4: | ||
| 593 | return read(Opcode::CompositeExtractU32x4, 4); | ||
| 594 | case Type::F16x2: | ||
| 595 | return read(Opcode::CompositeExtractF16x2, 2); | ||
| 596 | case Type::F16x3: | ||
| 597 | return read(Opcode::CompositeExtractF16x3, 3); | ||
| 598 | case Type::F16x4: | ||
| 599 | return read(Opcode::CompositeExtractF16x4, 4); | ||
| 600 | case Type::F32x2: | ||
| 601 | return read(Opcode::CompositeExtractF32x2, 2); | ||
| 602 | case Type::F32x3: | ||
| 603 | return read(Opcode::CompositeExtractF32x3, 3); | ||
| 604 | case Type::F32x4: | ||
| 605 | return read(Opcode::CompositeExtractF32x4, 4); | ||
| 606 | case Type::F64x2: | ||
| 607 | return read(Opcode::CompositeExtractF64x2, 2); | ||
| 608 | case Type::F64x3: | ||
| 609 | return read(Opcode::CompositeExtractF64x3, 3); | ||
| 610 | case Type::F64x4: | ||
| 611 | return read(Opcode::CompositeExtractF64x4, 4); | ||
| 612 | default: | ||
| 613 | ThrowInvalidType(vector.Type()); | ||
| 614 | } | ||
| 615 | } | ||
| 616 | |||
| 617 | Value IREmitter::CompositeInsert(const Value& vector, const Value& object, size_t element) { | ||
| 618 | const auto insert{[&](Opcode opcode, size_t limit) { | ||
| 619 | if (element >= limit) { | ||
| 620 | throw InvalidArgument("Out of bounds element {}", element); | ||
| 621 | } | ||
| 622 | return Inst(opcode, vector, object, Value{static_cast<u32>(element)}); | ||
| 623 | }}; | ||
| 624 | switch (vector.Type()) { | ||
| 625 | case Type::U32x2: | ||
| 626 | return insert(Opcode::CompositeInsertU32x2, 2); | ||
| 627 | case Type::U32x3: | ||
| 628 | return insert(Opcode::CompositeInsertU32x3, 3); | ||
| 629 | case Type::U32x4: | ||
| 630 | return insert(Opcode::CompositeInsertU32x4, 4); | ||
| 631 | case Type::F16x2: | ||
| 632 | return insert(Opcode::CompositeInsertF16x2, 2); | ||
| 633 | case Type::F16x3: | ||
| 634 | return insert(Opcode::CompositeInsertF16x3, 3); | ||
| 635 | case Type::F16x4: | ||
| 636 | return insert(Opcode::CompositeInsertF16x4, 4); | ||
| 637 | case Type::F32x2: | ||
| 638 | return insert(Opcode::CompositeInsertF32x2, 2); | ||
| 639 | case Type::F32x3: | ||
| 640 | return insert(Opcode::CompositeInsertF32x3, 3); | ||
| 641 | case Type::F32x4: | ||
| 642 | return insert(Opcode::CompositeInsertF32x4, 4); | ||
| 643 | case Type::F64x2: | ||
| 644 | return insert(Opcode::CompositeInsertF64x2, 2); | ||
| 645 | case Type::F64x3: | ||
| 646 | return insert(Opcode::CompositeInsertF64x3, 3); | ||
| 647 | case Type::F64x4: | ||
| 648 | return insert(Opcode::CompositeInsertF64x4, 4); | ||
| 649 | default: | ||
| 650 | ThrowInvalidType(vector.Type()); | ||
| 651 | } | ||
| 652 | } | ||
| 653 | |||
| 654 | Value IREmitter::Select(const U1& condition, const Value& true_value, const Value& false_value) { | ||
| 655 | if (true_value.Type() != false_value.Type()) { | ||
| 656 | throw InvalidArgument("Mismatching types {} and {}", true_value.Type(), false_value.Type()); | ||
| 657 | } | ||
| 658 | switch (true_value.Type()) { | ||
| 659 | case Type::U1: | ||
| 660 | return Inst(Opcode::SelectU1, condition, true_value, false_value); | ||
| 661 | case Type::U8: | ||
| 662 | return Inst(Opcode::SelectU8, condition, true_value, false_value); | ||
| 663 | case Type::U16: | ||
| 664 | return Inst(Opcode::SelectU16, condition, true_value, false_value); | ||
| 665 | case Type::U32: | ||
| 666 | return Inst(Opcode::SelectU32, condition, true_value, false_value); | ||
| 667 | case Type::U64: | ||
| 668 | return Inst(Opcode::SelectU64, condition, true_value, false_value); | ||
| 669 | case Type::F32: | ||
| 670 | return Inst(Opcode::SelectF32, condition, true_value, false_value); | ||
| 671 | case Type::F64: | ||
| 672 | return Inst(Opcode::SelectF64, condition, true_value, false_value); | ||
| 673 | default: | ||
| 674 | throw InvalidArgument("Invalid type {}", true_value.Type()); | ||
| 675 | } | ||
| 676 | } | ||
| 677 | |||
| 678 | template <> | ||
| 679 | IR::U32 IREmitter::BitCast<IR::U32, IR::F32>(const IR::F32& value) { | ||
| 680 | return Inst<IR::U32>(Opcode::BitCastU32F32, value); | ||
| 681 | } | ||
| 682 | |||
| 683 | template <> | ||
| 684 | IR::F32 IREmitter::BitCast<IR::F32, IR::U32>(const IR::U32& value) { | ||
| 685 | return Inst<IR::F32>(Opcode::BitCastF32U32, value); | ||
| 686 | } | ||
| 687 | |||
| 688 | template <> | ||
| 689 | IR::U16 IREmitter::BitCast<IR::U16, IR::F16>(const IR::F16& value) { | ||
| 690 | return Inst<IR::U16>(Opcode::BitCastU16F16, value); | ||
| 691 | } | ||
| 692 | |||
| 693 | template <> | ||
| 694 | IR::F16 IREmitter::BitCast<IR::F16, IR::U16>(const IR::U16& value) { | ||
| 695 | return Inst<IR::F16>(Opcode::BitCastF16U16, value); | ||
| 696 | } | ||
| 697 | |||
| 698 | template <> | ||
| 699 | IR::U64 IREmitter::BitCast<IR::U64, IR::F64>(const IR::F64& value) { | ||
| 700 | return Inst<IR::U64>(Opcode::BitCastU64F64, value); | ||
| 701 | } | ||
| 702 | |||
| 703 | template <> | ||
| 704 | IR::F64 IREmitter::BitCast<IR::F64, IR::U64>(const IR::U64& value) { | ||
| 705 | return Inst<IR::F64>(Opcode::BitCastF64U64, value); | ||
| 706 | } | ||
| 707 | |||
| 708 | U64 IREmitter::PackUint2x32(const Value& vector) { | ||
| 709 | return Inst<U64>(Opcode::PackUint2x32, vector); | ||
| 710 | } | ||
| 711 | |||
| 712 | Value IREmitter::UnpackUint2x32(const U64& value) { | ||
| 713 | return Inst<Value>(Opcode::UnpackUint2x32, value); | ||
| 714 | } | ||
| 715 | |||
| 716 | U32 IREmitter::PackFloat2x16(const Value& vector) { | ||
| 717 | return Inst<U32>(Opcode::PackFloat2x16, vector); | ||
| 718 | } | ||
| 719 | |||
| 720 | Value IREmitter::UnpackFloat2x16(const U32& value) { | ||
| 721 | return Inst(Opcode::UnpackFloat2x16, value); | ||
| 722 | } | ||
| 723 | |||
| 724 | U32 IREmitter::PackHalf2x16(const Value& vector) { | ||
| 725 | return Inst<U32>(Opcode::PackHalf2x16, vector); | ||
| 726 | } | ||
| 727 | |||
| 728 | Value IREmitter::UnpackHalf2x16(const U32& value) { | ||
| 729 | return Inst(Opcode::UnpackHalf2x16, value); | ||
| 730 | } | ||
| 731 | |||
| 732 | F64 IREmitter::PackDouble2x32(const Value& vector) { | ||
| 733 | return Inst<F64>(Opcode::PackDouble2x32, vector); | ||
| 734 | } | ||
| 735 | |||
| 736 | Value IREmitter::UnpackDouble2x32(const F64& value) { | ||
| 737 | return Inst<Value>(Opcode::UnpackDouble2x32, value); | ||
| 738 | } | ||
| 739 | |||
| 740 | F16F32F64 IREmitter::FPMul(const F16F32F64& a, const F16F32F64& b, FpControl control) { | ||
| 741 | if (a.Type() != b.Type()) { | ||
| 742 | throw InvalidArgument("Mismatching types {} and {}", a.Type(), b.Type()); | ||
| 743 | } | ||
| 744 | switch (a.Type()) { | ||
| 745 | case Type::F16: | ||
| 746 | return Inst<F16>(Opcode::FPMul16, Flags{control}, a, b); | ||
| 747 | case Type::F32: | ||
| 748 | return Inst<F32>(Opcode::FPMul32, Flags{control}, a, b); | ||
| 749 | case Type::F64: | ||
| 750 | return Inst<F64>(Opcode::FPMul64, Flags{control}, a, b); | ||
| 751 | default: | ||
| 752 | ThrowInvalidType(a.Type()); | ||
| 753 | } | ||
| 754 | } | ||
| 755 | |||
| 756 | F16F32F64 IREmitter::FPFma(const F16F32F64& a, const F16F32F64& b, const F16F32F64& c, | ||
| 757 | FpControl control) { | ||
| 758 | if (a.Type() != b.Type() || a.Type() != c.Type()) { | ||
| 759 | throw InvalidArgument("Mismatching types {}, {}, and {}", a.Type(), b.Type(), c.Type()); | ||
| 760 | } | ||
| 761 | switch (a.Type()) { | ||
| 762 | case Type::F16: | ||
| 763 | return Inst<F16>(Opcode::FPFma16, Flags{control}, a, b, c); | ||
| 764 | case Type::F32: | ||
| 765 | return Inst<F32>(Opcode::FPFma32, Flags{control}, a, b, c); | ||
| 766 | case Type::F64: | ||
| 767 | return Inst<F64>(Opcode::FPFma64, Flags{control}, a, b, c); | ||
| 768 | default: | ||
| 769 | ThrowInvalidType(a.Type()); | ||
| 770 | } | ||
| 771 | } | ||
| 772 | |||
| 773 | F16F32F64 IREmitter::FPAbs(const F16F32F64& value) { | ||
| 774 | switch (value.Type()) { | ||
| 775 | case Type::F16: | ||
| 776 | return Inst<F16>(Opcode::FPAbs16, value); | ||
| 777 | case Type::F32: | ||
| 778 | return Inst<F32>(Opcode::FPAbs32, value); | ||
| 779 | case Type::F64: | ||
| 780 | return Inst<F64>(Opcode::FPAbs64, value); | ||
| 781 | default: | ||
| 782 | ThrowInvalidType(value.Type()); | ||
| 783 | } | ||
| 784 | } | ||
| 785 | |||
| 786 | F16F32F64 IREmitter::FPNeg(const F16F32F64& value) { | ||
| 787 | switch (value.Type()) { | ||
| 788 | case Type::F16: | ||
| 789 | return Inst<F16>(Opcode::FPNeg16, value); | ||
| 790 | case Type::F32: | ||
| 791 | return Inst<F32>(Opcode::FPNeg32, value); | ||
| 792 | case Type::F64: | ||
| 793 | return Inst<F64>(Opcode::FPNeg64, value); | ||
| 794 | default: | ||
| 795 | ThrowInvalidType(value.Type()); | ||
| 796 | } | ||
| 797 | } | ||
| 798 | |||
| 799 | F16F32F64 IREmitter::FPAbsNeg(const F16F32F64& value, bool abs, bool neg) { | ||
| 800 | F16F32F64 result{value}; | ||
| 801 | if (abs) { | ||
| 802 | result = FPAbs(result); | ||
| 803 | } | ||
| 804 | if (neg) { | ||
| 805 | result = FPNeg(result); | ||
| 806 | } | ||
| 807 | return result; | ||
| 808 | } | ||
| 809 | |||
| 810 | F32 IREmitter::FPCos(const F32& value) { | ||
| 811 | return Inst<F32>(Opcode::FPCos, value); | ||
| 812 | } | ||
| 813 | |||
| 814 | F32 IREmitter::FPSin(const F32& value) { | ||
| 815 | return Inst<F32>(Opcode::FPSin, value); | ||
| 816 | } | ||
| 817 | |||
| 818 | F32 IREmitter::FPExp2(const F32& value) { | ||
| 819 | return Inst<F32>(Opcode::FPExp2, value); | ||
| 820 | } | ||
| 821 | |||
| 822 | F32 IREmitter::FPLog2(const F32& value) { | ||
| 823 | return Inst<F32>(Opcode::FPLog2, value); | ||
| 824 | } | ||
| 825 | |||
| 826 | F32F64 IREmitter::FPRecip(const F32F64& value) { | ||
| 827 | switch (value.Type()) { | ||
| 828 | case Type::F32: | ||
| 829 | return Inst<F32>(Opcode::FPRecip32, value); | ||
| 830 | case Type::F64: | ||
| 831 | return Inst<F64>(Opcode::FPRecip64, value); | ||
| 832 | default: | ||
| 833 | ThrowInvalidType(value.Type()); | ||
| 834 | } | ||
| 835 | } | ||
| 836 | |||
| 837 | F32F64 IREmitter::FPRecipSqrt(const F32F64& value) { | ||
| 838 | switch (value.Type()) { | ||
| 839 | case Type::F32: | ||
| 840 | return Inst<F32>(Opcode::FPRecipSqrt32, value); | ||
| 841 | case Type::F64: | ||
| 842 | return Inst<F64>(Opcode::FPRecipSqrt64, value); | ||
| 843 | default: | ||
| 844 | ThrowInvalidType(value.Type()); | ||
| 845 | } | ||
| 846 | } | ||
| 847 | |||
| 848 | F32 IREmitter::FPSqrt(const F32& value) { | ||
| 849 | return Inst<F32>(Opcode::FPSqrt, value); | ||
| 850 | } | ||
| 851 | |||
| 852 | F16F32F64 IREmitter::FPSaturate(const F16F32F64& value) { | ||
| 853 | switch (value.Type()) { | ||
| 854 | case Type::F16: | ||
| 855 | return Inst<F16>(Opcode::FPSaturate16, value); | ||
| 856 | case Type::F32: | ||
| 857 | return Inst<F32>(Opcode::FPSaturate32, value); | ||
| 858 | case Type::F64: | ||
| 859 | return Inst<F64>(Opcode::FPSaturate64, value); | ||
| 860 | default: | ||
| 861 | ThrowInvalidType(value.Type()); | ||
| 862 | } | ||
| 863 | } | ||
| 864 | |||
| 865 | F16F32F64 IREmitter::FPClamp(const F16F32F64& value, const F16F32F64& min_value, | ||
| 866 | const F16F32F64& max_value) { | ||
| 867 | if (value.Type() != min_value.Type() || value.Type() != max_value.Type()) { | ||
| 868 | throw InvalidArgument("Mismatching types {}, {}, and {}", value.Type(), min_value.Type(), | ||
| 869 | max_value.Type()); | ||
| 870 | } | ||
| 871 | switch (value.Type()) { | ||
| 872 | case Type::F16: | ||
| 873 | return Inst<F16>(Opcode::FPClamp16, value, min_value, max_value); | ||
| 874 | case Type::F32: | ||
| 875 | return Inst<F32>(Opcode::FPClamp32, value, min_value, max_value); | ||
| 876 | case Type::F64: | ||
| 877 | return Inst<F64>(Opcode::FPClamp64, value, min_value, max_value); | ||
| 878 | default: | ||
| 879 | ThrowInvalidType(value.Type()); | ||
| 880 | } | ||
| 881 | } | ||
| 882 | |||
| 883 | F16F32F64 IREmitter::FPRoundEven(const F16F32F64& value, FpControl control) { | ||
| 884 | switch (value.Type()) { | ||
| 885 | case Type::F16: | ||
| 886 | return Inst<F16>(Opcode::FPRoundEven16, Flags{control}, value); | ||
| 887 | case Type::F32: | ||
| 888 | return Inst<F32>(Opcode::FPRoundEven32, Flags{control}, value); | ||
| 889 | case Type::F64: | ||
| 890 | return Inst<F64>(Opcode::FPRoundEven64, Flags{control}, value); | ||
| 891 | default: | ||
| 892 | ThrowInvalidType(value.Type()); | ||
| 893 | } | ||
| 894 | } | ||
| 895 | |||
| 896 | F16F32F64 IREmitter::FPFloor(const F16F32F64& value, FpControl control) { | ||
| 897 | switch (value.Type()) { | ||
| 898 | case Type::F16: | ||
| 899 | return Inst<F16>(Opcode::FPFloor16, Flags{control}, value); | ||
| 900 | case Type::F32: | ||
| 901 | return Inst<F32>(Opcode::FPFloor32, Flags{control}, value); | ||
| 902 | case Type::F64: | ||
| 903 | return Inst<F64>(Opcode::FPFloor64, Flags{control}, value); | ||
| 904 | default: | ||
| 905 | ThrowInvalidType(value.Type()); | ||
| 906 | } | ||
| 907 | } | ||
| 908 | |||
| 909 | F16F32F64 IREmitter::FPCeil(const F16F32F64& value, FpControl control) { | ||
| 910 | switch (value.Type()) { | ||
| 911 | case Type::F16: | ||
| 912 | return Inst<F16>(Opcode::FPCeil16, Flags{control}, value); | ||
| 913 | case Type::F32: | ||
| 914 | return Inst<F32>(Opcode::FPCeil32, Flags{control}, value); | ||
| 915 | case Type::F64: | ||
| 916 | return Inst<F64>(Opcode::FPCeil64, Flags{control}, value); | ||
| 917 | default: | ||
| 918 | ThrowInvalidType(value.Type()); | ||
| 919 | } | ||
| 920 | } | ||
| 921 | |||
| 922 | F16F32F64 IREmitter::FPTrunc(const F16F32F64& value, FpControl control) { | ||
| 923 | switch (value.Type()) { | ||
| 924 | case Type::F16: | ||
| 925 | return Inst<F16>(Opcode::FPTrunc16, Flags{control}, value); | ||
| 926 | case Type::F32: | ||
| 927 | return Inst<F32>(Opcode::FPTrunc32, Flags{control}, value); | ||
| 928 | case Type::F64: | ||
| 929 | return Inst<F64>(Opcode::FPTrunc64, Flags{control}, value); | ||
| 930 | default: | ||
| 931 | ThrowInvalidType(value.Type()); | ||
| 932 | } | ||
| 933 | } | ||
| 934 | |||
| 935 | U1 IREmitter::FPEqual(const F16F32F64& lhs, const F16F32F64& rhs, FpControl control, bool ordered) { | ||
| 936 | if (lhs.Type() != rhs.Type()) { | ||
| 937 | throw InvalidArgument("Mismatching types {} and {}", lhs.Type(), rhs.Type()); | ||
| 938 | } | ||
| 939 | switch (lhs.Type()) { | ||
| 940 | case Type::F16: | ||
| 941 | return Inst<U1>(ordered ? Opcode::FPOrdEqual16 : Opcode::FPUnordEqual16, Flags{control}, | ||
| 942 | lhs, rhs); | ||
| 943 | case Type::F32: | ||
| 944 | return Inst<U1>(ordered ? Opcode::FPOrdEqual32 : Opcode::FPUnordEqual32, Flags{control}, | ||
| 945 | lhs, rhs); | ||
| 946 | case Type::F64: | ||
| 947 | return Inst<U1>(ordered ? Opcode::FPOrdEqual64 : Opcode::FPUnordEqual64, Flags{control}, | ||
| 948 | lhs, rhs); | ||
| 949 | default: | ||
| 950 | ThrowInvalidType(lhs.Type()); | ||
| 951 | } | ||
| 952 | } | ||
| 953 | |||
| 954 | U1 IREmitter::FPNotEqual(const F16F32F64& lhs, const F16F32F64& rhs, FpControl control, | ||
| 955 | bool ordered) { | ||
| 956 | if (lhs.Type() != rhs.Type()) { | ||
| 957 | throw InvalidArgument("Mismatching types {} and {}", lhs.Type(), rhs.Type()); | ||
| 958 | } | ||
| 959 | switch (lhs.Type()) { | ||
| 960 | case Type::F16: | ||
| 961 | return Inst<U1>(ordered ? Opcode::FPOrdNotEqual16 : Opcode::FPUnordNotEqual16, | ||
| 962 | Flags{control}, lhs, rhs); | ||
| 963 | case Type::F32: | ||
| 964 | return Inst<U1>(ordered ? Opcode::FPOrdNotEqual32 : Opcode::FPUnordNotEqual32, | ||
| 965 | Flags{control}, lhs, rhs); | ||
| 966 | case Type::F64: | ||
| 967 | return Inst<U1>(ordered ? Opcode::FPOrdNotEqual64 : Opcode::FPUnordNotEqual64, | ||
| 968 | Flags{control}, lhs, rhs); | ||
| 969 | default: | ||
| 970 | ThrowInvalidType(lhs.Type()); | ||
| 971 | } | ||
| 972 | } | ||
| 973 | |||
| 974 | U1 IREmitter::FPLessThan(const F16F32F64& lhs, const F16F32F64& rhs, FpControl control, | ||
| 975 | bool ordered) { | ||
| 976 | if (lhs.Type() != rhs.Type()) { | ||
| 977 | throw InvalidArgument("Mismatching types {} and {}", lhs.Type(), rhs.Type()); | ||
| 978 | } | ||
| 979 | switch (lhs.Type()) { | ||
| 980 | case Type::F16: | ||
| 981 | return Inst<U1>(ordered ? Opcode::FPOrdLessThan16 : Opcode::FPUnordLessThan16, | ||
| 982 | Flags{control}, lhs, rhs); | ||
| 983 | case Type::F32: | ||
| 984 | return Inst<U1>(ordered ? Opcode::FPOrdLessThan32 : Opcode::FPUnordLessThan32, | ||
| 985 | Flags{control}, lhs, rhs); | ||
| 986 | case Type::F64: | ||
| 987 | return Inst<U1>(ordered ? Opcode::FPOrdLessThan64 : Opcode::FPUnordLessThan64, | ||
| 988 | Flags{control}, lhs, rhs); | ||
| 989 | default: | ||
| 990 | ThrowInvalidType(lhs.Type()); | ||
| 991 | } | ||
| 992 | } | ||
| 993 | |||
| 994 | U1 IREmitter::FPGreaterThan(const F16F32F64& lhs, const F16F32F64& rhs, FpControl control, | ||
| 995 | bool ordered) { | ||
| 996 | if (lhs.Type() != rhs.Type()) { | ||
| 997 | throw InvalidArgument("Mismatching types {} and {}", lhs.Type(), rhs.Type()); | ||
| 998 | } | ||
| 999 | switch (lhs.Type()) { | ||
| 1000 | case Type::F16: | ||
| 1001 | return Inst<U1>(ordered ? Opcode::FPOrdGreaterThan16 : Opcode::FPUnordGreaterThan16, | ||
| 1002 | Flags{control}, lhs, rhs); | ||
| 1003 | case Type::F32: | ||
| 1004 | return Inst<U1>(ordered ? Opcode::FPOrdGreaterThan32 : Opcode::FPUnordGreaterThan32, | ||
| 1005 | Flags{control}, lhs, rhs); | ||
| 1006 | case Type::F64: | ||
| 1007 | return Inst<U1>(ordered ? Opcode::FPOrdGreaterThan64 : Opcode::FPUnordGreaterThan64, | ||
| 1008 | Flags{control}, lhs, rhs); | ||
| 1009 | default: | ||
| 1010 | ThrowInvalidType(lhs.Type()); | ||
| 1011 | } | ||
| 1012 | } | ||
| 1013 | |||
| 1014 | U1 IREmitter::FPLessThanEqual(const F16F32F64& lhs, const F16F32F64& rhs, FpControl control, | ||
| 1015 | bool ordered) { | ||
| 1016 | if (lhs.Type() != rhs.Type()) { | ||
| 1017 | throw InvalidArgument("Mismatching types {} and {}", lhs.Type(), rhs.Type()); | ||
| 1018 | } | ||
| 1019 | switch (lhs.Type()) { | ||
| 1020 | case Type::F16: | ||
| 1021 | return Inst<U1>(ordered ? Opcode::FPOrdLessThanEqual16 : Opcode::FPUnordLessThanEqual16, | ||
| 1022 | Flags{control}, lhs, rhs); | ||
| 1023 | case Type::F32: | ||
| 1024 | return Inst<U1>(ordered ? Opcode::FPOrdLessThanEqual32 : Opcode::FPUnordLessThanEqual32, | ||
| 1025 | Flags{control}, lhs, rhs); | ||
| 1026 | case Type::F64: | ||
| 1027 | return Inst<U1>(ordered ? Opcode::FPOrdLessThanEqual64 : Opcode::FPUnordLessThanEqual64, | ||
| 1028 | Flags{control}, lhs, rhs); | ||
| 1029 | default: | ||
| 1030 | ThrowInvalidType(lhs.Type()); | ||
| 1031 | } | ||
| 1032 | } | ||
| 1033 | |||
| 1034 | U1 IREmitter::FPGreaterThanEqual(const F16F32F64& lhs, const F16F32F64& rhs, FpControl control, | ||
| 1035 | bool ordered) { | ||
| 1036 | if (lhs.Type() != rhs.Type()) { | ||
| 1037 | throw InvalidArgument("Mismatching types {} and {}", lhs.Type(), rhs.Type()); | ||
| 1038 | } | ||
| 1039 | switch (lhs.Type()) { | ||
| 1040 | case Type::F16: | ||
| 1041 | return Inst<U1>(ordered ? Opcode::FPOrdGreaterThanEqual16 | ||
| 1042 | : Opcode::FPUnordGreaterThanEqual16, | ||
| 1043 | Flags{control}, lhs, rhs); | ||
| 1044 | case Type::F32: | ||
| 1045 | return Inst<U1>(ordered ? Opcode::FPOrdGreaterThanEqual32 | ||
| 1046 | : Opcode::FPUnordGreaterThanEqual32, | ||
| 1047 | Flags{control}, lhs, rhs); | ||
| 1048 | case Type::F64: | ||
| 1049 | return Inst<U1>(ordered ? Opcode::FPOrdGreaterThanEqual64 | ||
| 1050 | : Opcode::FPUnordGreaterThanEqual64, | ||
| 1051 | Flags{control}, lhs, rhs); | ||
| 1052 | default: | ||
| 1053 | ThrowInvalidType(lhs.Type()); | ||
| 1054 | } | ||
| 1055 | } | ||
| 1056 | |||
| 1057 | U1 IREmitter::FPIsNan(const F16F32F64& value) { | ||
| 1058 | switch (value.Type()) { | ||
| 1059 | case Type::F16: | ||
| 1060 | return Inst<U1>(Opcode::FPIsNan16, value); | ||
| 1061 | case Type::F32: | ||
| 1062 | return Inst<U1>(Opcode::FPIsNan32, value); | ||
| 1063 | case Type::F64: | ||
| 1064 | return Inst<U1>(Opcode::FPIsNan64, value); | ||
| 1065 | default: | ||
| 1066 | ThrowInvalidType(value.Type()); | ||
| 1067 | } | ||
| 1068 | } | ||
| 1069 | |||
| 1070 | U1 IREmitter::FPOrdered(const F16F32F64& lhs, const F16F32F64& rhs) { | ||
| 1071 | if (lhs.Type() != rhs.Type()) { | ||
| 1072 | throw InvalidArgument("Mismatching types {} and {}", lhs.Type(), rhs.Type()); | ||
| 1073 | } | ||
| 1074 | return LogicalAnd(LogicalNot(FPIsNan(lhs)), LogicalNot(FPIsNan(rhs))); | ||
| 1075 | } | ||
| 1076 | |||
| 1077 | U1 IREmitter::FPUnordered(const F16F32F64& lhs, const F16F32F64& rhs) { | ||
| 1078 | if (lhs.Type() != rhs.Type()) { | ||
| 1079 | throw InvalidArgument("Mismatching types {} and {}", lhs.Type(), rhs.Type()); | ||
| 1080 | } | ||
| 1081 | return LogicalOr(FPIsNan(lhs), FPIsNan(rhs)); | ||
| 1082 | } | ||
| 1083 | |||
| 1084 | F32F64 IREmitter::FPMax(const F32F64& lhs, const F32F64& rhs, FpControl control) { | ||
| 1085 | if (lhs.Type() != rhs.Type()) { | ||
| 1086 | throw InvalidArgument("Mismatching types {} and {}", lhs.Type(), rhs.Type()); | ||
| 1087 | } | ||
| 1088 | switch (lhs.Type()) { | ||
| 1089 | case Type::F32: | ||
| 1090 | return Inst<F32>(Opcode::FPMax32, Flags{control}, lhs, rhs); | ||
| 1091 | case Type::F64: | ||
| 1092 | return Inst<F64>(Opcode::FPMax64, Flags{control}, lhs, rhs); | ||
| 1093 | default: | ||
| 1094 | ThrowInvalidType(lhs.Type()); | ||
| 1095 | } | ||
| 1096 | } | ||
| 1097 | |||
| 1098 | F32F64 IREmitter::FPMin(const F32F64& lhs, const F32F64& rhs, FpControl control) { | ||
| 1099 | if (lhs.Type() != rhs.Type()) { | ||
| 1100 | throw InvalidArgument("Mismatching types {} and {}", lhs.Type(), rhs.Type()); | ||
| 1101 | } | ||
| 1102 | switch (lhs.Type()) { | ||
| 1103 | case Type::F32: | ||
| 1104 | return Inst<F32>(Opcode::FPMin32, Flags{control}, lhs, rhs); | ||
| 1105 | case Type::F64: | ||
| 1106 | return Inst<F64>(Opcode::FPMin64, Flags{control}, lhs, rhs); | ||
| 1107 | default: | ||
| 1108 | ThrowInvalidType(lhs.Type()); | ||
| 1109 | } | ||
| 1110 | } | ||
| 1111 | |||
| 1112 | U32U64 IREmitter::IAdd(const U32U64& a, const U32U64& b) { | ||
| 1113 | if (a.Type() != b.Type()) { | ||
| 1114 | throw InvalidArgument("Mismatching types {} and {}", a.Type(), b.Type()); | ||
| 1115 | } | ||
| 1116 | switch (a.Type()) { | ||
| 1117 | case Type::U32: | ||
| 1118 | return Inst<U32>(Opcode::IAdd32, a, b); | ||
| 1119 | case Type::U64: | ||
| 1120 | return Inst<U64>(Opcode::IAdd64, a, b); | ||
| 1121 | default: | ||
| 1122 | ThrowInvalidType(a.Type()); | ||
| 1123 | } | ||
| 1124 | } | ||
| 1125 | |||
| 1126 | U32U64 IREmitter::ISub(const U32U64& a, const U32U64& b) { | ||
| 1127 | if (a.Type() != b.Type()) { | ||
| 1128 | throw InvalidArgument("Mismatching types {} and {}", a.Type(), b.Type()); | ||
| 1129 | } | ||
| 1130 | switch (a.Type()) { | ||
| 1131 | case Type::U32: | ||
| 1132 | return Inst<U32>(Opcode::ISub32, a, b); | ||
| 1133 | case Type::U64: | ||
| 1134 | return Inst<U64>(Opcode::ISub64, a, b); | ||
| 1135 | default: | ||
| 1136 | ThrowInvalidType(a.Type()); | ||
| 1137 | } | ||
| 1138 | } | ||
| 1139 | |||
| 1140 | U32 IREmitter::IMul(const U32& a, const U32& b) { | ||
| 1141 | return Inst<U32>(Opcode::IMul32, a, b); | ||
| 1142 | } | ||
| 1143 | |||
| 1144 | U32U64 IREmitter::INeg(const U32U64& value) { | ||
| 1145 | switch (value.Type()) { | ||
| 1146 | case Type::U32: | ||
| 1147 | return Inst<U32>(Opcode::INeg32, value); | ||
| 1148 | case Type::U64: | ||
| 1149 | return Inst<U64>(Opcode::INeg64, value); | ||
| 1150 | default: | ||
| 1151 | ThrowInvalidType(value.Type()); | ||
| 1152 | } | ||
| 1153 | } | ||
| 1154 | |||
| 1155 | U32 IREmitter::IAbs(const U32& value) { | ||
| 1156 | return Inst<U32>(Opcode::IAbs32, value); | ||
| 1157 | } | ||
| 1158 | |||
| 1159 | U32U64 IREmitter::ShiftLeftLogical(const U32U64& base, const U32& shift) { | ||
| 1160 | switch (base.Type()) { | ||
| 1161 | case Type::U32: | ||
| 1162 | return Inst<U32>(Opcode::ShiftLeftLogical32, base, shift); | ||
| 1163 | case Type::U64: | ||
| 1164 | return Inst<U64>(Opcode::ShiftLeftLogical64, base, shift); | ||
| 1165 | default: | ||
| 1166 | ThrowInvalidType(base.Type()); | ||
| 1167 | } | ||
| 1168 | } | ||
| 1169 | |||
| 1170 | U32U64 IREmitter::ShiftRightLogical(const U32U64& base, const U32& shift) { | ||
| 1171 | switch (base.Type()) { | ||
| 1172 | case Type::U32: | ||
| 1173 | return Inst<U32>(Opcode::ShiftRightLogical32, base, shift); | ||
| 1174 | case Type::U64: | ||
| 1175 | return Inst<U64>(Opcode::ShiftRightLogical64, base, shift); | ||
| 1176 | default: | ||
| 1177 | ThrowInvalidType(base.Type()); | ||
| 1178 | } | ||
| 1179 | } | ||
| 1180 | |||
| 1181 | U32U64 IREmitter::ShiftRightArithmetic(const U32U64& base, const U32& shift) { | ||
| 1182 | switch (base.Type()) { | ||
| 1183 | case Type::U32: | ||
| 1184 | return Inst<U32>(Opcode::ShiftRightArithmetic32, base, shift); | ||
| 1185 | case Type::U64: | ||
| 1186 | return Inst<U64>(Opcode::ShiftRightArithmetic64, base, shift); | ||
| 1187 | default: | ||
| 1188 | ThrowInvalidType(base.Type()); | ||
| 1189 | } | ||
| 1190 | } | ||
| 1191 | |||
| 1192 | U32 IREmitter::BitwiseAnd(const U32& a, const U32& b) { | ||
| 1193 | return Inst<U32>(Opcode::BitwiseAnd32, a, b); | ||
| 1194 | } | ||
| 1195 | |||
| 1196 | U32 IREmitter::BitwiseOr(const U32& a, const U32& b) { | ||
| 1197 | return Inst<U32>(Opcode::BitwiseOr32, a, b); | ||
| 1198 | } | ||
| 1199 | |||
| 1200 | U32 IREmitter::BitwiseXor(const U32& a, const U32& b) { | ||
| 1201 | return Inst<U32>(Opcode::BitwiseXor32, a, b); | ||
| 1202 | } | ||
| 1203 | |||
| 1204 | U32 IREmitter::BitFieldInsert(const U32& base, const U32& insert, const U32& offset, | ||
| 1205 | const U32& count) { | ||
| 1206 | return Inst<U32>(Opcode::BitFieldInsert, base, insert, offset, count); | ||
| 1207 | } | ||
| 1208 | |||
| 1209 | U32 IREmitter::BitFieldExtract(const U32& base, const U32& offset, const U32& count, | ||
| 1210 | bool is_signed) { | ||
| 1211 | return Inst<U32>(is_signed ? Opcode::BitFieldSExtract : Opcode::BitFieldUExtract, base, offset, | ||
| 1212 | count); | ||
| 1213 | } | ||
| 1214 | |||
| 1215 | U32 IREmitter::BitReverse(const U32& value) { | ||
| 1216 | return Inst<U32>(Opcode::BitReverse32, value); | ||
| 1217 | } | ||
| 1218 | |||
| 1219 | U32 IREmitter::BitCount(const U32& value) { | ||
| 1220 | return Inst<U32>(Opcode::BitCount32, value); | ||
| 1221 | } | ||
| 1222 | |||
| 1223 | U32 IREmitter::BitwiseNot(const U32& value) { | ||
| 1224 | return Inst<U32>(Opcode::BitwiseNot32, value); | ||
| 1225 | } | ||
| 1226 | |||
| 1227 | U32 IREmitter::FindSMsb(const U32& value) { | ||
| 1228 | return Inst<U32>(Opcode::FindSMsb32, value); | ||
| 1229 | } | ||
| 1230 | |||
| 1231 | U32 IREmitter::FindUMsb(const U32& value) { | ||
| 1232 | return Inst<U32>(Opcode::FindUMsb32, value); | ||
| 1233 | } | ||
| 1234 | |||
| 1235 | U32 IREmitter::SMin(const U32& a, const U32& b) { | ||
| 1236 | return Inst<U32>(Opcode::SMin32, a, b); | ||
| 1237 | } | ||
| 1238 | |||
| 1239 | U32 IREmitter::UMin(const U32& a, const U32& b) { | ||
| 1240 | return Inst<U32>(Opcode::UMin32, a, b); | ||
| 1241 | } | ||
| 1242 | |||
| 1243 | U32 IREmitter::IMin(const U32& a, const U32& b, bool is_signed) { | ||
| 1244 | return is_signed ? SMin(a, b) : UMin(a, b); | ||
| 1245 | } | ||
| 1246 | |||
| 1247 | U32 IREmitter::SMax(const U32& a, const U32& b) { | ||
| 1248 | return Inst<U32>(Opcode::SMax32, a, b); | ||
| 1249 | } | ||
| 1250 | |||
| 1251 | U32 IREmitter::UMax(const U32& a, const U32& b) { | ||
| 1252 | return Inst<U32>(Opcode::UMax32, a, b); | ||
| 1253 | } | ||
| 1254 | |||
| 1255 | U32 IREmitter::IMax(const U32& a, const U32& b, bool is_signed) { | ||
| 1256 | return is_signed ? SMax(a, b) : UMax(a, b); | ||
| 1257 | } | ||
| 1258 | |||
| 1259 | U32 IREmitter::SClamp(const U32& value, const U32& min, const U32& max) { | ||
| 1260 | return Inst<U32>(Opcode::SClamp32, value, min, max); | ||
| 1261 | } | ||
| 1262 | |||
| 1263 | U32 IREmitter::UClamp(const U32& value, const U32& min, const U32& max) { | ||
| 1264 | return Inst<U32>(Opcode::UClamp32, value, min, max); | ||
| 1265 | } | ||
| 1266 | |||
| 1267 | U1 IREmitter::ILessThan(const U32& lhs, const U32& rhs, bool is_signed) { | ||
| 1268 | return Inst<U1>(is_signed ? Opcode::SLessThan : Opcode::ULessThan, lhs, rhs); | ||
| 1269 | } | ||
| 1270 | |||
| 1271 | U1 IREmitter::IEqual(const U32U64& lhs, const U32U64& rhs) { | ||
| 1272 | if (lhs.Type() != rhs.Type()) { | ||
| 1273 | throw InvalidArgument("Mismatching types {} and {}", lhs.Type(), rhs.Type()); | ||
| 1274 | } | ||
| 1275 | switch (lhs.Type()) { | ||
| 1276 | case Type::U32: | ||
| 1277 | return Inst<U1>(Opcode::IEqual, lhs, rhs); | ||
| 1278 | case Type::U64: { | ||
| 1279 | // Manually compare the unpacked values | ||
| 1280 | const Value lhs_vector{UnpackUint2x32(lhs)}; | ||
| 1281 | const Value rhs_vector{UnpackUint2x32(rhs)}; | ||
| 1282 | return LogicalAnd(IEqual(IR::U32{CompositeExtract(lhs_vector, 0)}, | ||
| 1283 | IR::U32{CompositeExtract(rhs_vector, 0)}), | ||
| 1284 | IEqual(IR::U32{CompositeExtract(lhs_vector, 1)}, | ||
| 1285 | IR::U32{CompositeExtract(rhs_vector, 1)})); | ||
| 1286 | } | ||
| 1287 | default: | ||
| 1288 | ThrowInvalidType(lhs.Type()); | ||
| 1289 | } | ||
| 1290 | } | ||
| 1291 | |||
| 1292 | U1 IREmitter::ILessThanEqual(const U32& lhs, const U32& rhs, bool is_signed) { | ||
| 1293 | return Inst<U1>(is_signed ? Opcode::SLessThanEqual : Opcode::ULessThanEqual, lhs, rhs); | ||
| 1294 | } | ||
| 1295 | |||
| 1296 | U1 IREmitter::IGreaterThan(const U32& lhs, const U32& rhs, bool is_signed) { | ||
| 1297 | return Inst<U1>(is_signed ? Opcode::SGreaterThan : Opcode::UGreaterThan, lhs, rhs); | ||
| 1298 | } | ||
| 1299 | |||
| 1300 | U1 IREmitter::INotEqual(const U32& lhs, const U32& rhs) { | ||
| 1301 | return Inst<U1>(Opcode::INotEqual, lhs, rhs); | ||
| 1302 | } | ||
| 1303 | |||
| 1304 | U1 IREmitter::IGreaterThanEqual(const U32& lhs, const U32& rhs, bool is_signed) { | ||
| 1305 | return Inst<U1>(is_signed ? Opcode::SGreaterThanEqual : Opcode::UGreaterThanEqual, lhs, rhs); | ||
| 1306 | } | ||
| 1307 | |||
| 1308 | U32 IREmitter::SharedAtomicIAdd(const U32& pointer_offset, const U32& value) { | ||
| 1309 | return Inst<U32>(Opcode::SharedAtomicIAdd32, pointer_offset, value); | ||
| 1310 | } | ||
| 1311 | |||
| 1312 | U32 IREmitter::SharedAtomicSMin(const U32& pointer_offset, const U32& value) { | ||
| 1313 | return Inst<U32>(Opcode::SharedAtomicSMin32, pointer_offset, value); | ||
| 1314 | } | ||
| 1315 | |||
| 1316 | U32 IREmitter::SharedAtomicUMin(const U32& pointer_offset, const U32& value) { | ||
| 1317 | return Inst<U32>(Opcode::SharedAtomicUMin32, pointer_offset, value); | ||
| 1318 | } | ||
| 1319 | |||
| 1320 | U32 IREmitter::SharedAtomicIMin(const U32& pointer_offset, const U32& value, bool is_signed) { | ||
| 1321 | return is_signed ? SharedAtomicSMin(pointer_offset, value) | ||
| 1322 | : SharedAtomicUMin(pointer_offset, value); | ||
| 1323 | } | ||
| 1324 | |||
| 1325 | U32 IREmitter::SharedAtomicSMax(const U32& pointer_offset, const U32& value) { | ||
| 1326 | return Inst<U32>(Opcode::SharedAtomicSMax32, pointer_offset, value); | ||
| 1327 | } | ||
| 1328 | |||
| 1329 | U32 IREmitter::SharedAtomicUMax(const U32& pointer_offset, const U32& value) { | ||
| 1330 | return Inst<U32>(Opcode::SharedAtomicUMax32, pointer_offset, value); | ||
| 1331 | } | ||
| 1332 | |||
| 1333 | U32 IREmitter::SharedAtomicIMax(const U32& pointer_offset, const U32& value, bool is_signed) { | ||
| 1334 | return is_signed ? SharedAtomicSMax(pointer_offset, value) | ||
| 1335 | : SharedAtomicUMax(pointer_offset, value); | ||
| 1336 | } | ||
| 1337 | |||
| 1338 | U32 IREmitter::SharedAtomicInc(const U32& pointer_offset, const U32& value) { | ||
| 1339 | return Inst<U32>(Opcode::SharedAtomicInc32, pointer_offset, value); | ||
| 1340 | } | ||
| 1341 | |||
| 1342 | U32 IREmitter::SharedAtomicDec(const U32& pointer_offset, const U32& value) { | ||
| 1343 | return Inst<U32>(Opcode::SharedAtomicDec32, pointer_offset, value); | ||
| 1344 | } | ||
| 1345 | |||
| 1346 | U32 IREmitter::SharedAtomicAnd(const U32& pointer_offset, const U32& value) { | ||
| 1347 | return Inst<U32>(Opcode::SharedAtomicAnd32, pointer_offset, value); | ||
| 1348 | } | ||
| 1349 | |||
| 1350 | U32 IREmitter::SharedAtomicOr(const U32& pointer_offset, const U32& value) { | ||
| 1351 | return Inst<U32>(Opcode::SharedAtomicOr32, pointer_offset, value); | ||
| 1352 | } | ||
| 1353 | |||
| 1354 | U32 IREmitter::SharedAtomicXor(const U32& pointer_offset, const U32& value) { | ||
| 1355 | return Inst<U32>(Opcode::SharedAtomicXor32, pointer_offset, value); | ||
| 1356 | } | ||
| 1357 | |||
| 1358 | U32U64 IREmitter::SharedAtomicExchange(const U32& pointer_offset, const U32U64& value) { | ||
| 1359 | switch (value.Type()) { | ||
| 1360 | case Type::U32: | ||
| 1361 | return Inst<U32>(Opcode::SharedAtomicExchange32, pointer_offset, value); | ||
| 1362 | case Type::U64: | ||
| 1363 | return Inst<U64>(Opcode::SharedAtomicExchange64, pointer_offset, value); | ||
| 1364 | default: | ||
| 1365 | ThrowInvalidType(pointer_offset.Type()); | ||
| 1366 | } | ||
| 1367 | } | ||
| 1368 | |||
| 1369 | U32U64 IREmitter::GlobalAtomicIAdd(const U64& pointer_offset, const U32U64& value) { | ||
| 1370 | switch (value.Type()) { | ||
| 1371 | case Type::U32: | ||
| 1372 | return Inst<U32>(Opcode::GlobalAtomicIAdd32, pointer_offset, value); | ||
| 1373 | case Type::U64: | ||
| 1374 | return Inst<U64>(Opcode::GlobalAtomicIAdd64, pointer_offset, value); | ||
| 1375 | default: | ||
| 1376 | ThrowInvalidType(value.Type()); | ||
| 1377 | } | ||
| 1378 | } | ||
| 1379 | |||
| 1380 | U32U64 IREmitter::GlobalAtomicSMin(const U64& pointer_offset, const U32U64& value) { | ||
| 1381 | switch (value.Type()) { | ||
| 1382 | case Type::U32: | ||
| 1383 | return Inst<U32>(Opcode::GlobalAtomicSMin32, pointer_offset, value); | ||
| 1384 | case Type::U64: | ||
| 1385 | return Inst<U64>(Opcode::GlobalAtomicSMin64, pointer_offset, value); | ||
| 1386 | default: | ||
| 1387 | ThrowInvalidType(value.Type()); | ||
| 1388 | } | ||
| 1389 | } | ||
| 1390 | |||
| 1391 | U32U64 IREmitter::GlobalAtomicUMin(const U64& pointer_offset, const U32U64& value) { | ||
| 1392 | switch (value.Type()) { | ||
| 1393 | case Type::U32: | ||
| 1394 | return Inst<U32>(Opcode::GlobalAtomicUMin32, pointer_offset, value); | ||
| 1395 | case Type::U64: | ||
| 1396 | return Inst<U64>(Opcode::GlobalAtomicUMin64, pointer_offset, value); | ||
| 1397 | default: | ||
| 1398 | ThrowInvalidType(value.Type()); | ||
| 1399 | } | ||
| 1400 | } | ||
| 1401 | |||
| 1402 | U32U64 IREmitter::GlobalAtomicIMin(const U64& pointer_offset, const U32U64& value, bool is_signed) { | ||
| 1403 | return is_signed ? GlobalAtomicSMin(pointer_offset, value) | ||
| 1404 | : GlobalAtomicUMin(pointer_offset, value); | ||
| 1405 | } | ||
| 1406 | |||
| 1407 | U32U64 IREmitter::GlobalAtomicSMax(const U64& pointer_offset, const U32U64& value) { | ||
| 1408 | switch (value.Type()) { | ||
| 1409 | case Type::U32: | ||
| 1410 | return Inst<U32>(Opcode::GlobalAtomicSMax32, pointer_offset, value); | ||
| 1411 | case Type::U64: | ||
| 1412 | return Inst<U64>(Opcode::GlobalAtomicSMax64, pointer_offset, value); | ||
| 1413 | default: | ||
| 1414 | ThrowInvalidType(value.Type()); | ||
| 1415 | } | ||
| 1416 | } | ||
| 1417 | |||
| 1418 | U32U64 IREmitter::GlobalAtomicUMax(const U64& pointer_offset, const U32U64& value) { | ||
| 1419 | switch (value.Type()) { | ||
| 1420 | case Type::U32: | ||
| 1421 | return Inst<U32>(Opcode::GlobalAtomicUMax32, pointer_offset, value); | ||
| 1422 | case Type::U64: | ||
| 1423 | return Inst<U64>(Opcode::GlobalAtomicUMax64, pointer_offset, value); | ||
| 1424 | default: | ||
| 1425 | ThrowInvalidType(value.Type()); | ||
| 1426 | } | ||
| 1427 | } | ||
| 1428 | |||
| 1429 | U32U64 IREmitter::GlobalAtomicIMax(const U64& pointer_offset, const U32U64& value, bool is_signed) { | ||
| 1430 | return is_signed ? GlobalAtomicSMax(pointer_offset, value) | ||
| 1431 | : GlobalAtomicUMax(pointer_offset, value); | ||
| 1432 | } | ||
| 1433 | |||
| 1434 | U32 IREmitter::GlobalAtomicInc(const U64& pointer_offset, const U32& value) { | ||
| 1435 | return Inst<U32>(Opcode::GlobalAtomicInc32, pointer_offset, value); | ||
| 1436 | } | ||
| 1437 | |||
| 1438 | U32 IREmitter::GlobalAtomicDec(const U64& pointer_offset, const U32& value) { | ||
| 1439 | return Inst<U32>(Opcode::GlobalAtomicDec32, pointer_offset, value); | ||
| 1440 | } | ||
| 1441 | |||
| 1442 | U32U64 IREmitter::GlobalAtomicAnd(const U64& pointer_offset, const U32U64& value) { | ||
| 1443 | switch (value.Type()) { | ||
| 1444 | case Type::U32: | ||
| 1445 | return Inst<U32>(Opcode::GlobalAtomicAnd32, pointer_offset, value); | ||
| 1446 | case Type::U64: | ||
| 1447 | return Inst<U64>(Opcode::GlobalAtomicAnd64, pointer_offset, value); | ||
| 1448 | default: | ||
| 1449 | ThrowInvalidType(value.Type()); | ||
| 1450 | } | ||
| 1451 | } | ||
| 1452 | |||
| 1453 | U32U64 IREmitter::GlobalAtomicOr(const U64& pointer_offset, const U32U64& value) { | ||
| 1454 | switch (value.Type()) { | ||
| 1455 | case Type::U32: | ||
| 1456 | return Inst<U32>(Opcode::GlobalAtomicOr32, pointer_offset, value); | ||
| 1457 | case Type::U64: | ||
| 1458 | return Inst<U64>(Opcode::GlobalAtomicOr64, pointer_offset, value); | ||
| 1459 | default: | ||
| 1460 | ThrowInvalidType(value.Type()); | ||
| 1461 | } | ||
| 1462 | } | ||
| 1463 | |||
| 1464 | U32U64 IREmitter::GlobalAtomicXor(const U64& pointer_offset, const U32U64& value) { | ||
| 1465 | switch (value.Type()) { | ||
| 1466 | case Type::U32: | ||
| 1467 | return Inst<U32>(Opcode::GlobalAtomicXor32, pointer_offset, value); | ||
| 1468 | case Type::U64: | ||
| 1469 | return Inst<U64>(Opcode::GlobalAtomicXor64, pointer_offset, value); | ||
| 1470 | default: | ||
| 1471 | ThrowInvalidType(value.Type()); | ||
| 1472 | } | ||
| 1473 | } | ||
| 1474 | |||
| 1475 | U32U64 IREmitter::GlobalAtomicExchange(const U64& pointer_offset, const U32U64& value) { | ||
| 1476 | switch (value.Type()) { | ||
| 1477 | case Type::U32: | ||
| 1478 | return Inst<U32>(Opcode::GlobalAtomicExchange32, pointer_offset, value); | ||
| 1479 | case Type::U64: | ||
| 1480 | return Inst<U64>(Opcode::GlobalAtomicExchange64, pointer_offset, value); | ||
| 1481 | default: | ||
| 1482 | ThrowInvalidType(pointer_offset.Type()); | ||
| 1483 | } | ||
| 1484 | } | ||
| 1485 | |||
| 1486 | F32 IREmitter::GlobalAtomicF32Add(const U64& pointer_offset, const Value& value, | ||
| 1487 | const FpControl control) { | ||
| 1488 | return Inst<F32>(Opcode::GlobalAtomicAddF32, Flags{control}, pointer_offset, value); | ||
| 1489 | } | ||
| 1490 | |||
| 1491 | Value IREmitter::GlobalAtomicF16x2Add(const U64& pointer_offset, const Value& value, | ||
| 1492 | const FpControl control) { | ||
| 1493 | return Inst(Opcode::GlobalAtomicAddF16x2, Flags{control}, pointer_offset, value); | ||
| 1494 | } | ||
| 1495 | |||
| 1496 | Value IREmitter::GlobalAtomicF16x2Min(const U64& pointer_offset, const Value& value, | ||
| 1497 | const FpControl control) { | ||
| 1498 | return Inst(Opcode::GlobalAtomicMinF16x2, Flags{control}, pointer_offset, value); | ||
| 1499 | } | ||
| 1500 | |||
| 1501 | Value IREmitter::GlobalAtomicF16x2Max(const U64& pointer_offset, const Value& value, | ||
| 1502 | const FpControl control) { | ||
| 1503 | return Inst(Opcode::GlobalAtomicMaxF16x2, Flags{control}, pointer_offset, value); | ||
| 1504 | } | ||
| 1505 | |||
| 1506 | U1 IREmitter::LogicalOr(const U1& a, const U1& b) { | ||
| 1507 | return Inst<U1>(Opcode::LogicalOr, a, b); | ||
| 1508 | } | ||
| 1509 | |||
| 1510 | U1 IREmitter::LogicalAnd(const U1& a, const U1& b) { | ||
| 1511 | return Inst<U1>(Opcode::LogicalAnd, a, b); | ||
| 1512 | } | ||
| 1513 | |||
| 1514 | U1 IREmitter::LogicalXor(const U1& a, const U1& b) { | ||
| 1515 | return Inst<U1>(Opcode::LogicalXor, a, b); | ||
| 1516 | } | ||
| 1517 | |||
| 1518 | U1 IREmitter::LogicalNot(const U1& value) { | ||
| 1519 | return Inst<U1>(Opcode::LogicalNot, value); | ||
| 1520 | } | ||
| 1521 | |||
| 1522 | U32U64 IREmitter::ConvertFToS(size_t bitsize, const F16F32F64& value) { | ||
| 1523 | switch (bitsize) { | ||
| 1524 | case 16: | ||
| 1525 | switch (value.Type()) { | ||
| 1526 | case Type::F16: | ||
| 1527 | return Inst<U32>(Opcode::ConvertS16F16, value); | ||
| 1528 | case Type::F32: | ||
| 1529 | return Inst<U32>(Opcode::ConvertS16F32, value); | ||
| 1530 | case Type::F64: | ||
| 1531 | return Inst<U32>(Opcode::ConvertS16F64, value); | ||
| 1532 | default: | ||
| 1533 | ThrowInvalidType(value.Type()); | ||
| 1534 | } | ||
| 1535 | case 32: | ||
| 1536 | switch (value.Type()) { | ||
| 1537 | case Type::F16: | ||
| 1538 | return Inst<U32>(Opcode::ConvertS32F16, value); | ||
| 1539 | case Type::F32: | ||
| 1540 | return Inst<U32>(Opcode::ConvertS32F32, value); | ||
| 1541 | case Type::F64: | ||
| 1542 | return Inst<U32>(Opcode::ConvertS32F64, value); | ||
| 1543 | default: | ||
| 1544 | ThrowInvalidType(value.Type()); | ||
| 1545 | } | ||
| 1546 | case 64: | ||
| 1547 | switch (value.Type()) { | ||
| 1548 | case Type::F16: | ||
| 1549 | return Inst<U64>(Opcode::ConvertS64F16, value); | ||
| 1550 | case Type::F32: | ||
| 1551 | return Inst<U64>(Opcode::ConvertS64F32, value); | ||
| 1552 | case Type::F64: | ||
| 1553 | return Inst<U64>(Opcode::ConvertS64F64, value); | ||
| 1554 | default: | ||
| 1555 | ThrowInvalidType(value.Type()); | ||
| 1556 | } | ||
| 1557 | default: | ||
| 1558 | throw InvalidArgument("Invalid destination bitsize {}", bitsize); | ||
| 1559 | } | ||
| 1560 | } | ||
| 1561 | |||
| 1562 | U32U64 IREmitter::ConvertFToU(size_t bitsize, const F16F32F64& value) { | ||
| 1563 | switch (bitsize) { | ||
| 1564 | case 16: | ||
| 1565 | switch (value.Type()) { | ||
| 1566 | case Type::F16: | ||
| 1567 | return Inst<U32>(Opcode::ConvertU16F16, value); | ||
| 1568 | case Type::F32: | ||
| 1569 | return Inst<U32>(Opcode::ConvertU16F32, value); | ||
| 1570 | case Type::F64: | ||
| 1571 | return Inst<U32>(Opcode::ConvertU16F64, value); | ||
| 1572 | default: | ||
| 1573 | ThrowInvalidType(value.Type()); | ||
| 1574 | } | ||
| 1575 | case 32: | ||
| 1576 | switch (value.Type()) { | ||
| 1577 | case Type::F16: | ||
| 1578 | return Inst<U32>(Opcode::ConvertU32F16, value); | ||
| 1579 | case Type::F32: | ||
| 1580 | return Inst<U32>(Opcode::ConvertU32F32, value); | ||
| 1581 | case Type::F64: | ||
| 1582 | return Inst<U32>(Opcode::ConvertU32F64, value); | ||
| 1583 | default: | ||
| 1584 | ThrowInvalidType(value.Type()); | ||
| 1585 | } | ||
| 1586 | case 64: | ||
| 1587 | switch (value.Type()) { | ||
| 1588 | case Type::F16: | ||
| 1589 | return Inst<U64>(Opcode::ConvertU64F16, value); | ||
| 1590 | case Type::F32: | ||
| 1591 | return Inst<U64>(Opcode::ConvertU64F32, value); | ||
| 1592 | case Type::F64: | ||
| 1593 | return Inst<U64>(Opcode::ConvertU64F64, value); | ||
| 1594 | default: | ||
| 1595 | ThrowInvalidType(value.Type()); | ||
| 1596 | } | ||
| 1597 | default: | ||
| 1598 | throw InvalidArgument("Invalid destination bitsize {}", bitsize); | ||
| 1599 | } | ||
| 1600 | } | ||
| 1601 | |||
| 1602 | U32U64 IREmitter::ConvertFToI(size_t bitsize, bool is_signed, const F16F32F64& value) { | ||
| 1603 | return is_signed ? ConvertFToS(bitsize, value) : ConvertFToU(bitsize, value); | ||
| 1604 | } | ||
| 1605 | |||
| 1606 | F16F32F64 IREmitter::ConvertSToF(size_t dest_bitsize, size_t src_bitsize, const Value& value, | ||
| 1607 | FpControl control) { | ||
| 1608 | switch (dest_bitsize) { | ||
| 1609 | case 16: | ||
| 1610 | switch (src_bitsize) { | ||
| 1611 | case 8: | ||
| 1612 | return Inst<F16>(Opcode::ConvertF16S8, Flags{control}, value); | ||
| 1613 | case 16: | ||
| 1614 | return Inst<F16>(Opcode::ConvertF16S16, Flags{control}, value); | ||
| 1615 | case 32: | ||
| 1616 | return Inst<F16>(Opcode::ConvertF16S32, Flags{control}, value); | ||
| 1617 | case 64: | ||
| 1618 | return Inst<F16>(Opcode::ConvertF16S64, Flags{control}, value); | ||
| 1619 | } | ||
| 1620 | break; | ||
| 1621 | case 32: | ||
| 1622 | switch (src_bitsize) { | ||
| 1623 | case 8: | ||
| 1624 | return Inst<F32>(Opcode::ConvertF32S8, Flags{control}, value); | ||
| 1625 | case 16: | ||
| 1626 | return Inst<F32>(Opcode::ConvertF32S16, Flags{control}, value); | ||
| 1627 | case 32: | ||
| 1628 | return Inst<F32>(Opcode::ConvertF32S32, Flags{control}, value); | ||
| 1629 | case 64: | ||
| 1630 | return Inst<F32>(Opcode::ConvertF32S64, Flags{control}, value); | ||
| 1631 | } | ||
| 1632 | break; | ||
| 1633 | case 64: | ||
| 1634 | switch (src_bitsize) { | ||
| 1635 | case 8: | ||
| 1636 | return Inst<F64>(Opcode::ConvertF64S8, Flags{control}, value); | ||
| 1637 | case 16: | ||
| 1638 | return Inst<F64>(Opcode::ConvertF64S16, Flags{control}, value); | ||
| 1639 | case 32: | ||
| 1640 | return Inst<F64>(Opcode::ConvertF64S32, Flags{control}, value); | ||
| 1641 | case 64: | ||
| 1642 | return Inst<F64>(Opcode::ConvertF64S64, Flags{control}, value); | ||
| 1643 | } | ||
| 1644 | break; | ||
| 1645 | } | ||
| 1646 | throw InvalidArgument("Invalid bit size combination dst={} src={}", dest_bitsize, src_bitsize); | ||
| 1647 | } | ||
| 1648 | |||
| 1649 | F16F32F64 IREmitter::ConvertUToF(size_t dest_bitsize, size_t src_bitsize, const Value& value, | ||
| 1650 | FpControl control) { | ||
| 1651 | switch (dest_bitsize) { | ||
| 1652 | case 16: | ||
| 1653 | switch (src_bitsize) { | ||
| 1654 | case 8: | ||
| 1655 | return Inst<F16>(Opcode::ConvertF16U8, Flags{control}, value); | ||
| 1656 | case 16: | ||
| 1657 | return Inst<F16>(Opcode::ConvertF16U16, Flags{control}, value); | ||
| 1658 | case 32: | ||
| 1659 | return Inst<F16>(Opcode::ConvertF16U32, Flags{control}, value); | ||
| 1660 | case 64: | ||
| 1661 | return Inst<F16>(Opcode::ConvertF16U64, Flags{control}, value); | ||
| 1662 | } | ||
| 1663 | break; | ||
| 1664 | case 32: | ||
| 1665 | switch (src_bitsize) { | ||
| 1666 | case 8: | ||
| 1667 | return Inst<F32>(Opcode::ConvertF32U8, Flags{control}, value); | ||
| 1668 | case 16: | ||
| 1669 | return Inst<F32>(Opcode::ConvertF32U16, Flags{control}, value); | ||
| 1670 | case 32: | ||
| 1671 | return Inst<F32>(Opcode::ConvertF32U32, Flags{control}, value); | ||
| 1672 | case 64: | ||
| 1673 | return Inst<F32>(Opcode::ConvertF32U64, Flags{control}, value); | ||
| 1674 | } | ||
| 1675 | break; | ||
| 1676 | case 64: | ||
| 1677 | switch (src_bitsize) { | ||
| 1678 | case 8: | ||
| 1679 | return Inst<F64>(Opcode::ConvertF64U8, Flags{control}, value); | ||
| 1680 | case 16: | ||
| 1681 | return Inst<F64>(Opcode::ConvertF64U16, Flags{control}, value); | ||
| 1682 | case 32: | ||
| 1683 | return Inst<F64>(Opcode::ConvertF64U32, Flags{control}, value); | ||
| 1684 | case 64: | ||
| 1685 | return Inst<F64>(Opcode::ConvertF64U64, Flags{control}, value); | ||
| 1686 | } | ||
| 1687 | break; | ||
| 1688 | } | ||
| 1689 | throw InvalidArgument("Invalid bit size combination dst={} src={}", dest_bitsize, src_bitsize); | ||
| 1690 | } | ||
| 1691 | |||
| 1692 | F16F32F64 IREmitter::ConvertIToF(size_t dest_bitsize, size_t src_bitsize, bool is_signed, | ||
| 1693 | const Value& value, FpControl control) { | ||
| 1694 | return is_signed ? ConvertSToF(dest_bitsize, src_bitsize, value, control) | ||
| 1695 | : ConvertUToF(dest_bitsize, src_bitsize, value, control); | ||
| 1696 | } | ||
| 1697 | |||
| 1698 | U32U64 IREmitter::UConvert(size_t result_bitsize, const U32U64& value) { | ||
| 1699 | switch (result_bitsize) { | ||
| 1700 | case 32: | ||
| 1701 | switch (value.Type()) { | ||
| 1702 | case Type::U32: | ||
| 1703 | // Nothing to do | ||
| 1704 | return value; | ||
| 1705 | case Type::U64: | ||
| 1706 | return Inst<U32>(Opcode::ConvertU32U64, value); | ||
| 1707 | default: | ||
| 1708 | break; | ||
| 1709 | } | ||
| 1710 | break; | ||
| 1711 | case 64: | ||
| 1712 | switch (value.Type()) { | ||
| 1713 | case Type::U32: | ||
| 1714 | return Inst<U64>(Opcode::ConvertU64U32, value); | ||
| 1715 | case Type::U64: | ||
| 1716 | // Nothing to do | ||
| 1717 | return value; | ||
| 1718 | default: | ||
| 1719 | break; | ||
| 1720 | } | ||
| 1721 | } | ||
| 1722 | throw NotImplementedException("Conversion from {} to {} bits", value.Type(), result_bitsize); | ||
| 1723 | } | ||
| 1724 | |||
| 1725 | F16F32F64 IREmitter::FPConvert(size_t result_bitsize, const F16F32F64& value, FpControl control) { | ||
| 1726 | switch (result_bitsize) { | ||
| 1727 | case 16: | ||
| 1728 | switch (value.Type()) { | ||
| 1729 | case Type::F16: | ||
| 1730 | // Nothing to do | ||
| 1731 | return value; | ||
| 1732 | case Type::F32: | ||
| 1733 | return Inst<F16>(Opcode::ConvertF16F32, Flags{control}, value); | ||
| 1734 | case Type::F64: | ||
| 1735 | throw LogicError("Illegal conversion from F64 to F16"); | ||
| 1736 | default: | ||
| 1737 | break; | ||
| 1738 | } | ||
| 1739 | break; | ||
| 1740 | case 32: | ||
| 1741 | switch (value.Type()) { | ||
| 1742 | case Type::F16: | ||
| 1743 | return Inst<F32>(Opcode::ConvertF32F16, Flags{control}, value); | ||
| 1744 | case Type::F32: | ||
| 1745 | // Nothing to do | ||
| 1746 | return value; | ||
| 1747 | case Type::F64: | ||
| 1748 | return Inst<F32>(Opcode::ConvertF32F64, Flags{control}, value); | ||
| 1749 | default: | ||
| 1750 | break; | ||
| 1751 | } | ||
| 1752 | break; | ||
| 1753 | case 64: | ||
| 1754 | switch (value.Type()) { | ||
| 1755 | case Type::F16: | ||
| 1756 | throw LogicError("Illegal conversion from F16 to F64"); | ||
| 1757 | case Type::F32: | ||
| 1758 | return Inst<F64>(Opcode::ConvertF64F32, Flags{control}, value); | ||
| 1759 | case Type::F64: | ||
| 1760 | // Nothing to do | ||
| 1761 | return value; | ||
| 1762 | default: | ||
| 1763 | break; | ||
| 1764 | } | ||
| 1765 | break; | ||
| 1766 | } | ||
| 1767 | throw NotImplementedException("Conversion from {} to {} bits", value.Type(), result_bitsize); | ||
| 1768 | } | ||
| 1769 | |||
| 1770 | Value IREmitter::ImageSampleImplicitLod(const Value& handle, const Value& coords, const F32& bias, | ||
| 1771 | const Value& offset, const F32& lod_clamp, | ||
| 1772 | TextureInstInfo info) { | ||
| 1773 | const Value bias_lc{MakeLodClampPair(*this, bias, lod_clamp)}; | ||
| 1774 | const Opcode op{handle.IsImmediate() ? Opcode::BoundImageSampleImplicitLod | ||
| 1775 | : Opcode::BindlessImageSampleImplicitLod}; | ||
| 1776 | return Inst(op, Flags{info}, handle, coords, bias_lc, offset); | ||
| 1777 | } | ||
| 1778 | |||
| 1779 | Value IREmitter::ImageSampleExplicitLod(const Value& handle, const Value& coords, const F32& lod, | ||
| 1780 | const Value& offset, TextureInstInfo info) { | ||
| 1781 | const Opcode op{handle.IsImmediate() ? Opcode::BoundImageSampleExplicitLod | ||
| 1782 | : Opcode::BindlessImageSampleExplicitLod}; | ||
| 1783 | return Inst(op, Flags{info}, handle, coords, lod, offset); | ||
| 1784 | } | ||
| 1785 | |||
| 1786 | F32 IREmitter::ImageSampleDrefImplicitLod(const Value& handle, const Value& coords, const F32& dref, | ||
| 1787 | const F32& bias, const Value& offset, | ||
| 1788 | const F32& lod_clamp, TextureInstInfo info) { | ||
| 1789 | const Value bias_lc{MakeLodClampPair(*this, bias, lod_clamp)}; | ||
| 1790 | const Opcode op{handle.IsImmediate() ? Opcode::BoundImageSampleDrefImplicitLod | ||
| 1791 | : Opcode::BindlessImageSampleDrefImplicitLod}; | ||
| 1792 | return Inst<F32>(op, Flags{info}, handle, coords, dref, bias_lc, offset); | ||
| 1793 | } | ||
| 1794 | |||
| 1795 | F32 IREmitter::ImageSampleDrefExplicitLod(const Value& handle, const Value& coords, const F32& dref, | ||
| 1796 | const F32& lod, const Value& offset, | ||
| 1797 | TextureInstInfo info) { | ||
| 1798 | const Opcode op{handle.IsImmediate() ? Opcode::BoundImageSampleDrefExplicitLod | ||
| 1799 | : Opcode::BindlessImageSampleDrefExplicitLod}; | ||
| 1800 | return Inst<F32>(op, Flags{info}, handle, coords, dref, lod, offset); | ||
| 1801 | } | ||
| 1802 | |||
| 1803 | Value IREmitter::ImageGather(const Value& handle, const Value& coords, const Value& offset, | ||
| 1804 | const Value& offset2, TextureInstInfo info) { | ||
| 1805 | const Opcode op{handle.IsImmediate() ? Opcode::BoundImageGather : Opcode::BindlessImageGather}; | ||
| 1806 | return Inst(op, Flags{info}, handle, coords, offset, offset2); | ||
| 1807 | } | ||
| 1808 | |||
| 1809 | Value IREmitter::ImageGatherDref(const Value& handle, const Value& coords, const Value& offset, | ||
| 1810 | const Value& offset2, const F32& dref, TextureInstInfo info) { | ||
| 1811 | const Opcode op{handle.IsImmediate() ? Opcode::BoundImageGatherDref | ||
| 1812 | : Opcode::BindlessImageGatherDref}; | ||
| 1813 | return Inst(op, Flags{info}, handle, coords, offset, offset2, dref); | ||
| 1814 | } | ||
| 1815 | |||
| 1816 | Value IREmitter::ImageFetch(const Value& handle, const Value& coords, const Value& offset, | ||
| 1817 | const U32& lod, const U32& multisampling, TextureInstInfo info) { | ||
| 1818 | const Opcode op{handle.IsImmediate() ? Opcode::BoundImageFetch : Opcode::BindlessImageFetch}; | ||
| 1819 | return Inst(op, Flags{info}, handle, coords, offset, lod, multisampling); | ||
| 1820 | } | ||
| 1821 | |||
| 1822 | Value IREmitter::ImageQueryDimension(const Value& handle, const IR::U32& lod) { | ||
| 1823 | const Opcode op{handle.IsImmediate() ? Opcode::BoundImageQueryDimensions | ||
| 1824 | : Opcode::BindlessImageQueryDimensions}; | ||
| 1825 | return Inst(op, handle, lod); | ||
| 1826 | } | ||
| 1827 | |||
| 1828 | Value IREmitter::ImageQueryLod(const Value& handle, const Value& coords, TextureInstInfo info) { | ||
| 1829 | const Opcode op{handle.IsImmediate() ? Opcode::BoundImageQueryLod | ||
| 1830 | : Opcode::BindlessImageQueryLod}; | ||
| 1831 | return Inst(op, Flags{info}, handle, coords); | ||
| 1832 | } | ||
| 1833 | |||
| 1834 | Value IREmitter::ImageGradient(const Value& handle, const Value& coords, const Value& derivates, | ||
| 1835 | const Value& offset, const F32& lod_clamp, TextureInstInfo info) { | ||
| 1836 | const Opcode op{handle.IsImmediate() ? Opcode::BoundImageGradient | ||
| 1837 | : Opcode::BindlessImageGradient}; | ||
| 1838 | return Inst(op, Flags{info}, handle, coords, derivates, offset, lod_clamp); | ||
| 1839 | } | ||
| 1840 | |||
| 1841 | Value IREmitter::ImageRead(const Value& handle, const Value& coords, TextureInstInfo info) { | ||
| 1842 | const Opcode op{handle.IsImmediate() ? Opcode::BoundImageRead : Opcode::BindlessImageRead}; | ||
| 1843 | return Inst(op, Flags{info}, handle, coords); | ||
| 1844 | } | ||
| 1845 | |||
| 1846 | void IREmitter::ImageWrite(const Value& handle, const Value& coords, const Value& color, | ||
| 1847 | TextureInstInfo info) { | ||
| 1848 | const Opcode op{handle.IsImmediate() ? Opcode::BoundImageWrite : Opcode::BindlessImageWrite}; | ||
| 1849 | Inst(op, Flags{info}, handle, coords, color); | ||
| 1850 | } | ||
| 1851 | |||
| 1852 | Value IREmitter::ImageAtomicIAdd(const Value& handle, const Value& coords, const Value& value, | ||
| 1853 | TextureInstInfo info) { | ||
| 1854 | const Opcode op{handle.IsImmediate() ? Opcode::BoundImageAtomicIAdd32 | ||
| 1855 | : Opcode::BindlessImageAtomicIAdd32}; | ||
| 1856 | return Inst(op, Flags{info}, handle, coords, value); | ||
| 1857 | } | ||
| 1858 | |||
| 1859 | Value IREmitter::ImageAtomicSMin(const Value& handle, const Value& coords, const Value& value, | ||
| 1860 | TextureInstInfo info) { | ||
| 1861 | const Opcode op{handle.IsImmediate() ? Opcode::BoundImageAtomicSMin32 | ||
| 1862 | : Opcode::BindlessImageAtomicSMin32}; | ||
| 1863 | return Inst(op, Flags{info}, handle, coords, value); | ||
| 1864 | } | ||
| 1865 | |||
| 1866 | Value IREmitter::ImageAtomicUMin(const Value& handle, const Value& coords, const Value& value, | ||
| 1867 | TextureInstInfo info) { | ||
| 1868 | const Opcode op{handle.IsImmediate() ? Opcode::BoundImageAtomicUMin32 | ||
| 1869 | : Opcode::BindlessImageAtomicUMin32}; | ||
| 1870 | return Inst(op, Flags{info}, handle, coords, value); | ||
| 1871 | } | ||
| 1872 | |||
| 1873 | Value IREmitter::ImageAtomicIMin(const Value& handle, const Value& coords, const Value& value, | ||
| 1874 | bool is_signed, TextureInstInfo info) { | ||
| 1875 | return is_signed ? ImageAtomicSMin(handle, coords, value, info) | ||
| 1876 | : ImageAtomicUMin(handle, coords, value, info); | ||
| 1877 | } | ||
| 1878 | |||
| 1879 | Value IREmitter::ImageAtomicSMax(const Value& handle, const Value& coords, const Value& value, | ||
| 1880 | TextureInstInfo info) { | ||
| 1881 | const Opcode op{handle.IsImmediate() ? Opcode::BoundImageAtomicSMax32 | ||
| 1882 | : Opcode::BindlessImageAtomicSMax32}; | ||
| 1883 | return Inst(op, Flags{info}, handle, coords, value); | ||
| 1884 | } | ||
| 1885 | |||
| 1886 | Value IREmitter::ImageAtomicUMax(const Value& handle, const Value& coords, const Value& value, | ||
| 1887 | TextureInstInfo info) { | ||
| 1888 | const Opcode op{handle.IsImmediate() ? Opcode::BoundImageAtomicUMax32 | ||
| 1889 | : Opcode::BindlessImageAtomicUMax32}; | ||
| 1890 | return Inst(op, Flags{info}, handle, coords, value); | ||
| 1891 | } | ||
| 1892 | |||
| 1893 | Value IREmitter::ImageAtomicIMax(const Value& handle, const Value& coords, const Value& value, | ||
| 1894 | bool is_signed, TextureInstInfo info) { | ||
| 1895 | return is_signed ? ImageAtomicSMax(handle, coords, value, info) | ||
| 1896 | : ImageAtomicUMax(handle, coords, value, info); | ||
| 1897 | } | ||
| 1898 | |||
| 1899 | Value IREmitter::ImageAtomicInc(const Value& handle, const Value& coords, const Value& value, | ||
| 1900 | TextureInstInfo info) { | ||
| 1901 | const Opcode op{handle.IsImmediate() ? Opcode::BoundImageAtomicInc32 | ||
| 1902 | : Opcode::BindlessImageAtomicInc32}; | ||
| 1903 | return Inst(op, Flags{info}, handle, coords, value); | ||
| 1904 | } | ||
| 1905 | |||
| 1906 | Value IREmitter::ImageAtomicDec(const Value& handle, const Value& coords, const Value& value, | ||
| 1907 | TextureInstInfo info) { | ||
| 1908 | const Opcode op{handle.IsImmediate() ? Opcode::BoundImageAtomicDec32 | ||
| 1909 | : Opcode::BindlessImageAtomicDec32}; | ||
| 1910 | return Inst(op, Flags{info}, handle, coords, value); | ||
| 1911 | } | ||
| 1912 | |||
| 1913 | Value IREmitter::ImageAtomicAnd(const Value& handle, const Value& coords, const Value& value, | ||
| 1914 | TextureInstInfo info) { | ||
| 1915 | const Opcode op{handle.IsImmediate() ? Opcode::BoundImageAtomicAnd32 | ||
| 1916 | : Opcode::BindlessImageAtomicAnd32}; | ||
| 1917 | return Inst(op, Flags{info}, handle, coords, value); | ||
| 1918 | } | ||
| 1919 | |||
| 1920 | Value IREmitter::ImageAtomicOr(const Value& handle, const Value& coords, const Value& value, | ||
| 1921 | TextureInstInfo info) { | ||
| 1922 | const Opcode op{handle.IsImmediate() ? Opcode::BoundImageAtomicOr32 | ||
| 1923 | : Opcode::BindlessImageAtomicOr32}; | ||
| 1924 | return Inst(op, Flags{info}, handle, coords, value); | ||
| 1925 | } | ||
| 1926 | |||
| 1927 | Value IREmitter::ImageAtomicXor(const Value& handle, const Value& coords, const Value& value, | ||
| 1928 | TextureInstInfo info) { | ||
| 1929 | const Opcode op{handle.IsImmediate() ? Opcode::BoundImageAtomicXor32 | ||
| 1930 | : Opcode::BindlessImageAtomicXor32}; | ||
| 1931 | return Inst(op, Flags{info}, handle, coords, value); | ||
| 1932 | } | ||
| 1933 | |||
| 1934 | Value IREmitter::ImageAtomicExchange(const Value& handle, const Value& coords, const Value& value, | ||
| 1935 | TextureInstInfo info) { | ||
| 1936 | const Opcode op{handle.IsImmediate() ? Opcode::BoundImageAtomicExchange32 | ||
| 1937 | : Opcode::BindlessImageAtomicExchange32}; | ||
| 1938 | return Inst(op, Flags{info}, handle, coords, value); | ||
| 1939 | } | ||
| 1940 | |||
| 1941 | U1 IREmitter::VoteAll(const U1& value) { | ||
| 1942 | return Inst<U1>(Opcode::VoteAll, value); | ||
| 1943 | } | ||
| 1944 | |||
| 1945 | U1 IREmitter::VoteAny(const U1& value) { | ||
| 1946 | return Inst<U1>(Opcode::VoteAny, value); | ||
| 1947 | } | ||
| 1948 | |||
| 1949 | U1 IREmitter::VoteEqual(const U1& value) { | ||
| 1950 | return Inst<U1>(Opcode::VoteEqual, value); | ||
| 1951 | } | ||
| 1952 | |||
| 1953 | U32 IREmitter::SubgroupBallot(const U1& value) { | ||
| 1954 | return Inst<U32>(Opcode::SubgroupBallot, value); | ||
| 1955 | } | ||
| 1956 | |||
| 1957 | U32 IREmitter::SubgroupEqMask() { | ||
| 1958 | return Inst<U32>(Opcode::SubgroupEqMask); | ||
| 1959 | } | ||
| 1960 | |||
| 1961 | U32 IREmitter::SubgroupLtMask() { | ||
| 1962 | return Inst<U32>(Opcode::SubgroupLtMask); | ||
| 1963 | } | ||
| 1964 | |||
| 1965 | U32 IREmitter::SubgroupLeMask() { | ||
| 1966 | return Inst<U32>(Opcode::SubgroupLeMask); | ||
| 1967 | } | ||
| 1968 | |||
| 1969 | U32 IREmitter::SubgroupGtMask() { | ||
| 1970 | return Inst<U32>(Opcode::SubgroupGtMask); | ||
| 1971 | } | ||
| 1972 | |||
| 1973 | U32 IREmitter::SubgroupGeMask() { | ||
| 1974 | return Inst<U32>(Opcode::SubgroupGeMask); | ||
| 1975 | } | ||
| 1976 | |||
| 1977 | U32 IREmitter::ShuffleIndex(const IR::U32& value, const IR::U32& index, const IR::U32& clamp, | ||
| 1978 | const IR::U32& seg_mask) { | ||
| 1979 | return Inst<U32>(Opcode::ShuffleIndex, value, index, clamp, seg_mask); | ||
| 1980 | } | ||
| 1981 | |||
| 1982 | U32 IREmitter::ShuffleUp(const IR::U32& value, const IR::U32& index, const IR::U32& clamp, | ||
| 1983 | const IR::U32& seg_mask) { | ||
| 1984 | return Inst<U32>(Opcode::ShuffleUp, value, index, clamp, seg_mask); | ||
| 1985 | } | ||
| 1986 | |||
| 1987 | U32 IREmitter::ShuffleDown(const IR::U32& value, const IR::U32& index, const IR::U32& clamp, | ||
| 1988 | const IR::U32& seg_mask) { | ||
| 1989 | return Inst<U32>(Opcode::ShuffleDown, value, index, clamp, seg_mask); | ||
| 1990 | } | ||
| 1991 | |||
| 1992 | U32 IREmitter::ShuffleButterfly(const IR::U32& value, const IR::U32& index, const IR::U32& clamp, | ||
| 1993 | const IR::U32& seg_mask) { | ||
| 1994 | return Inst<U32>(Opcode::ShuffleButterfly, value, index, clamp, seg_mask); | ||
| 1995 | } | ||
| 1996 | |||
| 1997 | F32 IREmitter::FSwizzleAdd(const F32& a, const F32& b, const U32& swizzle, FpControl control) { | ||
| 1998 | return Inst<F32>(Opcode::FSwizzleAdd, Flags{control}, a, b, swizzle); | ||
| 1999 | } | ||
| 2000 | |||
| 2001 | F32 IREmitter::DPdxFine(const F32& a) { | ||
| 2002 | return Inst<F32>(Opcode::DPdxFine, a); | ||
| 2003 | } | ||
| 2004 | |||
| 2005 | F32 IREmitter::DPdyFine(const F32& a) { | ||
| 2006 | return Inst<F32>(Opcode::DPdyFine, a); | ||
| 2007 | } | ||
| 2008 | |||
| 2009 | F32 IREmitter::DPdxCoarse(const F32& a) { | ||
| 2010 | return Inst<F32>(Opcode::DPdxCoarse, a); | ||
| 2011 | } | ||
| 2012 | |||
| 2013 | F32 IREmitter::DPdyCoarse(const F32& a) { | ||
| 2014 | return Inst<F32>(Opcode::DPdyCoarse, a); | ||
| 2015 | } | ||
| 2016 | |||
| 2017 | } // namespace Shader::IR | ||