reg_alloc: Emit AVX instructions where able

Smaller codesize.
This commit is contained in:
MerryMage 2018-09-28 21:12:48 +01:00
parent aedd32aa20
commit c6a6271f86

View File

@ -17,6 +17,15 @@
namespace Dynarmic::BackendX64 { namespace Dynarmic::BackendX64 {
#define MAYBE_AVX(OPCODE, ...) \
[&] { \
if (code.DoesCpuSupport(Xbyak::util::Cpu::tAVX)) { \
code.v##OPCODE(__VA_ARGS__); \
} else { \
code.OPCODE(__VA_ARGS__); \
} \
}()
static u64 ImmediateToU64(const IR::Value& imm) { static u64 ImmediateToU64(const IR::Value& imm) {
switch (imm.GetType()) { switch (imm.GetType()) {
case IR::Type::U1: case IR::Type::U1:
@ -506,9 +515,9 @@ HostLoc RegAlloc::LoadImmediate(IR::Value imm, HostLoc host_loc) {
Xbyak::Xmm reg = HostLocToXmm(host_loc); Xbyak::Xmm reg = HostLocToXmm(host_loc);
u64 imm_value = ImmediateToU64(imm); u64 imm_value = ImmediateToU64(imm);
if (imm_value == 0) if (imm_value == 0)
code.pxor(reg, reg); MAYBE_AVX(xorps, reg, reg);
else else
code.movdqa(reg, code.MConst(code.xword, imm_value)); // TODO: movaps/movapd more appropriate sometimes MAYBE_AVX(movaps, reg, code.MConst(code.xword, imm_value));
return host_loc; return host_loc;
} }
@ -594,7 +603,7 @@ const HostLocInfo& RegAlloc::LocInfo(HostLoc loc) const {
void RegAlloc::EmitMove(size_t bit_width, HostLoc to, HostLoc from) { void RegAlloc::EmitMove(size_t bit_width, HostLoc to, HostLoc from) {
if (HostLocIsXMM(to) && HostLocIsXMM(from)) { if (HostLocIsXMM(to) && HostLocIsXMM(from)) {
code.movaps(HostLocToXmm(to), HostLocToXmm(from)); MAYBE_AVX(movaps, HostLocToXmm(to), HostLocToXmm(from));
} else if (HostLocIsGPR(to) && HostLocIsGPR(from)) { } else if (HostLocIsGPR(to) && HostLocIsGPR(from)) {
ASSERT(bit_width != 128); ASSERT(bit_width != 128);
if (bit_width == 64) { if (bit_width == 64) {
@ -605,31 +614,31 @@ void RegAlloc::EmitMove(size_t bit_width, HostLoc to, HostLoc from) {
} else if (HostLocIsXMM(to) && HostLocIsGPR(from)) { } else if (HostLocIsXMM(to) && HostLocIsGPR(from)) {
ASSERT(bit_width != 128); ASSERT(bit_width != 128);
if (bit_width == 64) { if (bit_width == 64) {
code.movq(HostLocToXmm(to), HostLocToReg64(from)); MAYBE_AVX(movq, HostLocToXmm(to), HostLocToReg64(from));
} else { } else {
code.movd(HostLocToXmm(to), HostLocToReg64(from).cvt32()); MAYBE_AVX(movd, HostLocToXmm(to), HostLocToReg64(from).cvt32());
} }
} else if (HostLocIsGPR(to) && HostLocIsXMM(from)) { } else if (HostLocIsGPR(to) && HostLocIsXMM(from)) {
ASSERT(bit_width != 128); ASSERT(bit_width != 128);
if (bit_width == 64) { if (bit_width == 64) {
code.movq(HostLocToReg64(to), HostLocToXmm(from)); MAYBE_AVX(movq, HostLocToReg64(to), HostLocToXmm(from));
} else { } else {
code.movd(HostLocToReg64(to).cvt32(), HostLocToXmm(from)); MAYBE_AVX(movd, HostLocToReg64(to).cvt32(), HostLocToXmm(from));
} }
} else if (HostLocIsXMM(to) && HostLocIsSpill(from)) { } else if (HostLocIsXMM(to) && HostLocIsSpill(from)) {
Xbyak::Address spill_addr = spill_to_addr(from); Xbyak::Address spill_addr = spill_to_addr(from);
ASSERT(spill_addr.getBit() >= bit_width); ASSERT(spill_addr.getBit() >= bit_width);
switch (bit_width) { switch (bit_width) {
case 128: case 128:
code.movaps(HostLocToXmm(to), spill_addr); MAYBE_AVX(movaps, HostLocToXmm(to), spill_addr);
break; break;
case 64: case 64:
code.movsd(HostLocToXmm(to), spill_addr); MAYBE_AVX(movsd, HostLocToXmm(to), spill_addr);
break; break;
case 32: case 32:
case 16: case 16:
case 8: case 8:
code.movss(HostLocToXmm(to), spill_addr); MAYBE_AVX(movss, HostLocToXmm(to), spill_addr);
break; break;
default: default:
UNREACHABLE(); UNREACHABLE();
@ -639,15 +648,15 @@ void RegAlloc::EmitMove(size_t bit_width, HostLoc to, HostLoc from) {
ASSERT(spill_addr.getBit() >= bit_width); ASSERT(spill_addr.getBit() >= bit_width);
switch (bit_width) { switch (bit_width) {
case 128: case 128:
code.movaps(spill_addr, HostLocToXmm(from)); MAYBE_AVX(movaps, spill_addr, HostLocToXmm(from));
break; break;
case 64: case 64:
code.movsd(spill_addr, HostLocToXmm(from)); MAYBE_AVX(movsd, spill_addr, HostLocToXmm(from));
break; break;
case 32: case 32:
case 16: case 16:
case 8: case 8:
code.movss(spill_addr, HostLocToXmm(from)); MAYBE_AVX(movss, spill_addr, HostLocToXmm(from));
break; break;
default: default:
UNREACHABLE(); UNREACHABLE();