mirror of
https://github.com/PCSX2/pcsx2.git
synced 2025-12-16 04:08:48 +00:00
456 lines
21 KiB
C++
456 lines
21 KiB
C++
// SPDX-FileCopyrightText: 2002-2025 PCSX2 Dev Team
|
|
// SPDX-License-Identifier: GPL-3.0+
|
|
|
|
#include "codegen_tests.h"
|
|
#include <gtest/gtest.h>
|
|
#include <common/emitter/x86emitter.h>
|
|
#include <cstdio>
|
|
|
|
using namespace x86Emitter;
|
|
|
|
TEST(CodegenTests, MOVTest)
|
|
{
|
|
CODEGEN_TEST(xMOV(rax, 0), "31 c0");
|
|
CODEGEN_TEST(xMOV(rax, rcx), "48 89 c8");
|
|
CODEGEN_TEST(xMOV(eax, ecx), "89 c8");
|
|
CODEGEN_TEST(xMOV(r8, 0), "45 31 c0");
|
|
CODEGEN_TEST(xMOV(rax, r8), "4c 89 c0");
|
|
CODEGEN_TEST(xMOV(r8, rax), "49 89 c0");
|
|
CODEGEN_TEST(xMOV(r8, r9), "4d 89 c8");
|
|
CODEGEN_TEST(xMOV(rax, ptr64[rcx]), "48 8b 01");
|
|
CODEGEN_TEST(xMOV(eax, ptr32[rcx]), "8b 01");
|
|
CODEGEN_TEST(xMOV(ptr64[rax], rcx), "48 89 08");
|
|
CODEGEN_TEST(xMOV(ptr32[rax], ecx), "89 08");
|
|
CODEGEN_TEST(xMOV(rax, ptr64[r8]), "49 8b 00");
|
|
CODEGEN_TEST(xMOV(ptr64[r8], rax), "49 89 00");
|
|
CODEGEN_TEST(xMOV(r8, ptr64[r9]), "4d 8b 01");
|
|
CODEGEN_TEST(xMOV(ptr64[r8], r9), "4d 89 08");
|
|
CODEGEN_TEST(xMOV(rax, ptr64[rbx*4+3+rcx]), "48 8b 44 99 03");
|
|
CODEGEN_TEST(xMOV(ptr64[rbx*4+3+rax], rcx), "48 89 4c 98 03");
|
|
CODEGEN_TEST(xMOV(eax, ptr32[rbx*4+3+rcx]), "8b 44 99 03");
|
|
CODEGEN_TEST(xMOV(ptr32[rbx*4+3+rax], ecx), "89 4c 98 03");
|
|
CODEGEN_TEST(xMOV(r8, ptr64[r10*4+3+r9]), "4f 8b 44 91 03");
|
|
CODEGEN_TEST(xMOV(ptr64[r9*4+3+r8], r10), "4f 89 54 88 03");
|
|
CODEGEN_TEST(xMOV(ptr64[r8], 0), "49 c7 00 00 00 00 00");
|
|
CODEGEN_TEST(xMOV(ptr32[rax], 0), "c7 00 00 00 00 00");
|
|
CODEGEN_TEST(xMOV(ptr32[rbx*4+3+rax], -1), "c7 44 98 03 ff ff ff ff");
|
|
CODEGEN_TEST(xMOV(rax, 0xffffffff), "b8 ff ff ff ff");
|
|
CODEGEN_TEST(xMOV(r8, -1), "49 c7 c0 ff ff ff ff");
|
|
CODEGEN_TEST(xMOV64(rax, 0x1234567890), "48 b8 90 78 56 34 12 00 00 00");
|
|
CODEGEN_TEST(xMOV64(r8, 0x1234567890), "49 b8 90 78 56 34 12 00 00 00");
|
|
CODEGEN_TEST(xMOV(ptr32[base], 0x12), "c7 05 f6 ff ff ff 12 00 00 00");
|
|
CODEGEN_TEST(xMOVSX(eax, dx), "0f bf c2");
|
|
CODEGEN_TEST(xMOVSX(rax, r8d), "49 63 c0");
|
|
CODEGEN_TEST(xMOVSX(rax, ebx), "48 63 c3");
|
|
}
|
|
|
|
TEST(CodegenTests, LEATest)
|
|
{
|
|
CODEGEN_TEST(xLEA(rax, ptr[rcx]), "48 89 c8"); // Converted to mov rax, rcx
|
|
CODEGEN_TEST(xLEA(eax, ptr[rcx]), "89 c8"); // Converted to mov eax, ecx
|
|
CODEGEN_TEST(xLEA(rax, ptr[r8]), "4c 89 c0"); // Converted to mov rax, r8
|
|
CODEGEN_TEST(xLEA(r8, ptr[r9]), "4d 89 c8"); // Converted to mov r8, r9
|
|
CODEGEN_TEST(xLEA(rax, ptr[rbx*4+3+rcx]), "48 8d 44 99 03");
|
|
CODEGEN_TEST(xLEA(eax, ptr32[rbx*4+3+rcx]), "8d 44 99 03");
|
|
CODEGEN_TEST(xLEA(r8, ptr[r10*4+3+r9]), "4f 8d 44 91 03");
|
|
CODEGEN_TEST(xLEA(r8, ptr[base]), "4c 8d 05 f9 ff ff ff");
|
|
CODEGEN_TEST(xLoadFarAddr(r8, base), "4c 8d 05 f9 ff ff ff");
|
|
CODEGEN_TEST(xLoadFarAddr(r8, (void*)0xff00001234567890), "49 b8 90 78 56 34 12 00 00 ff");
|
|
CODEGEN_TEST(xLEA(rax, ptr[(void*)0x1234]), "b8 34 12 00 00"); // Converted to mov rax, 0x1234
|
|
CODEGEN_TEST(xLoadFarAddr(rax, (void*)0x1234), "b8 34 12 00 00");
|
|
CODEGEN_TEST(xLEA_Writeback(rbx), "48 8d 1d cd cd cd 0d");
|
|
}
|
|
|
|
TEST(CodegenTests, PUSHTest)
|
|
{
|
|
CODEGEN_TEST(xPUSH(rax), "50");
|
|
CODEGEN_TEST(xPUSH(r8), "41 50");
|
|
CODEGEN_TEST(xPUSH(0x1234), "68 34 12 00 00");
|
|
CODEGEN_TEST(xPUSH(0x12), "6a 12");
|
|
CODEGEN_TEST(xPUSH(ptr64[rax]), "ff 30");
|
|
CODEGEN_TEST(xPUSH(ptr64[r8]), "41 ff 30");
|
|
CODEGEN_TEST(xPUSH(ptr64[rax*2+3+rbx]), "ff 74 43 03");
|
|
CODEGEN_TEST(xPUSH(ptr64[rax*2+3+r8]), "41 ff 74 40 03");
|
|
CODEGEN_TEST(xPUSH(ptr64[r9*4+3+r8]), "43 ff 74 88 03");
|
|
CODEGEN_TEST(xPUSH(ptr64[r8*4+3+rax]), "42 ff 74 80 03");
|
|
CODEGEN_TEST(xPUSH(ptr64[rax*8+0x1234+rbx]), "ff b4 c3 34 12 00 00");
|
|
CODEGEN_TEST(xPUSH(ptr64[base]), "ff 35 fa ff ff ff");
|
|
CODEGEN_TEST(xPUSH(ptr64[(void*)0x1234]), "ff 34 25 34 12 00 00");
|
|
}
|
|
|
|
TEST(CodegenTests, POPTest)
|
|
{
|
|
CODEGEN_TEST(xPOP(rax), "58");
|
|
CODEGEN_TEST(xPOP(r8), "41 58");
|
|
CODEGEN_TEST(xPOP(ptr64[rax]), "8f 00");
|
|
CODEGEN_TEST(xPOP(ptr64[r8]), "41 8f 00");
|
|
CODEGEN_TEST(xPOP(ptr64[rax*2+3+rbx]), "8f 44 43 03");
|
|
CODEGEN_TEST(xPOP(ptr64[rax*2+3+r8]), "41 8f 44 40 03");
|
|
CODEGEN_TEST(xPOP(ptr64[r9*4+3+r8]), "43 8f 44 88 03");
|
|
CODEGEN_TEST(xPOP(ptr64[r8*4+3+rax]), "42 8f 44 80 03");
|
|
CODEGEN_TEST(xPOP(ptr64[rax*8+0x1234+rbx]), "8f 84 c3 34 12 00 00");
|
|
CODEGEN_TEST(xPOP(ptr64[base]), "8f 05 fa ff ff ff");
|
|
CODEGEN_TEST(xPOP(ptr64[(void*)0x1234]), "8f 04 25 34 12 00 00");
|
|
}
|
|
|
|
TEST(CodegenTests, MathTest)
|
|
{
|
|
CODEGEN_TEST(xINC(eax), "ff c0");
|
|
CODEGEN_TEST(xDEC(rax), "48 ff c8");
|
|
CODEGEN_TEST(xINC(r8), "49 ff c0");
|
|
CODEGEN_TEST(xADD(r8, r9), "4d 01 c8");
|
|
CODEGEN_TEST(xADD(r8, 0x12), "49 83 c0 12");
|
|
CODEGEN_TEST(xADD(rax, 0x1234), "48 05 34 12 00 00");
|
|
CODEGEN_TEST(xADD(ptr8[base], 1), "80 05 f9 ff ff ff 01");
|
|
CODEGEN_TEST(xADD(ptr32[base], -0x60), "83 05 f9 ff ff ff a0");
|
|
CODEGEN_TEST(xADD(ptr32[base], 0x1234), "81 05 f6 ff ff ff 34 12 00 00");
|
|
CODEGEN_TEST(xADD(eax, ebx), "01 d8");
|
|
CODEGEN_TEST(xADD(eax, 0x1234), "05 34 12 00 00");
|
|
CODEGEN_TEST(xADD(r8, ptr64[r10*4+3+r9]), "4f 03 44 91 03");
|
|
CODEGEN_TEST(xADD(ptr64[r9*4+3+r8], r10), "4f 01 54 88 03");
|
|
CODEGEN_TEST(xADD(eax, ptr32[rbx*4+3+rcx]), "03 44 99 03");
|
|
CODEGEN_TEST(xADD(ptr32[rax*4+3+rbx], ecx), "01 4c 83 03");
|
|
CODEGEN_TEST(xSUB(r8, 0x12), "49 83 e8 12");
|
|
CODEGEN_TEST(xSUB(rax, 0x1234), "48 2d 34 12 00 00");
|
|
CODEGEN_TEST(xSUB(eax, ptr32[rcx*4+rax]), "2b 04 88");
|
|
CODEGEN_TEST(xMUL(ptr32[base]), "f7 2d fa ff ff ff");
|
|
CODEGEN_TEST(xMUL(ptr32[(void*)0x1234]), "f7 2c 25 34 12 00 00");
|
|
CODEGEN_TEST(xDIV(ecx), "f7 f9");
|
|
}
|
|
|
|
TEST(CodegenTests, BitwiseTest)
|
|
{
|
|
CODEGEN_TEST(xSHR(r8, cl), "49 d3 e8");
|
|
CODEGEN_TEST(xSHR(rax, cl), "48 d3 e8");
|
|
CODEGEN_TEST(xSHR(ecx, cl), "d3 e9");
|
|
CODEGEN_TEST(xSAR(r8, 1), "49 d1 f8");
|
|
CODEGEN_TEST(xSAR(rax, 60), "48 c1 f8 3c");
|
|
CODEGEN_TEST(xSAR(eax, 30), "c1 f8 1e");
|
|
CODEGEN_TEST(xSHL(ebx, 30), "c1 e3 1e");
|
|
CODEGEN_TEST(xSHL(ptr32[base], 4), "c1 25 f9 ff ff ff 04");
|
|
CODEGEN_TEST(xAND(r8, r9), "4d 21 c8");
|
|
CODEGEN_TEST(xXOR(rax, ptr64[r10]), "49 33 02");
|
|
CODEGEN_TEST(xOR(esi, ptr32[rax+rbx]), "0b 34 18");
|
|
CODEGEN_TEST(xNOT(r8), "49 f7 d0");
|
|
CODEGEN_TEST(xNOT(ptr64[rax]), "48 f7 10");
|
|
CODEGEN_TEST(xNOT(ptr32[rbx]), "f7 13");
|
|
}
|
|
|
|
TEST(CodegenTests, JmpTest)
|
|
{
|
|
CODEGEN_TEST(xJMP(r8), "41 ff e0");
|
|
CODEGEN_TEST(xJMP(rdi), "ff e7");
|
|
CODEGEN_TEST(xJMP(ptr64[rax]), "ff 20");
|
|
CODEGEN_TEST(xJA(base), "77 fe");
|
|
CODEGEN_TEST(xJB((char*)base - 0xFFFF), "0f 82 fb ff fe ff");
|
|
}
|
|
|
|
TEST(CodegenTests, SSETest)
|
|
{
|
|
x86Emitter::use_avx = false;
|
|
|
|
CODEGEN_TEST(xCVTDQ2PD(xmm0, ptr64[rax]), "f3 0f e6 00");
|
|
CODEGEN_TEST(xCVTDQ2PS(xmm0, xmm8), "41 0f 5b c0");
|
|
CODEGEN_TEST(xCVTPD2DQ(xmm8, ptr128[r8]), "f2 45 0f e6 00");
|
|
CODEGEN_TEST(xCVTPD2PS(xmm1, xmm7), "66 0f 5a cf");
|
|
CODEGEN_TEST(xCVTSD2SI(rax, xmm1), "f2 48 0f 2d c1");
|
|
CODEGEN_TEST(xCVTSD2SI(esi, ptr64[rax]), "f2 0f 2d 30");
|
|
CODEGEN_TEST(xCVTSD2SS(xmm3, xmm4), "f2 0f 5a dc");
|
|
CODEGEN_TEST(xCVTSI2SS(xmm8, ecx), "f3 44 0f 2a c1");
|
|
CODEGEN_TEST(xCVTSI2SS(xmm3, ptr32[r8]), "f3 41 0f 2a 18");
|
|
CODEGEN_TEST(xCVTSI2SS(xmm3, ptr64[r8]), "f3 49 0f 2a 18");
|
|
CODEGEN_TEST(xCVTSS2SD(xmm8, xmm7), "f3 44 0f 5a c7");
|
|
CODEGEN_TEST(xCVTSS2SD(xmm4, ptr32[rcx]), "f3 0f 5a 21");
|
|
CODEGEN_TEST(xCVTSS2SI(eax, xmm4), "f3 0f 2d c4");
|
|
CODEGEN_TEST(xCVTSS2SI(rcx, ptr32[rax]), "f3 48 0f 2d 08");
|
|
CODEGEN_TEST(xCVTTPD2DQ(xmm4, xmm7), "66 0f e6 e7");
|
|
CODEGEN_TEST(xCVTTPS2DQ(xmm5, xmm3), "f3 0f 5b eb");
|
|
CODEGEN_TEST(xCVTTSD2SI(rdx, xmm4), "f2 48 0f 2c d4");
|
|
CODEGEN_TEST(xCVTTSS2SI(ecx, xmm3), "f3 0f 2c cb");
|
|
|
|
CODEGEN_TEST(xPSLL.W(xmm8, ptr[r8]), "66 45 0f f1 00");
|
|
CODEGEN_TEST(xPSLL.D(xmm0, xmm1), "66 0f f2 c1");
|
|
CODEGEN_TEST(xPSLL.Q(xmm4, ptr[rcx]), "66 0f f3 21");
|
|
CODEGEN_TEST(xPSLL.W(xmm5, 2), "66 0f 71 f5 02");
|
|
CODEGEN_TEST(xPSLL.D(xmm6, 3), "66 0f 72 f6 03");
|
|
CODEGEN_TEST(xPSLL.Q(xmm7, 4), "66 0f 73 f7 04");
|
|
CODEGEN_TEST(xPSLL.DQ(xmm8, 5), "66 41 0f 73 f8 05");
|
|
CODEGEN_TEST(xPSRA.W(xmm4, xmm2), "66 0f e1 e2");
|
|
CODEGEN_TEST(xPSRA.D(xmm5, ptr[rdi]), "66 0f e2 2f");
|
|
CODEGEN_TEST(xPSRA.W(xmm4, 3), "66 0f 71 e4 03");
|
|
CODEGEN_TEST(xPSRA.D(xmm5, 7), "66 0f 72 e5 07");
|
|
CODEGEN_TEST(xPSRL.W(xmm8, ptr[r8]), "66 45 0f d1 00");
|
|
CODEGEN_TEST(xPSRL.D(xmm0, xmm1), "66 0f d2 c1");
|
|
CODEGEN_TEST(xPSRL.Q(xmm4, ptr[rcx]), "66 0f d3 21");
|
|
CODEGEN_TEST(xPSRL.W(xmm5, 2), "66 0f 71 d5 02");
|
|
CODEGEN_TEST(xPSRL.D(xmm6, 3), "66 0f 72 d6 03");
|
|
CODEGEN_TEST(xPSRL.Q(xmm7, 4), "66 0f 73 d7 04");
|
|
CODEGEN_TEST(xPSRL.DQ(xmm8, 5), "66 41 0f 73 d8 05");
|
|
|
|
CODEGEN_TEST(xPADD.B(xmm1, xmm8), "66 41 0f fc c8");
|
|
CODEGEN_TEST(xPADD.W(xmm4, xmm7), "66 0f fd e7");
|
|
CODEGEN_TEST(xPADD.D(xmm2, ptr[rcx]), "66 0f fe 11");
|
|
CODEGEN_TEST(xPADD.Q(xmm8, xmm2), "66 44 0f d4 c2");
|
|
CODEGEN_TEST(xPADD.SB(xmm9, xmm8), "66 45 0f ec c8");
|
|
CODEGEN_TEST(xPADD.SW(xmm2, ptr[r8]), "66 41 0f ed 10");
|
|
CODEGEN_TEST(xPADD.USB(xmm3, xmm3), "66 0f dc db");
|
|
CODEGEN_TEST(xPADD.USW(xmm2, xmm9), "66 41 0f dd d1");
|
|
CODEGEN_TEST(xPSUB.B(xmm1, xmm8), "66 41 0f f8 c8");
|
|
CODEGEN_TEST(xPSUB.W(xmm4, xmm7), "66 0f f9 e7");
|
|
CODEGEN_TEST(xPSUB.D(xmm2, ptr[rcx]), "66 0f fa 11");
|
|
CODEGEN_TEST(xPSUB.Q(xmm8, xmm2), "66 44 0f fb c2");
|
|
CODEGEN_TEST(xPSUB.SB(xmm9, xmm8), "66 45 0f e8 c8");
|
|
CODEGEN_TEST(xPSUB.SW(xmm2, ptr[r8]), "66 41 0f e9 10");
|
|
CODEGEN_TEST(xPSUB.USB(xmm3, xmm3), "66 0f d8 db");
|
|
CODEGEN_TEST(xPSUB.USW(xmm2, xmm9), "66 41 0f d9 d1");
|
|
CODEGEN_TEST(xPMUL.LW(xmm2, xmm8), "66 41 0f d5 d0");
|
|
CODEGEN_TEST(xPMUL.HW(xmm9, ptr[r9]), "66 45 0f e5 09");
|
|
CODEGEN_TEST(xPMUL.HUW(xmm4, xmm3), "66 0f e4 e3");
|
|
CODEGEN_TEST(xPMUL.UDQ(xmm1, xmm7), "66 0f f4 cf");
|
|
CODEGEN_TEST(xPMUL.HRSW(xmm2, xmm4), "66 0f 38 0b d4");
|
|
CODEGEN_TEST(xPMUL.LD(xmm1, xmm8), "66 41 0f 38 40 c8");
|
|
CODEGEN_TEST(xPMUL.DQ(xmm4, xmm9), "66 41 0f 38 28 e1");
|
|
|
|
CODEGEN_TEST(xRSQRT.PS(xmm0, xmm8), "41 0f 52 c0");
|
|
CODEGEN_TEST(xRSQRT.SS(xmm4, ptr[r9]), "f3 41 0f 52 21");
|
|
CODEGEN_TEST(xRCP.PS(xmm4, ptr[rcx]), "0f 53 21");
|
|
CODEGEN_TEST(xRCP.SS(xmm5, xmm8), "f3 41 0f 53 e8");
|
|
CODEGEN_TEST(xSQRT.PS(xmm4, xmm2), "0f 51 e2");
|
|
CODEGEN_TEST(xSQRT.SS(xmm5, xmm1), "f3 0f 51 e9");
|
|
CODEGEN_TEST(xSQRT.PD(xmm7, ptr[rdi]), "66 0f 51 3f");
|
|
CODEGEN_TEST(xSQRT.SD(xmm5, xmm2), "f2 0f 51 ea");
|
|
CODEGEN_TEST(xANDN.PS(xmm6, ptr[rdi]), "0f 55 37");
|
|
CODEGEN_TEST(xANDN.PD(xmm3, xmm8), "66 41 0f 55 d8");
|
|
|
|
CODEGEN_TEST(xPABS.B(xmm0, xmm2), "66 0f 38 1c c2");
|
|
CODEGEN_TEST(xPABS.W(xmm4, xmm8), "66 41 0f 38 1d e0");
|
|
CODEGEN_TEST(xPABS.D(xmm6, ptr[rax]), "66 0f 38 1e 30");
|
|
CODEGEN_TEST(xPSIGN.B(xmm0, xmm2), "66 0f 38 08 c2");
|
|
CODEGEN_TEST(xPSIGN.W(xmm4, xmm8), "66 41 0f 38 09 e0");
|
|
CODEGEN_TEST(xPSIGN.D(xmm2, ptr[r8]), "66 41 0f 38 0a 10");
|
|
CODEGEN_TEST(xPMADD.WD(xmm0, xmm8), "66 41 0f f5 c0");
|
|
CODEGEN_TEST(xPMADD.UBSW(xmm0, xmm8), "66 41 0f 38 04 c0");
|
|
|
|
CODEGEN_TEST(xMOVAPS(xmm0, xmm1), "0f 28 c1");
|
|
CODEGEN_TEST(xMOVAPS(xmm8, xmm9), "45 0f 28 c1");
|
|
CODEGEN_TEST(xMOVUPS(xmm8, ptr128[r8+r9]), "47 0f 10 04 08");
|
|
CODEGEN_TEST(xMOVAPS(ptr128[rax+r9], xmm8), "46 0f 29 04 08");
|
|
CODEGEN_TEST(xBLEND.PS(xmm0, xmm1, 0x55), "66 0f 3a 0c c1 55");
|
|
CODEGEN_TEST(xBLEND.PD(xmm8, xmm9, 0xaa), "66 45 0f 3a 0d c1 aa");
|
|
CODEGEN_TEST(xPBLEND.W(xmm0, xmm1, 0x55), "66 0f 3a 0e c1 55");
|
|
CODEGEN_TEST(xPBLEND.VB(xmm1, xmm2), "66 0f 38 10 ca");
|
|
CODEGEN_TEST(xEXTRACTPS(ptr32[base], xmm1, 2), "66 0f 3a 17 0d f6 ff ff ff 02");
|
|
CODEGEN_TEST(xMOVD(eax, xmm1), "66 0f 7e c8");
|
|
CODEGEN_TEST(xMOVD(eax, xmm10), "66 44 0f 7e d0");
|
|
CODEGEN_TEST(xMOVD(rax, xmm1), "66 48 0f 7e c8");
|
|
CODEGEN_TEST(xMOVD(r10, xmm1), "66 49 0f 7e ca");
|
|
CODEGEN_TEST(xMOVD(rax, xmm10), "66 4c 0f 7e d0");
|
|
CODEGEN_TEST(xMOVD(r10, xmm10), "66 4d 0f 7e d2");
|
|
CODEGEN_TEST(xPINSR.B(xmm0, ebx, 1), "66 0f 3a 20 c3 01");
|
|
CODEGEN_TEST(xPINSR.W(xmm0, ebx, 1), "66 0f c4 c3 01");
|
|
CODEGEN_TEST(xPINSR.D(xmm0, ebx, 1), "66 0f 3a 22 c3 01");
|
|
CODEGEN_TEST(xPINSR.Q(xmm0, rbx, 1), "66 48 0f 3a 22 c3 01");
|
|
CODEGEN_TEST(xPEXTR.B(ebx, xmm0, 1), "66 0f 3a 14 c3 01");
|
|
CODEGEN_TEST(xPEXTR.W(ebx, xmm0, 1), "66 0f c5 c3 01");
|
|
CODEGEN_TEST(xPEXTR.D(ebx, xmm0, 1), "66 0f 3a 16 c3 01");
|
|
CODEGEN_TEST(xPEXTR.Q(rbx, xmm0, 1), "66 48 0f 3a 16 c3 01");
|
|
CODEGEN_TEST(xPEXTR.Q(ptr64[rax], xmm0, 1), "66 48 0f 3a 16 00 01");
|
|
}
|
|
|
|
TEST(CodegenTests, AVXTest)
|
|
{
|
|
x86Emitter::use_avx = true;
|
|
|
|
CODEGEN_TEST(xCVTDQ2PD(xmm0, ptr64[rax]), "c5 fa e6 00");
|
|
CODEGEN_TEST(xCVTDQ2PS(xmm0, xmm8), "c4 c1 78 5b c0");
|
|
CODEGEN_TEST(xCVTPD2DQ(xmm8, ptr128[r8]), "c4 41 7b e6 00");
|
|
CODEGEN_TEST(xCVTPD2PS(xmm1, xmm7), "c5 f9 5a cf");
|
|
CODEGEN_TEST(xCVTSD2SI(rax, xmm1), "c4 e1 fb 2d c1");
|
|
CODEGEN_TEST(xCVTSD2SI(esi, ptr64[rax]), "c5 fb 2d 30");
|
|
CODEGEN_TEST(xCVTSD2SS(xmm3, xmm4), "c5 e3 5a dc");
|
|
CODEGEN_TEST(xCVTSI2SS(xmm8, ecx), "c5 3a 2a c1");
|
|
CODEGEN_TEST(xCVTSI2SS(xmm3, ptr32[r8]), "c4 c1 62 2a 18");
|
|
CODEGEN_TEST(xCVTSI2SS(xmm3, ptr64[r8]), "c4 c1 e2 2a 18");
|
|
CODEGEN_TEST(xCVTSS2SD(xmm8, xmm7), "c5 3a 5a c7");
|
|
CODEGEN_TEST(xCVTSS2SD(xmm4, ptr32[rcx]), "c5 da 5a 21");
|
|
CODEGEN_TEST(xCVTSS2SI(eax, xmm4), "c5 fa 2d c4");
|
|
CODEGEN_TEST(xCVTSS2SI(rcx, ptr32[rax]), "c4 e1 fa 2d 08");
|
|
CODEGEN_TEST(xCVTTPD2DQ(xmm4, xmm7), "c5 f9 e6 e7");
|
|
CODEGEN_TEST(xCVTTPS2DQ(xmm5, xmm3), "c5 fa 5b eb");
|
|
CODEGEN_TEST(xCVTTSD2SI(rdx, xmm4), "c4 e1 fb 2c d4");
|
|
CODEGEN_TEST(xCVTTSS2SI(ecx, xmm3), "c5 fa 2c cb");
|
|
|
|
CODEGEN_TEST(xPSLL.W(xmm8, ptr[r8]), "c4 41 39 f1 00");
|
|
CODEGEN_TEST(xPSLL.D(xmm0, xmm1), "c5 f9 f2 c1");
|
|
CODEGEN_TEST(xPSLL.Q(xmm4, ptr[rcx]), "c5 d9 f3 21");
|
|
CODEGEN_TEST(xPSLL.W(xmm5, 2), "c5 d1 71 f5 02");
|
|
CODEGEN_TEST(xPSLL.D(xmm6, 3), "c5 c9 72 f6 03");
|
|
CODEGEN_TEST(xPSLL.Q(xmm7, 4), "c5 c1 73 f7 04");
|
|
CODEGEN_TEST(xPSLL.DQ(xmm8, 5), "c4 c1 39 73 f8 05");
|
|
CODEGEN_TEST(xPSRA.W(xmm4, xmm2), "c5 d9 e1 e2");
|
|
CODEGEN_TEST(xPSRA.D(xmm5, ptr[rdi]), "c5 d1 e2 2f");
|
|
CODEGEN_TEST(xPSRA.W(xmm4, 3), "c5 d9 71 e4 03");
|
|
CODEGEN_TEST(xPSRA.D(xmm5, 7), "c5 d1 72 e5 07");
|
|
CODEGEN_TEST(xPSRL.W(xmm8, ptr[r8]), "c4 41 39 d1 00");
|
|
CODEGEN_TEST(xPSRL.D(xmm0, xmm1), "c5 f9 d2 c1");
|
|
CODEGEN_TEST(xPSRL.Q(xmm4, ptr[rcx]), "c5 d9 d3 21");
|
|
CODEGEN_TEST(xPSRL.W(xmm5, 2), "c5 d1 71 d5 02");
|
|
CODEGEN_TEST(xPSRL.D(xmm6, 3), "c5 c9 72 d6 03");
|
|
CODEGEN_TEST(xPSRL.Q(xmm7, 4), "c5 c1 73 d7 04");
|
|
CODEGEN_TEST(xPSRL.DQ(xmm8, 5), "c4 c1 39 73 d8 05");
|
|
|
|
CODEGEN_TEST(xPADD.B(xmm1, xmm8), "c5 b9 fc c9"); // => vpaddb xmm1, xmm8, xmm1
|
|
CODEGEN_TEST(xPADD.W(xmm4, xmm7), "c5 d9 fd e7");
|
|
CODEGEN_TEST(xPADD.D(xmm2, ptr[rcx]), "c5 e9 fe 11");
|
|
CODEGEN_TEST(xPADD.Q(xmm8, xmm2), "c5 39 d4 c2");
|
|
CODEGEN_TEST(xPADD.SB(xmm9, xmm8), "c4 41 31 ec c8");
|
|
CODEGEN_TEST(xPADD.SW(xmm2, ptr[r8]), "c4 c1 69 ed 10");
|
|
CODEGEN_TEST(xPADD.USB(xmm3, xmm3), "c5 e1 dc db");
|
|
CODEGEN_TEST(xPADD.USW(xmm2, xmm9), "c5 b1 dd d2"); // => vpaddd xmm2, xmm9, xmm2
|
|
CODEGEN_TEST(xPSUB.B(xmm1, xmm8), "c4 c1 71 f8 c8");
|
|
CODEGEN_TEST(xPSUB.W(xmm4, xmm7), "c5 d9 f9 e7");
|
|
CODEGEN_TEST(xPSUB.D(xmm2, ptr[rcx]), "c5 e9 fa 11");
|
|
CODEGEN_TEST(xPSUB.Q(xmm8, xmm2), "c5 39 fb c2");
|
|
CODEGEN_TEST(xPSUB.SB(xmm9, xmm8), "c4 41 31 e8 c8");
|
|
CODEGEN_TEST(xPSUB.SW(xmm2, ptr[r8]), "c4 c1 69 e9 10");
|
|
CODEGEN_TEST(xPSUB.USB(xmm3, xmm3), "c5 e1 d8 db");
|
|
CODEGEN_TEST(xPSUB.USW(xmm2, xmm9), "c4 c1 69 d9 d1");
|
|
CODEGEN_TEST(xPMUL.LW(xmm2, xmm8), "c5 b9 d5 d2"); // => vpmullw xmm2, xmm8, xmm2
|
|
CODEGEN_TEST(xPMUL.HW(xmm9, ptr[r9]), "c4 41 31 e5 09");
|
|
CODEGEN_TEST(xPMUL.HUW(xmm4, xmm3), "c5 d9 e4 e3");
|
|
CODEGEN_TEST(xPMUL.UDQ(xmm1, xmm7), "c5 f1 f4 cf");
|
|
CODEGEN_TEST(xPMUL.HRSW(xmm2, xmm4), "c4 e2 69 0b d4");
|
|
CODEGEN_TEST(xPMUL.LD(xmm1, xmm8), "c4 c2 71 40 c8");
|
|
CODEGEN_TEST(xPMUL.DQ(xmm4, xmm9), "c4 c2 59 28 e1");
|
|
|
|
CODEGEN_TEST(xRSQRT.PS(xmm0, xmm8), "c4 c1 78 52 c0");
|
|
CODEGEN_TEST(xRSQRT.SS(xmm4, ptr[r9]), "c4 c1 5a 52 21");
|
|
CODEGEN_TEST(xRCP.PS(xmm4, ptr[rcx]), "c5 f8 53 21");
|
|
CODEGEN_TEST(xRCP.SS(xmm5, xmm8), "c4 c1 52 53 e8");
|
|
CODEGEN_TEST(xSQRT.PS(xmm4, xmm2), "c5 f8 51 e2");
|
|
CODEGEN_TEST(xSQRT.SS(xmm5, xmm1), "c5 d2 51 e9");
|
|
CODEGEN_TEST(xSQRT.PD(xmm7, ptr[rdi]), "c5 f9 51 3f");
|
|
CODEGEN_TEST(xSQRT.SD(xmm5, xmm2), "c5 d3 51 ea");
|
|
CODEGEN_TEST(xANDN.PS(xmm6, ptr[rdi]), "c5 c8 55 37");
|
|
CODEGEN_TEST(xANDN.PD(xmm3, xmm8), "c4 c1 61 55 d8");
|
|
|
|
CODEGEN_TEST(xPABS.B(xmm0, xmm2), "c4 e2 79 1c c2");
|
|
CODEGEN_TEST(xPABS.W(xmm4, xmm8), "c4 c2 79 1d e0");
|
|
CODEGEN_TEST(xPABS.D(xmm6, ptr[rax]), "c4 e2 79 1e 30");
|
|
CODEGEN_TEST(xPSIGN.B(xmm0, xmm2), "c4 e2 79 08 c2");
|
|
CODEGEN_TEST(xPSIGN.W(xmm4, xmm8), "c4 c2 59 09 e0");
|
|
CODEGEN_TEST(xPSIGN.D(xmm2, ptr[r8]), "c4 c2 69 0a 10");
|
|
CODEGEN_TEST(xPMADD.WD(xmm0, xmm8), "c5 b9 f5 c0"); // => vpmaddwd xmm0, xmm8, xmm0
|
|
CODEGEN_TEST(xPMADD.UBSW(xmm0, xmm8), "c4 c2 79 04 c0");
|
|
|
|
CODEGEN_TEST(xVMOVAPS(xmm0, xmm1), "c5 f8 28 c1");
|
|
CODEGEN_TEST(xVMOVAPS(xmm0, ptr32[rdi]), "c5 f8 28 07");
|
|
CODEGEN_TEST(xVMOVAPS(ptr32[rdi], xmm0), "c5 f8 29 07");
|
|
CODEGEN_TEST(xVMOVUPS(xmm0, ptr32[rdi]), "c5 f8 10 07");
|
|
CODEGEN_TEST(xVMOVUPS(ptr32[rdi], xmm0), "c5 f8 11 07");
|
|
|
|
CODEGEN_TEST(xVADD.PS(xmm0, xmm1, xmm2), "c5 f0 58 c2");
|
|
CODEGEN_TEST(xVADD.PD(xmm0, xmm1, xmm2), "c5 f1 58 c2");
|
|
CODEGEN_TEST(xVADD.SS(xmm0, xmm1, xmm2), "c5 f2 58 c2");
|
|
CODEGEN_TEST(xVADD.SD(xmm0, xmm1, xmm2), "c5 f3 58 c2");
|
|
CODEGEN_TEST(xVSUB.PS(xmm0, xmm1, xmm2), "c5 f0 5c c2");
|
|
CODEGEN_TEST(xVSUB.PD(xmm0, xmm1, xmm2), "c5 f1 5c c2");
|
|
CODEGEN_TEST(xVSUB.SS(xmm0, xmm1, xmm2), "c5 f2 5c c2");
|
|
CODEGEN_TEST(xVSUB.SD(xmm0, xmm1, xmm2), "c5 f3 5c c2");
|
|
CODEGEN_TEST(xVMUL.PS(xmm0, xmm1, xmm2), "c5 f0 59 c2");
|
|
CODEGEN_TEST(xVMUL.PD(xmm0, xmm1, xmm2), "c5 f1 59 c2");
|
|
CODEGEN_TEST(xVMUL.SS(xmm0, xmm1, xmm2), "c5 f2 59 c2");
|
|
CODEGEN_TEST(xVMUL.SD(xmm0, xmm1, xmm2), "c5 f3 59 c2");
|
|
CODEGEN_TEST(xVDIV.PS(xmm0, xmm1, xmm2), "c5 f0 5e c2");
|
|
CODEGEN_TEST(xVDIV.PD(xmm0, xmm1, xmm2), "c5 f1 5e c2");
|
|
CODEGEN_TEST(xVDIV.SS(xmm0, xmm1, xmm2), "c5 f2 5e c2");
|
|
CODEGEN_TEST(xVDIV.SD(xmm0, xmm1, xmm2), "c5 f3 5e c2");
|
|
|
|
// Don't need to test all variants, since they just change the condition immediate.
|
|
CODEGEN_TEST(xVCMP.EQ.PS(xmm0, xmm1, xmm2), "c5 f0 c2 c2 00");
|
|
CODEGEN_TEST(xVCMP.EQ.PD(xmm0, xmm1, xmm2), "c5 f1 c2 c2 00");
|
|
CODEGEN_TEST(xVCMP.EQ.SS(xmm0, xmm1, xmm2), "c5 f2 c2 c2 00");
|
|
CODEGEN_TEST(xVCMP.EQ.SD(xmm0, xmm1, xmm2), "c5 f3 c2 c2 00");
|
|
CODEGEN_TEST(xVCMP.LE.PS(xmm0, xmm1, xmm2), "c5 f0 c2 c2 02");
|
|
CODEGEN_TEST(xVCMP.LE.PD(xmm0, xmm1, xmm2), "c5 f1 c2 c2 02");
|
|
CODEGEN_TEST(xVCMP.LE.SS(xmm0, xmm1, xmm2), "c5 f2 c2 c2 02");
|
|
CODEGEN_TEST(xVCMP.LE.SD(xmm0, xmm1, xmm2), "c5 f3 c2 c2 02");
|
|
|
|
CODEGEN_TEST(xVPCMP.EQB(xmm0, xmm1, xmm2), "c5 f1 74 c2");
|
|
CODEGEN_TEST(xVPCMP.EQW(xmm0, xmm1, xmm2), "c5 f1 75 c2");
|
|
CODEGEN_TEST(xVPCMP.EQD(xmm0, xmm1, xmm2), "c5 f1 76 c2");
|
|
CODEGEN_TEST(xVPCMP.GTB(xmm0, xmm1, xmm2), "c5 f1 64 c2");
|
|
CODEGEN_TEST(xVPCMP.GTW(xmm0, xmm1, xmm2), "c5 f1 65 c2");
|
|
CODEGEN_TEST(xVPCMP.GTD(xmm0, xmm1, xmm2), "c5 f1 66 c2");
|
|
|
|
CODEGEN_TEST(xVPAND(xmm0, xmm1, xmm2), "c5 f1 db c2");
|
|
CODEGEN_TEST(xVPANDN(xmm0, xmm1, xmm2), "c5 f1 df c2");
|
|
CODEGEN_TEST(xVPOR(xmm0, xmm1, xmm2), "c5 f1 eb c2");
|
|
CODEGEN_TEST(xVPXOR(xmm0, xmm1, xmm2), "c5 f1 ef c2");
|
|
|
|
CODEGEN_TEST(xVMOVMSKPS(eax, xmm1), "c5 f8 50 c1");
|
|
CODEGEN_TEST(xVMOVMSKPD(eax, xmm1), "c5 f9 50 c1");
|
|
}
|
|
|
|
TEST(CodegenTests, AVX256Test)
|
|
{
|
|
x86Emitter::use_avx = true;
|
|
|
|
CODEGEN_TEST(xVMOVAPS(ymm0, ymm1), "c5 fc 28 c1");
|
|
CODEGEN_TEST(xVMOVAPS(ymm0, ptr32[rdi]), "c5 fc 28 07");
|
|
CODEGEN_TEST(xVMOVAPS(ptr32[rdi], ymm0), "c5 fc 29 07");
|
|
CODEGEN_TEST(xVMOVUPS(ymm0, ptr32[rdi]), "c5 fc 10 07");
|
|
CODEGEN_TEST(xVMOVUPS(ptr32[rdi], ymm0), "c5 fc 11 07");
|
|
|
|
CODEGEN_TEST(xVZEROUPPER(), "c5 f8 77");
|
|
|
|
CODEGEN_TEST(xVADD.PS(ymm0, ymm1, ymm2), "c5 f4 58 c2");
|
|
CODEGEN_TEST(xVADD.PD(ymm0, ymm1, ymm2), "c5 f5 58 c2");
|
|
CODEGEN_TEST(xVSUB.PS(ymm0, ymm1, ymm2), "c5 f4 5c c2");
|
|
CODEGEN_TEST(xVSUB.PD(ymm0, ymm1, ymm2), "c5 f5 5c c2");
|
|
CODEGEN_TEST(xVMUL.PS(ymm0, ymm1, ymm2), "c5 f4 59 c2");
|
|
CODEGEN_TEST(xVMUL.PD(ymm0, ymm1, ymm2), "c5 f5 59 c2");
|
|
CODEGEN_TEST(xVDIV.PS(ymm0, ymm1, ymm2), "c5 f4 5e c2");
|
|
CODEGEN_TEST(xVDIV.PD(ymm0, ymm1, ymm2), "c5 f5 5e c2");
|
|
|
|
CODEGEN_TEST(xVCMP.EQ.PS(ymm0, ymm1, ymm2), "c5 f4 c2 c2 00");
|
|
CODEGEN_TEST(xVCMP.EQ.PD(ymm0, ymm1, ymm2), "c5 f5 c2 c2 00");
|
|
CODEGEN_TEST(xVCMP.LE.PS(ymm0, ymm1, ymm2), "c5 f4 c2 c2 02");
|
|
CODEGEN_TEST(xVCMP.LE.PD(ymm0, ymm1, ymm2), "c5 f5 c2 c2 02");
|
|
|
|
CODEGEN_TEST(xVPCMP.EQB(ymm0, ymm1, ymm2), "c5 f5 74 c2");
|
|
CODEGEN_TEST(xVPCMP.EQW(ymm0, ymm1, ymm2), "c5 f5 75 c2");
|
|
CODEGEN_TEST(xVPCMP.EQD(ymm0, ymm1, ymm2), "c5 f5 76 c2");
|
|
CODEGEN_TEST(xVPCMP.GTB(ymm0, ymm1, ymm2), "c5 f5 64 c2");
|
|
CODEGEN_TEST(xVPCMP.GTW(ymm0, ymm1, ymm2), "c5 f5 65 c2");
|
|
CODEGEN_TEST(xVPCMP.GTD(ymm0, ymm1, ymm2), "c5 f5 66 c2");
|
|
|
|
CODEGEN_TEST(xVPAND(ymm0, ymm1, ymm2), "c5 f5 db c2");
|
|
CODEGEN_TEST(xVPANDN(ymm0, ymm1, ymm2), "c5 f5 df c2");
|
|
CODEGEN_TEST(xVPOR(ymm0, ymm1, ymm2), "c5 f5 eb c2");
|
|
CODEGEN_TEST(xVPXOR(ymm0, ymm1, ymm2), "c5 f5 ef c2");
|
|
|
|
CODEGEN_TEST(xVMOVMSKPS(eax, ymm1), "c5 fc 50 c1");
|
|
CODEGEN_TEST(xVMOVMSKPD(eax, ymm1), "c5 fd 50 c1");
|
|
}
|
|
|
|
TEST(CodegenTests, Extended8BitTest)
|
|
{
|
|
CODEGEN_TEST(xSETL(al), "0f 9c c0");
|
|
CODEGEN_TEST(xSETL(cl), "0f 9c c1");
|
|
CODEGEN_TEST(xSETL(dl), "0f 9c c2");
|
|
CODEGEN_TEST(xSETL(bl), "0f 9c c3");
|
|
CODEGEN_TEST(xSETL(spl), "40 0f 9c c4");
|
|
CODEGEN_TEST(xSETL(bpl), "40 0f 9c c5");
|
|
CODEGEN_TEST(xSETL(sil), "40 0f 9c c6");
|
|
CODEGEN_TEST(xSETL(dil), "40 0f 9c c7");
|
|
CODEGEN_TEST(xSETL(r8b), "41 0f 9c c0");
|
|
CODEGEN_TEST(xSETL(r9b), "41 0f 9c c1");
|
|
CODEGEN_TEST(xSETL(r10b), "41 0f 9c c2");
|
|
CODEGEN_TEST(xSETL(r11b), "41 0f 9c c3");
|
|
CODEGEN_TEST(xSETL(r12b), "41 0f 9c c4");
|
|
CODEGEN_TEST(xSETL(r13b), "41 0f 9c c5");
|
|
CODEGEN_TEST(xSETL(r14b), "41 0f 9c c6");
|
|
CODEGEN_TEST(xSETL(r15b), "41 0f 9c c7");
|
|
}
|