2f9dea5cc3
590c10e37 fix typo 396715a89 use github action 69a25fd92 change build status to travis-ci.com a6a9dac91 meanings of the name 8d1e41b65 test_util.cpp supports OpenBSD 77ffe7173 Merge pull request #115 from Ryan-rsm-McKenzie/master a1da3403a fix build interface include directory e0136d4ef fix add_library call with INTERFACE 3071eee0c support slightly more modern cmake e626d6209 v5.991 a49c4bc11 disable XBYAK_CONSTEXPR for g++-5 -std=c++-14 70777a699 Merge branch 'atafra-old_mac_fix' into dev 6b81678d0 fixed compile error on some older macOS versions 2c3b43f15 refactor util 91784e2b8 test_util checks AMX and AVX_VNNI 70b70c557 update to v5.99 284cc5bed refactor 6b3eb9c1e default encoding is always evex f85b1100b refactor vnni 276d09bae Merge branch 'akharito-akharito/adl_support' into dev 50df86ce3 v5.98 97ce92d58 Merge branch 'akharito/adl_support' of https://github.com/akharito/xbyak into akharito-akharito/adl_support 1f119a04a support [scale * reg] 9ee1bef9a cpuid - check that GRT CPUID leaf 7 subleaf 0 should return EAX=1 be93adb2c add AVX VNNI instruction support 0c277240a add ADL CPUID a9a5cc2e2 Add option to choose VEX or EVEX encoding 29bfd25ba fix indent a0c49fa2e Merge branch 'atafra-mac_avx512_fix' into dev ea388b3c6 fixed incorrect detection of AVX-512 on macOS ed1b8186f Merge branch 'FEX-Emu-extended_features' into dev 3dacddfec Merge branch 'extended_features' of https://github.com/FEX-Emu/xbyak into FEX-Emu-extended_features 898f78ca3 Merge branch 'kariya-mitsuru-use-sh' 0b7f1411c Merge branch 'use-sh' of https://github.com/kariya-mitsuru/xbyak into kariya-mitsuru-use-sh 99e2b13b2 Fixes extended feature support checking b0a43c7e5 Use sh instead of tcsh for test scripts 87e8f41ae remove warning of _MSC_VER git-subtree-dir: externals/xbyak git-subtree-split: 590c10e3746978dbfcf102d6da933ac2659e4544
134 lines
3.6 KiB
C++
134 lines
3.6 KiB
C++
#include <stdio.h>
|
|
#include "xbyak/xbyak_util.h"
|
|
|
|
#define NUM_OF_ARRAY(x) (sizeof(x) / sizeof(x[0]))
|
|
|
|
struct PopCountTest : public Xbyak::CodeGenerator {
|
|
PopCountTest(int n)
|
|
: Xbyak::CodeGenerator(4096, Xbyak::DontSetProtectRWE)
|
|
{
|
|
ret();
|
|
mov(eax, n);
|
|
popcnt(eax, eax);
|
|
ret();
|
|
}
|
|
};
|
|
|
|
void putCPUinfo()
|
|
{
|
|
using namespace Xbyak::util;
|
|
Cpu cpu;
|
|
printf("vendor %s\n", cpu.has(Cpu::tINTEL) ? "intel" : "amd");
|
|
static const struct {
|
|
Cpu::Type type;
|
|
const char *str;
|
|
} tbl[] = {
|
|
{ Cpu::tMMX, "mmx" },
|
|
{ Cpu::tMMX2, "mmx2" },
|
|
{ Cpu::tCMOV, "cmov" },
|
|
{ Cpu::tSSE, "sse" },
|
|
{ Cpu::tSSE2, "sse2" },
|
|
{ Cpu::tSSE3, "sse3" },
|
|
{ Cpu::tSSSE3, "ssse3" },
|
|
{ Cpu::tSSE41, "sse41" },
|
|
{ Cpu::tSSE42, "sse42" },
|
|
{ Cpu::tPOPCNT, "popcnt" },
|
|
{ Cpu::t3DN, "3dn" },
|
|
{ Cpu::tE3DN, "e3dn" },
|
|
{ Cpu::tSSE4a, "sse4a" },
|
|
{ Cpu::tSSE5, "sse5" },
|
|
{ Cpu::tAESNI, "aesni" },
|
|
{ Cpu::tRDTSCP, "rdtscp" },
|
|
{ Cpu::tOSXSAVE, "osxsave(xgetvb)" },
|
|
{ Cpu::tPCLMULQDQ, "pclmulqdq" },
|
|
{ Cpu::tAVX, "avx" },
|
|
{ Cpu::tFMA, "fma" },
|
|
{ Cpu::tAVX2, "avx2" },
|
|
{ Cpu::tBMI1, "bmi1" },
|
|
{ Cpu::tBMI2, "bmi2" },
|
|
{ Cpu::tLZCNT, "lzcnt" },
|
|
{ Cpu::tPREFETCHW, "prefetchw" },
|
|
{ Cpu::tENHANCED_REP, "enh_rep" },
|
|
{ Cpu::tRDRAND, "rdrand" },
|
|
{ Cpu::tADX, "adx" },
|
|
{ Cpu::tRDSEED, "rdseed" },
|
|
{ Cpu::tSMAP, "smap" },
|
|
{ Cpu::tHLE, "hle" },
|
|
{ Cpu::tRTM, "rtm" },
|
|
{ Cpu::tMPX, "mpx" },
|
|
{ Cpu::tSHA, "sha" },
|
|
{ Cpu::tPREFETCHWT1, "prefetchwt1" },
|
|
{ Cpu::tF16C, "f16c" },
|
|
{ Cpu::tMOVBE, "movbe" },
|
|
{ Cpu::tAVX512F, "avx512f" },
|
|
{ Cpu::tAVX512DQ, "avx512dq" },
|
|
{ Cpu::tAVX512IFMA, "avx512_ifma" },
|
|
{ Cpu::tAVX512PF, "avx512pf" },
|
|
{ Cpu::tAVX512ER, "avx512er" },
|
|
{ Cpu::tAVX512CD, "avx512cd" },
|
|
{ Cpu::tAVX512BW, "avx512bw" },
|
|
{ Cpu::tAVX512VL, "avx512vl" },
|
|
{ Cpu::tAVX512VBMI, "avx512_vbmi" },
|
|
{ Cpu::tAVX512_4VNNIW, "avx512_4vnniw" },
|
|
{ Cpu::tAVX512_4FMAPS, "avx512_4fmaps" },
|
|
|
|
{ Cpu::tAVX512_VBMI2, "avx512_vbmi2" },
|
|
{ Cpu::tGFNI, "gfni" },
|
|
{ Cpu::tVAES, "vaes" },
|
|
{ Cpu::tVPCLMULQDQ, "vpclmulqdq" },
|
|
{ Cpu::tAVX512_VNNI, "avx512_vnni" },
|
|
{ Cpu::tAVX512_BITALG, "avx512_bitalg" },
|
|
{ Cpu::tAVX512_VPOPCNTDQ, "avx512_vpopcntdq" },
|
|
{ Cpu::tAVX512_BF16, "avx512_bf16" },
|
|
{ Cpu::tAVX512_VP2INTERSECT, "avx512_vp2intersect" },
|
|
{ Cpu::tAMX_TILE, "amx(tile)" },
|
|
{ Cpu::tAMX_INT8, "amx(int8)" },
|
|
{ Cpu::tAMX_BF16, "amx(bf16)" },
|
|
{ Cpu::tAVX_VNNI, "avx_vnni" },
|
|
};
|
|
for (size_t i = 0; i < NUM_OF_ARRAY(tbl); i++) {
|
|
if (cpu.has(tbl[i].type)) printf(" %s", tbl[i].str);
|
|
}
|
|
printf("\n");
|
|
if (cpu.has(Cpu::tPOPCNT)) {
|
|
const int n = 0x12345678; // bitcount = 13
|
|
const int ok = 13;
|
|
PopCountTest code(n);
|
|
code.setProtectModeRE();
|
|
int (*f)() = code.getCode<int (*)()>();
|
|
int r = f();
|
|
if (r == ok) {
|
|
puts("popcnt ok");
|
|
} else {
|
|
printf("popcnt ng %d %d\n", r, ok);
|
|
}
|
|
code.setProtectModeRW();
|
|
}
|
|
/*
|
|
displayFamily displayModel
|
|
Opteron 2376 10 4
|
|
Core2 Duo T7100 6 F
|
|
Core i3-2120T 6 2A
|
|
Core i7-2600 6 2A
|
|
Xeon X5650 6 2C
|
|
Core i7-3517 6 3A
|
|
Core i7-3930K 6 2D
|
|
*/
|
|
cpu.putFamily();
|
|
if (!cpu.has(Cpu::tINTEL)) return;
|
|
for (unsigned int i = 0; i < cpu.getDataCacheLevels(); i++) {
|
|
printf("cache level=%u data cache size=%u cores sharing data cache=%u\n", i, cpu.getDataCacheSize(i), cpu.getCoresSharingDataCache(i));
|
|
}
|
|
printf("SmtLevel =%u\n", cpu.getNumCores(Xbyak::util::SmtLevel));
|
|
printf("CoreLevel=%u\n", cpu.getNumCores(Xbyak::util::CoreLevel));
|
|
}
|
|
|
|
int main()
|
|
{
|
|
#ifdef XBYAK32
|
|
puts("32bit");
|
|
#else
|
|
puts("64bit");
|
|
#endif
|
|
putCPUinfo();
|
|
}
|