Created
October 25, 2022 06:26
-
-
Save damageboy/77ec5ae48dd74c47ab9946ebd6b580d3 to your computer and use it in GitHub Desktop.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
CPUID highest leaf : [20h] | |
Running as root : [YES] | |
MSR reads supported : [YES] | |
CPU pinning enabled : [YES] | |
CPU supports zeroupper: [YES] | |
CPU supports AVX2 : [YES] | |
CPU supports AVX-512F : [YES] | |
CPU supports AVX-512VL: [YES] | |
CPU supports AVX-512BW: [YES] | |
CPU supports AVX-512CD: [YES] | |
cpuid = eax = 2, ebx = 166, ecx = 38400000, edx = 0 | |
tsc_freq = 3187.2 MHz (from cpuid leaf 0x15) | |
CPU brand string: 12th Gen Intel(R) Core(TM) i9-12900K | |
16 available CPUs: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15] | |
8 physical cores: [0, 2, 4, 6, 8, 10, 12, 14] | |
Will test up to 8 CPUs | |
Cores | ID | Description | OVRLP3 | Mops | A/M-ratio | A/M-MHz | M/tsc-ratio | |
1 | pause_only | pause instruction | 1.000 | 3032 | 1.56 | 4980 | 1.00 | |
1 | ucomis_clean | scalar ucomis (w/ vzeroupper) | 1.000 | 2501 | 1.56 | 4980 | 1.00 | |
1 | ucomis_dirty | scalar ucomis (no vzeroupper) | 1.000 | 2501 | 1.56 | 4980 | 1.00 | |
1 | scalar_iadd | Scalar integer adds | 1.000 | 5003 | 1.56 | 4980 | 1.00 | |
1 | avx128_iadd | 128-bit integer serial adds | 1.000 | 5002 | 1.56 | 4980 | 1.00 | |
1 | avx256_iadd | 256-bit integer serial adds | 1.000 | 5002 | 1.56 | 4980 | 1.00 | |
1 | avx512_iadd | 512-bit integer serial adds | 1.000 | 5002 | 1.56 | 4980 | 1.00 | |
1 | avx128_iadd16 | 128-bit integer serial adds zmm16 | 1.000 | 5002 | 1.56 | 4980 | 1.00 | |
1 | avx256_iadd16 | 256-bit integer serial adds zmm16 | 1.000 | 5002 | 1.56 | 4980 | 1.00 | |
1 | avx512_iadd16 | 512-bit integer serial adds zmm16 | 1.000 | 5003 | 1.56 | 4980 | 1.00 | |
1 | avx128_iadd_t | 128-bit integer parallel adds | 1.000 | 15006 | 1.56 | 4980 | 1.00 | |
1 | avx256_iadd_t | 256-bit integer parallel adds | 1.000 | 14999 | 1.56 | 4980 | 1.00 | |
1 | avx128_xor_zero | 128-bit zeroing xor | 1.000 | 29438 | 1.56 | 4980 | 1.00 | |
1 | avx256_xor_zero | 256-bit zeroing xor | 1.000 | 29420 | 1.56 | 4980 | 1.00 | |
1 | avx512_xor_zero | 512-bit zeroing xord | 1.000 | 29762 | 1.56 | 4980 | 1.00 | |
1 | avx128_mov_sparse | 128-bit reg-reg mov | 1.000 | 5002 | 1.56 | 4980 | 1.00 | |
1 | avx256_mov_sparse | 256-bit reg-reg mov | 1.000 | 5002 | 1.56 | 4980 | 1.00 | |
1 | avx512_mov_sparse | 512-bit reg-reg mov | 1.000 | 5002 | 1.56 | 4980 | 1.00 | |
1 | avx128_merge_sparse | 128-bit reg-reg merge mov | 1.000 | 5002 | 1.56 | 4980 | 1.00 | |
1 | avx256_merge_sparse | 256-bit reg-reg merge mov | 1.000 | 5002 | 1.56 | 4980 | 1.00 | |
1 | avx512_merge_sparse | 512-bit reg-reg merge mov | 1.000 | 5001 | 1.56 | 4980 | 1.00 | |
1 | avx128_vshift | 128-bit variable shift (vpsrlvd) | 1.000 | 5002 | 1.56 | 4980 | 1.00 | |
1 | avx256_vshift | 256-bit variable shift (vpsrlvd) | 1.000 | 5002 | 1.56 | 4980 | 1.00 | |
1 | avx512_vshift | 512-bit variable shift (vpsrlvd) | 1.000 | 5002 | 1.56 | 4980 | 1.00 | |
1 | avx128_vshift_t | 128-bit variable shift (vpsrlvd) | 1.000 | 10005 | 1.56 | 4980 | 1.00 | |
1 | avx256_vshift_t | 256-bit variable shift (vpsrlvd) | 1.000 | 10005 | 1.56 | 4980 | 1.00 | |
1 | avx512_vshift_t | 512-bit variable shift (vpsrlvd) | 1.000 | 5002 | 1.56 | 4980 | 1.00 | |
1 | avx128_vlzcnt | 128-bit lzcnt (vplzcntd) | 1.000 | 1251 | 1.56 | 4980 | 1.00 | |
1 | avx256_vlzcnt | 256-bit lzcnt (vplzcntd) | 1.000 | 1251 | 1.56 | 4980 | 1.00 | |
1 | avx512_vlzcnt | 512-bit lzcnt (vplzcntd) | 1.000 | 1251 | 1.56 | 4980 | 1.00 | |
1 | avx128_vlzcnt_t | 128-bit lzcnt (vplzcntd) | 1.000 | 10004 | 1.56 | 4980 | 1.00 | |
1 | avx256_vlzcnt_t | 256-bit lzcnt (vplzcntd) | 1.000 | 10004 | 1.56 | 4980 | 1.00 | |
1 | avx512_vlzcnt_t | 512-bit lzcnt (vplzcntd) | 1.000 | 5002 | 1.56 | 4980 | 1.00 | |
1 | avx128_imul | 128-bit integer muls (vpmuldq) | 1.000 | 1000 | 1.56 | 4980 | 1.00 | |
1 | avx256_imul | 256-bit integer muls (vpmuldq) | 1.000 | 1000 | 1.56 | 4980 | 1.00 | |
1 | avx512_imul | 512-bit integer muls (vpmuldq) | 1.000 | 1000 | 1.56 | 4980 | 1.00 | |
1 | avx128_fma_sparse | 128-bit 64-bit sparse FMAs | 1.000 | 5002 | 1.56 | 4980 | 1.00 | |
1 | avx256_fma_sparse | 256-bit 64-bit sparse FMAs | 1.000 | 5003 | 1.56 | 4980 | 1.00 | |
1 | avx512_fma_sparse | 512-bit 64-bit sparse FMAs | 1.000 | 5002 | 1.56 | 4980 | 1.00 | |
1 | avx128_fma | 128-bit serial DP FMAs | 1.000 | 1251 | 1.56 | 4980 | 1.00 | |
1 | avx256_fma | 256-bit serial DP FMAs | 1.000 | 1251 | 1.56 | 4980 | 1.00 | |
1 | avx512_fma | 512-bit serial DP FMAs | 1.000 | 1251 | 1.56 | 4980 | 1.00 | |
1 | avx128_fma_t | 128-bit parallel DP FMAs | 1.000 | 10006 | 1.56 | 4980 | 1.00 | |
1 | avx256_fma_t | 256-bit parallel DP FMAs | 1.000 | 10029 | 1.56 | 4980 | 1.00 | |
1 | avx512_fma_t | 512-bit parallel DP FMAs | 1.000 | 5001 | 1.56 | 4980 | 1.00 | |
1 | avx512_vpermw | 512-bit serial WORD permute | 1.000 | 1251 | 1.56 | 4980 | 1.00 | |
1 | avx512_vpermw_t | 512-bit parallel WORD permute | 1.000 | 5002 | 1.56 | 4980 | 1.00 | |
1 | avx512_vpermd | 512-bit serial DWORD permute | 1.000 | 1667 | 1.56 | 4980 | 1.00 | |
1 | avx512_vpermd_t | 512-bit parallel DWORD permute | 1.000 | 5001 | 1.56 | 4980 | 1.00 | |
Cores | ID | Description | OVRLP3 | Mops | A/M-ratio | A/M-MHz | M/tsc-ratio | |
2 | pause_only | pause instruction | 1.000 | 2874, 2874 | 1.56, 1.56 | 4971, 4971 | 1.00, 1.00 | |
2 | ucomis_clean | scalar ucomis (w/ vzeroupper) | 1.000 | 2459, 2458 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | ucomis_dirty | scalar ucomis (no vzeroupper) | 1.000 | 2457, 2457 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | scalar_iadd | Scalar integer adds | 1.000 | 4614, 4615 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx128_iadd | 128-bit integer serial adds | 1.000 | 4457, 4464 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx256_iadd | 256-bit integer serial adds | 1.000 | 4460, 4458 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx512_iadd | 512-bit integer serial adds | 1.000 | 4874, 4878 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx128_iadd16 | 128-bit integer serial adds zmm16 | 1.000 | 4460, 4457 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx256_iadd16 | 256-bit integer serial adds zmm16 | 1.000 | 4459, 4461 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx512_iadd16 | 512-bit integer serial adds zmm16 | 1.000 | 4898, 4898 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx128_iadd_t | 128-bit integer parallel adds | 1.000 | 7501, 7487 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx256_iadd_t | 256-bit integer parallel adds | 1.000 | 7510, 7496 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx128_xor_zero | 128-bit zeroing xor | 1.000 | 14819, 14795 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx256_xor_zero | 256-bit zeroing xor | 1.000 | 14828, 14806 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx512_xor_zero | 512-bit zeroing xord | 1.000 | 14846, 14865 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx128_mov_sparse | 128-bit reg-reg mov | 1.000 | 4614, 4611 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx256_mov_sparse | 256-bit reg-reg mov | 1.000 | 4615, 4607 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx512_mov_sparse | 512-bit reg-reg mov | 1.000 | 4611, 4611 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx128_merge_sparse | 128-bit reg-reg merge mov | 1.000 | 4618, 4609 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx256_merge_sparse | 256-bit reg-reg merge mov | 1.000 | 4613, 4613 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx512_merge_sparse | 512-bit reg-reg merge mov | 1.000 | 4611, 4608 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx128_vshift | 128-bit variable shift (vpsrlvd) | 1.000 | 4899, 4898 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx256_vshift | 256-bit variable shift (vpsrlvd) | 1.000 | 4900, 4899 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx512_vshift | 512-bit variable shift (vpsrlvd) | 1.000 | 2263, 2257 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx128_vshift_t | 128-bit variable shift (vpsrlvd) | 1.000 | 4843, 4817 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx256_vshift_t | 256-bit variable shift (vpsrlvd) | 1.000 | 4821, 4830 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx512_vshift_t | 512-bit variable shift (vpsrlvd) | 1.000 | 2259, 2263 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx128_vlzcnt | 128-bit lzcnt (vplzcntd) | 1.000 | 1251, 1251 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx256_vlzcnt | 256-bit lzcnt (vplzcntd) | 1.000 | 1250, 1251 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx512_vlzcnt | 512-bit lzcnt (vplzcntd) | 1.000 | 1251, 1251 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx128_vlzcnt_t | 128-bit lzcnt (vplzcntd) | 1.000 | 4824, 4831 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx256_vlzcnt_t | 256-bit lzcnt (vplzcntd) | 1.000 | 4824, 4833 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx512_vlzcnt_t | 512-bit lzcnt (vplzcntd) | 1.000 | 2256, 2272 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx128_imul | 128-bit integer muls (vpmuldq) | 1.000 | 1000, 1000 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx256_imul | 256-bit integer muls (vpmuldq) | 1.000 | 1000, 1000 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx512_imul | 512-bit integer muls (vpmuldq) | 1.000 | 1000, 1000 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx128_fma_sparse | 128-bit 64-bit sparse FMAs | 1.000 | 4614, 4608 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx256_fma_sparse | 256-bit 64-bit sparse FMAs | 1.000 | 4609, 4615 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx512_fma_sparse | 512-bit 64-bit sparse FMAs | 1.000 | 4610, 4609 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx128_fma | 128-bit serial DP FMAs | 1.000 | 1251, 1251 | 1.56, 1.56 | 4975, 4975 | 1.00, 1.00 | |
2 | avx256_fma | 256-bit serial DP FMAs | 1.000 | 1251, 1251 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx512_fma | 512-bit serial DP FMAs | 1.000 | 1251, 1251 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx128_fma_t | 128-bit parallel DP FMAs | 1.000 | 4845, 4843 | 1.56, 1.56 | 4980, 4981 | 1.00, 1.00 | |
2 | avx256_fma_t | 256-bit parallel DP FMAs | 1.000 | 4837, 4837 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx512_fma_t | 512-bit parallel DP FMAs | 1.000 | 2244, 2258 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx512_vpermw | 512-bit serial WORD permute | 1.000 | 1251, 1250 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx512_vpermw_t | 512-bit parallel WORD permute | 1.000 | 2489, 2488 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx512_vpermd | 512-bit serial DWORD permute | 1.000 | 1667, 1667 | 1.56, 1.56 | 4980, 4980 | 1.00, 1.00 | |
2 | avx512_vpermd_t | 512-bit parallel DWORD permute | 1.000 | 2506, 2492 | 1.56, 1.56 | 4980, 4979 | 1.00, 1.00 | |
Cores | ID | Description | OVRLP3 | Mops | A/M-ratio | A/M-MHz | M/tsc-ratio | |
3 | pause_only | pause instruction | 1.000 | 2876, 2876, 3032 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | ucomis_clean | scalar ucomis (w/ vzeroupper) | 1.000 | 2457, 2457, 2501 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | ucomis_dirty | scalar ucomis (no vzeroupper) | 1.000 | 2456, 2456, 2501 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | scalar_iadd | Scalar integer adds | 1.000 | 4615, 4614, 5003 | 1.55, 1.55, 1.56 | 4953, 4953, 4980 | 1.00, 1.00, 1.00 | |
3 | avx128_iadd | 128-bit integer serial adds | 1.000 | 4468, 4459, 5002 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx256_iadd | 256-bit integer serial adds | 1.000 | 4458, 4458, 5002 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx512_iadd | 512-bit integer serial adds | 1.000 | 4876, 4877, 5003 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx128_iadd16 | 128-bit integer serial adds zmm16 | 1.000 | 4462, 4461, 5002 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx256_iadd16 | 256-bit integer serial adds zmm16 | 1.000 | 4458, 4458, 5003 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx512_iadd16 | 512-bit integer serial adds zmm16 | 1.000 | 4897, 4899, 5003 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx128_iadd_t | 128-bit integer parallel adds | 1.000 | 7506, 7495, 15008 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx256_iadd_t | 256-bit integer parallel adds | 1.000 | 7505, 7497, 15006 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx128_xor_zero | 128-bit zeroing xor | 1.000 | 14808, 14835, 29429 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx256_xor_zero | 256-bit zeroing xor | 1.000 | 14797, 14799, 29612 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx512_xor_zero | 512-bit zeroing xord | 1.000 | 14848, 14861, 29727 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx128_mov_sparse | 128-bit reg-reg mov | 1.000 | 4613, 4612, 5003 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx256_mov_sparse | 256-bit reg-reg mov | 1.000 | 4614, 4612, 5003 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx512_mov_sparse | 512-bit reg-reg mov | 1.000 | 4611, 4611, 5001 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx128_merge_sparse | 128-bit reg-reg merge mov | 1.000 | 4611, 4611, 5001 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx256_merge_sparse | 256-bit reg-reg merge mov | 1.000 | 4612, 4612, 5002 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx512_merge_sparse | 512-bit reg-reg merge mov | 1.000 | 4613, 4611, 5002 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx128_vshift | 128-bit variable shift (vpsrlvd) | 1.000 | 4898, 4902, 5003 | 1.55, 1.55, 1.56 | 4950, 4950, 4980 | 1.00, 1.00, 1.00 | |
3 | avx256_vshift | 256-bit variable shift (vpsrlvd) | 1.000 | 4898, 4899, 5002 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx512_vshift | 512-bit variable shift (vpsrlvd) | 1.000 | 2253, 2276, 5002 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx128_vshift_t | 128-bit variable shift (vpsrlvd) | 1.000 | 4825, 4817, 10005 | 1.56, 1.56, 1.56 | 4977, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx256_vshift_t | 256-bit variable shift (vpsrlvd) | 1.000 | 4821, 4820, 10004 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx512_vshift_t | 512-bit variable shift (vpsrlvd) | 1.000 | 2259, 2248, 5002 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx128_vlzcnt | 128-bit lzcnt (vplzcntd) | 1.000 | 1251, 1251, 1251 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx256_vlzcnt | 256-bit lzcnt (vplzcntd) | 1.000 | 1251, 1251, 1251 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx512_vlzcnt | 512-bit lzcnt (vplzcntd) | 1.000 | 1251, 1250, 1251 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx128_vlzcnt_t | 128-bit lzcnt (vplzcntd) | 1.000 | 4828, 4822, 10008 | 1.56, 1.56, 1.56 | 4961, 4962, 4980 | 1.00, 1.00, 1.00 | |
3 | avx256_vlzcnt_t | 256-bit lzcnt (vplzcntd) | 1.000 | 4815, 4827, 10006 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx512_vlzcnt_t | 512-bit lzcnt (vplzcntd) | 1.000 | 2258, 2252, 5002 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx128_imul | 128-bit integer muls (vpmuldq) | 1.000 | 1000, 1000, 1000 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx256_imul | 256-bit integer muls (vpmuldq) | 1.000 | 1000, 1000, 1000 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx512_imul | 512-bit integer muls (vpmuldq) | 1.000 | 1000, 1000, 1000 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx128_fma_sparse | 128-bit 64-bit sparse FMAs | 1.000 | 4614, 4610, 5002 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx256_fma_sparse | 256-bit 64-bit sparse FMAs | 1.000 | 4610, 4610, 5003 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx512_fma_sparse | 512-bit 64-bit sparse FMAs | 1.000 | 4610, 4612, 5002 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx128_fma | 128-bit serial DP FMAs | 1.000 | 1251, 1251, 1251 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx256_fma | 256-bit serial DP FMAs | 1.000 | 1251, 1251, 1251 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx512_fma | 512-bit serial DP FMAs | 1.000 | 1251, 1250, 1251 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx128_fma_t | 128-bit parallel DP FMAs | 1.000 | 4825, 4849, 10017 | 1.56, 1.56, 1.56 | 4968, 4968, 4980 | 1.00, 1.00, 1.00 | |
3 | avx256_fma_t | 256-bit parallel DP FMAs | 1.000 | 4812, 4863, 10011 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx512_fma_t | 512-bit parallel DP FMAs | 1.000 | 2260, 2249, 5003 | 1.56, 1.56, 1.56 | 4980, 4981, 4980 | 1.00, 1.00, 1.00 | |
3 | avx512_vpermw | 512-bit serial WORD permute | 1.000 | 1251, 1251, 1251 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx512_vpermw_t | 512-bit parallel WORD permute | 1.000 | 2490, 2486, 5005 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx512_vpermd | 512-bit serial DWORD permute | 1.000 | 1667, 1667, 1667 | 1.56, 1.56, 1.56 | 4980, 4980, 4980 | 1.00, 1.00, 1.00 | |
3 | avx512_vpermd_t | 512-bit parallel DWORD permute | 1.000 | 2512, 2496, 5003 | 1.56, 1.56, 1.56 | 4979, 4981, 4980 | 1.00, 1.00, 1.00 | |
Cores | ID | Description | OVRLP3 | Mops | A/M-ratio | A/M-MHz | M/tsc-ratio | |
4 | pause_only | pause instruction | 1.000 | 2874, 2875, 2860, 2860 | 1.55, 1.55, 1.56, 1.56 | 4941, 4940, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | ucomis_clean | scalar ucomis (w/ vzeroupper) | 1.000 | 2457, 2457, 2457, 2458 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | ucomis_dirty | scalar ucomis (no vzeroupper) | 1.000 | 2459, 2458, 2459, 2456 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | scalar_iadd | Scalar integer adds | 1.000 | 4611, 4617, 4616, 4615 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx128_iadd | 128-bit integer serial adds | 1.000 | 4466, 4457, 4461, 4463 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx256_iadd | 256-bit integer serial adds | 1.000 | 4460, 4457, 4463, 4464 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx512_iadd | 512-bit integer serial adds | 1.000 | 4875, 4877, 4878, 4878 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx128_iadd16 | 128-bit integer serial adds zmm16 | 1.000 | 4458, 4460, 4457, 4458 | 1.55, 1.55, 1.55, 1.55 | 4953, 4953, 4947, 4947 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx256_iadd16 | 256-bit integer serial adds zmm16 | 1.000 | 4458, 4465, 4456, 4460 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx512_iadd16 | 512-bit integer serial adds zmm16 | 1.000 | 4897, 4897, 4898, 4895 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx128_iadd_t | 128-bit integer parallel adds | 1.000 | 7492, 7500, 7482, 7509 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4979 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx256_iadd_t | 256-bit integer parallel adds | 1.000 | 7502, 7495, 7476, 7513 | 1.56, 1.56, 1.55, 1.55 | 4980, 4980, 4948, 4948 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx128_xor_zero | 128-bit zeroing xor | 1.000 | 14795, 14808, 14819, 14797 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx256_xor_zero | 256-bit zeroing xor | 1.000 | 14808, 14797, 14810, 14793 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx512_xor_zero | 512-bit zeroing xord | 1.000 | 14857, 14854, 14868, 14848 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx128_mov_sparse | 128-bit reg-reg mov | 1.000 | 4610, 4609, 4607, 4614 | 1.55, 1.56, 1.56, 1.56 | 4954, 4956, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx256_mov_sparse | 256-bit reg-reg mov | 1.000 | 4608, 4607, 4611, 4613 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx512_mov_sparse | 512-bit reg-reg mov | 1.000 | 4614, 4613, 4612, 4615 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx128_merge_sparse | 128-bit reg-reg merge mov | 1.000 | 4611, 4612, 4616, 4612 | 1.55, 1.55, 1.56, 1.56 | 4942, 4941, 4979, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx256_merge_sparse | 256-bit reg-reg merge mov | 1.000 | 4608, 4612, 4613, 4610 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx512_merge_sparse | 512-bit reg-reg merge mov | 1.000 | 4611, 4612, 4612, 4612 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx128_vshift | 128-bit variable shift (vpsrlvd) | 1.000 | 4898, 4898, 4898, 4900 | 1.56, 1.56, 1.56, 1.56 | 4962, 4961, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx256_vshift | 256-bit variable shift (vpsrlvd) | 1.000 | 4898, 4898, 4898, 4897 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx512_vshift | 512-bit variable shift (vpsrlvd) | 1.000 | 2265, 2264, 2265, 2259 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx128_vshift_t | 128-bit variable shift (vpsrlvd) | 1.000 | 4809, 4827, 4815, 4842 | 1.56, 1.56, 1.56, 1.56 | 4980, 4978, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx256_vshift_t | 256-bit variable shift (vpsrlvd) | 1.000 | 4833, 4834, 4827, 4829 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx512_vshift_t | 512-bit variable shift (vpsrlvd) | 1.000 | 2250, 2255, 2250, 2252 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx128_vlzcnt | 128-bit lzcnt (vplzcntd) | 1.000 | 1251, 1251, 1251, 1251 | 1.56, 1.56, 1.56, 1.56 | 4971, 4971, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx256_vlzcnt | 256-bit lzcnt (vplzcntd) | 1.000 | 1251, 1251, 1250, 1251 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx512_vlzcnt | 512-bit lzcnt (vplzcntd) | 1.000 | 1250, 1250, 1250, 1251 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx128_vlzcnt_t | 128-bit lzcnt (vplzcntd) | 1.000 | 4825, 4829, 4857, 4844 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4975 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx256_vlzcnt_t | 256-bit lzcnt (vplzcntd) | 1.000 | 4826, 4830, 4834, 4816 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx512_vlzcnt_t | 512-bit lzcnt (vplzcntd) | 1.000 | 2247, 2265, 2259, 2259 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx128_imul | 128-bit integer muls (vpmuldq) | 1.000 | 1000, 1000, 1000, 1000 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx256_imul | 256-bit integer muls (vpmuldq) | 1.000 | 1000, 1000, 1000, 1000 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx512_imul | 512-bit integer muls (vpmuldq) | 1.000 | 1000, 1000, 1000, 1000 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx128_fma_sparse | 128-bit 64-bit sparse FMAs | 1.000 | 4609, 4610, 4612, 4613 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4979 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx256_fma_sparse | 256-bit 64-bit sparse FMAs | 1.000 | 4610, 4615, 4611, 4612 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx512_fma_sparse | 512-bit 64-bit sparse FMAs | 1.000 | 4609, 4612, 4609, 4613 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx128_fma | 128-bit serial DP FMAs | 1.000 | 1250, 1251, 1251, 1251 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx256_fma | 256-bit serial DP FMAs | 1.000 | 1251, 1251, 1251, 1251 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx512_fma | 512-bit serial DP FMAs | 1.000 | 1251, 1251, 1251, 1251 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx128_fma_t | 128-bit parallel DP FMAs | 1.000 | 4839, 4827, 4829, 4831 | 1.56, 1.56, 1.56, 1.56 | 4980, 4981, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx256_fma_t | 256-bit parallel DP FMAs | 1.000 | 4859, 4848, 4717, 4819 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4979, 4981 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx512_fma_t | 512-bit parallel DP FMAs | 1.000 | 2245, 2254, 2244, 2254 | 1.56, 1.56, 1.56, 1.56 | 4979, 4980, 4981, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx512_vpermw | 512-bit serial WORD permute | 1.000 | 1251, 1251, 1251, 1251 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx512_vpermw_t | 512-bit parallel WORD permute | 1.000 | 2492, 2489, 2489, 2488 | 1.56, 1.56, 1.56, 1.56 | 4977, 4979, 4980, 4979 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx512_vpermd | 512-bit serial DWORD permute | 1.000 | 1667, 1667, 1667, 1667 | 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00 | |
4 | avx512_vpermd_t | 512-bit parallel DWORD permute | 1.000 | 2481, 2492, 2490, 2498 | 1.56, 1.56, 1.56, 1.56 | 4981, 4979, 4981, 4980 | 1.00, 1.00, 1.00, 1.00 | |
Cores | ID | Description | OVRLP3 | Mops | A/M-ratio | A/M-MHz | M/tsc-ratio | |
5 | pause_only | pause instruction | 1.000 | 2908, 2908, 2892, 2892, 3032 | 1.55, 1.55, 1.55, 1.55, 1.56 | 4939, 4939, 4941, 4941, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | ucomis_clean | scalar ucomis (w/ vzeroupper) | 1.000 | 2457, 2458, 2457, 2457, 2502 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4970, 4970, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | ucomis_dirty | scalar ucomis (no vzeroupper) | 1.000 | 2454, 2455, 2456, 2456, 2501 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | scalar_iadd | Scalar integer adds | 1.000 | 4614, 4616, 4612, 4613, 5002 | 1.56, 1.56, 1.55, 1.55, 1.56 | 4980, 4980, 4943, 4942, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx128_iadd | 128-bit integer serial adds | 1.000 | 4460, 4463, 4459, 4460, 5003 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx256_iadd | 256-bit integer serial adds | 1.000 | 4461, 4460, 4458, 4464, 5002 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx512_iadd | 512-bit integer serial adds | 1.000 | 4865, 4869, 4866, 4864, 5002 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx128_iadd16 | 128-bit integer serial adds zmm16 | 1.000 | 4456, 4460, 4458, 4464, 5002 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx256_iadd16 | 256-bit integer serial adds zmm16 | 1.000 | 4464, 4459, 4463, 4462, 5003 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx512_iadd16 | 512-bit integer serial adds zmm16 | 1.000 | 4899, 4900, 4898, 4897, 5002 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx128_iadd_t | 128-bit integer parallel adds | 1.000 | 7511, 7476, 7508, 7479, 15006 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4978, 4980, 4979, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx256_iadd_t | 256-bit integer parallel adds | 1.000 | 7484, 7519, 7496, 7504, 15006 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx128_xor_zero | 128-bit zeroing xor | 1.000 | 14824, 14815, 14813, 14797, 29429 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx256_xor_zero | 256-bit zeroing xor | 1.000 | 14817, 14828, 14815, 14815, 29438 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx512_xor_zero | 512-bit zeroing xord | 1.000 | 14870, 14850, 14859, 14861, 29744 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx128_mov_sparse | 128-bit reg-reg mov | 1.000 | 4615, 4607, 4610, 4611, 5001 | 1.55, 1.55, 1.56, 1.56, 1.56 | 4954, 4954, 4979, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx256_mov_sparse | 256-bit reg-reg mov | 1.000 | 4613, 4612, 4608, 4616, 5003 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx512_mov_sparse | 512-bit reg-reg mov | 1.000 | 4610, 4611, 4613, 4614, 5003 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx128_merge_sparse | 128-bit reg-reg merge mov | 1.000 | 4609, 4612, 4614, 4610, 5002 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx256_merge_sparse | 256-bit reg-reg merge mov | 1.000 | 4610, 4610, 4612, 4614, 5002 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx512_merge_sparse | 512-bit reg-reg merge mov | 1.000 | 4614, 4612, 4610, 4613, 5003 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx128_vshift | 128-bit variable shift (vpsrlvd) | 1.000 | 4898, 4899, 4898, 4899, 5003 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx256_vshift | 256-bit variable shift (vpsrlvd) | 1.000 | 4900, 4899, 4900, 4899, 5002 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx512_vshift | 512-bit variable shift (vpsrlvd) | 1.000 | 2260, 2253, 2269, 2277, 5002 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx128_vshift_t | 128-bit variable shift (vpsrlvd) | 1.000 | 4822, 4829, 4830, 4830, 10003 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4979, 4980, 4980, 4979, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx256_vshift_t | 256-bit variable shift (vpsrlvd) | 1.000 | 4823, 4825, 4827, 4835, 10003 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx512_vshift_t | 512-bit variable shift (vpsrlvd) | 1.000 | 2254, 2259, 2257, 2252, 5003 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx128_vlzcnt | 128-bit lzcnt (vplzcntd) | 1.000 | 1251, 1251, 1251, 1250, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4974, 4974, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx256_vlzcnt | 256-bit lzcnt (vplzcntd) | 1.000 | 1251, 1251, 1251, 1251, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx512_vlzcnt | 512-bit lzcnt (vplzcntd) | 1.000 | 1250, 1250, 1251, 1251, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx128_vlzcnt_t | 128-bit lzcnt (vplzcntd) | 1.000 | 4808, 4834, 4828, 4809, 10006 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4976, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx256_vlzcnt_t | 256-bit lzcnt (vplzcntd) | 1.000 | 4824, 4833, 4842, 4821, 10005 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx512_vlzcnt_t | 512-bit lzcnt (vplzcntd) | 1.000 | 2248, 2249, 2267, 2260, 5002 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx128_imul | 128-bit integer muls (vpmuldq) | 1.000 | 1000, 1000, 1000, 1000, 1000 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4976, 4976, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx256_imul | 256-bit integer muls (vpmuldq) | 1.000 | 1000, 1000, 1000, 1000, 1000 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx512_imul | 512-bit integer muls (vpmuldq) | 1.000 | 1000, 1000, 1000, 1000, 1000 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx128_fma_sparse | 128-bit 64-bit sparse FMAs | 1.000 | 4609, 4614, 4614, 4610, 5002 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4979, 4980, 4962, 4962, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx256_fma_sparse | 256-bit 64-bit sparse FMAs | 1.000 | 4611, 4611, 4606, 4614, 5003 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx512_fma_sparse | 512-bit 64-bit sparse FMAs | 1.000 | 4611, 4608, 4611, 4613, 5003 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx128_fma | 128-bit serial DP FMAs | 1.000 | 1251, 1251, 1251, 1251, 1250 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx256_fma | 256-bit serial DP FMAs | 1.000 | 1251, 1251, 1251, 1251, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx512_fma | 512-bit serial DP FMAs | 1.000 | 1250, 1251, 1251, 1251, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx128_fma_t | 128-bit parallel DP FMAs | 1.000 | 4825, 4837, 4851, 4842, 10007 | 1.55, 1.55, 1.56, 1.56, 1.56 | 4942, 4942, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx256_fma_t | 256-bit parallel DP FMAs | 1.000 | 4830, 4848, 4750, 4881, 10022 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4979, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx512_fma_t | 512-bit parallel DP FMAs | 1.000 | 2258, 2252, 2260, 2252, 5000 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4981, 4980, 4980, 4979, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx512_vpermw | 512-bit serial WORD permute | 1.000 | 1251, 1251, 1251, 1251, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx512_vpermw_t | 512-bit parallel WORD permute | 1.000 | 2488, 2490, 2490, 2489, 5004 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx512_vpermd | 512-bit serial DWORD permute | 1.000 | 1667, 1667, 1667, 1667, 1667 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
5 | avx512_vpermd_t | 512-bit parallel DWORD permute | 1.000 | 2504, 2494, 2432, 2508, 5003 | 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4979, 4979, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00 | |
Cores | ID | Description | OVRLP3 | Mops | A/M-ratio | A/M-MHz | M/tsc-ratio | |
6 | pause_only | pause instruction | 1.000 | 2875, 2875, 2875, 2875, 2875, 2875 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4966, 4967, 4967, 4966, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | ucomis_clean | scalar ucomis (w/ vzeroupper) | 1.000 | 2457, 2458, 2458, 2458, 2457, 2457 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | ucomis_dirty | scalar ucomis (no vzeroupper) | 1.000 | 2455, 2455, 2456, 2456, 2456, 2456 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | scalar_iadd | Scalar integer adds | 1.000 | 4614, 4615, 4616, 4610, 4613, 4613 | 1.56, 1.56, 1.55, 1.55, 1.56, 1.56 | 4980, 4980, 4950, 4950, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx128_iadd | 128-bit integer serial adds | 1.000 | 4466, 4458, 4463, 4463, 4466, 4459 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4968, 4968, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx256_iadd | 256-bit integer serial adds | 1.000 | 4459, 4462, 4458, 4464, 4463, 4459 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx512_iadd | 512-bit integer serial adds | 1.000 | 4873, 4874, 4872, 4875, 4873, 4873 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx128_iadd16 | 128-bit integer serial adds zmm16 | 1.000 | 4460, 4460, 4458, 4469, 4455, 4464 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4978, 4980, 4979, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx256_iadd16 | 256-bit integer serial adds zmm16 | 1.000 | 4460, 4462, 4457, 4462, 4456, 4460 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx512_iadd16 | 512-bit integer serial adds zmm16 | 1.000 | 4897, 4897, 4898, 4898, 4898, 4899 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx128_iadd_t | 128-bit integer parallel adds | 1.000 | 7491, 7505, 7505, 7501, 7501, 7496 | 1.55, 1.55, 1.55, 1.55, 1.56, 1.56 | 4948, 4948, 4942, 4942, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx256_iadd_t | 256-bit integer parallel adds | 1.000 | 7509, 7484, 7494, 7501, 7497, 7488 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4963, 4962, 4958, 4958, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx128_xor_zero | 128-bit zeroing xor | 1.000 | 14832, 14804, 14795, 14824, 14815, 14795 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx256_xor_zero | 256-bit zeroing xor | 1.000 | 14795, 14824, 14815, 14808, 14826, 14826 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx512_xor_zero | 512-bit zeroing xord | 1.000 | 14846, 14870, 14868, 14850, 14872, 14850 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx128_mov_sparse | 128-bit reg-reg mov | 1.000 | 4612, 4607, 4614, 4611, 4611, 4613 | 1.55, 1.55, 1.56, 1.56, 1.56, 1.56 | 4954, 4954, 4979, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx256_mov_sparse | 256-bit reg-reg mov | 1.000 | 4613, 4609, 4611, 4611, 4611, 4611 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx512_mov_sparse | 512-bit reg-reg mov | 1.000 | 4611, 4608, 4610, 4615, 4611, 4611 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx128_merge_sparse | 128-bit reg-reg merge mov | 1.000 | 4612, 4609, 4610, 4609, 4616, 4612 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4979, 4980, 4979, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx256_merge_sparse | 256-bit reg-reg merge mov | 1.000 | 4612, 4611, 4613, 4614, 4611, 4613 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx512_merge_sparse | 512-bit reg-reg merge mov | 1.000 | 4612, 4611, 4615, 4610, 4614, 4611 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx128_vshift | 128-bit variable shift (vpsrlvd) | 1.000 | 4900, 4898, 4899, 4900, 4898, 4896 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4967, 4967, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx256_vshift | 256-bit variable shift (vpsrlvd) | 1.000 | 4898, 4897, 4899, 4899, 4896, 4899 | 1.55, 1.55, 1.56, 1.56, 1.56, 1.56 | 4940, 4940, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx512_vshift | 512-bit variable shift (vpsrlvd) | 1.000 | 2267, 2258, 2252, 2259, 2274, 2272 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx128_vshift_t | 128-bit variable shift (vpsrlvd) | 1.000 | 4830, 4833, 4824, 4817, 4824, 4803 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4960, 4959, 4977, 4980, 4978, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx256_vshift_t | 256-bit variable shift (vpsrlvd) | 1.000 | 4835, 4804, 4807, 4834, 4833, 4824 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx512_vshift_t | 512-bit variable shift (vpsrlvd) | 1.000 | 2252, 2257, 2259, 2243, 2262, 2255 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx128_vlzcnt | 128-bit lzcnt (vplzcntd) | 1.000 | 1251, 1251, 1251, 1251, 1251, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx256_vlzcnt | 256-bit lzcnt (vplzcntd) | 1.000 | 1251, 1251, 1251, 1250, 1250, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx512_vlzcnt | 512-bit lzcnt (vplzcntd) | 1.000 | 1251, 1251, 1251, 1251, 1251, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx128_vlzcnt_t | 128-bit lzcnt (vplzcntd) | 1.000 | 4799, 4837, 4817, 4810, 4838, 4812 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4977, 4977, 4980, 4966, 4967 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx256_vlzcnt_t | 256-bit lzcnt (vplzcntd) | 1.000 | 4826, 4837, 4869, 4846, 4817, 4832 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx512_vlzcnt_t | 512-bit lzcnt (vplzcntd) | 1.000 | 2251, 2260, 2259, 2255, 2258, 2244 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx128_imul | 128-bit integer muls (vpmuldq) | 1.000 | 1000, 1000, 1001, 1000, 1000, 1000 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4972, 4972, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx256_imul | 256-bit integer muls (vpmuldq) | 1.000 | 1000, 1000, 1000, 1000, 1000, 1000 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx512_imul | 512-bit integer muls (vpmuldq) | 1.000 | 1000, 1000, 1000, 1000, 1000, 1000 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx128_fma_sparse | 128-bit 64-bit sparse FMAs | 1.000 | 4611, 4612, 4606, 4614, 4609, 4615 | 1.56, 1.56, 1.55, 1.55, 1.56, 1.56 | 4980, 4979, 4943, 4943, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx256_fma_sparse | 256-bit 64-bit sparse FMAs | 1.000 | 4608, 4613, 4609, 4613, 4614, 4608 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx512_fma_sparse | 512-bit 64-bit sparse FMAs | 1.000 | 4614, 4611, 4610, 4610, 4610, 4607 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx128_fma | 128-bit serial DP FMAs | 1.000 | 1250, 1251, 1251, 1251, 1251, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4976, 4976, 4970, 4970, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx256_fma | 256-bit serial DP FMAs | 1.000 | 1251, 1251, 1251, 1251, 1251, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx512_fma | 512-bit serial DP FMAs | 1.000 | 1251, 1251, 1251, 1251, 1251, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx128_fma_t | 128-bit parallel DP FMAs | 1.000 | 4843, 4826, 4851, 4856, 4827, 4820 | 1.55, 1.55, 1.56, 1.56, 1.56, 1.56 | 4943, 4943, 4980, 4980, 4980, 4977 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx256_fma_t | 256-bit parallel DP FMAs | 1.000 | 4834, 4838, 4844, 4832, 4831, 4823 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx512_fma_t | 512-bit parallel DP FMAs | 1.000 | 2228, 2257, 2261, 2259, 2250, 2249 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4979, 4981, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx512_vpermw | 512-bit serial WORD permute | 1.000 | 1251, 1250, 1251, 1251, 1251, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx512_vpermw_t | 512-bit parallel WORD permute | 1.000 | 2486, 2487, 2490, 2494, 2488, 2489 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4979, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx512_vpermd | 512-bit serial DWORD permute | 1.000 | 1667, 1667, 1667, 1667, 1667, 1667 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
6 | avx512_vpermd_t | 512-bit parallel DWORD permute | 1.000 | 2486, 2479, 2443, 2507, 2508, 2489 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4979, 4980, 4980, 4980, 4981, 4979 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
Cores | ID | Description | OVRLP3 | Mops | A/M-ratio | A/M-MHz | M/tsc-ratio | |
7 | pause_only | pause instruction | 1.000 | 2874, 2875, 2875, 2876, 2863, 2866, 3032 | 1.55, 1.55, 1.56, 1.56, 1.56, 1.56, 1.56 | 4938, 4938, 4980, 4980, 4978, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | ucomis_clean | scalar ucomis (w/ vzeroupper) | 1.000 | 2459, 2456, 2457, 2457, 2457, 2459, 2500 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | ucomis_dirty | scalar ucomis (no vzeroupper) | 1.000 | 2456, 2459, 2458, 2458, 2457, 2457, 2501 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | scalar_iadd | Scalar integer adds | 1.000 | 4613, 4613, 4615, 4618, 4611, 4616, 5003 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4959, 4959, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx128_iadd | 128-bit integer serial adds | 1.000 | 4461, 4461, 4465, 4459, 4461, 4459, 5002 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx256_iadd | 256-bit integer serial adds | 1.000 | 4461, 4462, 4462, 4466, 4461, 4462, 5002 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx512_iadd | 512-bit integer serial adds | 1.000 | 4853, 4855, 4871, 4876, 4877, 4874, 5003 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx128_iadd16 | 128-bit integer serial adds zmm16 | 1.000 | 4465, 4461, 4459, 4462, 4462, 4461, 5002 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4960 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx256_iadd16 | 256-bit integer serial adds zmm16 | 1.000 | 4454, 4462, 4455, 4463, 4461, 4465, 5002 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx512_iadd16 | 512-bit integer serial adds zmm16 | 1.000 | 4900, 4895, 4898, 4899, 4899, 4896, 5002 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx128_iadd_t | 128-bit integer parallel adds | 1.000 | 7509, 7488, 7482, 7509, 7491, 7509, 15002 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4962, 4963, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx256_iadd_t | 256-bit integer parallel adds | 1.000 | 7504, 7490, 7500, 7505, 7511, 7498, 15006 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx128_xor_zero | 128-bit zeroing xor | 1.000 | 14808, 14813, 14793, 14815, 14826, 14799, 29438 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx256_xor_zero | 256-bit zeroing xor | 1.000 | 14799, 14806, 14804, 14819, 14797, 14806, 29595 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx512_xor_zero | 512-bit zeroing xord | 1.000 | 14852, 14872, 14861, 14854, 14859, 14854, 29771 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx128_mov_sparse | 128-bit reg-reg mov | 1.000 | 4610, 4608, 4613, 4608, 4611, 4609, 5002 | 1.56, 1.56, 1.55, 1.55, 1.56, 1.56, 1.56 | 4979, 4980, 4943, 4942, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx256_mov_sparse | 256-bit reg-reg mov | 1.000 | 4610, 4613, 4612, 4613, 4611, 4612, 5001 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx512_mov_sparse | 512-bit reg-reg mov | 1.000 | 4614, 4611, 4610, 4614, 4612, 4612, 5002 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx128_merge_sparse | 128-bit reg-reg merge mov | 1.000 | 4612, 4610, 4615, 4609, 4613, 4610, 5003 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx256_merge_sparse | 256-bit reg-reg merge mov | 1.000 | 4611, 4612, 4610, 4612, 4614, 4610, 5002 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx512_merge_sparse | 512-bit reg-reg merge mov | 1.000 | 4611, 4611, 4612, 4611, 4611, 4609, 5002 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4981, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx128_vshift | 128-bit variable shift (vpsrlvd) | 1.000 | 4898, 4900, 4897, 4899, 4896, 4897, 5002 | 1.55, 1.55, 1.56, 1.56, 1.56, 1.56, 1.56 | 4945, 4945, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx256_vshift | 256-bit variable shift (vpsrlvd) | 1.000 | 4898, 4897, 4898, 4899, 4900, 4899, 5002 | 1.55, 1.55, 1.56, 1.56, 1.56, 1.56, 1.56 | 4956, 4956, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx512_vshift | 512-bit variable shift (vpsrlvd) | 1.000 | 2268, 2260, 2265, 2253, 2254, 2259, 5002 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx128_vshift_t | 128-bit variable shift (vpsrlvd) | 1.000 | 4833, 4818, 4835, 4825, 4826, 4810, 10005 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4978, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx256_vshift_t | 256-bit variable shift (vpsrlvd) | 1.000 | 4826, 4829, 4834, 4819, 4842, 4833, 10004 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx512_vshift_t | 512-bit variable shift (vpsrlvd) | 1.000 | 2245, 2249, 2243, 2261, 2243, 2259, 5002 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx128_vlzcnt | 128-bit lzcnt (vplzcntd) | 1.000 | 1250, 1250, 1251, 1251, 1250, 1251, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4977 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx256_vlzcnt | 256-bit lzcnt (vplzcntd) | 1.000 | 1250, 1251, 1251, 1251, 1251, 1251, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx512_vlzcnt | 512-bit lzcnt (vplzcntd) | 1.000 | 1251, 1250, 1251, 1251, 1251, 1251, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx128_vlzcnt_t | 128-bit lzcnt (vplzcntd) | 1.000 | 4817, 4828, 4830, 4823, 4849, 4805, 10006 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4961, 4959, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx256_vlzcnt_t | 256-bit lzcnt (vplzcntd) | 1.000 | 4829, 4835, 4836, 4824, 4823, 4813, 10005 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx512_vlzcnt_t | 512-bit lzcnt (vplzcntd) | 1.000 | 2256, 2245, 2244, 2262, 2246, 2252, 5002 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx128_imul | 128-bit integer muls (vpmuldq) | 1.000 | 1000, 1000, 1000, 1000, 1000, 1000, 1000 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4974, 4974, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx256_imul | 256-bit integer muls (vpmuldq) | 1.000 | 1000, 1000, 1000, 1000, 1000, 1000, 1000 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx512_imul | 512-bit integer muls (vpmuldq) | 1.000 | 1000, 1000, 1000, 1000, 1000, 1000, 1000 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx128_fma_sparse | 128-bit 64-bit sparse FMAs | 1.000 | 4610, 4611, 4611, 4614, 4610, 4610, 5002 | 1.56, 1.56, 1.55, 1.55, 1.55, 1.55, 1.56 | 4980, 4980, 4936, 4936, 4938, 4938, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx256_fma_sparse | 256-bit 64-bit sparse FMAs | 1.000 | 4612, 4613, 4614, 4610, 4614, 4611, 5003 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx512_fma_sparse | 512-bit 64-bit sparse FMAs | 1.000 | 4613, 4607, 4610, 4614, 4613, 4609, 5002 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx128_fma | 128-bit serial DP FMAs | 1.000 | 1251, 1250, 1251, 1251, 1251, 1250, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4969, 4969, 4976, 4976, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx256_fma | 256-bit serial DP FMAs | 1.000 | 1251, 1251, 1251, 1251, 1251, 1251, 1250 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx512_fma | 512-bit serial DP FMAs | 1.000 | 1250, 1251, 1251, 1251, 1251, 1251, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx128_fma_t | 128-bit parallel DP FMAs | 1.000 | 4813, 4830, 4837, 4843, 4834, 4853, 10000 | 1.55, 1.55, 1.56, 1.56, 1.55, 1.55, 1.56 | 4944, 4937, 4981, 4980, 4936, 4937, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx256_fma_t | 256-bit parallel DP FMAs | 1.000 | 4827, 4851, 4841, 4842, 4873, 4882, 10008 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4979, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx512_fma_t | 512-bit parallel DP FMAs | 1.000 | 2258, 2250, 2239, 2244, 2243, 2248, 5002 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4979, 4981, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx512_vpermw | 512-bit serial WORD permute | 1.000 | 1251, 1251, 1251, 1251, 1251, 1251, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx512_vpermw_t | 512-bit parallel WORD permute | 1.000 | 2488, 2488, 2492, 2481, 2488, 2491, 5004 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx512_vpermd | 512-bit serial DWORD permute | 1.000 | 1667, 1667, 1667, 1667, 1667, 1667, 1667 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
7 | avx512_vpermd_t | 512-bit parallel DWORD permute | 1.000 | 2496, 2504, 2437, 2508, 2508, 2499, 5003 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4981, 4980, 4980, 4980, 4979, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
Cores | ID | Description | OVRLP3 | Mops | A/M-ratio | A/M-MHz | M/tsc-ratio | |
8 | pause_only | pause instruction | 1.000 | 2875, 2876, 2876, 2876, 2859, 2859, 2875, 2875 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.55, 1.55 | 4980, 4980, 4980, 4980, 4971, 4971, 4942, 4943 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | ucomis_clean | scalar ucomis (w/ vzeroupper) | 1.000 | 2457, 2458, 2458, 2457, 2457, 2458, 2456, 2457 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4959, 4958, 4963, 4963, 4959, 4959, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | ucomis_dirty | scalar ucomis (no vzeroupper) | 1.000 | 2457, 2456, 2454, 2455, 2455, 2455, 2456, 2456 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | scalar_iadd | Scalar integer adds | 1.000 | 4613, 4616, 4613, 4613, 4615, 4614, 4611, 4620 | 1.55, 1.55, 1.55, 1.55, 1.56, 1.56, 1.56, 1.56 | 4954, 4954, 4955, 4955, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx128_iadd | 128-bit integer serial adds | 1.000 | 4458, 4462, 4461, 4463, 4460, 4462, 4460, 4459 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx256_iadd | 256-bit integer serial adds | 1.000 | 4462, 4463, 4457, 4466, 4462, 4458, 4459, 4459 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx512_iadd | 512-bit integer serial adds | 1.000 | 4873, 4873, 4884, 4888, 4875, 4882, 4846, 4854 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx128_iadd16 | 128-bit integer serial adds zmm16 | 1.000 | 4463, 4456, 4462, 4460, 4459, 4460, 4456, 4461 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4960, 4960, 4968, 4968, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx256_iadd16 | 256-bit integer serial adds zmm16 | 1.000 | 4460, 4459, 4463, 4464, 4460, 4465, 4452, 4462 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx512_iadd16 | 512-bit integer serial adds zmm16 | 1.000 | 4897, 4896, 4896, 4896, 4898, 4898, 4897, 4898 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx128_iadd_t | 128-bit integer parallel adds | 1.000 | 7506, 7493, 7500, 7486, 7513, 7484, 7511, 7477 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4978, 4980, 4979, 4980, 4979, 4980, 4978, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx256_iadd_t | 256-bit integer parallel adds | 1.000 | 7475, 7515, 7515, 7485, 7488, 7509, 7513, 7492 | 1.56, 1.56, 1.56, 1.56, 1.55, 1.55, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4954, 4956, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx128_xor_zero | 128-bit zeroing xor | 1.000 | 14826, 14795, 14826, 14804, 14810, 14802, 14806, 14839 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx256_xor_zero | 256-bit zeroing xor | 1.000 | 14821, 14799, 14806, 14824, 14795, 14808, 14797, 14819 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx512_xor_zero | 512-bit zeroing xord | 1.000 | 14865, 14852, 14846, 14872, 14857, 14857, 14872, 14872 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx128_mov_sparse | 128-bit reg-reg mov | 1.000 | 4612, 4612, 4611, 4611, 4610, 4610, 4611, 4609 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4979, 4980, 4980, 4979, 4980, 4980, 4980, 4979 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx256_mov_sparse | 256-bit reg-reg mov | 1.000 | 4611, 4612, 4607, 4614, 4614, 4611, 4611, 4612 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4961, 4960, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx512_mov_sparse | 512-bit reg-reg mov | 1.000 | 4616, 4609, 4616, 4609, 4609, 4609, 4613, 4609 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx128_merge_sparse | 128-bit reg-reg merge mov | 1.000 | 4610, 4615, 4611, 4611, 4611, 4611, 4614, 4612 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4957, 4957 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx256_merge_sparse | 256-bit reg-reg merge mov | 1.000 | 4611, 4612, 4614, 4609, 4612, 4612, 4611, 4614 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx512_merge_sparse | 512-bit reg-reg merge mov | 1.000 | 4612, 4611, 4611, 4612, 4613, 4611, 4615, 4611 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx128_vshift | 128-bit variable shift (vpsrlvd) | 1.000 | 4900, 4898, 4899, 4899, 4899, 4900, 4898, 4900 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4968, 4968, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx256_vshift | 256-bit variable shift (vpsrlvd) | 1.000 | 4898, 4898, 4897, 4898, 4900, 4896, 4901, 4899 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx512_vshift | 512-bit variable shift (vpsrlvd) | 1.000 | 2251, 2267, 2262, 2262, 2263, 2258, 2256, 2275 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx128_vshift_t | 128-bit variable shift (vpsrlvd) | 1.000 | 4826, 4814, 4837, 4819, 4823, 4838, 4829, 4822 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4978, 4980, 4980, 4979, 4980, 4980, 4978, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx256_vshift_t | 256-bit variable shift (vpsrlvd) | 1.000 | 4823, 4832, 4826, 4836, 4817, 4831, 4846, 4804 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4962, 4962, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx512_vshift_t | 512-bit variable shift (vpsrlvd) | 1.000 | 2254, 2261, 2256, 2246, 2248, 2250, 2256, 2251 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx128_vlzcnt | 128-bit lzcnt (vplzcntd) | 1.000 | 1250, 1250, 1251, 1251, 1251, 1251, 1251, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4968, 4968, 4980, 4980, 4974, 4974, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx256_vlzcnt | 256-bit lzcnt (vplzcntd) | 1.000 | 1250, 1251, 1251, 1251, 1251, 1251, 1251, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx512_vlzcnt | 512-bit lzcnt (vplzcntd) | 1.000 | 1251, 1251, 1251, 1251, 1251, 1251, 1251, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx128_vlzcnt_t | 128-bit lzcnt (vplzcntd) | 1.000 | 4829, 4848, 4830, 4836, 4840, 4832, 4832, 4820 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4979, 4980, 4980, 4980, 4974, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx256_vlzcnt_t | 256-bit lzcnt (vplzcntd) | 1.000 | 4831, 4815, 4837, 4850, 4819, 4833, 4827, 4807 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx512_vlzcnt_t | 512-bit lzcnt (vplzcntd) | 1.000 | 2265, 2264, 2253, 2257, 2269, 2268, 2246, 2251 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx128_imul | 128-bit integer muls (vpmuldq) | 1.000 | 1000, 1000, 1000, 1000, 1000, 1000, 1000, 1000 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4975, 4975, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx256_imul | 256-bit integer muls (vpmuldq) | 1.000 | 1000, 1000, 1000, 1000, 1000, 1000, 1000, 1000 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx512_imul | 512-bit integer muls (vpmuldq) | 1.000 | 1000, 1000, 1000, 1000, 1000, 1000, 1000, 1000 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx128_fma_sparse | 128-bit 64-bit sparse FMAs | 1.000 | 4614, 4610, 4608, 4610, 4612, 4613, 4608, 4616 | 1.56, 1.56, 1.56, 1.56, 1.55, 1.55, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4942, 4943, 4980, 4979 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx256_fma_sparse | 256-bit 64-bit sparse FMAs | 1.000 | 4612, 4608, 4609, 4611, 4610, 4610, 4613, 4612 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx512_fma_sparse | 512-bit 64-bit sparse FMAs | 1.000 | 4610, 4613, 4609, 4614, 4609, 4614, 4611, 4613 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx128_fma | 128-bit serial DP FMAs | 1.000 | 1251, 1250, 1251, 1251, 1251, 1250, 1251, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4974, 4974, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx256_fma | 256-bit serial DP FMAs | 1.000 | 1251, 1250, 1251, 1251, 1251, 1251, 1251, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx512_fma | 512-bit serial DP FMAs | 1.000 | 1251, 1251, 1251, 1251, 1251, 1250, 1251, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx128_fma_t | 128-bit parallel DP FMAs | 1.000 | 4842, 4859, 4830, 4830, 4852, 4845, 4846, 4840 | 1.56, 1.56, 1.55, 1.55, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4935, 4947, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx256_fma_t | 256-bit parallel DP FMAs | 1.000 | 4848, 4837, 4850, 4824, 4836, 4851, 4848, 4854 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4979, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx512_fma_t | 512-bit parallel DP FMAs | 1.000 | 2254, 2256, 2232, 2242, 2249, 2255, 2253, 2260 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4979, 4981, 4980, 4979, 4981, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx512_vpermw | 512-bit serial WORD permute | 1.000 | 1250, 1251, 1251, 1251, 1251, 1251, 1251, 1251 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx512_vpermw_t | 512-bit parallel WORD permute | 1.000 | 2487, 2494, 2494, 2492, 2493, 2489, 2485, 2489 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4979, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx512_vpermd | 512-bit serial DWORD permute | 1.000 | 1667, 1667, 1667, 1667, 1667, 1667, 1667, 1667 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4980, 4980, 4980, 4980, 4980 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 | |
8 | avx512_vpermd_t | 512-bit parallel DWORD permute | 1.000 | 2483, 2505, 2513, 2504, 2452, 2495, 2507, 2500 | 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56, 1.56 | 4980, 4980, 4980, 4979, 4979, 4980, 4980, 4981 | 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00, 1.00 |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment