Created
December 11, 2016 09:32
-
-
Save nkurz/6e797e8b635931d2a0e4f32af6a12d1a to your computer and use it in GitHub Desktop.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
gcc-4.8 -O0 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=48 sd=0.02% | |
64 min=176 mean=176 sd=0.08% | |
256 min=896 mean=896 sd=0.04% | |
1024 min=4790 mean=4794 sd=0.07% | |
4096 min=32083 mean=32162 sd=0.13% | |
16384 min=194866 mean=194966 sd=0.03% | |
65536 min=1058338 mean=1059307 sd=0.05% | |
262144 min=4922740 mean=4929473 sd=0.12% | |
1048576 min=38757666 mean=38915279 sd=0.18% | |
gcc-4.8 -O0 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.04% | |
64 min=175 mean=176 sd=0.21% | |
256 min=883 mean=884 sd=0.07% | |
1024 min=4747 mean=4751 sd=0.06% | |
4096 min=32106 mean=32223 sd=0.71% | |
16384 min=192640 mean=192851 sd=0.07% | |
65536 min=1054922 mean=1056044 sd=0.07% | |
262144 min=4885094 mean=4892426 sd=0.12% | |
1048576 min=37589429 mean=37681476 sd=0.18% | |
gcc-4.8 -O1 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.02% | |
64 min=171 mean=171 sd=0.11% | |
256 min=864 mean=865 sd=0.05% | |
1024 min=4771 mean=4783 sd=0.19% | |
4096 min=32064 mean=32132 sd=0.14% | |
16384 min=194179 mean=194275 sd=0.03% | |
65536 min=1053685 mean=1054441 sd=0.03% | |
262144 min=4998435 mean=5008326 sd=0.11% | |
1048576 min=38468560 mean=38567220 sd=0.21% | |
gcc-4.8 -O1 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=171 sd=0.09% | |
256 min=863 mean=864 sd=0.07% | |
1024 min=4665 mean=4673 sd=0.12% | |
4096 min=32224 mean=32259 sd=0.06% | |
16384 min=198684 mean=198736 sd=0.02% | |
65536 min=1041438 mean=1041821 sd=0.02% | |
262144 min=4810739 mean=4823106 sd=0.12% | |
1048576 min=38912965 mean=39084602 sd=0.25% | |
gcc-4.8 -O2 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=172 sd=0.12% | |
256 min=864 mean=865 sd=0.05% | |
1024 min=4666 mean=4670 sd=0.06% | |
4096 min=31981 mean=32015 sd=0.10% | |
16384 min=192241 mean=192360 sd=0.04% | |
65536 min=1052094 mean=1052420 sd=0.02% | |
262144 min=4879758 mean=4888145 sd=0.12% | |
1048576 min=39325396 mean=39558492 sd=0.29% | |
gcc-4.8 -O2 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.13% | |
16 min=47 mean=47 sd=0.02% | |
64 min=175 mean=175 sd=0.18% | |
256 min=873 mean=875 sd=0.12% | |
1024 min=4716 mean=4720 sd=0.04% | |
4096 min=32030 mean=32091 sd=0.15% | |
16384 min=192265 mean=192376 sd=0.04% | |
65536 min=1040228 mean=1040667 sd=0.03% | |
262144 min=4848977 mean=4859544 sd=0.20% | |
1048576 min=39220137 mean=39414494 sd=0.35% | |
gcc-4.8 -O3 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=172 sd=0.08% | |
256 min=902 mean=908 sd=0.41% | |
1024 min=4677 mean=4680 sd=0.05% | |
4096 min=34984 mean=35219 sd=0.42% | |
16384 min=196031 mean=196170 sd=0.03% | |
65536 min=1033650 mean=1033881 sd=0.02% | |
262144 min=4928774 mean=4938207 sd=0.09% | |
1048576 min=37992977 mean=38117990 sd=0.14% | |
gcc-4.8 -O3 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.00% | |
16 min=47 mean=47 sd=0.12% | |
64 min=175 mean=176 sd=0.11% | |
256 min=879 mean=880 sd=0.11% | |
1024 min=4685 mean=4698 sd=0.17% | |
4096 min=32215 mean=32255 sd=0.07% | |
16384 min=193378 mean=193534 sd=0.05% | |
65536 min=1059356 mean=1059948 sd=0.03% | |
262144 min=4901205 mean=4907895 sd=0.12% | |
1048576 min=35922567 mean=35991696 sd=0.18% | |
gcc-4.8 -Ofast fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.02% | |
64 min=175 mean=176 sd=0.16% | |
256 min=873 mean=875 sd=0.11% | |
1024 min=4684 mean=4690 sd=0.06% | |
4096 min=45945 mean=45986 sd=0.08% | |
16384 min=198910 mean=199113 sd=0.07% | |
65536 min=1046070 mean=1046454 sd=0.03% | |
262144 min=4812898 mean=4818908 sd=0.09% | |
1048576 min=38662613 mean=38802101 sd=0.20% | |
gcc-4.8 -Ofast -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.13% | |
64 min=175 mean=176 sd=0.19% | |
256 min=874 mean=876 sd=0.07% | |
1024 min=4735 mean=4739 sd=0.07% | |
4096 min=32021 mean=32065 sd=0.10% | |
16384 min=193762 mean=193928 sd=0.03% | |
65536 min=1048962 mean=1049723 sd=0.06% | |
262144 min=4727678 mean=4734806 sd=0.09% | |
1048576 min=39469380 mean=39706822 sd=0.27% | |
------------------------ | |
gcc-4.9 -O0 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=48 sd=0.02% | |
64 min=175 mean=176 sd=0.13% | |
256 min=895 mean=897 sd=0.06% | |
1024 min=4770 mean=4780 sd=0.11% | |
4096 min=34446 mean=34671 sd=0.43% | |
16384 min=196612 mean=196741 sd=0.05% | |
65536 min=1045810 mean=1046179 sd=0.02% | |
262144 min=4823771 mean=4837792 sd=0.13% | |
1048576 min=37271396 mean=37349234 sd=0.17% | |
gcc-4.9 -O0 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.02% | |
16 min=48 mean=48 sd=0.02% | |
64 min=176 mean=176 sd=0.11% | |
256 min=873 mean=875 sd=0.19% | |
1024 min=4729 mean=4734 sd=0.05% | |
4096 min=32201 mean=32249 sd=0.11% | |
16384 min=195673 mean=195736 sd=0.02% | |
65536 min=1064126 mean=1065207 sd=0.05% | |
262144 min=4914402 mean=4921511 sd=0.13% | |
1048576 min=35906443 mean=36008913 sd=0.22% | |
gcc-4.9 -O1 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.02% | |
64 min=171 mean=172 sd=0.08% | |
256 min=864 mean=869 sd=0.72% | |
1024 min=4661 mean=4669 sd=0.09% | |
4096 min=32030 mean=32137 sd=0.16% | |
16384 min=193967 mean=194041 sd=0.04% | |
65536 min=1052680 mean=1053055 sd=0.03% | |
262144 min=4962321 mean=4981647 sd=0.20% | |
1048576 min=38942176 mean=39070362 sd=0.23% | |
gcc-4.9 -O1 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.02% | |
64 min=175 mean=176 sd=0.30% | |
256 min=959 mean=960 sd=0.05% | |
1024 min=4686 mean=4690 sd=0.09% | |
4096 min=32423 mean=32510 sd=0.12% | |
16384 min=192984 mean=193131 sd=0.05% | |
65536 min=1068713 mean=1069383 sd=0.03% | |
262144 min=4902529 mean=4911127 sd=0.11% | |
1048576 min=34290544 mean=34450862 sd=0.24% | |
gcc-4.9 -O2 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.36% | |
16 min=47 mean=47 sd=0.03% | |
64 min=171 mean=172 sd=0.06% | |
256 min=864 mean=865 sd=0.12% | |
1024 min=4770 mean=4782 sd=0.13% | |
4096 min=31989 mean=32026 sd=0.07% | |
16384 min=194620 mean=194703 sd=0.03% | |
65536 min=1044870 mean=1045159 sd=0.02% | |
262144 min=4943415 mean=4952558 sd=0.12% | |
1048576 min=39516715 mean=39672901 sd=0.31% | |
gcc-4.9 -O2 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=174 mean=175 sd=0.28% | |
256 min=875 mean=877 sd=0.38% | |
1024 min=4750 mean=4759 sd=0.14% | |
4096 min=32488 mean=32538 sd=0.11% | |
16384 min=193758 mean=193917 sd=0.04% | |
65536 min=1043740 mean=1044089 sd=0.02% | |
262144 min=4916994 mean=4928359 sd=0.14% | |
1048576 min=36845482 mean=36930448 sd=0.22% | |
gcc-4.9 -O3 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.02% | |
64 min=176 mean=176 sd=0.13% | |
256 min=890 mean=890 sd=0.04% | |
1024 min=4693 mean=4706 sd=0.11% | |
4096 min=32228 mean=32281 sd=0.13% | |
16384 min=197705 mean=197811 sd=0.05% | |
65536 min=1047724 mean=1048269 sd=0.03% | |
262144 min=4910197 mean=4917191 sd=0.12% | |
1048576 min=35418295 mean=35685565 sd=0.27% | |
gcc-4.9 -O3 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.02% | |
64 min=171 mean=172 sd=0.34% | |
256 min=864 mean=865 sd=0.05% | |
1024 min=4677 mean=4685 sd=0.15% | |
4096 min=32604 mean=32680 sd=0.17% | |
16384 min=200173 mean=200377 sd=0.07% | |
65536 min=1049404 mean=1049997 sd=0.04% | |
262144 min=4903346 mean=4916740 sd=0.16% | |
1048576 min=34144087 mean=34251989 sd=0.22% | |
gcc-4.9 -Ofast fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.02% | |
64 min=175 mean=176 sd=0.42% | |
256 min=884 mean=886 sd=0.17% | |
1024 min=4770 mean=4778 sd=0.07% | |
4096 min=32104 mean=32183 sd=0.21% | |
16384 min=196297 mean=196424 sd=0.05% | |
65536 min=1057860 mean=1059021 sd=0.06% | |
262144 min=4920777 mean=4926921 sd=0.09% | |
1048576 min=39172052 mean=39476681 sd=0.42% | |
gcc-4.9 -Ofast -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.02% | |
16 min=47 mean=47 sd=0.01% | |
64 min=175 mean=176 sd=0.42% | |
256 min=875 mean=876 sd=0.06% | |
1024 min=4726 mean=4733 sd=0.07% | |
4096 min=32394 mean=32498 sd=0.18% | |
16384 min=198075 mean=198218 sd=0.07% | |
65536 min=1051465 mean=1052079 sd=0.02% | |
262144 min=4805842 mean=4817821 sd=0.14% | |
1048576 min=34730104 mean=34851278 sd=0.24% | |
------------------------ | |
gcc-5 -O0 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=48 mean=48 sd=0.03% | |
64 min=176 mean=176 sd=0.12% | |
256 min=875 mean=876 sd=0.07% | |
1024 min=4738 mean=4742 sd=0.05% | |
4096 min=32162 mean=32236 sd=0.18% | |
16384 min=199138 mean=199279 sd=0.04% | |
65536 min=1043348 mean=1043779 sd=0.03% | |
262144 min=4895893 mean=4905251 sd=0.10% | |
1048576 min=37157191 mean=37280805 sd=0.26% | |
gcc-5 -O0 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=48 sd=0.02% | |
64 min=176 mean=176 sd=0.12% | |
256 min=882 mean=883 sd=0.07% | |
1024 min=4711 mean=4714 sd=0.06% | |
4096 min=32020 mean=32095 sd=0.16% | |
16384 min=192817 mean=192893 sd=0.03% | |
65536 min=1041303 mean=1041852 sd=0.04% | |
262144 min=4828981 mean=4834945 sd=0.10% | |
1048576 min=35624842 mean=35847361 sd=0.40% | |
gcc-5 -O1 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=171 sd=0.06% | |
256 min=865 mean=865 sd=0.03% | |
1024 min=4708 mean=4712 sd=0.05% | |
4096 min=32744 mean=32794 sd=0.09% | |
16384 min=193724 mean=193809 sd=0.03% | |
65536 min=1050222 mean=1050808 sd=0.03% | |
262144 min=4895098 mean=4904418 sd=0.12% | |
1048576 min=38762514 mean=38911682 sd=0.32% | |
gcc-5 -O1 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.00% | |
64 min=176 mean=176 sd=0.10% | |
256 min=876 mean=880 sd=0.66% | |
1024 min=4739 mean=4754 sd=0.12% | |
4096 min=32180 mean=32206 sd=0.09% | |
16384 min=195960 mean=196171 sd=0.06% | |
65536 min=1038492 mean=1039007 sd=0.04% | |
262144 min=4813623 mean=4827724 sd=0.13% | |
1048576 min=37059288 mean=37209768 sd=0.33% | |
gcc-5 -O2 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.13% | |
16 min=47 mean=47 sd=0.01% | |
64 min=175 mean=176 sd=0.27% | |
256 min=896 mean=900 sd=0.19% | |
1024 min=4755 mean=4762 sd=0.10% | |
4096 min=32278 mean=32330 sd=0.10% | |
16384 min=196404 mean=196548 sd=0.05% | |
65536 min=1050353 mean=1050800 sd=0.03% | |
262144 min=4902667 mean=4910330 sd=0.11% | |
1048576 min=37543673 mean=37655905 sd=0.24% | |
gcc-5 -O2 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=171 sd=0.10% | |
256 min=863 mean=865 sd=0.10% | |
1024 min=4630 mean=4637 sd=0.11% | |
4096 min=32195 mean=32281 sd=0.38% | |
16384 min=192850 mean=192993 sd=0.03% | |
65536 min=1054787 mean=1055286 sd=0.03% | |
262144 min=4837477 mean=4852825 sd=0.21% | |
1048576 min=37430839 mean=37610524 sd=0.24% | |
gcc-5 -O3 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.13% | |
64 min=175 mean=176 sd=0.15% | |
256 min=873 mean=876 sd=0.18% | |
1024 min=4748 mean=4760 sd=0.13% | |
4096 min=32143 mean=32175 sd=0.06% | |
16384 min=191792 mean=192184 sd=0.37% | |
65536 min=1034334 mean=1035234 sd=0.08% | |
262144 min=4918035 mean=4926013 sd=0.09% | |
1048576 min=33388946 mean=33543536 sd=0.33% | |
gcc-5 -O3 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=176 mean=176 sd=0.12% | |
256 min=882 mean=884 sd=0.10% | |
1024 min=4716 mean=4719 sd=0.05% | |
4096 min=32071 mean=32179 sd=0.16% | |
16384 min=196058 mean=196225 sd=0.05% | |
65536 min=1048948 mean=1049276 sd=0.02% | |
262144 min=4910085 mean=4920057 sd=0.14% | |
1048576 min=38377229 mean=38493085 sd=0.15% | |
gcc-5 -Ofast fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.00% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=171 sd=0.11% | |
256 min=864 mean=865 sd=0.05% | |
1024 min=4655 mean=4662 sd=0.09% | |
4096 min=31997 mean=32040 sd=0.09% | |
16384 min=202369 mean=202627 sd=0.06% | |
65536 min=1043509 mean=1045249 sd=0.35% | |
262144 min=4821160 mean=4835019 sd=0.12% | |
1048576 min=39522736 mean=39738556 sd=0.28% | |
gcc-5 -Ofast -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=52 mean=52 sd=0.05% | |
64 min=175 mean=176 sd=0.19% | |
256 min=873 mean=876 sd=0.11% | |
1024 min=4799 mean=4803 sd=0.06% | |
4096 min=32970 mean=33030 sd=0.11% | |
16384 min=194918 mean=195123 sd=0.07% | |
65536 min=1044277 mean=1045938 sd=0.37% | |
262144 min=4784487 mean=4799786 sd=0.16% | |
1048576 min=34751941 mean=34913229 sd=0.23% | |
------------------------ | |
gcc-5 -flto -O0 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.02% | |
64 min=171 mean=172 sd=0.09% | |
256 min=866 mean=867 sd=0.14% | |
1024 min=4669 mean=4682 sd=0.20% | |
4096 min=32104 mean=32149 sd=0.11% | |
16384 min=195137 mean=195219 sd=0.03% | |
65536 min=1048797 mean=1050752 sd=0.37% | |
262144 min=4909217 mean=4919075 sd=0.10% | |
1048576 min=37752300 mean=38012626 sd=0.30% | |
gcc-5 -flto -O0 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=172 sd=0.18% | |
256 min=864 mean=866 sd=0.16% | |
1024 min=4684 mean=4693 sd=0.12% | |
4096 min=32007 mean=32134 sd=0.22% | |
16384 min=193653 mean=193725 sd=0.03% | |
65536 min=1036900 mean=1038613 sd=0.34% | |
262144 min=4982987 mean=4993351 sd=0.13% | |
1048576 min=36885592 mean=37047455 sd=0.30% | |
gcc-5 -flto -O1 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.00% | |
16 min=47 mean=47 sd=0.01% | |
64 min=175 mean=176 sd=0.23% | |
256 min=874 mean=875 sd=0.10% | |
1024 min=4705 mean=4708 sd=0.04% | |
4096 min=32176 mean=32232 sd=0.11% | |
16384 min=192186 mean=192294 sd=0.03% | |
65536 min=1054258 mean=1056042 sd=0.40% | |
262144 min=4827871 mean=4838273 sd=0.15% | |
1048576 min=34117207 mean=34234653 sd=0.20% | |
gcc-5 -flto -O1 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.02% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=171 sd=0.07% | |
256 min=864 mean=865 sd=0.04% | |
1024 min=4658 mean=4667 sd=0.13% | |
4096 min=33524 mean=33553 sd=0.08% | |
16384 min=194962 mean=195121 sd=0.06% | |
65536 min=1061271 mean=1061770 sd=0.04% | |
262144 min=4778762 mean=4799832 sd=0.45% | |
1048576 min=34481890 mean=34603479 sd=0.28% | |
gcc-5 -flto -O2 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.02% | |
64 min=171 mean=171 sd=0.12% | |
256 min=864 mean=865 sd=0.07% | |
1024 min=4655 mean=4664 sd=0.13% | |
4096 min=32109 mean=32170 sd=0.08% | |
16384 min=196094 mean=196288 sd=0.05% | |
65536 min=1054529 mean=1055485 sd=0.06% | |
262144 min=4915166 mean=4920772 sd=0.07% | |
1048576 min=34592613 mean=34723468 sd=0.20% | |
gcc-5 -flto -O2 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.02% | |
16 min=47 mean=47 sd=0.01% | |
64 min=175 mean=175 sd=0.24% | |
256 min=875 mean=876 sd=0.06% | |
1024 min=4687 mean=4694 sd=0.07% | |
4096 min=32019 mean=32084 sd=0.16% | |
16384 min=196110 mean=196347 sd=0.05% | |
65536 min=1036130 mean=1036746 sd=0.04% | |
262144 min=4824574 mean=4834370 sd=0.14% | |
1048576 min=35336157 mean=35487643 sd=0.40% | |
gcc-5 -flto -O3 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.00% | |
16 min=47 mean=47 sd=0.01% | |
64 min=175 mean=176 sd=0.18% | |
256 min=874 mean=876 sd=0.10% | |
1024 min=5274 mean=5285 sd=0.13% | |
4096 min=33605 mean=33677 sd=0.14% | |
16384 min=192546 mean=192778 sd=0.13% | |
65536 min=1041712 mean=1042004 sd=0.02% | |
262144 min=4897756 mean=4910172 sd=0.15% | |
1048576 min=35642955 mean=35804579 sd=0.32% | |
gcc-5 -flto -O3 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=172 sd=0.07% | |
256 min=864 mean=865 sd=0.06% | |
1024 min=4676 mean=4683 sd=0.08% | |
4096 min=32188 mean=32216 sd=0.07% | |
16384 min=193878 mean=194017 sd=0.06% | |
65536 min=1060084 mean=1061105 sd=0.06% | |
262144 min=4916624 mean=4923962 sd=0.08% | |
1048576 min=34155721 mean=34253301 sd=0.25% | |
gcc-5 -flto -Ofast fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=175 mean=176 sd=0.15% | |
256 min=873 mean=875 sd=0.12% | |
1024 min=4754 mean=4758 sd=0.08% | |
4096 min=32227 mean=32295 sd=0.13% | |
16384 min=192123 mean=192340 sd=0.07% | |
65536 min=1049262 mean=1050040 sd=0.11% | |
262144 min=4819654 mean=4830520 sd=0.19% | |
1048576 min=36157369 mean=36322239 sd=0.38% | |
gcc-5 -flto -Ofast -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.02% | |
16 min=47 mean=47 sd=0.04% | |
64 min=171 mean=172 sd=0.07% | |
256 min=864 mean=865 sd=0.09% | |
1024 min=4676 mean=4682 sd=0.13% | |
4096 min=32207 mean=32241 sd=0.07% | |
16384 min=195777 mean=196024 sd=0.06% | |
65536 min=1067209 mean=1068259 sd=0.13% | |
262144 min=4793623 mean=4807412 sd=0.12% | |
1048576 min=34832407 mean=34947159 sd=0.17% | |
------------------------ | |
gcc-6 -O0 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=48 sd=0.05% | |
64 min=176 mean=176 sd=0.08% | |
256 min=875 mean=876 sd=0.06% | |
1024 min=4729 mean=4733 sd=0.05% | |
4096 min=32230 mean=32266 sd=0.11% | |
16384 min=196710 mean=196949 sd=0.07% | |
65536 min=1053526 mean=1053975 sd=0.03% | |
262144 min=4900647 mean=4911060 sd=0.14% | |
1048576 min=34407601 mean=34499279 sd=0.20% | |
gcc-6 -O0 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=172 sd=0.09% | |
256 min=864 mean=866 sd=0.16% | |
1024 min=4656 mean=4672 sd=0.17% | |
4096 min=32130 mean=32173 sd=0.09% | |
16384 min=192784 mean=192866 sd=0.03% | |
65536 min=1049139 mean=1049566 sd=0.03% | |
262144 min=4896432 mean=4911819 sd=0.14% | |
1048576 min=38369997 mean=38541929 sd=0.35% | |
gcc-6 -O1 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=172 sd=0.10% | |
256 min=864 mean=865 sd=0.06% | |
1024 min=4701 mean=4704 sd=0.05% | |
4096 min=32371 mean=32476 sd=0.13% | |
16384 min=199098 mean=199288 sd=0.07% | |
65536 min=1060126 mean=1060527 sd=0.03% | |
262144 min=4797743 mean=4807762 sd=0.15% | |
1048576 min=34930900 mean=35028688 sd=0.18% | |
gcc-6 -O1 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.02% | |
16 min=47 mean=47 sd=0.00% | |
64 min=171 mean=172 sd=0.52% | |
256 min=882 mean=889 sd=0.51% | |
1024 min=4689 mean=4696 sd=0.08% | |
4096 min=32219 mean=32243 sd=0.04% | |
16384 min=193769 mean=193988 sd=0.06% | |
65536 min=1043065 mean=1043535 sd=0.02% | |
262144 min=4893521 mean=4901724 sd=0.12% | |
1048576 min=35740670 mean=35810840 sd=0.14% | |
gcc-6 -O2 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.02% | |
64 min=174 mean=175 sd=0.33% | |
256 min=881 mean=898 sd=0.75% | |
1024 min=4757 mean=4762 sd=0.05% | |
4096 min=32122 mean=32178 sd=0.10% | |
16384 min=195805 mean=195906 sd=0.04% | |
65536 min=1041365 mean=1041545 sd=0.01% | |
262144 min=4794807 mean=4804543 sd=0.12% | |
1048576 min=38744389 mean=38962086 sd=0.35% | |
gcc-6 -O2 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=172 sd=0.07% | |
256 min=864 mean=865 sd=0.06% | |
1024 min=4706 mean=4717 sd=0.13% | |
4096 min=32238 mean=32281 sd=0.08% | |
16384 min=195849 mean=195979 sd=0.05% | |
65536 min=1053162 mean=1053839 sd=0.04% | |
262144 min=4798310 mean=4811955 sd=0.11% | |
1048576 min=34947857 mean=35025157 sd=0.22% | |
gcc-6 -O3 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.39% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=172 sd=0.09% | |
256 min=863 mean=864 sd=0.14% | |
1024 min=4755 mean=4759 sd=0.06% | |
4096 min=32377 mean=32416 sd=0.09% | |
16384 min=193882 mean=194013 sd=0.03% | |
65536 min=1052496 mean=1053005 sd=0.04% | |
262144 min=4926307 mean=4937327 sd=0.15% | |
1048576 min=35376837 mean=35541974 sd=0.37% | |
gcc-6 -O3 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.36% | |
64 min=171 mean=171 sd=0.07% | |
256 min=864 mean=865 sd=0.07% | |
1024 min=4672 mean=4680 sd=0.14% | |
4096 min=32211 mean=32313 sd=0.16% | |
16384 min=192281 mean=192444 sd=0.04% | |
65536 min=1050983 mean=1051820 sd=0.06% | |
262144 min=4889165 mean=4900273 sd=0.14% | |
1048576 min=38198458 mean=38332192 sd=0.25% | |
gcc-6 -Ofast fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.02% | |
64 min=171 mean=171 sd=0.09% | |
256 min=863 mean=864 sd=0.07% | |
1024 min=4643 mean=4653 sd=0.14% | |
4096 min=32125 mean=32211 sd=0.18% | |
16384 min=197840 mean=198019 sd=0.06% | |
65536 min=1056341 mean=1057001 sd=0.06% | |
262144 min=4819247 mean=4828567 sd=0.12% | |
1048576 min=35904719 mean=35981753 sd=0.11% | |
gcc-6 -Ofast -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.02% | |
64 min=171 mean=171 sd=0.09% | |
256 min=863 mean=864 sd=0.08% | |
1024 min=4691 mean=4697 sd=0.07% | |
4096 min=31975 mean=32036 sd=0.15% | |
16384 min=196192 mean=196271 sd=0.03% | |
65536 min=1035653 mean=1036302 sd=0.07% | |
262144 min=4801736 mean=4808866 sd=0.07% | |
1048576 min=34885387 mean=35029149 sd=0.26% | |
------------------------ | |
gcc-6 -flto -O0 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.02% | |
64 min=172 mean=172 sd=0.07% | |
256 min=865 mean=868 sd=0.21% | |
1024 min=4675 mean=4691 sd=0.26% | |
4096 min=32532 mean=32611 sd=0.15% | |
16384 min=193346 mean=193458 sd=0.03% | |
65536 min=1051180 mean=1051642 sd=0.04% | |
262144 min=4871459 mean=4878724 sd=0.10% | |
1048576 min=33990927 mean=34102144 sd=0.27% | |
gcc-6 -flto -O0 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.02% | |
16 min=48 mean=48 sd=0.02% | |
64 min=176 mean=176 sd=0.07% | |
256 min=874 mean=876 sd=0.14% | |
1024 min=4779 mean=4792 sd=0.12% | |
4096 min=32305 mean=32339 sd=0.09% | |
16384 min=198397 mean=198503 sd=0.04% | |
65536 min=1047898 mean=1048407 sd=0.04% | |
262144 min=4809628 mean=4819152 sd=0.10% | |
1048576 min=39430475 mean=39559243 sd=0.20% | |
gcc-6 -flto -O1 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.02% | |
64 min=176 mean=176 sd=0.14% | |
256 min=874 mean=876 sd=0.10% | |
1024 min=4698 mean=4706 sd=0.09% | |
4096 min=32182 mean=32221 sd=0.10% | |
16384 min=190320 mean=190372 sd=0.03% | |
65536 min=1037374 mean=1037798 sd=0.02% | |
262144 min=4909578 mean=4916495 sd=0.12% | |
1048576 min=34531603 mean=34638136 sd=0.16% | |
gcc-6 -flto -O1 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=175 mean=176 sd=0.11% | |
256 min=874 mean=876 sd=0.10% | |
1024 min=4698 mean=4702 sd=0.06% | |
4096 min=31926 mean=31982 sd=0.11% | |
16384 min=192175 mean=192278 sd=0.03% | |
65536 min=1047601 mean=1048006 sd=0.02% | |
262144 min=4766002 mean=4776115 sd=0.15% | |
1048576 min=39558267 mean=39720935 sd=0.25% | |
gcc-6 -flto -O2 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.02% | |
64 min=175 mean=176 sd=0.19% | |
256 min=873 mean=876 sd=0.33% | |
1024 min=4697 mean=4703 sd=0.07% | |
4096 min=32207 mean=32278 sd=0.16% | |
16384 min=193652 mean=193825 sd=0.15% | |
65536 min=1044607 mean=1045045 sd=0.03% | |
262144 min=4775850 mean=4786947 sd=0.11% | |
1048576 min=38202159 mean=38335822 sd=0.22% | |
gcc-6 -flto -O2 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.02% | |
64 min=175 mean=176 sd=0.17% | |
256 min=874 mean=876 sd=0.09% | |
1024 min=4700 mean=4709 sd=0.14% | |
4096 min=31971 mean=32029 sd=0.10% | |
16384 min=193732 mean=193840 sd=0.03% | |
65536 min=1056856 mean=1057522 sd=0.03% | |
262144 min=4896396 mean=4905727 sd=0.13% | |
1048576 min=34918522 mean=35015662 sd=0.19% | |
gcc-6 -flto -O3 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=171 sd=0.10% | |
256 min=864 mean=865 sd=0.06% | |
1024 min=4690 mean=4693 sd=0.04% | |
4096 min=32002 mean=32044 sd=0.09% | |
16384 min=196097 mean=196345 sd=0.07% | |
65536 min=1047147 mean=1048561 sd=0.09% | |
262144 min=4874748 mean=4891069 sd=0.16% | |
1048576 min=35756699 mean=35894708 sd=0.22% | |
gcc-6 -flto -O3 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=172 sd=0.10% | |
256 min=864 mean=865 sd=0.06% | |
1024 min=4685 mean=4692 sd=0.11% | |
4096 min=32100 mean=32134 sd=0.08% | |
16384 min=197028 mean=197064 sd=0.02% | |
65536 min=1047362 mean=1047706 sd=0.02% | |
262144 min=4793651 mean=4802553 sd=0.11% | |
1048576 min=38046812 mean=38155264 sd=0.23% | |
gcc-6 -flto -Ofast fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=175 mean=175 sd=0.16% | |
256 min=875 mean=876 sd=0.09% | |
1024 min=4741 mean=4753 sd=0.12% | |
4096 min=32070 mean=32114 sd=0.08% | |
16384 min=193682 mean=193805 sd=0.04% | |
65536 min=1049561 mean=1050042 sd=0.02% | |
262144 min=4795785 mean=4806186 sd=0.12% | |
1048576 min=34536380 mean=34635924 sd=0.28% | |
gcc-6 -flto -Ofast -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.02% | |
64 min=171 mean=171 sd=0.05% | |
256 min=864 mean=865 sd=0.09% | |
1024 min=4680 mean=4689 sd=0.35% | |
4096 min=32290 mean=32351 sd=0.12% | |
16384 min=190279 mean=190380 sd=0.03% | |
65536 min=1053302 mean=1054364 sd=0.13% | |
262144 min=4788034 mean=4799775 sd=0.17% | |
1048576 min=34512910 mean=34616538 sd=0.24% | |
------------------------ | |
icc-16 -O0 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=19 mean=19 sd=0.00% | |
16 min=48 mean=48 sd=0.01% | |
64 min=173 mean=173 sd=0.07% | |
256 min=866 mean=868 sd=0.10% | |
1024 min=4701 mean=4712 sd=0.13% | |
4096 min=32025 mean=32107 sd=0.13% | |
16384 min=194410 mean=194493 sd=0.03% | |
65536 min=1047313 mean=1047670 sd=0.02% | |
262144 min=4825120 mean=4838436 sd=0.15% | |
1048576 min=37193058 mean=37312231 sd=0.20% | |
icc-16 -O0 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=19 mean=19 sd=0.21% | |
16 min=48 mean=48 sd=0.02% | |
64 min=177 mean=177 sd=0.19% | |
256 min=877 mean=878 sd=0.10% | |
1024 min=4724 mean=4731 sd=0.10% | |
4096 min=31973 mean=32017 sd=0.11% | |
16384 min=193711 mean=193764 sd=0.01% | |
65536 min=1058795 mean=1059251 sd=0.03% | |
262144 min=4765798 mean=4774941 sd=0.10% | |
1048576 min=37270517 mean=37377241 sd=0.22% | |
icc-16 -O1 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.13% | |
64 min=175 mean=176 sd=0.18% | |
256 min=873 mean=876 sd=0.17% | |
1024 min=4694 mean=4702 sd=0.10% | |
4096 min=31959 mean=32000 sd=0.10% | |
16384 min=193254 mean=193569 sd=0.37% | |
65536 min=1041609 mean=1041921 sd=0.02% | |
262144 min=4859827 mean=4865687 sd=0.11% | |
1048576 min=38125004 mean=38267950 sd=0.25% | |
icc-16 -O1 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.02% | |
64 min=174 mean=176 sd=0.28% | |
256 min=873 mean=875 sd=0.14% | |
1024 min=4750 mean=4759 sd=0.11% | |
4096 min=32141 mean=32191 sd=0.07% | |
16384 min=193729 mean=193839 sd=0.04% | |
65536 min=1065304 mean=1065586 sd=0.02% | |
262144 min=4768996 mean=4782863 sd=0.13% | |
1048576 min=39070171 mean=39251783 sd=0.29% | |
icc-16 -O2 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=175 mean=175 sd=0.25% | |
256 min=873 mean=875 sd=0.14% | |
1024 min=4713 mean=4717 sd=0.05% | |
4096 min=32191 mean=32237 sd=0.09% | |
16384 min=195528 mean=195738 sd=0.05% | |
65536 min=1049183 mean=1049586 sd=0.02% | |
262144 min=4773643 mean=4787586 sd=0.18% | |
1048576 min=37640412 mean=37759026 sd=0.19% | |
icc-16 -O2 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=176 mean=176 sd=0.07% | |
256 min=884 mean=887 sd=0.17% | |
1024 min=4777 mean=4781 sd=0.07% | |
4096 min=32320 mean=32353 sd=0.08% | |
16384 min=193861 mean=193980 sd=0.04% | |
65536 min=1047984 mean=1049887 sd=0.33% | |
262144 min=4801125 mean=4808950 sd=0.12% | |
1048576 min=38905850 mean=39141926 sd=0.29% | |
icc-16 -O3 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=172 sd=0.09% | |
256 min=862 mean=864 sd=0.09% | |
1024 min=4661 mean=4672 sd=0.16% | |
4096 min=32415 mean=32464 sd=0.10% | |
16384 min=194823 mean=194876 sd=0.02% | |
65536 min=1039403 mean=1040078 sd=0.03% | |
262144 min=4784139 mean=4798441 sd=0.14% | |
1048576 min=37044009 mean=37119166 sd=0.18% | |
icc-16 -O3 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.02% | |
16 min=47 mean=47 sd=0.01% | |
64 min=174 mean=175 sd=0.22% | |
256 min=875 mean=876 sd=0.17% | |
1024 min=4685 mean=4690 sd=0.11% | |
4096 min=32976 mean=33071 sd=0.16% | |
16384 min=191853 mean=191938 sd=0.03% | |
65536 min=1034972 mean=1035388 sd=0.02% | |
262144 min=4792165 mean=4797617 sd=0.09% | |
1048576 min=37187244 mean=37305344 sd=0.30% | |
icc-16 -Ofast fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.02% | |
16 min=47 mean=47 sd=0.01% | |
64 min=175 mean=175 sd=0.15% | |
256 min=875 mean=877 sd=0.12% | |
1024 min=4770 mean=4774 sd=0.10% | |
4096 min=32069 mean=32159 sd=0.18% | |
16384 min=194575 mean=194696 sd=0.04% | |
65536 min=1056485 mean=1057037 sd=0.03% | |
262144 min=4890761 mean=4902503 sd=0.12% | |
1048576 min=34408416 mean=34488179 sd=0.21% | |
icc-16 -Ofast -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.02% | |
64 min=171 mean=172 sd=0.07% | |
256 min=864 mean=865 sd=0.05% | |
1024 min=4707 mean=4711 sd=0.06% | |
4096 min=32169 mean=32252 sd=0.16% | |
16384 min=199490 mean=199662 sd=0.05% | |
65536 min=1034725 mean=1035058 sd=0.02% | |
262144 min=4893211 mean=4901529 sd=0.11% | |
1048576 min=35245570 mean=35341259 sd=0.15% | |
------------------------ | |
icc-16 -ipo -O0 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=19 mean=19 sd=0.19% | |
16 min=48 mean=48 sd=0.01% | |
64 min=172 mean=173 sd=0.06% | |
256 min=865 mean=867 sd=0.11% | |
1024 min=4675 mean=4680 sd=0.08% | |
4096 min=32456 mean=32501 sd=0.08% | |
16384 min=203901 mean=203975 sd=0.03% | |
65536 min=1035751 mean=1036319 sd=0.03% | |
262144 min=4821844 mean=4831573 sd=0.11% | |
1048576 min=35089139 mean=35204741 sd=0.36% | |
icc-16 -ipo -O0 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=19 mean=19 sd=0.22% | |
16 min=48 mean=48 sd=0.02% | |
64 min=176 mean=176 sd=0.16% | |
256 min=874 mean=878 sd=0.19% | |
1024 min=4696 mean=4704 sd=0.14% | |
4096 min=32038 mean=32073 sd=0.08% | |
16384 min=196544 mean=196580 sd=0.01% | |
65536 min=1035583 mean=1036213 sd=0.03% | |
262144 min=4863336 mean=4870225 sd=0.11% | |
1048576 min=38654180 mean=38849223 sd=0.29% | |
icc-16 -ipo -O1 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=175 mean=176 sd=0.18% | |
256 min=874 mean=876 sd=0.12% | |
1024 min=4715 mean=4719 sd=0.04% | |
4096 min=31920 mean=32008 sd=0.17% | |
16384 min=191408 mean=191560 sd=0.11% | |
65536 min=1049257 mean=1049560 sd=0.02% | |
262144 min=4960936 mean=4967385 sd=0.09% | |
1048576 min=38764751 mean=38862308 sd=0.21% | |
icc-16 -ipo -O1 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=175 mean=176 sd=0.17% | |
256 min=873 mean=877 sd=0.33% | |
1024 min=4765 mean=4773 sd=0.11% | |
4096 min=32199 mean=32237 sd=0.07% | |
16384 min=191737 mean=191824 sd=0.03% | |
65536 min=1049634 mean=1049815 sd=0.01% | |
262144 min=4754288 mean=4773359 sd=0.20% | |
1048576 min=37435502 mean=37628445 sd=0.38% | |
icc-16 -ipo -O2 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=175 mean=176 sd=0.13% | |
256 min=873 mean=875 sd=0.12% | |
1024 min=4688 mean=4695 sd=0.08% | |
4096 min=32791 mean=32822 sd=0.08% | |
16384 min=191976 mean=192121 sd=0.07% | |
65536 min=1058717 mean=1059342 sd=0.03% | |
262144 min=4848715 mean=4862228 sd=0.14% | |
1048576 min=34749847 mean=34916547 sd=0.35% | |
icc-16 -ipo -O2 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.00% | |
16 min=47 mean=47 sd=0.02% | |
64 min=171 mean=171 sd=0.11% | |
256 min=863 mean=865 sd=0.09% | |
1024 min=4665 mean=4677 sd=0.15% | |
4096 min=33879 mean=33949 sd=0.17% | |
16384 min=195847 mean=196085 sd=0.08% | |
65536 min=1052975 mean=1053365 sd=0.02% | |
262144 min=4905791 mean=4913855 sd=0.15% | |
1048576 min=34462198 mean=34576137 sd=0.23% | |
icc-16 -ipo -O3 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=183 mean=187 sd=1.24% | |
256 min=873 mean=878 sd=0.37% | |
1024 min=4753 mean=4768 sd=0.16% | |
4096 min=32441 mean=32504 sd=0.08% | |
16384 min=196485 mean=196705 sd=0.05% | |
65536 min=1044382 mean=1044932 sd=0.03% | |
262144 min=4795707 mean=4804891 sd=0.12% | |
1048576 min=36215588 mean=36327559 sd=0.18% | |
icc-16 -ipo -O3 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=174 mean=175 sd=0.23% | |
256 min=885 mean=886 sd=0.04% | |
1024 min=4691 mean=4695 sd=0.07% | |
4096 min=32239 mean=32308 sd=0.15% | |
16384 min=195920 mean=196013 sd=0.05% | |
65536 min=1047177 mean=1047487 sd=0.02% | |
262144 min=4789451 mean=4801335 sd=0.17% | |
1048576 min=39599935 mean=39757089 sd=0.28% | |
icc-16 -ipo -Ofast fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=176 mean=176 sd=0.09% | |
256 min=875 mean=876 sd=0.09% | |
1024 min=11031 mean=11036 sd=0.04% | |
4096 min=32308 mean=32365 sd=0.09% | |
16384 min=197141 mean=197234 sd=0.03% | |
65536 min=1052465 mean=1052938 sd=0.02% | |
262144 min=4876275 mean=4885881 sd=0.10% | |
1048576 min=35275071 mean=35399965 sd=0.24% | |
icc-16 -ipo -Ofast -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.13% | |
16 min=47 mean=47 sd=0.01% | |
64 min=176 mean=176 sd=0.09% | |
256 min=885 mean=894 sd=0.43% | |
1024 min=4743 mean=4748 sd=0.06% | |
4096 min=32201 mean=32255 sd=0.09% | |
16384 min=197968 mean=198222 sd=0.07% | |
65536 min=1058485 mean=1059243 sd=0.04% | |
262144 min=4874405 mean=4881044 sd=0.11% | |
1048576 min=36895616 mean=37033530 sd=0.23% | |
------------------------ | |
icc-17 -O0 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=19 mean=19 sd=0.17% | |
16 min=48 mean=48 sd=0.03% | |
64 min=176 mean=177 sd=0.19% | |
256 min=877 mean=879 sd=0.11% | |
1024 min=4719 mean=4722 sd=0.06% | |
4096 min=33891 mean=33942 sd=0.13% | |
16384 min=196077 mean=196166 sd=0.03% | |
65536 min=1049547 mean=1050182 sd=0.03% | |
262144 min=4792904 mean=4798968 sd=0.12% | |
1048576 min=37108409 mean=37259480 sd=0.25% | |
icc-17 -O0 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=19 mean=19 sd=0.27% | |
16 min=48 mean=48 sd=0.01% | |
64 min=173 mean=173 sd=0.15% | |
256 min=868 mean=869 sd=0.08% | |
1024 min=4687 mean=4689 sd=0.03% | |
4096 min=32062 mean=32108 sd=0.10% | |
16384 min=192745 mean=192853 sd=0.04% | |
65536 min=1049665 mean=1050401 sd=0.04% | |
262144 min=4772367 mean=4779350 sd=0.08% | |
1048576 min=35012764 mean=35146662 sd=0.21% | |
icc-17 -O1 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=176 mean=176 sd=0.21% | |
256 min=874 mean=876 sd=0.09% | |
1024 min=4702 mean=4708 sd=0.08% | |
4096 min=31986 mean=32018 sd=0.09% | |
16384 min=193305 mean=193432 sd=0.06% | |
65536 min=1056080 mean=1056555 sd=0.03% | |
262144 min=4833338 mean=4838814 sd=0.09% | |
1048576 min=34929217 mean=35071403 sd=0.19% | |
icc-17 -O1 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.03% | |
64 min=175 mean=176 sd=0.09% | |
256 min=879 mean=881 sd=0.16% | |
1024 min=4744 mean=4752 sd=0.14% | |
4096 min=32191 mean=32254 sd=0.15% | |
16384 min=193595 mean=193680 sd=0.03% | |
65536 min=1051794 mean=1052503 sd=0.03% | |
262144 min=4935312 mean=4945130 sd=0.12% | |
1048576 min=34742182 mean=34850701 sd=0.24% | |
icc-17 -O2 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.37% | |
64 min=171 mean=172 sd=0.07% | |
256 min=863 mean=864 sd=0.06% | |
1024 min=4640 mean=4652 sd=0.25% | |
4096 min=32281 mean=32349 sd=0.13% | |
16384 min=194712 mean=194794 sd=0.03% | |
65536 min=1050320 mean=1051062 sd=0.05% | |
262144 min=4839224 mean=4850537 sd=0.16% | |
1048576 min=38837008 mean=38998541 sd=0.25% | |
icc-17 -O2 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=175 mean=176 sd=0.41% | |
256 min=876 mean=876 sd=0.04% | |
1024 min=4715 mean=4721 sd=0.07% | |
4096 min=32101 mean=32184 sd=0.19% | |
16384 min=191707 mean=191775 sd=0.03% | |
65536 min=1045560 mean=1045915 sd=0.04% | |
262144 min=4916270 mean=4922517 sd=0.11% | |
1048576 min=33978519 mean=34086617 sd=0.28% | |
icc-17 -O3 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=175 mean=175 sd=0.26% | |
256 min=875 mean=876 sd=0.08% | |
1024 min=4769 mean=4774 sd=0.09% | |
4096 min=32320 mean=32365 sd=0.10% | |
16384 min=197284 mean=197438 sd=0.05% | |
65536 min=1048943 mean=1049203 sd=0.02% | |
262144 min=4846744 mean=4862920 sd=0.20% | |
1048576 min=33696984 mean=33844829 sd=0.36% | |
icc-17 -O3 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=175 mean=175 sd=0.15% | |
256 min=875 mean=882 sd=0.85% | |
1024 min=4777 mean=4814 sd=0.27% | |
4096 min=32123 mean=32178 sd=0.09% | |
16384 min=190429 mean=190574 sd=0.04% | |
65536 min=1048061 mean=1048248 sd=0.01% | |
262144 min=4773521 mean=4789231 sd=0.16% | |
1048576 min=38358290 mean=38541396 sd=0.33% | |
icc-17 -Ofast fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=172 sd=0.08% | |
256 min=864 mean=865 sd=0.08% | |
1024 min=4681 mean=4688 sd=0.12% | |
4096 min=32158 mean=32257 sd=0.15% | |
16384 min=191847 mean=191945 sd=0.04% | |
65536 min=1044494 mean=1044743 sd=0.02% | |
262144 min=4868322 mean=4878141 sd=0.12% | |
1048576 min=39550829 mean=39723231 sd=0.26% | |
icc-17 -Ofast -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=172 sd=0.22% | |
256 min=863 mean=865 sd=0.09% | |
1024 min=4691 mean=4696 sd=0.06% | |
4096 min=32098 mean=32195 sd=0.15% | |
16384 min=196628 mean=196911 sd=0.07% | |
65536 min=1048424 mean=1048849 sd=0.02% | |
262144 min=4908673 mean=4916802 sd=0.10% | |
1048576 min=33701294 mean=33861685 sd=0.36% | |
------------------------ | |
icc-17 -ipo -O0 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=19 mean=19 sd=0.22% | |
16 min=48 mean=48 sd=0.12% | |
64 min=172 mean=173 sd=0.11% | |
256 min=865 mean=868 sd=0.22% | |
1024 min=4687 mean=4700 sd=0.13% | |
4096 min=32103 mean=32134 sd=0.08% | |
16384 min=194224 mean=194627 sd=0.39% | |
65536 min=1052157 mean=1052954 sd=0.06% | |
262144 min=4781997 mean=4797994 sd=0.14% | |
1048576 min=35695388 mean=35776103 sd=0.17% | |
icc-17 -ipo -O0 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=19 mean=19 sd=0.19% | |
16 min=48 mean=48 sd=0.01% | |
64 min=173 mean=173 sd=0.12% | |
256 min=866 mean=868 sd=0.10% | |
1024 min=4679 mean=4687 sd=0.10% | |
4096 min=32196 mean=32304 sd=0.23% | |
16384 min=191524 mean=191833 sd=0.37% | |
65536 min=1064101 mean=1064649 sd=0.04% | |
262144 min=4776166 mean=4795321 sd=0.21% | |
1048576 min=36423467 mean=36558875 sd=0.27% | |
icc-17 -ipo -O1 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.02% | |
64 min=176 mean=176 sd=0.25% | |
256 min=876 mean=877 sd=0.07% | |
1024 min=4701 mean=4709 sd=0.09% | |
4096 min=32198 mean=32228 sd=0.12% | |
16384 min=193236 mean=193305 sd=0.03% | |
65536 min=1050999 mean=1051655 sd=0.03% | |
262144 min=4870323 mean=4888583 sd=0.20% | |
1048576 min=37721715 mean=37898257 sd=0.26% | |
icc-17 -ipo -O1 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.02% | |
16 min=47 mean=47 sd=0.02% | |
64 min=175 mean=175 sd=0.13% | |
256 min=899 mean=900 sd=0.08% | |
1024 min=4760 mean=4768 sd=0.11% | |
4096 min=32091 mean=32156 sd=0.12% | |
16384 min=194049 mean=194196 sd=0.05% | |
65536 min=1073212 mean=1073849 sd=0.03% | |
262144 min=4814006 mean=4826569 sd=0.13% | |
1048576 min=37401758 mean=37546346 sd=0.22% | |
icc-17 -ipo -O2 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=172 sd=0.09% | |
256 min=864 mean=865 sd=0.05% | |
1024 min=4612 mean=4627 sd=0.28% | |
4096 min=32192 mean=32251 sd=0.12% | |
16384 min=192791 mean=192934 sd=0.04% | |
65536 min=1044926 mean=1045217 sd=0.02% | |
262144 min=4910397 mean=4923834 sd=0.46% | |
1048576 min=38537544 mean=38683478 sd=0.29% | |
icc-17 -ipo -O2 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.02% | |
64 min=171 mean=172 sd=0.14% | |
256 min=863 mean=864 sd=0.09% | |
1024 min=4702 mean=4713 sd=0.15% | |
4096 min=32206 mean=32254 sd=0.12% | |
16384 min=197320 mean=197408 sd=0.03% | |
65536 min=1049449 mean=1049754 sd=0.02% | |
262144 min=4892760 mean=4903506 sd=0.40% | |
1048576 min=36074416 mean=36202949 sd=0.29% | |
icc-17 -ipo -O3 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.02% | |
64 min=176 mean=176 sd=0.07% | |
256 min=875 mean=880 sd=0.36% | |
1024 min=4761 mean=4770 sd=0.16% | |
4096 min=32241 mean=32308 sd=0.12% | |
16384 min=193581 mean=193659 sd=0.03% | |
65536 min=1047644 mean=1047909 sd=0.02% | |
262144 min=4752623 mean=4769552 sd=0.15% | |
1048576 min=39208966 mean=39315415 sd=0.20% | |
icc-17 -ipo -O3 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.02% | |
64 min=171 mean=172 sd=0.07% | |
256 min=863 mean=864 sd=0.07% | |
1024 min=4694 mean=4700 sd=0.19% | |
4096 min=31994 mean=32061 sd=0.13% | |
16384 min=193943 mean=194020 sd=0.02% | |
65536 min=1053122 mean=1053893 sd=0.04% | |
262144 min=4805329 mean=4818054 sd=0.18% | |
1048576 min=36793717 mean=36954812 sd=0.25% | |
icc-17 -ipo -Ofast fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=174 mean=177 sd=1.43% | |
256 min=863 mean=864 sd=0.06% | |
1024 min=4700 mean=4707 sd=0.08% | |
4096 min=32720 mean=32798 sd=0.12% | |
16384 min=191078 mean=191171 sd=0.03% | |
65536 min=1053978 mean=1054850 sd=0.06% | |
262144 min=4848433 mean=4855945 sd=0.09% | |
1048576 min=38467435 mean=38628216 sd=0.34% | |
icc-17 -ipo -Ofast -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.02% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=172 sd=0.13% | |
256 min=864 mean=865 sd=0.08% | |
1024 min=4665 mean=4669 sd=0.07% | |
4096 min=32138 mean=32237 sd=0.26% | |
16384 min=192695 mean=192791 sd=0.03% | |
65536 min=1055380 mean=1055733 sd=0.03% | |
262144 min=4860588 mean=4866786 sd=0.09% | |
1048576 min=38675404 mean=38780668 sd=0.16% | |
------------------------ | |
clang-4.0 -O0 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=48 mean=48 sd=0.02% | |
64 min=177 mean=177 sd=0.05% | |
256 min=875 mean=876 sd=0.08% | |
1024 min=4772 mean=4780 sd=0.09% | |
4096 min=32159 mean=32234 sd=0.24% | |
16384 min=195092 mean=195321 sd=0.04% | |
65536 min=1043926 mean=1044289 sd=0.02% | |
262144 min=4749236 mean=4765547 sd=0.15% | |
1048576 min=34541012 mean=34612756 sd=0.16% | |
clang-4.0 -O0 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.06% | |
16 min=48 mean=48 sd=0.06% | |
64 min=171 mean=171 sd=0.14% | |
256 min=864 mean=865 sd=0.06% | |
1024 min=4709 mean=4716 sd=0.11% | |
4096 min=32200 mean=32288 sd=0.25% | |
16384 min=194531 mean=194614 sd=0.03% | |
65536 min=1058554 mean=1058835 sd=0.02% | |
262144 min=4856730 mean=4863840 sd=0.08% | |
1048576 min=33910789 mean=34070913 sd=0.34% | |
clang-4.0 -O1 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.02% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=172 sd=0.08% | |
256 min=864 mean=864 sd=0.07% | |
1024 min=4697 mean=4705 sd=0.12% | |
4096 min=38230 mean=38311 sd=0.18% | |
16384 min=191597 mean=191761 sd=0.06% | |
65536 min=1051194 mean=1052048 sd=0.03% | |
262144 min=4836443 mean=4847817 sd=0.16% | |
1048576 min=38984373 mean=39122783 sd=0.26% | |
clang-4.0 -O1 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.02% | |
16 min=47 mean=47 sd=0.01% | |
64 min=175 mean=176 sd=0.23% | |
256 min=875 mean=876 sd=0.07% | |
1024 min=4697 mean=4700 sd=0.04% | |
4096 min=31966 mean=32045 sd=0.25% | |
16384 min=189698 mean=189821 sd=0.04% | |
65536 min=1061335 mean=1061706 sd=0.02% | |
262144 min=4723954 mean=4737297 sd=0.18% | |
1048576 min=38038958 mean=38158495 sd=0.27% | |
clang-4.0 -O2 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=172 sd=0.14% | |
256 min=864 mean=865 sd=0.04% | |
1024 min=4664 mean=4669 sd=0.05% | |
4096 min=32133 mean=32199 sd=0.17% | |
16384 min=189889 mean=190019 sd=0.04% | |
65536 min=1054775 mean=1055636 sd=0.06% | |
262144 min=4799844 mean=4809442 sd=0.20% | |
1048576 min=37363501 mean=37481119 sd=0.20% | |
clang-4.0 -O2 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.02% | |
16 min=47 mean=47 sd=0.01% | |
64 min=175 mean=175 sd=0.25% | |
256 min=874 mean=876 sd=0.10% | |
1024 min=4697 mean=4713 sd=0.14% | |
4096 min=32419 mean=32463 sd=0.15% | |
16384 min=191312 mean=191443 sd=0.04% | |
65536 min=1066708 mean=1067178 sd=0.03% | |
262144 min=4782455 mean=4793902 sd=0.11% | |
1048576 min=37570285 mean=37718289 sd=0.28% | |
clang-4.0 -O3 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.02% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=172 sd=0.48% | |
256 min=864 mean=865 sd=0.02% | |
1024 min=4705 mean=4709 sd=0.06% | |
4096 min=32131 mean=32188 sd=0.22% | |
16384 min=193911 mean=193984 sd=0.04% | |
65536 min=1044802 mean=1045243 sd=0.03% | |
262144 min=4768817 mean=4780161 sd=0.23% | |
1048576 min=39456333 mean=39610953 sd=0.27% | |
clang-4.0 -O3 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.02% | |
16 min=47 mean=47 sd=0.01% | |
64 min=175 mean=175 sd=0.19% | |
256 min=874 mean=876 sd=0.12% | |
1024 min=4710 mean=4715 sd=0.07% | |
4096 min=34858 mean=35040 sd=0.65% | |
16384 min=192522 mean=192629 sd=0.03% | |
65536 min=1049267 mean=1049685 sd=0.02% | |
262144 min=4787709 mean=4809667 sd=0.25% | |
1048576 min=38506532 mean=38636433 sd=0.21% | |
clang-4.0 -Ofast fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.02% | |
16 min=47 mean=47 sd=0.01% | |
64 min=175 mean=176 sd=0.13% | |
256 min=874 mean=875 sd=0.11% | |
1024 min=4709 mean=4720 sd=0.13% | |
4096 min=34253 mean=34287 sd=0.05% | |
16384 min=193202 mean=193356 sd=0.05% | |
65536 min=1050892 mean=1051440 sd=0.05% | |
262144 min=4752501 mean=4765067 sd=0.13% | |
1048576 min=38089855 mean=38362035 sd=0.34% | |
clang-4.0 -Ofast -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=171 sd=0.07% | |
256 min=949 mean=949 sd=0.02% | |
1024 min=4663 mean=4670 sd=0.11% | |
4096 min=32289 mean=32342 sd=0.06% | |
16384 min=191938 mean=192230 sd=0.15% | |
65536 min=1049918 mean=1050352 sd=0.04% | |
262144 min=4832042 mean=4840957 sd=0.14% | |
1048576 min=37942245 mean=38151352 sd=0.28% | |
------------------------ | |
clang-4.0 -flto -O0 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=48 mean=48 sd=0.03% | |
64 min=177 mean=177 sd=0.05% | |
256 min=875 mean=876 sd=0.14% | |
1024 min=4706 mean=4711 sd=0.04% | |
4096 min=31998 mean=32092 sd=0.15% | |
16384 min=191723 mean=191962 sd=0.13% | |
65536 min=1051391 mean=1051880 sd=0.02% | |
262144 min=4856748 mean=4862138 sd=0.07% | |
1048576 min=34968430 mean=35116763 sd=0.25% | |
clang-4.0 -flto -O0 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.22% | |
16 min=47 mean=48 sd=0.02% | |
64 min=171 mean=171 sd=0.05% | |
256 min=864 mean=865 sd=0.07% | |
1024 min=4613 mean=4621 sd=0.15% | |
4096 min=31972 mean=32059 sd=0.15% | |
16384 min=195094 mean=195257 sd=0.12% | |
65536 min=1055860 mean=1056521 sd=0.07% | |
262144 min=4838024 mean=4848831 sd=0.10% | |
1048576 min=34255313 mean=34378157 sd=0.33% | |
clang-4.0 -flto -O1 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=171 sd=0.08% | |
256 min=865 mean=865 sd=0.03% | |
1024 min=4646 mean=4651 sd=0.11% | |
4096 min=38418 mean=38492 sd=0.13% | |
16384 min=193196 mean=193401 sd=0.13% | |
65536 min=1059756 mean=1060029 sd=0.03% | |
262144 min=4764165 mean=4774396 sd=0.14% | |
1048576 min=37383556 mean=37437254 sd=0.13% | |
clang-4.0 -flto -O1 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.02% | |
16 min=47 mean=47 sd=0.02% | |
64 min=175 mean=176 sd=0.09% | |
256 min=874 mean=875 sd=0.10% | |
1024 min=4698 mean=4702 sd=0.05% | |
4096 min=32117 mean=32140 sd=0.07% | |
16384 min=197803 mean=198013 sd=0.12% | |
65536 min=1047778 mean=1048376 sd=0.03% | |
262144 min=4855357 mean=4866418 sd=0.12% | |
1048576 min=36671287 mean=36834387 sd=0.28% | |
clang-4.0 -flto -O2 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.02% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=171 sd=0.06% | |
256 min=864 mean=865 sd=0.03% | |
1024 min=4900 mean=4906 sd=0.09% | |
4096 min=32586 mean=32646 sd=0.17% | |
16384 min=198363 mean=198733 sd=0.12% | |
65536 min=1061351 mean=1061809 sd=0.02% | |
262144 min=4793395 mean=4801621 sd=0.13% | |
1048576 min=39129701 mean=39282996 sd=0.28% | |
clang-4.0 -flto -O2 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.02% | |
64 min=171 mean=172 sd=0.11% | |
256 min=864 mean=865 sd=0.05% | |
1024 min=4656 mean=4669 sd=0.17% | |
4096 min=40032 mean=40086 sd=0.09% | |
16384 min=194326 mean=194661 sd=0.15% | |
65536 min=1061353 mean=1061776 sd=0.02% | |
262144 min=4785557 mean=4794235 sd=0.13% | |
1048576 min=38030266 mean=38164632 sd=0.18% | |
clang-4.0 -flto -O3 fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=171 sd=0.04% | |
256 min=864 mean=865 sd=0.05% | |
1024 min=4687 mean=4691 sd=0.04% | |
4096 min=32144 mean=32243 sd=0.11% | |
16384 min=194794 mean=194998 sd=0.13% | |
65536 min=1055720 mean=1056722 sd=0.05% | |
262144 min=4785085 mean=4799322 sd=0.14% | |
1048576 min=35234914 mean=35341889 sd=0.20% | |
clang-4.0 -flto -O3 -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.02% | |
16 min=47 mean=47 sd=0.02% | |
64 min=174 mean=175 sd=0.26% | |
256 min=873 mean=875 sd=0.14% | |
1024 min=4693 mean=4696 sd=0.05% | |
4096 min=34472 mean=34606 sd=0.29% | |
16384 min=201542 mean=201719 sd=0.13% | |
65536 min=1054263 mean=1054716 sd=0.03% | |
262144 min=4852508 mean=4860416 sd=0.10% | |
1048576 min=38470514 mean=38646777 sd=0.36% | |
clang-4.0 -flto -Ofast fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.01% | |
16 min=47 mean=47 sd=0.01% | |
64 min=171 mean=171 sd=0.08% | |
256 min=864 mean=865 sd=0.06% | |
1024 min=4699 mean=4705 sd=0.07% | |
4096 min=32232 mean=32333 sd=0.17% | |
16384 min=196574 mean=196722 sd=0.14% | |
65536 min=1046890 mean=1047374 sd=0.02% | |
262144 min=4813586 mean=4824912 sd=0.13% | |
1048576 min=34627022 mean=34799847 sd=0.31% | |
clang-4.0 -flto -Ofast -march=native fft-test-asm | |
Self-test passed | |
Size Time per FFT (ns) | |
4 min=18 mean=18 sd=0.02% | |
16 min=47 mean=47 sd=0.01% | |
64 min=170 mean=171 sd=0.10% | |
256 min=864 mean=864 sd=0.05% | |
1024 min=4648 mean=4655 sd=0.12% | |
4096 min=32223 mean=32313 sd=0.20% | |
16384 min=191956 mean=192211 sd=0.15% | |
65536 min=1046127 mean=1046375 sd=0.02% | |
262144 min=4772847 mean=4783577 sd=0.16% | |
1048576 min=37877161 mean=38016011 sd=0.24% |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment