Implementation notes: amd64, genji346, crypto_core/multsntrup653

Computer: genji346
Architecture: amd64
CPU ID: AuthenticAMD-00830f10-178bfbff
SUPERCOP version: 20191017
Operation: crypto_core
Primitive: multsntrup653
TimeObject sizeTest sizeImplementationCompilerBenchmark dateSUPERCOP version
1560016728 32 033142 904 768avxicc_-march=core-avx2_-mtune=core-avx2_-O3_-fomit-frame-pointer2019102520191017
1560016728 32 033142 904 768avxicc_-march=skylake_-mtune=skylake_-O3_-fomit-frame-pointer2019102520191017
1562016728 32 033142 904 768avxicc_-march=broadwell_-mtune=broadwell_-O3_-fomit-frame-pointer2019102520191017
1562016856 32 032006 904 768avxicc_-march=corei7_-mtune=corei7_-O2_-fomit-frame-pointer2019102520191017
1566016792 32 033606 904 768avxicc_-march=core-avx2_-mtune=core-avx2_-O2_-fomit-frame-pointer2019102520191017
1568016728 32 033142 904 768avxicc_-march=haswell_-mtune=haswell_-O3_-fomit-frame-pointer2019102520191017
1570016792 32 033606 904 768avxicc_-march=broadwell_-mtune=broadwell_-O2_-fomit-frame-pointer2019102520191017
1570016840 32 032046 904 768avxicc_-march=corei7_-mtune=corei7_-O3_-fomit-frame-pointer2019102520191017
1570016792 32 033606 904 768avxicc_-march=skylake_-mtune=skylake_-O2_-fomit-frame-pointer2019102520191017
1574016792 32 033606 904 768avxicc_-march=haswell_-mtune=haswell_-O2_-fomit-frame-pointer2019102520191017
1594015798 0 029081 816 800avxgcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102520191017
1812014781 0 025660 808 800avxgcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102520191017
1860014869 0 025972 808 800avxgcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102520191017
2104015326 0 025388 800 800avxgcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102520191017
2310019224 32 035670 904 768avxicc_-march=core-avx-i_-mtune=core-avx-i_-O3_-fomit-frame-pointer2019102520191017
2310019224 32 035670 904 768avxicc_-march=corei7-avx_-mtune=corei7-avx_-O3_-fomit-frame-pointer2019102520191017
2312019224 32 035670 904 768avxicc_-march=ivybridge_-mtune=ivybridge_-O3_-fomit-frame-pointer2019102520191017
2324019224 32 035670 904 768avxicc_-march=sandybridge_-mtune=sandybridge_-O3_-fomit-frame-pointer2019102520191017
2334019272 32 035686 904 768avxicc_-march=sandybridge_-mtune=sandybridge_-O2_-fomit-frame-pointer2019102520191017
2346019272 32 035686 904 768avxicc_-march=corei7-avx_-mtune=corei7-avx_-O2_-fomit-frame-pointer2019102520191017
2348019272 32 035686 904 768avxicc_-march=core-avx-i_-mtune=core-avx-i_-O2_-fomit-frame-pointer2019102520191017
2348019272 32 035686 904 768avxicc_-march=ivybridge_-mtune=ivybridge_-O2_-fomit-frame-pointer2019102520191017
1362204273 0 017545 816 800refgcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102520191017
1404602453 0 015219 808 776refclang_-march=native_-O2_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2019102520191017
1406002453 0 015219 808 776refclang_-march=native_-O_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2019102520191017
1412203061 0 016451 808 776refclang_-march=native_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2019102520191017
2984203424 0 020190 864 768reficc_-march=core-avx2_-mtune=core-avx2_-O2_-fomit-frame-pointer2019102520191017
2987803424 0 020190 864 768reficc_-march=haswell_-mtune=haswell_-O2_-fomit-frame-pointer2019102520191017
2990003424 0 020190 864 768reficc_-march=broadwell_-mtune=broadwell_-O2_-fomit-frame-pointer2019102520191017
2992003424 0 020190 864 768reficc_-march=skylake_-mtune=skylake_-O2_-fomit-frame-pointer2019102520191017
3000603552 0 019918 864 768reficc_-march=skylake_-mtune=skylake_-O3_-fomit-frame-pointer2019102520191017
3005603552 0 019918 864 768reficc_-march=broadwell_-mtune=broadwell_-O3_-fomit-frame-pointer2019102520191017
3005603552 0 019918 864 768reficc_-march=haswell_-mtune=haswell_-O3_-fomit-frame-pointer2019102520191017
3008603552 0 019918 864 768reficc_-march=core-avx2_-mtune=core-avx2_-O3_-fomit-frame-pointer2019102520191017
3248402976 0 018118 864 768reficc_-march=corei7_-mtune=corei7_-O3_-fomit-frame-pointer2019102520191017
3261002904 0 019302 864 768reficc_-march=corei7-avx_-mtune=corei7-avx_-O3_-fomit-frame-pointer2019102520191017
3261202904 0 019302 864 768reficc_-march=ivybridge_-mtune=ivybridge_-O3_-fomit-frame-pointer2019102520191017
3263002904 0 019302 864 768reficc_-march=core-avx-i_-mtune=core-avx-i_-O3_-fomit-frame-pointer2019102520191017
3264402904 0 019302 864 768reficc_-march=sandybridge_-mtune=sandybridge_-O3_-fomit-frame-pointer2019102520191017
3266202904 0 019270 864 768reficc_-march=core-avx-i_-mtune=core-avx-i_-O2_-fomit-frame-pointer2019102520191017
3266802904 0 019270 864 768reficc_-march=sandybridge_-mtune=sandybridge_-O2_-fomit-frame-pointer2019102520191017
3270202904 0 019270 864 768reficc_-march=ivybridge_-mtune=ivybridge_-O2_-fomit-frame-pointer2019102520191017
3275602904 0 019270 864 768reficc_-march=corei7-avx_-mtune=corei7-avx_-O2_-fomit-frame-pointer2019102520191017
3525002944 0 018030 864 768reficc_-march=corei7_-mtune=corei7_-O2_-fomit-frame-pointer2019102520191017
4026603635 0 016787 808 760refclang_-mcpu=native_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2019102520191017
1102080596 0 010721 800 760refclang_-march=native_-Os_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2019102520191017
1144280466 0 010492 800 800refgcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102520191017
1157000537 0 011388 808 800refgcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102520191017
1184940606 0 011660 808 800refgcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102520191017

Test failure

Implementation: crypto_core/multsntrup653/avx
Compiler: icc -march=cannonlake -mtune=cannonlake -O2 -fomit-frame-pointer
error 111

Number of similar (compiler,implementation) pairs: 12, namely:
CompilerImplementations
icc -march=cannonlake -mtune=cannonlake -O2 -fomit-frame-pointer avx ref
icc -march=cannonlake -mtune=cannonlake -O3 -fomit-frame-pointer avx ref
icc -march=icelake-client -mtune=icelake-client -O2 -fomit-frame-pointer avx ref
icc -march=icelake-client -mtune=icelake-client -O3 -fomit-frame-pointer avx ref
icc -march=skylake-avx512 -mtune=skylake-avx512 -O2 -fomit-frame-pointer avx ref
icc -march=skylake-avx512 -mtune=skylake-avx512 -O3 -fomit-frame-pointer avx ref

Compiler output

Implementation: crypto_core/multsntrup653/avx
Compiler: clang -march=native -O2 -fomit-frame-pointer -fwrapv -Qunused-arguments -fPIC -fPIE
mult768.c: In file included from mult768.c:2:
mult768.c: In file included from /software/compilers/gcc/gcc-9.2.0-full+isl+binutils/lib/gcc/x86_64-pc-linux-gnu/9.2.0/include/immintrin.h:27:
mult768.c: /software/compilers/gcc/gcc-9.2.0-full+isl+binutils/lib/gcc/x86_64-pc-linux-gnu/9.2.0/include/mmintrin.h:55:72: warning: unknown attribute '__artificial__' ignored [-Wunknown-attributes]
mult768.c: extern __inline void __attribute__((__gnu_inline__, __always_inline__, __artificial__))
mult768.c: ^
mult768.c: /software/compilers/gcc/gcc-9.2.0-full+isl+binutils/lib/gcc/x86_64-pc-linux-gnu/9.2.0/include/mmintrin.h:61:72: warning: unknown attribute '__artificial__' ignored [-Wunknown-attributes]
mult768.c: extern __inline void __attribute__((__gnu_inline__, __always_inline__, __artificial__))
mult768.c: ^
mult768.c: /software/compilers/gcc/gcc-9.2.0-full+isl+binutils/lib/gcc/x86_64-pc-linux-gnu/9.2.0/include/mmintrin.h:68:74: warning: unknown attribute '__artificial__' ignored [-Wunknown-attributes]
mult768.c: extern __inline __m64 __attribute__((__gnu_inline__, __always_inline__, __artificial__))
mult768.c: ^
mult768.c: /software/compilers/gcc/gcc-9.2.0-full+isl+binutils/lib/gcc/x86_64-pc-linux-gnu/9.2.0/include/mmintrin.h:74:74: warning: unknown attribute '__artificial__' ignored [-Wunknown-attributes]
mult768.c: extern __inline __m64 __attribute__((__gnu_inline__, __always_inline__, __artificial__))
mult768.c: ^
mult768.c: /software/compilers/gcc/gcc-9.2.0-full+isl+binutils/lib/gcc/x86_64-pc-linux-gnu/9.2.0/include/mmintrin.h:84:74: warning: unknown attribute '__artificial__' ignored [-Wunknown-attributes]
mult768.c: extern __inline __m64 __attribute__((__gnu_inline__, __always_inline__, __artificial__))
mult768.c: ^
mult768.c: /software/compilers/gcc/gcc-9.2.0-full+isl+binutils/lib/gcc/x86_64-pc-linux-gnu/9.2.0/include/mmintrin.h:90:74: warning: unknown attribute '__artificial__' ignored [-Wunknown-attributes]
mult768.c: extern __inline __m64 __attribute__((__gnu_inline__, __always_inline__, __artificial__))
mult768.c: ^
mult768.c: /software/compilers/gcc/gcc-9.2.0-full+isl+binutils/lib/gcc/x86_64-pc-linux-gnu/9.2.0/include/mmintrin.h:97:74: warning: unknown attribute '__artificial__' ignored [-Wunknown-attributes]
mult768.c: extern __inline __m64 __attribute__((__gnu_inline__, __always_inline__, __artificial__))
mult768.c: ^
mult768.c: /software/compilers/gcc/gcc-9.2.0-full+isl+binutils/lib/gcc/x86_64-pc-linux-gnu/9.2.0/include/mmintrin.h:103:74: warning: unknown attribute '__artificial__' ignored [-Wunknown-attributes]
mult768.c: extern __inline __m64 __attribute__((__gnu_inline__, __always_inline__, __artificial__))
mult768.c: ...

Number of similar (compiler,implementation) pairs: 5, namely:
CompilerImplementations
clang -march=native -O2 -fomit-frame-pointer -fwrapv -Qunused-arguments -fPIC -fPIE avx
clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments -fPIC -fPIE avx
clang -march=native -O -fomit-frame-pointer -fwrapv -Qunused-arguments -fPIC -fPIE avx
clang -march=native -Os -fomit-frame-pointer -fwrapv -Qunused-arguments -fPIC -fPIE avx
clang -mcpu=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments -fPIC -fPIE avx

Compiler output

Implementation: crypto_core/multsntrup653/avx
Compiler: icc -march=broadwell -mtune=broadwell -O2 -fomit-frame-pointer
mult768.c: mult768.c(196): warning #167: argument of type "int16={int16_t={short}} (*)[512]" is incompatible with parameter of type "const int16={int16_t={short}} (*)[512]"
mult768.c: ungood(h_7681,hpad);
mult768.c: ^
mult768.c:
mult768.c: mult768.c(224): warning #167: argument of type "int16={int16_t={short}} (*)[512]" is incompatible with parameter of type "const int16={int16_t={short}} (*)[512]"
mult768.c: ungood(h_10753,hpad);
mult768.c: ^
mult768.c:

Number of similar (compiler,implementation) pairs: 24, namely:
CompilerImplementations
icc -march=broadwell -mtune=broadwell -O2 -fomit-frame-pointer avx
icc -march=broadwell -mtune=broadwell -O3 -fomit-frame-pointer avx
icc -march=cannonlake -mtune=cannonlake -O2 -fomit-frame-pointer avx
icc -march=cannonlake -mtune=cannonlake -O3 -fomit-frame-pointer avx
icc -march=core-avx-i -mtune=core-avx-i -O2 -fomit-frame-pointer avx
icc -march=core-avx-i -mtune=core-avx-i -O3 -fomit-frame-pointer avx
icc -march=core-avx2 -mtune=core-avx2 -O2 -fomit-frame-pointer avx
icc -march=core-avx2 -mtune=core-avx2 -O3 -fomit-frame-pointer avx
icc -march=corei7-avx -mtune=corei7-avx -O2 -fomit-frame-pointer avx
icc -march=corei7-avx -mtune=corei7-avx -O3 -fomit-frame-pointer avx
icc -march=corei7 -mtune=corei7 -O2 -fomit-frame-pointer avx
icc -march=corei7 -mtune=corei7 -O3 -fomit-frame-pointer avx
icc -march=haswell -mtune=haswell -O2 -fomit-frame-pointer avx
icc -march=haswell -mtune=haswell -O3 -fomit-frame-pointer avx
icc -march=icelake-client -mtune=icelake-client -O2 -fomit-frame-pointer avx
icc -march=icelake-client -mtune=icelake-client -O3 -fomit-frame-pointer avx
icc -march=ivybridge -mtune=ivybridge -O2 -fomit-frame-pointer avx
icc -march=ivybridge -mtune=ivybridge -O3 -fomit-frame-pointer avx
icc -march=sandybridge -mtune=sandybridge -O2 -fomit-frame-pointer avx
icc -march=sandybridge -mtune=sandybridge -O3 -fomit-frame-pointer avx
icc -march=skylake-avx512 -mtune=skylake-avx512 -O2 -fomit-frame-pointer avx
icc -march=skylake-avx512 -mtune=skylake-avx512 -O3 -fomit-frame-pointer avx
icc -march=skylake -mtune=skylake -O2 -fomit-frame-pointer avx
icc -march=skylake -mtune=skylake -O3 -fomit-frame-pointer avx