Implementation notes: amd64, genji548, crypto_kem/ntskem1264

Computer: genji548
Architecture: amd64
CPU ID: GenuineIntel-00050654-bfebfbff
SUPERCOP version: 20191017
Operation: crypto_kem
Primitive: ntskem1264
TimeObject sizeTest sizeImplementationCompilerBenchmark dateSUPERCOP version
40060493735 6228 16123629 7120 1640avx2gcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102020191017
42211865341 6228 1692557 7120 1640avx2gcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102020191017
42227666913 6228 1694253 7120 1640avx2gcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102020191017
43753087024 6228 16116965 7120 1640sse2gcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102020191017
45289660481 6228 1687821 7120 1640sse2gcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102020191017
46257658966 6228 1686181 7120 1640sse2gcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102020191017
50633859492 6228 1685892 7112 1608avx2gcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102020191017
57250654691 6228 1681156 7112 1608sse2gcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102020191017
697274187144 6276 16221981 7192 1640opticc_-march=icelake-client_-mtune=icelake-client_-O3_-fomit-frame-pointer2019102020191017
698388155408 6276 16189373 7192 1608opticc_-march=broadwell_-mtune=broadwell_-O3_-fomit-frame-pointer2019102020191017
698436155408 6276 16189373 7192 1608opticc_-march=skylake_-mtune=skylake_-O3_-fomit-frame-pointer2019102020191017
700676155408 6276 16189373 7192 1608opticc_-march=haswell_-mtune=haswell_-O3_-fomit-frame-pointer2019102020191017
702342155120 6276 16189621 7192 1640opticc_-march=skylake-avx512_-mtune=skylake-avx512_-O3_-fomit-frame-pointer2019102020191017
703592155408 6276 16189373 7192 1608opticc_-march=core-avx2_-mtune=core-avx2_-O3_-fomit-frame-pointer2019102020191017
715990150616 6276 16185229 7192 1640opticc_-march=skylake-avx512_-mtune=skylake-avx512_-O2_-fomit-frame-pointer2019102020191017
71828488476 6228 16119965 7120 1640optgcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102020191017
725830179696 6276 16214885 7192 1640opticc_-march=icelake-client_-mtune=icelake-client_-O2_-fomit-frame-pointer2019102020191017
737662150832 6276 16185197 7192 1608opticc_-march=core-avx2_-mtune=core-avx2_-O2_-fomit-frame-pointer2019102020191017
740550150848 6276 16185213 7192 1608opticc_-march=skylake_-mtune=skylake_-O2_-fomit-frame-pointer2019102020191017
741132150832 6276 16185197 7192 1608opticc_-march=haswell_-mtune=haswell_-O2_-fomit-frame-pointer2019102020191017
741510150832 6276 16185197 7192 1608opticc_-march=broadwell_-mtune=broadwell_-O2_-fomit-frame-pointer2019102020191017
76205855520 6228 1684509 7120 1640optgcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102020191017
774022120592 6276 16154589 7192 1608opticc_-march=ivybridge_-mtune=ivybridge_-O2_-fomit-frame-pointer2019102020191017
775736120592 6276 16154589 7192 1608opticc_-march=corei7-avx_-mtune=corei7-avx_-O2_-fomit-frame-pointer2019102020191017
776708120592 6276 16154589 7192 1608opticc_-march=core-avx-i_-mtune=core-avx-i_-O2_-fomit-frame-pointer2019102020191017
778284120592 6276 16154589 7192 1608opticc_-march=sandybridge_-mtune=sandybridge_-O2_-fomit-frame-pointer2019102020191017
781210120224 6276 16152973 7192 1608opticc_-march=corei7_-mtune=corei7_-O2_-fomit-frame-pointer2019102020191017
783856121792 6276 16155821 7192 1608opticc_-march=corei7-avx_-mtune=corei7-avx_-O3_-fomit-frame-pointer2019102020191017
784542121792 6276 16155821 7192 1608opticc_-march=core-avx-i_-mtune=core-avx-i_-O3_-fomit-frame-pointer2019102020191017
784748121792 6276 16155821 7192 1608opticc_-march=sandybridge_-mtune=sandybridge_-O3_-fomit-frame-pointer2019102020191017
785422121008 6276 16153813 7192 1608opticc_-march=corei7_-mtune=corei7_-O3_-fomit-frame-pointer2019102020191017
785630121792 6276 16155821 7192 1608opticc_-march=ivybridge_-mtune=ivybridge_-O3_-fomit-frame-pointer2019102020191017
84643053949 6228 1682725 7120 1640optgcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102020191017
90305849459 6228 1677284 7112 1608optgcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102020191017
5971136108256 100 16142613 1016 1608reficc_-march=broadwell_-mtune=broadwell_-O2_-fomit-frame-pointer2019102020191017
5978014108256 100 16142613 1016 1608reficc_-march=skylake_-mtune=skylake_-O2_-fomit-frame-pointer2019102020191017
6014046108272 100 16142629 1016 1608reficc_-march=core-avx2_-mtune=core-avx2_-O2_-fomit-frame-pointer2019102020191017
6015970108272 100 16142629 1016 1608reficc_-march=haswell_-mtune=haswell_-O2_-fomit-frame-pointer2019102020191017
6019756108632 100 16143269 1016 1640reficc_-march=skylake-avx512_-mtune=skylake-avx512_-O2_-fomit-frame-pointer2019102020191017
6039388135648 100 16170829 1016 1640reficc_-march=icelake-client_-mtune=icelake-client_-O2_-fomit-frame-pointer2019102020191017
6077914112848 100 16147373 1016 1640reficc_-march=skylake-avx512_-mtune=skylake-avx512_-O3_-fomit-frame-pointer2019102020191017
6113622111800 100 16145757 1016 1608reficc_-march=skylake_-mtune=skylake_-O3_-fomit-frame-pointer2019102020191017
6121686111800 100 16145757 1016 1608reficc_-march=haswell_-mtune=haswell_-O3_-fomit-frame-pointer2019102020191017
6128070111800 100 16145757 1016 1608reficc_-march=broadwell_-mtune=broadwell_-O3_-fomit-frame-pointer2019102020191017
6152666143376 100 16178205 1016 1640reficc_-march=icelake-client_-mtune=icelake-client_-O3_-fomit-frame-pointer2019102020191017
6169724111800 100 16145757 1016 1608reficc_-march=core-avx2_-mtune=core-avx2_-O3_-fomit-frame-pointer2019102020191017
623669678352 100 16111149 1016 1608reficc_-march=corei7_-mtune=corei7_-O3_-fomit-frame-pointer2019102020191017
624520075888 100 16109877 1016 1608reficc_-march=core-avx-i_-mtune=core-avx-i_-O2_-fomit-frame-pointer2019102020191017
624649676368 100 16109109 1016 1608reficc_-march=corei7_-mtune=corei7_-O2_-fomit-frame-pointer2019102020191017
625075275888 100 16109877 1016 1608reficc_-march=sandybridge_-mtune=sandybridge_-O2_-fomit-frame-pointer2019102020191017
626064875888 100 16109877 1016 1608reficc_-march=ivybridge_-mtune=ivybridge_-O2_-fomit-frame-pointer2019102020191017
626209475888 100 16109877 1016 1608reficc_-march=corei7-avx_-mtune=corei7-avx_-O2_-fomit-frame-pointer2019102020191017
627494478256 100 16112277 1016 1608reficc_-march=core-avx-i_-mtune=core-avx-i_-O3_-fomit-frame-pointer2019102020191017
628051678256 100 16112277 1016 1608reficc_-march=sandybridge_-mtune=sandybridge_-O3_-fomit-frame-pointer2019102020191017
628148478256 100 16112277 1016 1608reficc_-march=corei7-avx_-mtune=corei7-avx_-O3_-fomit-frame-pointer2019102020191017
628493678256 100 16112277 1016 1608reficc_-march=ivybridge_-mtune=ivybridge_-O3_-fomit-frame-pointer2019102020191017
632962447774 76 1679405 944 1640refgcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102020191017
637178224543 76 1653517 944 1640refgcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102020191017
668671822830 76 1651597 944 1640refgcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102020191017
798477419286 76 1647100 936 1608refgcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102020191017

Test failure

Implementation: opt
Security model: unknown
Compiler: icc -march=cannonlake -mtune=cannonlake -O2 -fomit-frame-pointer
error 111

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
icc -march=cannonlake -mtune=cannonlake -O2 -fomit-frame-pointer opt
icc -march=cannonlake -mtune=cannonlake -O3 -fomit-frame-pointer opt
icc -march=cannonlake -mtune=cannonlake -O2 -fomit-frame-pointer ref
icc -march=cannonlake -mtune=cannonlake -O3 -fomit-frame-pointer ref

Compiler output

Implementation: avx2
Security model: unknown
Compiler: icc -march=broadwell -mtune=broadwell -O2 -fomit-frame-pointer
nts_kem.c: nts_kem.c(717): error: expression must have integral type
nts_kem.c: v[i] = ~v[i];
nts_kem.c: ^
nts_kem.c:
nts_kem.c: compilation aborted for nts_kem.c (code 2)

Number of similar (compiler,implementation) pairs: 38, namely:
CompilerImplementations
icc -march=broadwell -mtune=broadwell -O2 -fomit-frame-pointer avx2
icc -march=broadwell -mtune=broadwell -O3 -fomit-frame-pointer avx2
icc -march=cannonlake -mtune=cannonlake -O2 -fomit-frame-pointer avx2
icc -march=cannonlake -mtune=cannonlake -O3 -fomit-frame-pointer avx2
icc -march=core-avx2 -mtune=core-avx2 -O2 -fomit-frame-pointer avx2
icc -march=core-avx2 -mtune=core-avx2 -O3 -fomit-frame-pointer avx2
icc -march=haswell -mtune=haswell -O2 -fomit-frame-pointer avx2
icc -march=haswell -mtune=haswell -O3 -fomit-frame-pointer avx2
icc -march=icelake-client -mtune=icelake-client -O2 -fomit-frame-pointer avx2
icc -march=icelake-client -mtune=icelake-client -O3 -fomit-frame-pointer avx2
icc -march=skylake-avx512 -mtune=skylake-avx512 -O2 -fomit-frame-pointer avx2
icc -march=skylake-avx512 -mtune=skylake-avx512 -O3 -fomit-frame-pointer avx2
icc -march=skylake -mtune=skylake -O2 -fomit-frame-pointer avx2
icc -march=skylake -mtune=skylake -O3 -fomit-frame-pointer avx2
icc -march=broadwell -mtune=broadwell -O2 -fomit-frame-pointer sse2
icc -march=broadwell -mtune=broadwell -O3 -fomit-frame-pointer sse2
icc -march=cannonlake -mtune=cannonlake -O2 -fomit-frame-pointer sse2
icc -march=cannonlake -mtune=cannonlake -O3 -fomit-frame-pointer sse2
icc -march=core-avx-i -mtune=core-avx-i -O2 -fomit-frame-pointer sse2
icc -march=core-avx-i -mtune=core-avx-i -O3 -fomit-frame-pointer sse2
icc -march=core-avx2 -mtune=core-avx2 -O2 -fomit-frame-pointer sse2
icc -march=core-avx2 -mtune=core-avx2 -O3 -fomit-frame-pointer sse2
icc -march=corei7-avx -mtune=corei7-avx -O2 -fomit-frame-pointer sse2
icc -march=corei7-avx -mtune=corei7-avx -O3 -fomit-frame-pointer sse2
icc -march=corei7 -mtune=corei7 -O2 -fomit-frame-pointer sse2
icc -march=corei7 -mtune=corei7 -O3 -fomit-frame-pointer sse2
icc -march=haswell -mtune=haswell -O2 -fomit-frame-pointer sse2
icc -march=haswell -mtune=haswell -O3 -fomit-frame-pointer sse2
icc -march=icelake-client -mtune=icelake-client -O2 -fomit-frame-pointer sse2
icc -march=icelake-client -mtune=icelake-client -O3 -fomit-frame-pointer sse2
icc -march=ivybridge -mtune=ivybridge -O2 -fomit-frame-pointer sse2
icc -march=ivybridge -mtune=ivybridge -O3 -fomit-frame-pointer sse2
icc -march=sandybridge -mtune=sandybridge -O2 -fomit-frame-pointer sse2
icc -march=sandybridge -mtune=sandybridge -O3 -fomit-frame-pointer sse2
icc -march=skylake-avx512 -mtune=skylake-avx512 -O2 -fomit-frame-pointer sse2
icc -march=skylake-avx512 -mtune=skylake-avx512 -O3 -fomit-frame-pointer sse2
icc -march=skylake -mtune=skylake -O2 -fomit-frame-pointer sse2
icc -march=skylake -mtune=skylake -O3 -fomit-frame-pointer sse2

Compiler output

Implementation: avx2
Security model: unknown
Compiler: icc -march=core-avx-i -mtune=core-avx-i -O2 -fomit-frame-pointer
ff.c: ff.c(104): warning #167: argument of type "vector *" is incompatible with parameter of type "__m256i *"
ff.c: bitslice_mul12_256(c, a, b);
ff.c: ^
ff.c:
ff.c: ff.c(104): warning #167: argument of type "const vector *" is incompatible with parameter of type "const __m256i *"
ff.c: bitslice_mul12_256(c, a, b);
ff.c: ^
ff.c:
ff.c: ff.c(104): warning #167: argument of type "const vector *" is incompatible with parameter of type "const __m256i *"
ff.c: bitslice_mul12_256(c, a, b);
ff.c: ^
ff.c:
nts_kem.c: nts_kem.c(373): error: a value of type "union __m256i" cannot be assigned to an entity of type "vector"
nts_kem.c: Q[i][NTS_KEM_PARAM_R_VEC-1] = _mm256_setzero_si256();
nts_kem.c: ^
nts_kem.c:
nts_kem.c: nts_kem.c(409): error: a value of type "union __m256i" cannot be assigned to an entity of type "vector"
nts_kem.c: c_c[i] = _mm256_setzero_si256();
nts_kem.c: ^
nts_kem.c:
nts_kem.c: nts_kem.c(517): error: a value of type "union __m256i" cannot be used to initialize an entity of type "vector"
nts_kem.c: vector allones = _mm256_set1_epi64x(-1);
nts_kem.c: ^
nts_kem.c:
nts_kem.c: nts_kem.c(592): warning #167: argument of type "vector (*)[12]" is incompatible with parameter of type "__m256i (*)[12]"
nts_kem.c: bitslice_fft(evals, sigma, -(1ULL-extended_error));
nts_kem.c: ^
nts_kem.c:
nts_kem.c: nts_kem.c(608): warning #167: argument of type "vector *" is incompatible with parameter of type "const __m256i *"
nts_kem.c: error[i] = vector_ff_or(evals[i]);
nts_kem.c: ^
nts_kem.c:
nts_kem.c: nts_kem.c(608): error: a value of type "__m256i" cannot be assigned to an entity of type "vector"
nts_kem.c: error[i] = vector_ff_or(evals[i]);
nts_kem.c: ^
nts_kem.c:
nts_kem.c: nts_kem.c(609): error: argument of type "vector" is incompatible with parameter of type "union __m256i"
nts_kem.c: ...

Number of similar (compiler,implementation) pairs: 10, namely:
CompilerImplementations
icc -march=core-avx-i -mtune=core-avx-i -O2 -fomit-frame-pointer avx2
icc -march=core-avx-i -mtune=core-avx-i -O3 -fomit-frame-pointer avx2
icc -march=corei7-avx -mtune=corei7-avx -O2 -fomit-frame-pointer avx2
icc -march=corei7-avx -mtune=corei7-avx -O3 -fomit-frame-pointer avx2
icc -march=corei7 -mtune=corei7 -O2 -fomit-frame-pointer avx2
icc -march=corei7 -mtune=corei7 -O3 -fomit-frame-pointer avx2
icc -march=ivybridge -mtune=ivybridge -O2 -fomit-frame-pointer avx2
icc -march=ivybridge -mtune=ivybridge -O3 -fomit-frame-pointer avx2
icc -march=sandybridge -mtune=sandybridge -O2 -fomit-frame-pointer avx2
icc -march=sandybridge -mtune=sandybridge -O3 -fomit-frame-pointer avx2