Implementation notes: aarch64, hikey960, crypto_kem/ntskem13136

Computer: hikey960
Architecture: aarch64
CPU ID: 410fd034
SUPERCOP version: 20190816
Operation: crypto_kem
Primitive: ntskem13136
TimeObject sizeTest sizeImplementationCompilerBenchmark dateSUPERCOP version
365132496320 84 16115201 1048 1616optgcc_-funroll-loops_-O3_-fomit-frame-pointer2019121020190816
395560179580 84 1698209 1040 1584optgcc_-funroll-loops_-fno-schedule-insns_-O2_-fomit-frame-pointer2019121020190816
404176579100 84 1697953 1040 1584optgcc_-funroll-loops_-fno-schedule-insns_-O_-fomit-frame-pointer2019121020190816
409108258420 84 1673969 1040 1584optgcc_-fno-schedule-insns_-O2_-fomit-frame-pointer2019121020190816
409108255245 84 1670172 1024 1584optgcc_-funroll-loops_-Os_-fomit-frame-pointer2019121020190816
412439774121 84 1690482 944 1600optclang_-O3_-fwrapv_-mavx2_-fomit-frame-pointer_-Qunused-arguments2019121020190816
416612759116 84 1674769 1040 1584optgcc_-O_-fomit-frame-pointer2019121020190816
420165959116 84 1674769 1040 1584optgcc_-fno-schedule-insns_-O_-fomit-frame-pointer2019121020190816
448642079100 84 1697953 1040 1584optgcc_-funroll-loops_-O_-fomit-frame-pointer2019121020190816
504833396844 84 16115705 1048 1616optgcc_-funroll-loops_-fno-schedule-insns_-O3_-fomit-frame-pointer2019121020190816
647685057604 84 1673209 1040 1584optgcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv2019121020190816
662670078732 84 1695945 1048 1616optgcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv2019121020190816
687544274457 84 1690794 944 1600optclang_-O3_-fomit-frame-pointer_-Qunused-arguments2019121020190816
743812979012 84 1697601 1040 1584optgcc_-funroll-loops_-O2_-fomit-frame-pointer2019121020190816
774597680504 84 1697737 1048 1616optgcc_-O3_-fomit-frame-pointer2019121020190816
776722574121 84 1690482 944 1600optclang_-O3_-fwrapv_-mavx_-maes_-mpclmul_-fomit-frame-pointer_-Qunused-arguments2019121020190816
805688157656 84 1673257 1040 1584optgcc_-O2_-fomit-frame-pointer2019121020190816
824175055205 84 1670116 1024 1584optgcc_-Os_-fomit-frame-pointer2019121020190816
844202181276 84 1698481 1048 1616optgcc_-fno-schedule-insns_-O3_-fomit-frame-pointer2019121020190816
931265355245 84 1670172 1024 1584optgcc_-funroll-loops_-fno-schedule-insns_-Os_-fomit-frame-pointer2019121020190816
982792555205 84 1670116 1024 1584optgcc_-fno-schedule-insns_-Os_-fomit-frame-pointer2019121020190816
1046836074121 84 1690482 944 1600optclang_-O3_-fwrapv_-mavx_-fomit-frame-pointer_-Qunused-arguments2019121020190816
1083625959292 84 1674945 1040 1584optgcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv2019121020190816
14616401525096 84 16543757 1024 1584optgcc_-funroll-loops2019121020190816
1568737825477 76 1641898 936 1600refclang_-O3_-fwrapv_-mavx_-fomit-frame-pointer_-Qunused-arguments2019121020190816
1637136934288 76 1652857 1032 1584refgcc_-funroll-loops_-O2_-fomit-frame-pointer2019121020190816
1862109955197 84 1670108 1024 1584optgcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv2019121020190816
19067285525096 84 16543757 1024 1584optgcc2019121020190816
2180776532072 76 1650897 1032 1584refgcc_-funroll-loops_-fno-schedule-insns_-O_-fomit-frame-pointer2019121020190816
2258534935104 76 1652297 1032 1616refgcc_-O3_-fomit-frame-pointer2019121020190816
2402851520104 76 1635681 1032 1584refgcc_-O2_-fomit-frame-pointer2019121020190816
2408896649780 76 1668593 1032 1616refgcc_-funroll-loops_-fno-schedule-insns_-O3_-fomit-frame-pointer2019121020190816
2438880149960 76 1668809 1032 1616refgcc_-funroll-loops_-O3_-fomit-frame-pointer2019121020190816
2518391920108 76 1635737 1032 1584refgcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv2019121020190816
2594724317445 76 1632332 1016 1584refgcc_-Os_-fomit-frame-pointer2019121020190816
2616338033992 76 1652593 1032 1584refgcc_-funroll-loops_-fno-schedule-insns_-O2_-fomit-frame-pointer2019121020190816
2874538825477 76 1641898 936 1600refclang_-O3_-fwrapv_-mavx_-maes_-mpclmul_-fomit-frame-pointer_-Qunused-arguments2019121020190816
2878785025477 76 1641898 936 1600refclang_-O3_-fwrapv_-mavx2_-fomit-frame-pointer_-Qunused-arguments2019121020190816
3189307525649 76 1642066 936 1600refclang_-O3_-fomit-frame-pointer_-Qunused-arguments2019121020190816
4219942517489 76 1632396 1016 1584refgcc_-funroll-loops_-fno-schedule-insns_-Os_-fomit-frame-pointer2019121020190816
4295700032884 76 1650057 1032 1616refgcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv2019121020190816
4355746934960 76 1652137 1032 1616refgcc_-fno-schedule-insns_-O3_-fomit-frame-pointer2019121020190816
4437058520144 76 1635721 1032 1584refgcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv2019121020190816
4628700032072 76 1650897 1032 1584refgcc_-funroll-loops_-O_-fomit-frame-pointer2019121020190816
4644517520008 76 1635545 1032 1584refgcc_-fno-schedule-insns_-O2_-fomit-frame-pointer2019121020190816
4681980020072 76 1635697 1032 1584refgcc_-fno-schedule-insns_-O_-fomit-frame-pointer2019121020190816
4723605020072 76 1635697 1032 1584refgcc_-O_-fomit-frame-pointer2019121020190816
4800691517489 76 1632396 1016 1584refgcc_-funroll-loops_-Os_-fomit-frame-pointer2019121020190816
51290442525096 84 16543757 1024 1584optcc2019121020190816
5515454717409 76 1632292 1016 1584refgcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv2019121020190816
7729986639656 76 1658293 1016 1584refgcc2019121020190816
8875932317445 76 1632332 1016 1584refgcc_-fno-schedule-insns_-Os_-fomit-frame-pointer2019121020190816
10445383339656 76 1658293 1016 1584refcc2019121020190816
17793537339656 76 1658293 1016 1584refgcc_-funroll-loops2019121020190816

Compiler output

Implementation: avx2
Security model: unknown
Compiler: cc
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bitslice_bma_128.h:18:23: fatal error: immintrin.h: No such file or directory
bitslice_bma_128.c: #include <immintrin.h>
bitslice_bma_128.c: ^
bitslice_bma_128.c: compilation terminated.

Number of similar (compiler,implementation) pairs: 23, namely:
CompilerImplementations
cc avx2
gcc avx2
gcc -O2 -fomit-frame-pointer avx2
gcc -O3 -fomit-frame-pointer avx2
gcc -O -fomit-frame-pointer avx2
gcc -Os -fomit-frame-pointer avx2
gcc -fno-schedule-insns -O2 -fomit-frame-pointer avx2
gcc -fno-schedule-insns -O3 -fomit-frame-pointer avx2
gcc -fno-schedule-insns -O -fomit-frame-pointer avx2
gcc -fno-schedule-insns -Os -fomit-frame-pointer avx2
gcc -funroll-loops avx2
gcc -funroll-loops -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -O -fomit-frame-pointer avx2
gcc -funroll-loops -Os -fomit-frame-pointer avx2
gcc -funroll-loops -fno-schedule-insns -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -fno-schedule-insns -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -fno-schedule-insns -O -fomit-frame-pointer avx2
gcc -funroll-loops -fno-schedule-insns -Os -fomit-frame-pointer avx2
gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv avx2
gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv avx2
gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv avx2
gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv avx2

Compiler output

Implementation: avx2
Security model: unknown
Compiler: clang -O3 -fomit-frame-pointer -Qunused-arguments
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:
bitslice_bma_128.c: In file included from ./bitslice_bma_128.h:18:
bitslice_bma_128.c: In file included from /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/immintrin.h:27:
bitslice_bma_128.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:45:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
bitslice_bma_128.c: return (__m64)__builtin_ia32_vec_init_v2si(__i, 0);
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:69:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
bitslice_bma_128.c: return (__m64)__builtin_ia32_packsswb((__v4hi)__m1, (__v4hi)__m2);
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:75:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
bitslice_bma_128.c: return (__m64)__builtin_ia32_packssdw((__v2si)__m1, (__v2si)__m2);
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:81:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
bitslice_bma_128.c: return (__m64)__builtin_ia32_packuswb((__v4hi)__m1, (__v4hi)__m2);
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:87:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
bitslice_bma_128.c: return (__m64)__builtin_ia32_punpckhbw((__v8qi)__m1, (__v8qi)__m2);
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:93:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
bitslice_bma_128.c: return (__m64)__builtin_ia32_punpckhwd((__v4hi)__m1, (__v4hi)__m2);
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:99:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
bitslice_bma_128.c: return (__m64)__builtin_ia32_punpckhdq((__v2si)__m1, (__v2si)__m2);
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:105:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
clang -O3 -fomit-frame-pointer -Qunused-arguments avx2
clang -O3 -fwrapv -mavx2 -fomit-frame-pointer -Qunused-arguments avx2
clang -O3 -fwrapv -mavx -fomit-frame-pointer -Qunused-arguments avx2
clang -O3 -fwrapv -mavx -maes -mpclmul -fomit-frame-pointer -Qunused-arguments avx2

Compiler output

Implementation: sse2
Security model: unknown
Compiler: cc
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:0:
bitslice_bma_128.c: bits.h:47:9: error: unknown type name '__m128i'
bitslice_bma_128.c: typedef __m128i vector;
bitslice_bma_128.c: ^~~~~~~
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:98:11: error: unknown type name '__m128i'
bitslice_bma_128.c: const __m128i a_hi = _mm_unpackhi_epi64(a, a);
bitslice_bma_128.c: ^~~~~~~
bitslice_bma_128.c: bits.h:98:26: warning: implicit declaration of function '_mm_unpackhi_epi64' [-Wimplicit-function-declaration]
bitslice_bma_128.c: const __m128i a_hi = _mm_unpackhi_epi64(a, a);
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64' [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bitslice_bma_128.h: At top level:
bitslice_bma_128.c: bitslice_bma_128.h:18:23: fatal error: immintrin.h: No such file or directory
bitslice_bma_128.c: #include <immintrin.h>
bitslice_bma_128.c: ^
bitslice_bma_128.c: compilation terminated.

Number of similar (compiler,implementation) pairs: 23, namely:
CompilerImplementations
cc sse2
gcc sse2
gcc -O2 -fomit-frame-pointer sse2
gcc -O3 -fomit-frame-pointer sse2
gcc -O -fomit-frame-pointer sse2
gcc -Os -fomit-frame-pointer sse2
gcc -fno-schedule-insns -O2 -fomit-frame-pointer sse2
gcc -fno-schedule-insns -O3 -fomit-frame-pointer sse2
gcc -fno-schedule-insns -O -fomit-frame-pointer sse2
gcc -fno-schedule-insns -Os -fomit-frame-pointer sse2
gcc -funroll-loops sse2
gcc -funroll-loops -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -O -fomit-frame-pointer sse2
gcc -funroll-loops -Os -fomit-frame-pointer sse2
gcc -funroll-loops -fno-schedule-insns -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -fno-schedule-insns -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -fno-schedule-insns -O -fomit-frame-pointer sse2
gcc -funroll-loops -fno-schedule-insns -Os -fomit-frame-pointer sse2
gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv sse2
gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv sse2
gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv sse2
gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv sse2

Compiler output

Implementation: sse2
Security model: unknown
Compiler: clang -O3 -fomit-frame-pointer -Qunused-arguments
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:
bitslice_bma_128.c: ./bits.h:47:9: error: unknown type name '__m128i'
bitslice_bma_128.c: typedef __m128i vector;
bitslice_bma_128.c: ^
bitslice_bma_128.c: ./bits.h:98:11: error: unknown type name '__m128i'
bitslice_bma_128.c: const __m128i a_hi = _mm_unpackhi_epi64(a, a);
bitslice_bma_128.c: ^
bitslice_bma_128.c: ./bits.h:98:26: warning: implicit declaration of function '_mm_unpackhi_epi64' is invalid in C99 [-Wimplicit-function-declaration]
bitslice_bma_128.c: const __m128i a_hi = _mm_unpackhi_epi64(a, a);
bitslice_bma_128.c: ^
bitslice_bma_128.c: ./bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64' is invalid in C99 [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:
bitslice_bma_128.c: In file included from ./bitslice_bma_128.h:18:
bitslice_bma_128.c: In file included from /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/immintrin.h:27:
bitslice_bma_128.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:45:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
bitslice_bma_128.c: return (__m64)__builtin_ia32_vec_init_v2si(__i, 0);
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:69:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
bitslice_bma_128.c: return (__m64)__builtin_ia32_packsswb((__v4hi)__m1, (__v4hi)__m2);
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:75:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
bitslice_bma_128.c: return (__m64)__builtin_ia32_packssdw((__v2si)__m1, (__v2si)__m2);
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
clang -O3 -fomit-frame-pointer -Qunused-arguments sse2
clang -O3 -fwrapv -mavx2 -fomit-frame-pointer -Qunused-arguments sse2
clang -O3 -fwrapv -mavx -fomit-frame-pointer -Qunused-arguments sse2
clang -O3 -fwrapv -mavx -maes -mpclmul -fomit-frame-pointer -Qunused-arguments sse2