Implementation notes: aarch64, hikey960, crypto_kem/ntskem1380

Computer: hikey960
Architecture: aarch64
CPU ID: 410fd034
SUPERCOP version: 20190816
Operation: crypto_kem
Primitive: ntskem1380
TimeObject sizeTest sizeImplementationCompilerBenchmark dateSUPERCOP version
95936473832 84 1692425 1040 1584optgcc_-funroll-loops_-O2_-fomit-frame-pointer2019121020190816
195637569808 84 1687049 1048 1616optgcc_-O3_-fomit-frame-pointer2019121020190816
196470052880 84 1668489 1040 1584optgcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv2019121020190816
208957554540 84 1670193 1040 1584optgcc_-O_-fomit-frame-pointer2019121020190816
209790054540 84 1670193 1040 1584optgcc_-fno-schedule-insns_-O_-fomit-frame-pointer2019121020190816
212287550697 84 1665628 1024 1584optgcc_-funroll-loops_-Os_-fomit-frame-pointer2019121020190816
235597586468 84 16105337 1048 1616optgcc_-funroll-loops_-fno-schedule-insns_-O3_-fomit-frame-pointer2019121020190816
237869153500 84 1669049 1040 1584optgcc_-fno-schedule-insns_-O2_-fomit-frame-pointer2019121020190816
248917568541 84 1684898 944 1600optclang_-O3_-fwrapv_-mavx2_-fomit-frame-pointer_-Qunused-arguments2019121020190816
270931550601 84 1665508 1024 1584optgcc_-Os_-fomit-frame-pointer2019121020190816
289986468873 84 1685210 944 1600optclang_-O3_-fomit-frame-pointer_-Qunused-arguments2019121020190816
297202570636 84 1687841 1048 1616optgcc_-fno-schedule-insns_-O3_-fomit-frame-pointer2019121020190816
299096050589 84 1665500 1024 1584optgcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv2019121020190816
358975150697 84 1665628 1024 1584optgcc_-funroll-loops_-fno-schedule-insns_-Os_-fomit-frame-pointer2019121020190816
373870052872 84 1668473 1040 1584optgcc_-O2_-fomit-frame-pointer2019121020190816
373870074556 84 1693409 1040 1584optgcc_-funroll-loops_-fno-schedule-insns_-O_-fomit-frame-pointer2019121020190816
437062568541 84 1684898 944 1600optclang_-O3_-fwrapv_-mavx_-maes_-mpclmul_-fomit-frame-pointer_-Qunused-arguments2019121020190816
437895068541 84 1684898 944 1600optclang_-O3_-fwrapv_-mavx_-fomit-frame-pointer_-Qunused-arguments2019121020190816
476663574260 84 1692897 1040 1584optgcc_-funroll-loops_-fno-schedule-insns_-O2_-fomit-frame-pointer2019121020190816
497478550601 84 1665508 1024 1584optgcc_-fno-schedule-insns_-Os_-fomit-frame-pointer2019121020190816
513652585852 84 16104737 1048 1616optgcc_-funroll-loops_-O3_-fomit-frame-pointer2019121020190816
552780074556 84 1693409 1040 1584optgcc_-funroll-loops_-O_-fomit-frame-pointer2019121020190816
561937554656 84 1670313 1040 1584optgcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv2019121020190816
701797568152 84 1685369 1048 1616optgcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv2019121020190816
782592325537 76 1641962 936 1600refclang_-O3_-fwrapv_-mavx_-maes_-mpclmul_-fomit-frame-pointer_-Qunused-arguments2019121120190816
811017925537 76 1641962 936 1600refclang_-O3_-fwrapv_-mavx2_-fomit-frame-pointer_-Qunused-arguments2019121120190816
816883825537 76 1641962 936 1600refclang_-O3_-fwrapv_-mavx_-fomit-frame-pointer_-Qunused-arguments2019121120190816
907842617449 76 1632332 1016 1584refgcc_-Os_-fomit-frame-pointer2019121020190816
9157500515504 84 16534165 1024 1584optcc2019121020190816
929932749348 76 1668161 1032 1616refgcc_-funroll-loops_-fno-schedule-insns_-O3_-fomit-frame-pointer2019121120190816
1144130434484 76 1651657 1032 1616refgcc_-fno-schedule-insns_-O3_-fomit-frame-pointer2019121120190816
1375290032412 76 1649577 1032 1616refgcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv2019121020190816
1383615034624 76 1651817 1032 1616refgcc_-O3_-fomit-frame-pointer2019121020190816
1397295935700 76 1654305 1032 1584refgcc_-funroll-loops_-fno-schedule-insns_-O2_-fomit-frame-pointer2019121120190816
14546092515504 84 16534165 1024 1584optgcc_-funroll-loops2019121020190816
1502662525709 76 1642130 936 1600refclang_-O3_-fomit-frame-pointer_-Qunused-arguments2019121120190816
1603395020044 76 1635673 1032 1584refgcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv2019121020190816
1626705017413 76 1632300 1016 1584refgcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv2019121020190816
1906654049520 76 1668361 1032 1616refgcc_-funroll-loops_-O3_-fomit-frame-pointer2019121120190816
1916415020084 76 1635657 1032 1584refgcc_-O2_-fomit-frame-pointer2019121120190816
2121210017449 76 1632332 1016 1584refgcc_-fno-schedule-insns_-Os_-fomit-frame-pointer2019121120190816
2164586634084 76 1652913 1032 1584refgcc_-funroll-loops_-fno-schedule-insns_-O_-fomit-frame-pointer2019121120190816
2327533319992 76 1635529 1032 1584refgcc_-fno-schedule-insns_-O2_-fomit-frame-pointer2019121120190816
3049447520124 76 1635697 1032 1584refgcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv2019121020190816
3428230536004 76 1654577 1032 1584refgcc_-funroll-loops_-O2_-fomit-frame-pointer2019121120190816
3490523639636 76 1658269 1016 1584refgcc2019121120190816
3710214919996 76 1635625 1032 1584refgcc_-fno-schedule-insns_-O_-fomit-frame-pointer2019121120190816
4125116717493 76 1632396 1016 1584refgcc_-funroll-loops_-fno-schedule-insns_-Os_-fomit-frame-pointer2019121120190816
4478017517493 76 1632396 1016 1584refgcc_-funroll-loops_-Os_-fomit-frame-pointer2019121120190816
4530465034084 76 1652913 1032 1584refgcc_-funroll-loops_-O_-fomit-frame-pointer2019121120190816
46137150515504 84 16534165 1024 1584optgcc2019121020190816
5061600019996 76 1635625 1032 1584refgcc_-O_-fomit-frame-pointer2019121120190816
6515977539636 76 1658269 1016 1584refcc2019121120190816
6769057539636 76 1658269 1016 1584refgcc_-funroll-loops2019121120190816

Compiler output

Implementation: avx2
Security model: unknown
Compiler: cc
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:0:
bitslice_bma_128.c: bitslice_bma_128.h:18:23: fatal error: immintrin.h: No such file or directory
bitslice_bma_128.c: #include <immintrin.h>
bitslice_bma_128.c: ^
bitslice_bma_128.c: compilation terminated.

Number of similar (compiler,implementation) pairs: 23, namely:
CompilerImplementations
cc avx2
gcc avx2
gcc -O2 -fomit-frame-pointer avx2
gcc -O3 -fomit-frame-pointer avx2
gcc -O -fomit-frame-pointer avx2
gcc -Os -fomit-frame-pointer avx2
gcc -fno-schedule-insns -O2 -fomit-frame-pointer avx2
gcc -fno-schedule-insns -O3 -fomit-frame-pointer avx2
gcc -fno-schedule-insns -O -fomit-frame-pointer avx2
gcc -fno-schedule-insns -Os -fomit-frame-pointer avx2
gcc -funroll-loops avx2
gcc -funroll-loops -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -O -fomit-frame-pointer avx2
gcc -funroll-loops -Os -fomit-frame-pointer avx2
gcc -funroll-loops -fno-schedule-insns -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -fno-schedule-insns -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -fno-schedule-insns -O -fomit-frame-pointer avx2
gcc -funroll-loops -fno-schedule-insns -Os -fomit-frame-pointer avx2
gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv avx2
gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv avx2
gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv avx2
gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv avx2

Compiler output

Implementation: avx2
Security model: unknown
Compiler: clang -O3 -fomit-frame-pointer -Qunused-arguments
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:
bitslice_bma_128.c: In file included from ./bitslice_bma_128.h:18:
bitslice_bma_128.c: In file included from /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/immintrin.h:27:
bitslice_bma_128.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:45:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
bitslice_bma_128.c: return (__m64)__builtin_ia32_vec_init_v2si(__i, 0);
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:69:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
bitslice_bma_128.c: return (__m64)__builtin_ia32_packsswb((__v4hi)__m1, (__v4hi)__m2);
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:75:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
bitslice_bma_128.c: return (__m64)__builtin_ia32_packssdw((__v2si)__m1, (__v2si)__m2);
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:81:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
bitslice_bma_128.c: return (__m64)__builtin_ia32_packuswb((__v4hi)__m1, (__v4hi)__m2);
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:87:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
bitslice_bma_128.c: return (__m64)__builtin_ia32_punpckhbw((__v8qi)__m1, (__v8qi)__m2);
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:93:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
bitslice_bma_128.c: return (__m64)__builtin_ia32_punpckhwd((__v4hi)__m1, (__v4hi)__m2);
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:99:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
bitslice_bma_128.c: return (__m64)__builtin_ia32_punpckhdq((__v2si)__m1, (__v2si)__m2);
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:105:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
clang -O3 -fomit-frame-pointer -Qunused-arguments avx2
clang -O3 -fwrapv -mavx2 -fomit-frame-pointer -Qunused-arguments avx2
clang -O3 -fwrapv -mavx -fomit-frame-pointer -Qunused-arguments avx2
clang -O3 -fwrapv -mavx -maes -mpclmul -fomit-frame-pointer -Qunused-arguments avx2

Compiler output

Implementation: sse2
Security model: unknown
Compiler: cc
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:0:
bitslice_bma_128.c: bits.h:47:9: error: unknown type name '__m128i'
bitslice_bma_128.c: typedef __m128i vector;
bitslice_bma_128.c: ^~~~~~~
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:98:11: error: unknown type name '__m128i'
bitslice_bma_128.c: const __m128i a_hi = _mm_unpackhi_epi64(a, a);
bitslice_bma_128.c: ^~~~~~~
bitslice_bma_128.c: bits.h:98:26: warning: implicit declaration of function '_mm_unpackhi_epi64' [-Wimplicit-function-declaration]
bitslice_bma_128.c: const __m128i a_hi = _mm_unpackhi_epi64(a, a);
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64' [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bitslice_bma_128.h: At top level:
bitslice_bma_128.c: bitslice_bma_128.h:18:23: fatal error: immintrin.h: No such file or directory
bitslice_bma_128.c: #include <immintrin.h>
bitslice_bma_128.c: ^
bitslice_bma_128.c: compilation terminated.

Number of similar (compiler,implementation) pairs: 23, namely:
CompilerImplementations
cc sse2
gcc sse2
gcc -O2 -fomit-frame-pointer sse2
gcc -O3 -fomit-frame-pointer sse2
gcc -O -fomit-frame-pointer sse2
gcc -Os -fomit-frame-pointer sse2
gcc -fno-schedule-insns -O2 -fomit-frame-pointer sse2
gcc -fno-schedule-insns -O3 -fomit-frame-pointer sse2
gcc -fno-schedule-insns -O -fomit-frame-pointer sse2
gcc -fno-schedule-insns -Os -fomit-frame-pointer sse2
gcc -funroll-loops sse2
gcc -funroll-loops -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -O -fomit-frame-pointer sse2
gcc -funroll-loops -Os -fomit-frame-pointer sse2
gcc -funroll-loops -fno-schedule-insns -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -fno-schedule-insns -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -fno-schedule-insns -O -fomit-frame-pointer sse2
gcc -funroll-loops -fno-schedule-insns -Os -fomit-frame-pointer sse2
gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv sse2
gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv sse2
gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv sse2
gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv sse2

Compiler output

Implementation: sse2
Security model: unknown
Compiler: clang -O3 -fomit-frame-pointer -Qunused-arguments
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:
bitslice_bma_128.c: ./bits.h:47:9: error: unknown type name '__m128i'
bitslice_bma_128.c: typedef __m128i vector;
bitslice_bma_128.c: ^
bitslice_bma_128.c: ./bits.h:98:11: error: unknown type name '__m128i'
bitslice_bma_128.c: const __m128i a_hi = _mm_unpackhi_epi64(a, a);
bitslice_bma_128.c: ^
bitslice_bma_128.c: ./bits.h:98:26: warning: implicit declaration of function '_mm_unpackhi_epi64' is invalid in C99 [-Wimplicit-function-declaration]
bitslice_bma_128.c: const __m128i a_hi = _mm_unpackhi_epi64(a, a);
bitslice_bma_128.c: ^
bitslice_bma_128.c: ./bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64' is invalid in C99 [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:
bitslice_bma_128.c: In file included from ./bitslice_bma_128.h:18:
bitslice_bma_128.c: In file included from /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/immintrin.h:27:
bitslice_bma_128.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:45:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
bitslice_bma_128.c: return (__m64)__builtin_ia32_vec_init_v2si(__i, 0);
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:69:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
bitslice_bma_128.c: return (__m64)__builtin_ia32_packsswb((__v4hi)__m1, (__v4hi)__m2);
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:75:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
bitslice_bma_128.c: return (__m64)__builtin_ia32_packssdw((__v2si)__m1, (__v2si)__m2);
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
clang -O3 -fomit-frame-pointer -Qunused-arguments sse2
clang -O3 -fwrapv -mavx2 -fomit-frame-pointer -Qunused-arguments sse2
clang -O3 -fwrapv -mavx -fomit-frame-pointer -Qunused-arguments sse2
clang -O3 -fwrapv -mavx -maes -mpclmul -fomit-frame-pointer -Qunused-arguments sse2