Implementation notes: aarch64, hikey960, crypto_decode/761x4591

Computer: hikey960
Architecture: aarch64
CPU ID: 410fd034
SUPERCOP version: 20190816
Operation: crypto_decode
Primitive: 761x4591
TimeObject sizeTest sizeImplementationCompilerBenchmark dateSUPERCOP version
02172 0 012992 816 752int16clang_-O3_-fwrapv_-mavx2_-fomit-frame-pointer_-Qunused-arguments2019112520190816
124894696 0 015504 816 752int16clang_-O3_-fomit-frame-pointer_-Qunused-arguments2019112520190816
166502308 0 012046 904 736int16gcc_-O2_-fomit-frame-pointer2019112520190816
166502304 0 011466 888 736int16gcc_-Os_-fomit-frame-pointer2019112520190816
166502732 0 014135 912 768int16gcc_-fno-schedule-insns_-O3_-fomit-frame-pointer2019112520190816
166502176 0 012006 904 736int16gcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv2019112520190816
166504236 0 015032 816 752portableclang_-O3_-fomit-frame-pointer_-Qunused-arguments2019112520190816
166502240 0 011974 904 736portablegcc_-O2_-fomit-frame-pointer2019112520190816
166522228 0 011926 904 736portablegcc_-fno-schedule-insns_-O2_-fomit-frame-pointer2019112520190816
166522660 0 014063 912 768portablegcc_-fno-schedule-insns_-O3_-fomit-frame-pointer2019112520190816
166522240 0 011974 904 736portablegcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv2019112520190816
177662852 0 016094 904 736portablegcc_-funroll-loops_-fno-schedule-insns_-O_-fomit-frame-pointer2019112520190816
233862172 0 012992 816 752int16clang_-O3_-fwrapv_-mavx_-fomit-frame-pointer_-Qunused-arguments2019112520190816
249753140 0 016134 904 736int16gcc_-funroll-loops_-fno-schedule-insns_-O2_-fomit-frame-pointer2019112520190816
249753140 0 016399 912 768int16gcc_-funroll-loops_-fno-schedule-insns_-O3_-fomit-frame-pointer2019112520190816
249752468 0 013887 912 768int16gcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv2019112520190816
249752380 0 013200 816 752portableclang_-O3_-fwrapv_-mavx_-maes_-mpclmul_-fomit-frame-pointer_-Qunused-arguments2019112520190816
249753472 0 016847 912 768portablegcc_-funroll-loops_-O3_-fomit-frame-pointer2019112520190816
249753440 0 016430 904 736portablegcc_-funroll-loops_-fno-schedule-insns_-O2_-fomit-frame-pointer2019112520190816
291412172 0 012992 816 752int16clang_-O3_-fwrapv_-mavx_-maes_-mpclmul_-fomit-frame-pointer_-Qunused-arguments2019112520190816
291412092 0 011830 904 736int16gcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv2019112520190816
333002764 0 014191 912 768int16gcc_-O3_-fomit-frame-pointer2019112520190816
333002404 0 012230 904 736int16gcc_-O_-fomit-frame-pointer2019112520190816
333002404 0 012230 904 736int16gcc_-fno-schedule-insns_-O_-fomit-frame-pointer2019112520190816
333003188 0 016230 904 736int16gcc_-funroll-loops_-O2_-fomit-frame-pointer2019112520190816
333002304 0 011498 888 736int16gcc_-funroll-loops_-Os_-fomit-frame-pointer2019112520190816
333003224 0 016462 904 736int16gcc_-funroll-loops_-fno-schedule-insns_-O_-fomit-frame-pointer2019112520190816
333002304 0 011498 888 736int16gcc_-funroll-loops_-fno-schedule-insns_-Os_-fomit-frame-pointer2019112520190816
333002692 0 014119 912 768portablegcc_-O3_-fomit-frame-pointer2019112520190816
333002852 0 016094 904 736portablegcc_-funroll-loops_-O_-fomit-frame-pointer2019112520190816
333003440 0 016695 912 768portablegcc_-funroll-loops_-fno-schedule-insns_-O3_-fomit-frame-pointer2019112520190816
333001052 0 012479 912 768refgcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv2019112520190816
333042308 0 012006 904 736int16gcc_-fno-schedule-insns_-O2_-fomit-frame-pointer2019112520190816
333042304 0 011466 888 736int16gcc_-fno-schedule-insns_-Os_-fomit-frame-pointer2019112520190816
333043188 0 016567 912 768int16gcc_-funroll-loops_-O3_-fomit-frame-pointer2019112520190816
333041436 0 010626 888 736portablegcc_-funroll-loops_-fno-schedule-insns_-Os_-fomit-frame-pointer2019112520190816
350792104 0 011266 888 736int16gcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv2019112520190816
355321404 0 010562 888 736portablegcc_-fno-schedule-insns_-Os_-fomit-frame-pointer2019112520190816
355321404 0 010562 888 736portablegcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv2019112520190816
416252380 0 013200 816 752portableclang_-O3_-fwrapv_-mavx2_-fomit-frame-pointer_-Qunused-arguments2019112520190816
416252380 0 013200 816 752portableclang_-O3_-fwrapv_-mavx_-fomit-frame-pointer_-Qunused-arguments2019112520190816
416251140 0 011960 816 752refclang_-O3_-fwrapv_-mavx2_-fomit-frame-pointer_-Qunused-arguments2019112520190816
416251840 0 015078 904 736refgcc_-funroll-loops_-fno-schedule-insns_-O_-fomit-frame-pointer2019112520190816
444151132 0 011928 816 752refclang_-O3_-fomit-frame-pointer_-Qunused-arguments2019112520190816
44415812 0 09994 888 736refgcc_-funroll-loops_-Os_-fomit-frame-pointer2019112520190816
46641812 0 09994 888 736refgcc_-funroll-loops_-fno-schedule-insns_-Os_-fomit-frame-pointer2019112520190816
467263224 0 016462 904 736int16gcc_-funroll-loops_-O_-fomit-frame-pointer2019112520190816
467262692 0 014111 912 768portablegcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv2019112520190816
499501828 0 014830 904 736refgcc_-funroll-loops_-fno-schedule-insns_-O2_-fomit-frame-pointer2019112520190816
499563472 0 016510 904 736portablegcc_-funroll-loops_-O2_-fomit-frame-pointer2019112520190816
582751560 0 011390 904 736portablegcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv2019112520190816
58275812 0 09962 888 736refgcc_-Os_-fomit-frame-pointer2019112520190816
666081404 0 010562 888 736portablegcc_-Os_-fomit-frame-pointer2019112520190816
666081436 0 010626 888 736portablegcc_-funroll-loops_-Os_-fomit-frame-pointer2019112520190816
749251560 0 011390 904 736portablegcc_-fno-schedule-insns_-O_-fomit-frame-pointer2019112520190816
749251044 0 012471 912 768refgcc_-O3_-fomit-frame-pointer2019112520190816
749251044 0 012455 912 768refgcc_-fno-schedule-insns_-O3_-fomit-frame-pointer2019112520190816
749251844 0 014894 904 736refgcc_-funroll-loops_-O2_-fomit-frame-pointer2019112520190816
749251976 0 015247 912 768refgcc_-funroll-loops_-fno-schedule-insns_-O3_-fomit-frame-pointer2019112520190816
832501140 0 011960 816 752refclang_-O3_-fwrapv_-mavx_-fomit-frame-pointer_-Qunused-arguments2019112520190816
832501140 0 011960 816 752refclang_-O3_-fwrapv_-mavx_-maes_-mpclmul_-fomit-frame-pointer_-Qunused-arguments2019112520190816
83250988 0 010726 904 736refgcc_-O2_-fomit-frame-pointer2019112520190816
83250988 0 010686 904 736refgcc_-fno-schedule-insns_-O2_-fomit-frame-pointer2019112520190816
83250996 0 010734 904 736refgcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv2019112520190816
91586808 0 09962 888 736refgcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv2019112520190816
99900972 0 010798 904 736refgcc_-O_-fomit-frame-pointer2019112520190816
99900972 0 010798 904 736refgcc_-fno-schedule-insns_-O_-fomit-frame-pointer2019112520190816
99900988 0 010822 904 736refgcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv2019112520190816
1052371560 0 011390 904 736portablegcc_-O_-fomit-frame-pointer2019112520190816
1052371992 0 015375 912 768refgcc_-funroll-loops_-O3_-fomit-frame-pointer2019112520190816
1082253052 0 015234 888 736portablecc2019112520190816
1082253052 0 015234 888 736portablegcc2019112520190816
128623812 0 09962 888 736refgcc_-fno-schedule-insns_-Os_-fomit-frame-pointer2019112520190816
1403161840 0 015078 904 736refgcc_-funroll-loops_-O_-fomit-frame-pointer2019112520190816
1498502544 0 014722 888 736refcc2019112520190816
1665203052 0 015234 888 736portablegcc_-funroll-loops2019112520190816
1831286652 0 018834 888 736int16cc2019112520190816
1831506652 0 018834 888 736int16gcc2019112520190816
1831506652 0 018834 888 736int16gcc_-funroll-loops2019112520190816
3538552544 0 014722 888 736refgcc2019112520190816
3579752544 0 014722 888 736refgcc_-funroll-loops2019112520190816

Compiler output

Implementation: avx
Security model: unknown
Compiler: cc
decode.c: decode.c:3:23: fatal error: immintrin.h: No such file or directory
decode.c: #include <immintrin.h>
decode.c: ^
decode.c: compilation terminated.

Number of similar (compiler,implementation) pairs: 23, namely:
CompilerImplementations
cc avx
gcc avx
gcc -O2 -fomit-frame-pointer avx
gcc -O3 -fomit-frame-pointer avx
gcc -O -fomit-frame-pointer avx
gcc -Os -fomit-frame-pointer avx
gcc -fno-schedule-insns -O2 -fomit-frame-pointer avx
gcc -fno-schedule-insns -O3 -fomit-frame-pointer avx
gcc -fno-schedule-insns -O -fomit-frame-pointer avx
gcc -fno-schedule-insns -Os -fomit-frame-pointer avx
gcc -funroll-loops avx
gcc -funroll-loops -O2 -fomit-frame-pointer avx
gcc -funroll-loops -O3 -fomit-frame-pointer avx
gcc -funroll-loops -O -fomit-frame-pointer avx
gcc -funroll-loops -Os -fomit-frame-pointer avx
gcc -funroll-loops -fno-schedule-insns -O2 -fomit-frame-pointer avx
gcc -funroll-loops -fno-schedule-insns -O3 -fomit-frame-pointer avx
gcc -funroll-loops -fno-schedule-insns -O -fomit-frame-pointer avx
gcc -funroll-loops -fno-schedule-insns -Os -fomit-frame-pointer avx
gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv avx
gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv avx
gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv avx
gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv avx

Compiler output

Implementation: avx
Security model: unknown
Compiler: clang -O3 -fomit-frame-pointer -Qunused-arguments
decode.c: In file included from decode.c:3:
decode.c: In file included from /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/immintrin.h:27:
decode.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:45:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
decode.c: return (__m64)__builtin_ia32_vec_init_v2si(__i, 0);
decode.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
decode.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:69:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
decode.c: return (__m64)__builtin_ia32_packsswb((__v4hi)__m1, (__v4hi)__m2);
decode.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
decode.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:75:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
decode.c: return (__m64)__builtin_ia32_packssdw((__v2si)__m1, (__v2si)__m2);
decode.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
decode.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:81:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
decode.c: return (__m64)__builtin_ia32_packuswb((__v4hi)__m1, (__v4hi)__m2);
decode.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
decode.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:87:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
decode.c: return (__m64)__builtin_ia32_punpckhbw((__v8qi)__m1, (__v8qi)__m2);
decode.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
decode.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:93:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
decode.c: return (__m64)__builtin_ia32_punpckhwd((__v4hi)__m1, (__v4hi)__m2);
decode.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
decode.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:99:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
decode.c: return (__m64)__builtin_ia32_punpckhdq((__v2si)__m1, (__v2si)__m2);
decode.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
decode.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:105:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
decode.c: return (__m64)__builtin_ia32_punpcklbw((__v8qi)__m1, (__v8qi)__m2);
decode.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
clang -O3 -fomit-frame-pointer -Qunused-arguments avx
clang -O3 -fwrapv -mavx2 -fomit-frame-pointer -Qunused-arguments avx
clang -O3 -fwrapv -mavx -fomit-frame-pointer -Qunused-arguments avx
clang -O3 -fwrapv -mavx -maes -mpclmul -fomit-frame-pointer -Qunused-arguments avx