Implementation notes: aarch64, hikey960, crypto_decode/653x1541

Computer: hikey960
Architecture: aarch64
CPU ID: 410fd034
SUPERCOP version: 20190816
Operation: crypto_decode
Primitive: 653x1541
TimeObject sizeTest sizeImplementationCompilerBenchmark dateSUPERCOP version
83251904 0 011638 904 736int16gcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv2019112520190816
88832156 0 011982 904 736int16gcc_-fno-schedule-insns_-O_-fomit-frame-pointer2019112520190816
116934532 0 015336 816 752int16clang_-O3_-fomit-frame-pointer_-Qunused-arguments2019112520190816
116932016 0 012832 816 752int16clang_-O3_-fwrapv_-mavx_-fomit-frame-pointer_-Qunused-arguments2019112520190816
124891912 0 011074 888 736int16gcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv2019112520190816
155472516 0 015678 904 736portablegcc_-funroll-loops_-fno-schedule-insns_-O_-fomit-frame-pointer2019112520190816
166503508 0 014935 912 768int16gcc_-O3_-fomit-frame-pointer2019112520190816
166502080 0 011242 888 736int16gcc_-Os_-fomit-frame-pointer2019112520190816
166503820 0 017063 912 768int16gcc_-funroll-loops_-O3_-fomit-frame-pointer2019112520190816
166503792 0 016967 912 768int16gcc_-funroll-loops_-fno-schedule-insns_-O3_-fomit-frame-pointer2019112520190816
166502080 0 011274 888 736int16gcc_-funroll-loops_-fno-schedule-insns_-Os_-fomit-frame-pointer2019112520190816
166502156 0 012976 816 752portableclang_-O3_-fwrapv_-mavx_-fomit-frame-pointer_-Qunused-arguments2019112520190816
166502156 0 012976 816 752portableclang_-O3_-fwrapv_-mavx_-maes_-mpclmul_-fomit-frame-pointer_-Qunused-arguments2019112520190816
166502028 0 011766 904 736portablegcc_-O2_-fomit-frame-pointer2019112520190816
166502492 0 013895 912 768portablegcc_-fno-schedule-insns_-O3_-fomit-frame-pointer2019112520190816
166502984 0 015886 904 736portablegcc_-funroll-loops_-O2_-fomit-frame-pointer2019112520190816
166502984 0 016223 912 768portablegcc_-funroll-loops_-O3_-fomit-frame-pointer2019112520190816
166502948 0 015862 904 736portablegcc_-funroll-loops_-fno-schedule-insns_-O2_-fomit-frame-pointer2019112520190816
166502948 0 016127 912 768portablegcc_-funroll-loops_-fno-schedule-insns_-O3_-fomit-frame-pointer2019112520190816
166502024 0 011758 904 736portablegcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv2019112520190816
177662080 0 011242 888 736int16gcc_-fno-schedule-insns_-Os_-fomit-frame-pointer2019112520190816
177661156 0 012583 912 768refgcc_-O3_-fomit-frame-pointer2019112520190816
17766820 0 09970 888 736refgcc_-Os_-fomit-frame-pointer2019112520190816
211313916 0 017078 904 736int16gcc_-funroll-loops_-fno-schedule-insns_-O_-fomit-frame-pointer2019112520190816
233633820 0 016726 904 736int16gcc_-funroll-loops_-O2_-fomit-frame-pointer2019112520190816
233862076 0 011774 904 736int16gcc_-fno-schedule-insns_-O2_-fomit-frame-pointer2019112520190816
233864068 0 014864 816 752portableclang_-O3_-fomit-frame-pointer_-Qunused-arguments2019112520190816
249752016 0 012832 816 752int16clang_-O3_-fwrapv_-mavx2_-fomit-frame-pointer_-Qunused-arguments2019112520190816
249753484 0 014887 912 768int16gcc_-fno-schedule-insns_-O3_-fomit-frame-pointer2019112520190816
249752080 0 011274 888 736int16gcc_-funroll-loops_-Os_-fomit-frame-pointer2019112520190816
249753144 0 014559 912 768int16gcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv2019112520190816
249751960 0 011790 904 736int16gcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv2019112520190816
249752508 0 013935 912 768portablegcc_-O3_-fomit-frame-pointer2019112520190816
249751320 0 010482 888 736portablegcc_-Os_-fomit-frame-pointer2019112520190816
249751320 0 010482 888 736portablegcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv2019112520190816
249751260 0 012080 816 752refclang_-O3_-fwrapv_-mavx_-fomit-frame-pointer_-Qunused-arguments2019112520190816
249752072 0 015263 912 768refgcc_-funroll-loops_-fno-schedule-insns_-O3_-fomit-frame-pointer2019112520190816
249751148 0 012575 912 768refgcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv2019112520190816
266492016 0 012832 816 752int16clang_-O3_-fwrapv_-mavx_-maes_-mpclmul_-fomit-frame-pointer_-Qunused-arguments2019112520190816
268943916 0 017078 904 736int16gcc_-funroll-loops_-O_-fomit-frame-pointer2019112520190816
333002156 0 012976 816 752portableclang_-O3_-fwrapv_-mavx2_-fomit-frame-pointer_-Qunused-arguments2019112520190816
333002020 0 011718 904 736portablegcc_-fno-schedule-insns_-O2_-fomit-frame-pointer2019112520190816
333002504 0 013919 912 768portablegcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv2019112520190816
33300996 0 010694 904 736refgcc_-fno-schedule-insns_-O2_-fomit-frame-pointer2019112520190816
333002024 0 014934 904 736refgcc_-funroll-loops_-O2_-fomit-frame-pointer2019112520190816
333002028 0 015190 904 736refgcc_-funroll-loops_-O_-fomit-frame-pointer2019112520190816
333002028 0 015190 904 736refgcc_-funroll-loops_-fno-schedule-insns_-O_-fomit-frame-pointer2019112520190816
333001000 0 010742 904 736refgcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv2019112520190816
333152516 0 015678 904 736portablegcc_-funroll-loops_-O_-fomit-frame-pointer2019112520190816
350792008 0 014926 904 736refgcc_-funroll-loops_-fno-schedule-insns_-O2_-fomit-frame-pointer2019112520190816
441833792 0 016702 904 736int16gcc_-funroll-loops_-fno-schedule-insns_-O2_-fomit-frame-pointer2019112520190816
44415820 0 09970 888 736refgcc_-fno-schedule-insns_-Os_-fomit-frame-pointer2019112520190816
457931320 0 010482 888 736portablegcc_-fno-schedule-insns_-Os_-fomit-frame-pointer2019112520190816
467722156 0 011982 904 736int16gcc_-O_-fomit-frame-pointer2019112520190816
467721260 0 012080 816 752refclang_-O3_-fwrapv_-mavx2_-fomit-frame-pointer_-Qunused-arguments2019112520190816
467721260 0 012080 816 752refclang_-O3_-fwrapv_-mavx_-maes_-mpclmul_-fomit-frame-pointer_-Qunused-arguments2019112520190816
499501252 0 012048 816 752refclang_-O3_-fomit-frame-pointer_-Qunused-arguments2019112520190816
582751480 0 011310 904 736portablegcc_-fno-schedule-insns_-O_-fomit-frame-pointer2019112520190816
582751352 0 010546 888 736portablegcc_-funroll-loops_-fno-schedule-insns_-Os_-fomit-frame-pointer2019112520190816
582751480 0 011310 904 736portablegcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv2019112520190816
58275980 0 010806 904 736refgcc_-fno-schedule-insns_-O_-fomit-frame-pointer2019112520190816
624451480 0 011310 904 736portablegcc_-O_-fomit-frame-pointer2019112520190816
666005972 0 018154 888 736int16gcc2019112520190816
666005972 0 018154 888 736int16gcc_-funroll-loops2019112520190816
666001156 0 012567 912 768refgcc_-fno-schedule-insns_-O3_-fomit-frame-pointer2019112520190816
701582088 0 011822 904 736int16gcc_-O2_-fomit-frame-pointer2019112520190816
70158996 0 010734 904 736refgcc_-O2_-fomit-frame-pointer2019112520190816
74925820 0 010002 888 736refgcc_-funroll-loops_-fno-schedule-insns_-Os_-fomit-frame-pointer2019112520190816
83250980 0 010806 904 736refgcc_-O_-fomit-frame-pointer2019112520190816
83250996 0 010830 904 736refgcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv2019112520190816
934601352 0 010546 888 736portablegcc_-funroll-loops_-Os_-fomit-frame-pointer2019112520190816
935445972 0 018154 888 736int16cc2019112520190816
935442088 0 015343 912 768refgcc_-funroll-loops_-O3_-fomit-frame-pointer2019112520190816
105237816 0 09970 888 736refgcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv2019112520190816
1248902564 0 014746 888 736refgcc2019112520190816
1415252884 0 015066 888 736portablegcc_-funroll-loops2019112520190816
198781820 0 010002 888 736refgcc_-funroll-loops_-Os_-fomit-frame-pointer2019112520190816
2164502564 0 014746 888 736refgcc_-funroll-loops2019112520190816
2923252884 0 015066 888 736portablecc2019112520190816
3829502884 0 015066 888 736portablegcc2019112520190816
6036352564 0 014746 888 736refcc2019112520190816

Compiler output

Implementation: avx
Security model: unknown
Compiler: cc
decode.c: decode.c:3:23: fatal error: immintrin.h: No such file or directory
decode.c: #include <immintrin.h>
decode.c: ^
decode.c: compilation terminated.

Number of similar (compiler,implementation) pairs: 23, namely:
CompilerImplementations
cc avx
gcc avx
gcc -O2 -fomit-frame-pointer avx
gcc -O3 -fomit-frame-pointer avx
gcc -O -fomit-frame-pointer avx
gcc -Os -fomit-frame-pointer avx
gcc -fno-schedule-insns -O2 -fomit-frame-pointer avx
gcc -fno-schedule-insns -O3 -fomit-frame-pointer avx
gcc -fno-schedule-insns -O -fomit-frame-pointer avx
gcc -fno-schedule-insns -Os -fomit-frame-pointer avx
gcc -funroll-loops avx
gcc -funroll-loops -O2 -fomit-frame-pointer avx
gcc -funroll-loops -O3 -fomit-frame-pointer avx
gcc -funroll-loops -O -fomit-frame-pointer avx
gcc -funroll-loops -Os -fomit-frame-pointer avx
gcc -funroll-loops -fno-schedule-insns -O2 -fomit-frame-pointer avx
gcc -funroll-loops -fno-schedule-insns -O3 -fomit-frame-pointer avx
gcc -funroll-loops -fno-schedule-insns -O -fomit-frame-pointer avx
gcc -funroll-loops -fno-schedule-insns -Os -fomit-frame-pointer avx
gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv avx
gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv avx
gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv avx
gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv avx

Compiler output

Implementation: avx
Security model: unknown
Compiler: clang -O3 -fomit-frame-pointer -Qunused-arguments
decode.c: In file included from decode.c:3:
decode.c: In file included from /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/immintrin.h:27:
decode.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:45:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
decode.c: return (__m64)__builtin_ia32_vec_init_v2si(__i, 0);
decode.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
decode.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:69:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
decode.c: return (__m64)__builtin_ia32_packsswb((__v4hi)__m1, (__v4hi)__m2);
decode.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
decode.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:75:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
decode.c: return (__m64)__builtin_ia32_packssdw((__v2si)__m1, (__v2si)__m2);
decode.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
decode.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:81:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
decode.c: return (__m64)__builtin_ia32_packuswb((__v4hi)__m1, (__v4hi)__m2);
decode.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
decode.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:87:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
decode.c: return (__m64)__builtin_ia32_punpckhbw((__v8qi)__m1, (__v8qi)__m2);
decode.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
decode.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:93:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
decode.c: return (__m64)__builtin_ia32_punpckhwd((__v4hi)__m1, (__v4hi)__m2);
decode.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
decode.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:99:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
decode.c: return (__m64)__builtin_ia32_punpckhdq((__v2si)__m1, (__v2si)__m2);
decode.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
decode.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/mmintrin.h:105:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
decode.c: return (__m64)__builtin_ia32_punpcklbw((__v8qi)__m1, (__v8qi)__m2);
decode.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
clang -O3 -fomit-frame-pointer -Qunused-arguments avx
clang -O3 -fwrapv -mavx2 -fomit-frame-pointer -Qunused-arguments avx
clang -O3 -fwrapv -mavx -fomit-frame-pointer -Qunused-arguments avx
clang -O3 -fwrapv -mavx -maes -mpclmul -fomit-frame-pointer -Qunused-arguments avx